Linux Audio

Check our new training course

Loading...
   1/*
   2 * ARMv7 Cortex-A8 and Cortex-A9 Performance Events handling code.
   3 *
   4 * ARMv7 support: Jean Pihet <jpihet@mvista.com>
   5 * 2010 (c) MontaVista Software, LLC.
   6 *
   7 * Copied from ARMv6 code, with the low level code inspired
   8 *  by the ARMv7 Oprofile code.
   9 *
  10 * Cortex-A8 has up to 4 configurable performance counters and
  11 *  a single cycle counter.
  12 * Cortex-A9 has up to 31 configurable performance counters and
  13 *  a single cycle counter.
  14 *
  15 * All counters can be enabled/disabled and IRQ masked separately. The cycle
  16 *  counter and all 4 performance counters together can be reset separately.
  17 */
  18
  19#ifdef CONFIG_CPU_V7
  20
  21#include <asm/cp15.h>
  22#include <asm/cputype.h>
  23#include <asm/irq_regs.h>
  24#include <asm/vfp.h>
  25#include "../vfp/vfpinstr.h"
  26
  27#include <linux/of.h>
  28#include <linux/perf/arm_pmu.h>
  29#include <linux/platform_device.h>
  30
  31/*
  32 * Common ARMv7 event types
  33 *
  34 * Note: An implementation may not be able to count all of these events
  35 * but the encodings are considered to be `reserved' in the case that
  36 * they are not available.
  37 */
  38#define ARMV7_PERFCTR_PMNC_SW_INCR			0x00
  39#define ARMV7_PERFCTR_L1_ICACHE_REFILL			0x01
  40#define ARMV7_PERFCTR_ITLB_REFILL			0x02
  41#define ARMV7_PERFCTR_L1_DCACHE_REFILL			0x03
  42#define ARMV7_PERFCTR_L1_DCACHE_ACCESS			0x04
  43#define ARMV7_PERFCTR_DTLB_REFILL			0x05
  44#define ARMV7_PERFCTR_MEM_READ				0x06
  45#define ARMV7_PERFCTR_MEM_WRITE				0x07
  46#define ARMV7_PERFCTR_INSTR_EXECUTED			0x08
  47#define ARMV7_PERFCTR_EXC_TAKEN				0x09
  48#define ARMV7_PERFCTR_EXC_EXECUTED			0x0A
  49#define ARMV7_PERFCTR_CID_WRITE				0x0B
  50
  51/*
  52 * ARMV7_PERFCTR_PC_WRITE is equivalent to HW_BRANCH_INSTRUCTIONS.
  53 * It counts:
  54 *  - all (taken) branch instructions,
  55 *  - instructions that explicitly write the PC,
  56 *  - exception generating instructions.
  57 */
  58#define ARMV7_PERFCTR_PC_WRITE				0x0C
  59#define ARMV7_PERFCTR_PC_IMM_BRANCH			0x0D
  60#define ARMV7_PERFCTR_PC_PROC_RETURN			0x0E
  61#define ARMV7_PERFCTR_MEM_UNALIGNED_ACCESS		0x0F
  62#define ARMV7_PERFCTR_PC_BRANCH_MIS_PRED		0x10
  63#define ARMV7_PERFCTR_CLOCK_CYCLES			0x11
  64#define ARMV7_PERFCTR_PC_BRANCH_PRED			0x12
  65
  66/* These events are defined by the PMUv2 supplement (ARM DDI 0457A). */
  67#define ARMV7_PERFCTR_MEM_ACCESS			0x13
  68#define ARMV7_PERFCTR_L1_ICACHE_ACCESS			0x14
  69#define ARMV7_PERFCTR_L1_DCACHE_WB			0x15
  70#define ARMV7_PERFCTR_L2_CACHE_ACCESS			0x16
  71#define ARMV7_PERFCTR_L2_CACHE_REFILL			0x17
  72#define ARMV7_PERFCTR_L2_CACHE_WB			0x18
  73#define ARMV7_PERFCTR_BUS_ACCESS			0x19
  74#define ARMV7_PERFCTR_MEM_ERROR				0x1A
  75#define ARMV7_PERFCTR_INSTR_SPEC			0x1B
  76#define ARMV7_PERFCTR_TTBR_WRITE			0x1C
  77#define ARMV7_PERFCTR_BUS_CYCLES			0x1D
  78
  79#define ARMV7_PERFCTR_CPU_CYCLES			0xFF
  80
  81/* ARMv7 Cortex-A8 specific event types */
  82#define ARMV7_A8_PERFCTR_L2_CACHE_ACCESS		0x43
  83#define ARMV7_A8_PERFCTR_L2_CACHE_REFILL		0x44
  84#define ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS		0x50
  85#define ARMV7_A8_PERFCTR_STALL_ISIDE			0x56
  86
  87/* ARMv7 Cortex-A9 specific event types */
  88#define ARMV7_A9_PERFCTR_INSTR_CORE_RENAME		0x68
  89#define ARMV7_A9_PERFCTR_STALL_ICACHE			0x60
  90#define ARMV7_A9_PERFCTR_STALL_DISPATCH			0x66
  91
  92/* ARMv7 Cortex-A5 specific event types */
  93#define ARMV7_A5_PERFCTR_PREFETCH_LINEFILL		0xc2
  94#define ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP		0xc3
  95
  96/* ARMv7 Cortex-A15 specific event types */
  97#define ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ		0x40
  98#define ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE	0x41
  99#define ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ		0x42
 100#define ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE	0x43
 101
 102#define ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ		0x4C
 103#define ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE		0x4D
 104
 105#define ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ		0x50
 106#define ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE		0x51
 107#define ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ		0x52
 108#define ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE		0x53
 109
 110#define ARMV7_A15_PERFCTR_PC_WRITE_SPEC			0x76
 111
 112/* ARMv7 Cortex-A12 specific event types */
 113#define ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_READ		0x40
 114#define ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_WRITE	0x41
 115
 116#define ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_READ		0x50
 117#define ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_WRITE		0x51
 118
 119#define ARMV7_A12_PERFCTR_PC_WRITE_SPEC			0x76
 120
 121#define ARMV7_A12_PERFCTR_PF_TLB_REFILL			0xe7
 122
 123/* ARMv7 Krait specific event types */
 124#define KRAIT_PMRESR0_GROUP0				0xcc
 125#define KRAIT_PMRESR1_GROUP0				0xd0
 126#define KRAIT_PMRESR2_GROUP0				0xd4
 127#define KRAIT_VPMRESR0_GROUP0				0xd8
 128
 129#define KRAIT_PERFCTR_L1_ICACHE_ACCESS			0x10011
 130#define KRAIT_PERFCTR_L1_ICACHE_MISS			0x10010
 131
 132#define KRAIT_PERFCTR_L1_ITLB_ACCESS			0x12222
 133#define KRAIT_PERFCTR_L1_DTLB_ACCESS			0x12210
 134
 135/* ARMv7 Scorpion specific event types */
 136#define SCORPION_LPM0_GROUP0				0x4c
 137#define SCORPION_LPM1_GROUP0				0x50
 138#define SCORPION_LPM2_GROUP0				0x54
 139#define SCORPION_L2LPM_GROUP0				0x58
 140#define SCORPION_VLPM_GROUP0				0x5c
 141
 142#define SCORPION_ICACHE_ACCESS				0x10053
 143#define SCORPION_ICACHE_MISS				0x10052
 144
 145#define SCORPION_DTLB_ACCESS				0x12013
 146#define SCORPION_DTLB_MISS				0x12012
 147
 148#define SCORPION_ITLB_MISS				0x12021
 149
 150/*
 151 * Cortex-A8 HW events mapping
 152 *
 153 * The hardware events that we support. We do support cache operations but
 154 * we have harvard caches and no way to combine instruction and data
 155 * accesses/misses in hardware.
 156 */
 157static const unsigned armv7_a8_perf_map[PERF_COUNT_HW_MAX] = {
 158	PERF_MAP_ALL_UNSUPPORTED,
 159	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 160	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 161	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 162	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 163	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_PERFCTR_PC_WRITE,
 164	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 165	[PERF_COUNT_HW_STALLED_CYCLES_FRONTEND]	= ARMV7_A8_PERFCTR_STALL_ISIDE,
 166};
 167
 168static const unsigned armv7_a8_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 169					  [PERF_COUNT_HW_CACHE_OP_MAX]
 170					  [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 171	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 172
 173	/*
 174	 * The performance counters don't differentiate between read and write
 175	 * accesses/misses so this isn't strictly correct, but it's the best we
 176	 * can do. Writes and reads get combined.
 177	 */
 178	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 179	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 180	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 181	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 182
 183	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS,
 184	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 185
 186	[C(LL)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
 187	[C(LL)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
 188	[C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
 189	[C(LL)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
 190
 191	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 192	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 193
 194	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 195	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 196
 197	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 198	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 199	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 200	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 201};
 202
 203/*
 204 * Cortex-A9 HW events mapping
 205 */
 206static const unsigned armv7_a9_perf_map[PERF_COUNT_HW_MAX] = {
 207	PERF_MAP_ALL_UNSUPPORTED,
 208	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 209	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_A9_PERFCTR_INSTR_CORE_RENAME,
 210	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 211	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 212	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_PERFCTR_PC_WRITE,
 213	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 214	[PERF_COUNT_HW_STALLED_CYCLES_FRONTEND]	= ARMV7_A9_PERFCTR_STALL_ICACHE,
 215	[PERF_COUNT_HW_STALLED_CYCLES_BACKEND]	= ARMV7_A9_PERFCTR_STALL_DISPATCH,
 216};
 217
 218static const unsigned armv7_a9_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 219					  [PERF_COUNT_HW_CACHE_OP_MAX]
 220					  [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 221	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 222
 223	/*
 224	 * The performance counters don't differentiate between read and write
 225	 * accesses/misses so this isn't strictly correct, but it's the best we
 226	 * can do. Writes and reads get combined.
 227	 */
 228	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 229	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 230	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 231	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 232
 233	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 234
 235	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 236	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 237
 238	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 239	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 240
 241	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 242	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 243	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 244	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 245};
 246
 247/*
 248 * Cortex-A5 HW events mapping
 249 */
 250static const unsigned armv7_a5_perf_map[PERF_COUNT_HW_MAX] = {
 251	PERF_MAP_ALL_UNSUPPORTED,
 252	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 253	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 254	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 255	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 256	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_PERFCTR_PC_WRITE,
 257	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 258};
 259
 260static const unsigned armv7_a5_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 261					[PERF_COUNT_HW_CACHE_OP_MAX]
 262					[PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 263	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 264
 265	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 266	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 267	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 268	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 269	[C(L1D)][C(OP_PREFETCH)][C(RESULT_ACCESS)]	= ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
 270	[C(L1D)][C(OP_PREFETCH)][C(RESULT_MISS)]	= ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
 271
 272	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_ICACHE_ACCESS,
 273	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 274	/*
 275	 * The prefetch counters don't differentiate between the I side and the
 276	 * D side.
 277	 */
 278	[C(L1I)][C(OP_PREFETCH)][C(RESULT_ACCESS)]	= ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
 279	[C(L1I)][C(OP_PREFETCH)][C(RESULT_MISS)]	= ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
 280
 281	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 282	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 283
 284	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 285	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 286
 287	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 288	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 289	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 290	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 291};
 292
 293/*
 294 * Cortex-A15 HW events mapping
 295 */
 296static const unsigned armv7_a15_perf_map[PERF_COUNT_HW_MAX] = {
 297	PERF_MAP_ALL_UNSUPPORTED,
 298	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 299	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 300	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 301	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 302	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_A15_PERFCTR_PC_WRITE_SPEC,
 303	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 304	[PERF_COUNT_HW_BUS_CYCLES]		= ARMV7_PERFCTR_BUS_CYCLES,
 305};
 306
 307static const unsigned armv7_a15_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 308					[PERF_COUNT_HW_CACHE_OP_MAX]
 309					[PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 310	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 311
 312	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ,
 313	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ,
 314	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE,
 315	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE,
 316
 317	/*
 318	 * Not all performance counters differentiate between read and write
 319	 * accesses/misses so we're not always strictly correct, but it's the
 320	 * best we can do. Writes and reads get combined in these cases.
 321	 */
 322	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_ICACHE_ACCESS,
 323	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 324
 325	[C(LL)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ,
 326	[C(LL)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ,
 327	[C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE,
 328	[C(LL)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE,
 329
 330	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ,
 331	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE,
 332
 333	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 334	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 335
 336	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 337	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 338	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 339	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 340};
 341
 342/*
 343 * Cortex-A7 HW events mapping
 344 */
 345static const unsigned armv7_a7_perf_map[PERF_COUNT_HW_MAX] = {
 346	PERF_MAP_ALL_UNSUPPORTED,
 347	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 348	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 349	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 350	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 351	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_PERFCTR_PC_WRITE,
 352	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 353	[PERF_COUNT_HW_BUS_CYCLES]		= ARMV7_PERFCTR_BUS_CYCLES,
 354};
 355
 356static const unsigned armv7_a7_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 357					[PERF_COUNT_HW_CACHE_OP_MAX]
 358					[PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 359	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 360
 361	/*
 362	 * The performance counters don't differentiate between read and write
 363	 * accesses/misses so this isn't strictly correct, but it's the best we
 364	 * can do. Writes and reads get combined.
 365	 */
 366	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 367	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 368	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 369	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 370
 371	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_ICACHE_ACCESS,
 372	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 373
 374	[C(LL)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L2_CACHE_ACCESS,
 375	[C(LL)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L2_CACHE_REFILL,
 376	[C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L2_CACHE_ACCESS,
 377	[C(LL)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L2_CACHE_REFILL,
 378
 379	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 380	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 381
 382	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 383	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 384
 385	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 386	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 387	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 388	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 389};
 390
 391/*
 392 * Cortex-A12 HW events mapping
 393 */
 394static const unsigned armv7_a12_perf_map[PERF_COUNT_HW_MAX] = {
 395	PERF_MAP_ALL_UNSUPPORTED,
 396	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 397	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 398	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 399	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 400	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_A12_PERFCTR_PC_WRITE_SPEC,
 401	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 402	[PERF_COUNT_HW_BUS_CYCLES]		= ARMV7_PERFCTR_BUS_CYCLES,
 403};
 404
 405static const unsigned armv7_a12_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 406					[PERF_COUNT_HW_CACHE_OP_MAX]
 407					[PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 408	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 409
 410	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_READ,
 411	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 412	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_WRITE,
 413	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 414
 415	/*
 416	 * Not all performance counters differentiate between read and write
 417	 * accesses/misses so we're not always strictly correct, but it's the
 418	 * best we can do. Writes and reads get combined in these cases.
 419	 */
 420	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_ICACHE_ACCESS,
 421	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 422
 423	[C(LL)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_READ,
 424	[C(LL)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L2_CACHE_REFILL,
 425	[C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_WRITE,
 426	[C(LL)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L2_CACHE_REFILL,
 427
 428	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 429	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 430	[C(DTLB)][C(OP_PREFETCH)][C(RESULT_MISS)]	= ARMV7_A12_PERFCTR_PF_TLB_REFILL,
 431
 432	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 433	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 434
 435	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 436	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 437	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 438	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 439};
 440
 441/*
 442 * Krait HW events mapping
 443 */
 444static const unsigned krait_perf_map[PERF_COUNT_HW_MAX] = {
 445	PERF_MAP_ALL_UNSUPPORTED,
 446	[PERF_COUNT_HW_CPU_CYCLES]	    = ARMV7_PERFCTR_CPU_CYCLES,
 447	[PERF_COUNT_HW_INSTRUCTIONS]	    = ARMV7_PERFCTR_INSTR_EXECUTED,
 448	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
 449	[PERF_COUNT_HW_BRANCH_MISSES]	    = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 450	[PERF_COUNT_HW_BUS_CYCLES]	    = ARMV7_PERFCTR_CLOCK_CYCLES,
 451};
 452
 453static const unsigned krait_perf_map_no_branch[PERF_COUNT_HW_MAX] = {
 454	PERF_MAP_ALL_UNSUPPORTED,
 455	[PERF_COUNT_HW_CPU_CYCLES]	    = ARMV7_PERFCTR_CPU_CYCLES,
 456	[PERF_COUNT_HW_INSTRUCTIONS]	    = ARMV7_PERFCTR_INSTR_EXECUTED,
 457	[PERF_COUNT_HW_BRANCH_MISSES]	    = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 458	[PERF_COUNT_HW_BUS_CYCLES]	    = ARMV7_PERFCTR_CLOCK_CYCLES,
 459};
 460
 461static const unsigned krait_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 462					  [PERF_COUNT_HW_CACHE_OP_MAX]
 463					  [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 464	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 465
 466	/*
 467	 * The performance counters don't differentiate between read and write
 468	 * accesses/misses so this isn't strictly correct, but it's the best we
 469	 * can do. Writes and reads get combined.
 470	 */
 471	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 472	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 473	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 474	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 475
 476	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_ICACHE_ACCESS,
 477	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= KRAIT_PERFCTR_L1_ICACHE_MISS,
 478
 479	[C(DTLB)][C(OP_READ)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_DTLB_ACCESS,
 480	[C(DTLB)][C(OP_WRITE)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_DTLB_ACCESS,
 481
 482	[C(ITLB)][C(OP_READ)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_ITLB_ACCESS,
 483	[C(ITLB)][C(OP_WRITE)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_ITLB_ACCESS,
 484
 485	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 486	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 487	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 488	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 489};
 490
 491/*
 492 * Scorpion HW events mapping
 493 */
 494static const unsigned scorpion_perf_map[PERF_COUNT_HW_MAX] = {
 495	PERF_MAP_ALL_UNSUPPORTED,
 496	[PERF_COUNT_HW_CPU_CYCLES]	    = ARMV7_PERFCTR_CPU_CYCLES,
 497	[PERF_COUNT_HW_INSTRUCTIONS]	    = ARMV7_PERFCTR_INSTR_EXECUTED,
 498	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
 499	[PERF_COUNT_HW_BRANCH_MISSES]	    = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 500	[PERF_COUNT_HW_BUS_CYCLES]	    = ARMV7_PERFCTR_CLOCK_CYCLES,
 501};
 502
 503static const unsigned scorpion_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 504					    [PERF_COUNT_HW_CACHE_OP_MAX]
 505					    [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 506	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 507	/*
 508	 * The performance counters don't differentiate between read and write
 509	 * accesses/misses so this isn't strictly correct, but it's the best we
 510	 * can do. Writes and reads get combined.
 511	 */
 512	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 513	[C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
 514	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 515	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
 516	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)] = SCORPION_ICACHE_ACCESS,
 517	[C(L1I)][C(OP_READ)][C(RESULT_MISS)] = SCORPION_ICACHE_MISS,
 518	/*
 519	 * Only ITLB misses and DTLB refills are supported.  If users want the
 520	 * DTLB refills misses a raw counter must be used.
 521	 */
 522	[C(DTLB)][C(OP_READ)][C(RESULT_ACCESS)] = SCORPION_DTLB_ACCESS,
 523	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)] = SCORPION_DTLB_MISS,
 524	[C(DTLB)][C(OP_WRITE)][C(RESULT_ACCESS)] = SCORPION_DTLB_ACCESS,
 525	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)] = SCORPION_DTLB_MISS,
 526	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)] = SCORPION_ITLB_MISS,
 527	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)] = SCORPION_ITLB_MISS,
 528	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
 529	[C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 530	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
 531	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 532};
 533
 534PMU_FORMAT_ATTR(event, "config:0-7");
 535
 536static struct attribute *armv7_pmu_format_attrs[] = {
 537	&format_attr_event.attr,
 538	NULL,
 539};
 540
 541static struct attribute_group armv7_pmu_format_attr_group = {
 542	.name = "format",
 543	.attrs = armv7_pmu_format_attrs,
 544};
 545
 546#define ARMV7_EVENT_ATTR_RESOLVE(m) #m
 547#define ARMV7_EVENT_ATTR(name, config) \
 548	PMU_EVENT_ATTR_STRING(name, armv7_event_attr_##name, \
 549			      "event=" ARMV7_EVENT_ATTR_RESOLVE(config))
 550
 551ARMV7_EVENT_ATTR(sw_incr, ARMV7_PERFCTR_PMNC_SW_INCR);
 552ARMV7_EVENT_ATTR(l1i_cache_refill, ARMV7_PERFCTR_L1_ICACHE_REFILL);
 553ARMV7_EVENT_ATTR(l1i_tlb_refill, ARMV7_PERFCTR_ITLB_REFILL);
 554ARMV7_EVENT_ATTR(l1d_cache_refill, ARMV7_PERFCTR_L1_DCACHE_REFILL);
 555ARMV7_EVENT_ATTR(l1d_cache, ARMV7_PERFCTR_L1_DCACHE_ACCESS);
 556ARMV7_EVENT_ATTR(l1d_tlb_refill, ARMV7_PERFCTR_DTLB_REFILL);
 557ARMV7_EVENT_ATTR(ld_retired, ARMV7_PERFCTR_MEM_READ);
 558ARMV7_EVENT_ATTR(st_retired, ARMV7_PERFCTR_MEM_WRITE);
 559ARMV7_EVENT_ATTR(inst_retired, ARMV7_PERFCTR_INSTR_EXECUTED);
 560ARMV7_EVENT_ATTR(exc_taken, ARMV7_PERFCTR_EXC_TAKEN);
 561ARMV7_EVENT_ATTR(exc_return, ARMV7_PERFCTR_EXC_EXECUTED);
 562ARMV7_EVENT_ATTR(cid_write_retired, ARMV7_PERFCTR_CID_WRITE);
 563ARMV7_EVENT_ATTR(pc_write_retired, ARMV7_PERFCTR_PC_WRITE);
 564ARMV7_EVENT_ATTR(br_immed_retired, ARMV7_PERFCTR_PC_IMM_BRANCH);
 565ARMV7_EVENT_ATTR(br_return_retired, ARMV7_PERFCTR_PC_PROC_RETURN);
 566ARMV7_EVENT_ATTR(unaligned_ldst_retired, ARMV7_PERFCTR_MEM_UNALIGNED_ACCESS);
 567ARMV7_EVENT_ATTR(br_mis_pred, ARMV7_PERFCTR_PC_BRANCH_MIS_PRED);
 568ARMV7_EVENT_ATTR(cpu_cycles, ARMV7_PERFCTR_CLOCK_CYCLES);
 569ARMV7_EVENT_ATTR(br_pred, ARMV7_PERFCTR_PC_BRANCH_PRED);
 570
 571static struct attribute *armv7_pmuv1_event_attrs[] = {
 572	&armv7_event_attr_sw_incr.attr.attr,
 573	&armv7_event_attr_l1i_cache_refill.attr.attr,
 574	&armv7_event_attr_l1i_tlb_refill.attr.attr,
 575	&armv7_event_attr_l1d_cache_refill.attr.attr,
 576	&armv7_event_attr_l1d_cache.attr.attr,
 577	&armv7_event_attr_l1d_tlb_refill.attr.attr,
 578	&armv7_event_attr_ld_retired.attr.attr,
 579	&armv7_event_attr_st_retired.attr.attr,
 580	&armv7_event_attr_inst_retired.attr.attr,
 581	&armv7_event_attr_exc_taken.attr.attr,
 582	&armv7_event_attr_exc_return.attr.attr,
 583	&armv7_event_attr_cid_write_retired.attr.attr,
 584	&armv7_event_attr_pc_write_retired.attr.attr,
 585	&armv7_event_attr_br_immed_retired.attr.attr,
 586	&armv7_event_attr_br_return_retired.attr.attr,
 587	&armv7_event_attr_unaligned_ldst_retired.attr.attr,
 588	&armv7_event_attr_br_mis_pred.attr.attr,
 589	&armv7_event_attr_cpu_cycles.attr.attr,
 590	&armv7_event_attr_br_pred.attr.attr,
 591	NULL,
 592};
 593
 594static struct attribute_group armv7_pmuv1_events_attr_group = {
 595	.name = "events",
 596	.attrs = armv7_pmuv1_event_attrs,
 597};
 598
 599static const struct attribute_group *armv7_pmuv1_attr_groups[] = {
 600	&armv7_pmuv1_events_attr_group,
 601	&armv7_pmu_format_attr_group,
 602	NULL,
 603};
 604
 605ARMV7_EVENT_ATTR(mem_access, ARMV7_PERFCTR_MEM_ACCESS);
 606ARMV7_EVENT_ATTR(l1i_cache, ARMV7_PERFCTR_L1_ICACHE_ACCESS);
 607ARMV7_EVENT_ATTR(l1d_cache_wb, ARMV7_PERFCTR_L1_DCACHE_WB);
 608ARMV7_EVENT_ATTR(l2d_cache, ARMV7_PERFCTR_L2_CACHE_ACCESS);
 609ARMV7_EVENT_ATTR(l2d_cache_refill, ARMV7_PERFCTR_L2_CACHE_REFILL);
 610ARMV7_EVENT_ATTR(l2d_cache_wb, ARMV7_PERFCTR_L2_CACHE_WB);
 611ARMV7_EVENT_ATTR(bus_access, ARMV7_PERFCTR_BUS_ACCESS);
 612ARMV7_EVENT_ATTR(memory_error, ARMV7_PERFCTR_MEM_ERROR);
 613ARMV7_EVENT_ATTR(inst_spec, ARMV7_PERFCTR_INSTR_SPEC);
 614ARMV7_EVENT_ATTR(ttbr_write_retired, ARMV7_PERFCTR_TTBR_WRITE);
 615ARMV7_EVENT_ATTR(bus_cycles, ARMV7_PERFCTR_BUS_CYCLES);
 616
 617static struct attribute *armv7_pmuv2_event_attrs[] = {
 618	&armv7_event_attr_sw_incr.attr.attr,
 619	&armv7_event_attr_l1i_cache_refill.attr.attr,
 620	&armv7_event_attr_l1i_tlb_refill.attr.attr,
 621	&armv7_event_attr_l1d_cache_refill.attr.attr,
 622	&armv7_event_attr_l1d_cache.attr.attr,
 623	&armv7_event_attr_l1d_tlb_refill.attr.attr,
 624	&armv7_event_attr_ld_retired.attr.attr,
 625	&armv7_event_attr_st_retired.attr.attr,
 626	&armv7_event_attr_inst_retired.attr.attr,
 627	&armv7_event_attr_exc_taken.attr.attr,
 628	&armv7_event_attr_exc_return.attr.attr,
 629	&armv7_event_attr_cid_write_retired.attr.attr,
 630	&armv7_event_attr_pc_write_retired.attr.attr,
 631	&armv7_event_attr_br_immed_retired.attr.attr,
 632	&armv7_event_attr_br_return_retired.attr.attr,
 633	&armv7_event_attr_unaligned_ldst_retired.attr.attr,
 634	&armv7_event_attr_br_mis_pred.attr.attr,
 635	&armv7_event_attr_cpu_cycles.attr.attr,
 636	&armv7_event_attr_br_pred.attr.attr,
 637	&armv7_event_attr_mem_access.attr.attr,
 638	&armv7_event_attr_l1i_cache.attr.attr,
 639	&armv7_event_attr_l1d_cache_wb.attr.attr,
 640	&armv7_event_attr_l2d_cache.attr.attr,
 641	&armv7_event_attr_l2d_cache_refill.attr.attr,
 642	&armv7_event_attr_l2d_cache_wb.attr.attr,
 643	&armv7_event_attr_bus_access.attr.attr,
 644	&armv7_event_attr_memory_error.attr.attr,
 645	&armv7_event_attr_inst_spec.attr.attr,
 646	&armv7_event_attr_ttbr_write_retired.attr.attr,
 647	&armv7_event_attr_bus_cycles.attr.attr,
 648	NULL,
 649};
 650
 651static struct attribute_group armv7_pmuv2_events_attr_group = {
 652	.name = "events",
 653	.attrs = armv7_pmuv2_event_attrs,
 654};
 655
 656static const struct attribute_group *armv7_pmuv2_attr_groups[] = {
 657	&armv7_pmuv2_events_attr_group,
 658	&armv7_pmu_format_attr_group,
 659	NULL,
 660};
 661
 662/*
 663 * Perf Events' indices
 664 */
 665#define	ARMV7_IDX_CYCLE_COUNTER	0
 666#define	ARMV7_IDX_COUNTER0	1
 667#define	ARMV7_IDX_COUNTER_LAST(cpu_pmu) \
 668	(ARMV7_IDX_CYCLE_COUNTER + cpu_pmu->num_events - 1)
 669
 670#define	ARMV7_MAX_COUNTERS	32
 671#define	ARMV7_COUNTER_MASK	(ARMV7_MAX_COUNTERS - 1)
 672
 673/*
 674 * ARMv7 low level PMNC access
 675 */
 676
 677/*
 678 * Perf Event to low level counters mapping
 679 */
 680#define	ARMV7_IDX_TO_COUNTER(x)	\
 681	(((x) - ARMV7_IDX_COUNTER0) & ARMV7_COUNTER_MASK)
 682
 683/*
 684 * Per-CPU PMNC: config reg
 685 */
 686#define ARMV7_PMNC_E		(1 << 0) /* Enable all counters */
 687#define ARMV7_PMNC_P		(1 << 1) /* Reset all counters */
 688#define ARMV7_PMNC_C		(1 << 2) /* Cycle counter reset */
 689#define ARMV7_PMNC_D		(1 << 3) /* CCNT counts every 64th cpu cycle */
 690#define ARMV7_PMNC_X		(1 << 4) /* Export to ETM */
 691#define ARMV7_PMNC_DP		(1 << 5) /* Disable CCNT if non-invasive debug*/
 692#define	ARMV7_PMNC_N_SHIFT	11	 /* Number of counters supported */
 693#define	ARMV7_PMNC_N_MASK	0x1f
 694#define	ARMV7_PMNC_MASK		0x3f	 /* Mask for writable bits */
 695
 696/*
 697 * FLAG: counters overflow flag status reg
 698 */
 699#define	ARMV7_FLAG_MASK		0xffffffff	/* Mask for writable bits */
 700#define	ARMV7_OVERFLOWED_MASK	ARMV7_FLAG_MASK
 701
 702/*
 703 * PMXEVTYPER: Event selection reg
 704 */
 705#define	ARMV7_EVTYPE_MASK	0xc80000ff	/* Mask for writable bits */
 706#define	ARMV7_EVTYPE_EVENT	0xff		/* Mask for EVENT bits */
 707
 708/*
 709 * Event filters for PMUv2
 710 */
 711#define	ARMV7_EXCLUDE_PL1	(1 << 31)
 712#define	ARMV7_EXCLUDE_USER	(1 << 30)
 713#define	ARMV7_INCLUDE_HYP	(1 << 27)
 714
 715/*
 716 * Secure debug enable reg
 717 */
 718#define ARMV7_SDER_SUNIDEN	BIT(1) /* Permit non-invasive debug */
 719
 720static inline u32 armv7_pmnc_read(void)
 721{
 722	u32 val;
 723	asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r"(val));
 724	return val;
 725}
 726
 727static inline void armv7_pmnc_write(u32 val)
 728{
 729	val &= ARMV7_PMNC_MASK;
 730	isb();
 731	asm volatile("mcr p15, 0, %0, c9, c12, 0" : : "r"(val));
 732}
 733
 734static inline int armv7_pmnc_has_overflowed(u32 pmnc)
 735{
 736	return pmnc & ARMV7_OVERFLOWED_MASK;
 737}
 738
 739static inline int armv7_pmnc_counter_valid(struct arm_pmu *cpu_pmu, int idx)
 740{
 741	return idx >= ARMV7_IDX_CYCLE_COUNTER &&
 742		idx <= ARMV7_IDX_COUNTER_LAST(cpu_pmu);
 743}
 744
 745static inline int armv7_pmnc_counter_has_overflowed(u32 pmnc, int idx)
 746{
 747	return pmnc & BIT(ARMV7_IDX_TO_COUNTER(idx));
 748}
 749
 750static inline void armv7_pmnc_select_counter(int idx)
 751{
 752	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 753	asm volatile("mcr p15, 0, %0, c9, c12, 5" : : "r" (counter));
 754	isb();
 755}
 756
 757static inline u32 armv7pmu_read_counter(struct perf_event *event)
 758{
 759	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
 760	struct hw_perf_event *hwc = &event->hw;
 761	int idx = hwc->idx;
 762	u32 value = 0;
 763
 764	if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
 765		pr_err("CPU%u reading wrong counter %d\n",
 766			smp_processor_id(), idx);
 767	} else if (idx == ARMV7_IDX_CYCLE_COUNTER) {
 768		asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (value));
 769	} else {
 770		armv7_pmnc_select_counter(idx);
 771		asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (value));
 772	}
 773
 774	return value;
 775}
 776
 777static inline void armv7pmu_write_counter(struct perf_event *event, u32 value)
 778{
 779	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
 780	struct hw_perf_event *hwc = &event->hw;
 781	int idx = hwc->idx;
 782
 783	if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
 784		pr_err("CPU%u writing wrong counter %d\n",
 785			smp_processor_id(), idx);
 786	} else if (idx == ARMV7_IDX_CYCLE_COUNTER) {
 787		asm volatile("mcr p15, 0, %0, c9, c13, 0" : : "r" (value));
 788	} else {
 789		armv7_pmnc_select_counter(idx);
 790		asm volatile("mcr p15, 0, %0, c9, c13, 2" : : "r" (value));
 791	}
 792}
 793
 794static inline void armv7_pmnc_write_evtsel(int idx, u32 val)
 795{
 796	armv7_pmnc_select_counter(idx);
 797	val &= ARMV7_EVTYPE_MASK;
 798	asm volatile("mcr p15, 0, %0, c9, c13, 1" : : "r" (val));
 799}
 800
 801static inline void armv7_pmnc_enable_counter(int idx)
 802{
 803	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 804	asm volatile("mcr p15, 0, %0, c9, c12, 1" : : "r" (BIT(counter)));
 805}
 806
 807static inline void armv7_pmnc_disable_counter(int idx)
 808{
 809	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 810	asm volatile("mcr p15, 0, %0, c9, c12, 2" : : "r" (BIT(counter)));
 811}
 812
 813static inline void armv7_pmnc_enable_intens(int idx)
 814{
 815	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 816	asm volatile("mcr p15, 0, %0, c9, c14, 1" : : "r" (BIT(counter)));
 817}
 818
 819static inline void armv7_pmnc_disable_intens(int idx)
 820{
 821	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 822	asm volatile("mcr p15, 0, %0, c9, c14, 2" : : "r" (BIT(counter)));
 823	isb();
 824	/* Clear the overflow flag in case an interrupt is pending. */
 825	asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (BIT(counter)));
 826	isb();
 827}
 828
 829static inline u32 armv7_pmnc_getreset_flags(void)
 830{
 831	u32 val;
 832
 833	/* Read */
 834	asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
 835
 836	/* Write to clear flags */
 837	val &= ARMV7_FLAG_MASK;
 838	asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (val));
 839
 840	return val;
 841}
 842
 843#ifdef DEBUG
 844static void armv7_pmnc_dump_regs(struct arm_pmu *cpu_pmu)
 845{
 846	u32 val;
 847	unsigned int cnt;
 848
 849	pr_info("PMNC registers dump:\n");
 850
 851	asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r" (val));
 852	pr_info("PMNC  =0x%08x\n", val);
 853
 854	asm volatile("mrc p15, 0, %0, c9, c12, 1" : "=r" (val));
 855	pr_info("CNTENS=0x%08x\n", val);
 856
 857	asm volatile("mrc p15, 0, %0, c9, c14, 1" : "=r" (val));
 858	pr_info("INTENS=0x%08x\n", val);
 859
 860	asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
 861	pr_info("FLAGS =0x%08x\n", val);
 862
 863	asm volatile("mrc p15, 0, %0, c9, c12, 5" : "=r" (val));
 864	pr_info("SELECT=0x%08x\n", val);
 865
 866	asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (val));
 867	pr_info("CCNT  =0x%08x\n", val);
 868
 869	for (cnt = ARMV7_IDX_COUNTER0;
 870			cnt <= ARMV7_IDX_COUNTER_LAST(cpu_pmu); cnt++) {
 871		armv7_pmnc_select_counter(cnt);
 872		asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (val));
 873		pr_info("CNT[%d] count =0x%08x\n",
 874			ARMV7_IDX_TO_COUNTER(cnt), val);
 875		asm volatile("mrc p15, 0, %0, c9, c13, 1" : "=r" (val));
 876		pr_info("CNT[%d] evtsel=0x%08x\n",
 877			ARMV7_IDX_TO_COUNTER(cnt), val);
 878	}
 879}
 880#endif
 881
 882static void armv7pmu_enable_event(struct perf_event *event)
 883{
 884	unsigned long flags;
 885	struct hw_perf_event *hwc = &event->hw;
 886	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
 887	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
 888	int idx = hwc->idx;
 889
 890	if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
 891		pr_err("CPU%u enabling wrong PMNC counter IRQ enable %d\n",
 892			smp_processor_id(), idx);
 893		return;
 894	}
 895
 896	/*
 897	 * Enable counter and interrupt, and set the counter to count
 898	 * the event that we're interested in.
 899	 */
 900	raw_spin_lock_irqsave(&events->pmu_lock, flags);
 901
 902	/*
 903	 * Disable counter
 904	 */
 905	armv7_pmnc_disable_counter(idx);
 906
 907	/*
 908	 * Set event (if destined for PMNx counters)
 909	 * We only need to set the event for the cycle counter if we
 910	 * have the ability to perform event filtering.
 911	 */
 912	if (cpu_pmu->set_event_filter || idx != ARMV7_IDX_CYCLE_COUNTER)
 913		armv7_pmnc_write_evtsel(idx, hwc->config_base);
 914
 915	/*
 916	 * Enable interrupt for this counter
 917	 */
 918	armv7_pmnc_enable_intens(idx);
 919
 920	/*
 921	 * Enable counter
 922	 */
 923	armv7_pmnc_enable_counter(idx);
 924
 925	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
 926}
 927
 928static void armv7pmu_disable_event(struct perf_event *event)
 929{
 930	unsigned long flags;
 931	struct hw_perf_event *hwc = &event->hw;
 932	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
 933	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
 934	int idx = hwc->idx;
 935
 936	if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
 937		pr_err("CPU%u disabling wrong PMNC counter IRQ enable %d\n",
 938			smp_processor_id(), idx);
 939		return;
 940	}
 941
 942	/*
 943	 * Disable counter and interrupt
 944	 */
 945	raw_spin_lock_irqsave(&events->pmu_lock, flags);
 946
 947	/*
 948	 * Disable counter
 949	 */
 950	armv7_pmnc_disable_counter(idx);
 951
 952	/*
 953	 * Disable interrupt for this counter
 954	 */
 955	armv7_pmnc_disable_intens(idx);
 956
 957	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
 958}
 959
 960static irqreturn_t armv7pmu_handle_irq(int irq_num, void *dev)
 961{
 962	u32 pmnc;
 963	struct perf_sample_data data;
 964	struct arm_pmu *cpu_pmu = (struct arm_pmu *)dev;
 965	struct pmu_hw_events *cpuc = this_cpu_ptr(cpu_pmu->hw_events);
 966	struct pt_regs *regs;
 967	int idx;
 968
 969	/*
 970	 * Get and reset the IRQ flags
 971	 */
 972	pmnc = armv7_pmnc_getreset_flags();
 973
 974	/*
 975	 * Did an overflow occur?
 976	 */
 977	if (!armv7_pmnc_has_overflowed(pmnc))
 978		return IRQ_NONE;
 979
 980	/*
 981	 * Handle the counter(s) overflow(s)
 982	 */
 983	regs = get_irq_regs();
 984
 985	for (idx = 0; idx < cpu_pmu->num_events; ++idx) {
 986		struct perf_event *event = cpuc->events[idx];
 987		struct hw_perf_event *hwc;
 988
 989		/* Ignore if we don't have an event. */
 990		if (!event)
 991			continue;
 992
 993		/*
 994		 * We have a single interrupt for all counters. Check that
 995		 * each counter has overflowed before we process it.
 996		 */
 997		if (!armv7_pmnc_counter_has_overflowed(pmnc, idx))
 998			continue;
 999
1000		hwc = &event->hw;
1001		armpmu_event_update(event);
1002		perf_sample_data_init(&data, 0, hwc->last_period);
1003		if (!armpmu_event_set_period(event))
1004			continue;
1005
1006		if (perf_event_overflow(event, &data, regs))
1007			cpu_pmu->disable(event);
1008	}
1009
1010	/*
1011	 * Handle the pending perf events.
1012	 *
1013	 * Note: this call *must* be run with interrupts disabled. For
1014	 * platforms that can have the PMU interrupts raised as an NMI, this
1015	 * will not work.
1016	 */
1017	irq_work_run();
1018
1019	return IRQ_HANDLED;
1020}
1021
1022static void armv7pmu_start(struct arm_pmu *cpu_pmu)
1023{
1024	unsigned long flags;
1025	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1026
1027	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1028	/* Enable all counters */
1029	armv7_pmnc_write(armv7_pmnc_read() | ARMV7_PMNC_E);
1030	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1031}
1032
1033static void armv7pmu_stop(struct arm_pmu *cpu_pmu)
1034{
1035	unsigned long flags;
1036	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1037
1038	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1039	/* Disable all counters */
1040	armv7_pmnc_write(armv7_pmnc_read() & ~ARMV7_PMNC_E);
1041	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1042}
1043
1044static int armv7pmu_get_event_idx(struct pmu_hw_events *cpuc,
1045				  struct perf_event *event)
1046{
1047	int idx;
1048	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1049	struct hw_perf_event *hwc = &event->hw;
1050	unsigned long evtype = hwc->config_base & ARMV7_EVTYPE_EVENT;
1051
1052	/* Always place a cycle counter into the cycle counter. */
1053	if (evtype == ARMV7_PERFCTR_CPU_CYCLES) {
1054		if (test_and_set_bit(ARMV7_IDX_CYCLE_COUNTER, cpuc->used_mask))
1055			return -EAGAIN;
1056
1057		return ARMV7_IDX_CYCLE_COUNTER;
1058	}
1059
1060	/*
1061	 * For anything other than a cycle counter, try and use
1062	 * the events counters
1063	 */
1064	for (idx = ARMV7_IDX_COUNTER0; idx < cpu_pmu->num_events; ++idx) {
1065		if (!test_and_set_bit(idx, cpuc->used_mask))
1066			return idx;
1067	}
1068
1069	/* The counters are all in use. */
1070	return -EAGAIN;
1071}
1072
1073/*
1074 * Add an event filter to a given event. This will only work for PMUv2 PMUs.
1075 */
1076static int armv7pmu_set_event_filter(struct hw_perf_event *event,
1077				     struct perf_event_attr *attr)
1078{
1079	unsigned long config_base = 0;
1080
1081	if (attr->exclude_idle)
1082		return -EPERM;
1083	if (attr->exclude_user)
1084		config_base |= ARMV7_EXCLUDE_USER;
1085	if (attr->exclude_kernel)
1086		config_base |= ARMV7_EXCLUDE_PL1;
1087	if (!attr->exclude_hv)
1088		config_base |= ARMV7_INCLUDE_HYP;
1089
1090	/*
1091	 * Install the filter into config_base as this is used to
1092	 * construct the event type.
1093	 */
1094	event->config_base = config_base;
1095
1096	return 0;
1097}
1098
1099static void armv7pmu_reset(void *info)
1100{
1101	struct arm_pmu *cpu_pmu = (struct arm_pmu *)info;
1102	u32 idx, nb_cnt = cpu_pmu->num_events, val;
1103
1104	if (cpu_pmu->secure_access) {
1105		asm volatile("mrc p15, 0, %0, c1, c1, 1" : "=r" (val));
1106		val |= ARMV7_SDER_SUNIDEN;
1107		asm volatile("mcr p15, 0, %0, c1, c1, 1" : : "r" (val));
1108	}
1109
1110	/* The counter and interrupt enable registers are unknown at reset. */
1111	for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1112		armv7_pmnc_disable_counter(idx);
1113		armv7_pmnc_disable_intens(idx);
1114	}
1115
1116	/* Initialize & Reset PMNC: C and P bits */
1117	armv7_pmnc_write(ARMV7_PMNC_P | ARMV7_PMNC_C);
1118}
1119
1120static int armv7_a8_map_event(struct perf_event *event)
1121{
1122	return armpmu_map_event(event, &armv7_a8_perf_map,
1123				&armv7_a8_perf_cache_map, 0xFF);
1124}
1125
1126static int armv7_a9_map_event(struct perf_event *event)
1127{
1128	return armpmu_map_event(event, &armv7_a9_perf_map,
1129				&armv7_a9_perf_cache_map, 0xFF);
1130}
1131
1132static int armv7_a5_map_event(struct perf_event *event)
1133{
1134	return armpmu_map_event(event, &armv7_a5_perf_map,
1135				&armv7_a5_perf_cache_map, 0xFF);
1136}
1137
1138static int armv7_a15_map_event(struct perf_event *event)
1139{
1140	return armpmu_map_event(event, &armv7_a15_perf_map,
1141				&armv7_a15_perf_cache_map, 0xFF);
1142}
1143
1144static int armv7_a7_map_event(struct perf_event *event)
1145{
1146	return armpmu_map_event(event, &armv7_a7_perf_map,
1147				&armv7_a7_perf_cache_map, 0xFF);
1148}
1149
1150static int armv7_a12_map_event(struct perf_event *event)
1151{
1152	return armpmu_map_event(event, &armv7_a12_perf_map,
1153				&armv7_a12_perf_cache_map, 0xFF);
1154}
1155
1156static int krait_map_event(struct perf_event *event)
1157{
1158	return armpmu_map_event(event, &krait_perf_map,
1159				&krait_perf_cache_map, 0xFFFFF);
1160}
1161
1162static int krait_map_event_no_branch(struct perf_event *event)
1163{
1164	return armpmu_map_event(event, &krait_perf_map_no_branch,
1165				&krait_perf_cache_map, 0xFFFFF);
1166}
1167
1168static int scorpion_map_event(struct perf_event *event)
1169{
1170	return armpmu_map_event(event, &scorpion_perf_map,
1171				&scorpion_perf_cache_map, 0xFFFFF);
1172}
1173
1174static void armv7pmu_init(struct arm_pmu *cpu_pmu)
1175{
1176	cpu_pmu->handle_irq	= armv7pmu_handle_irq;
1177	cpu_pmu->enable		= armv7pmu_enable_event;
1178	cpu_pmu->disable	= armv7pmu_disable_event;
1179	cpu_pmu->read_counter	= armv7pmu_read_counter;
1180	cpu_pmu->write_counter	= armv7pmu_write_counter;
1181	cpu_pmu->get_event_idx	= armv7pmu_get_event_idx;
1182	cpu_pmu->start		= armv7pmu_start;
1183	cpu_pmu->stop		= armv7pmu_stop;
1184	cpu_pmu->reset		= armv7pmu_reset;
1185	cpu_pmu->max_period	= (1LLU << 32) - 1;
1186};
1187
1188static void armv7_read_num_pmnc_events(void *info)
1189{
1190	int *nb_cnt = info;
1191
1192	/* Read the nb of CNTx counters supported from PMNC */
1193	*nb_cnt = (armv7_pmnc_read() >> ARMV7_PMNC_N_SHIFT) & ARMV7_PMNC_N_MASK;
1194
1195	/* Add the CPU cycles counter */
1196	*nb_cnt += 1;
1197}
1198
1199static int armv7_probe_num_events(struct arm_pmu *arm_pmu)
1200{
1201	return smp_call_function_any(&arm_pmu->supported_cpus,
1202				     armv7_read_num_pmnc_events,
1203				     &arm_pmu->num_events, 1);
1204}
1205
1206static int armv7_a8_pmu_init(struct arm_pmu *cpu_pmu)
1207{
1208	armv7pmu_init(cpu_pmu);
1209	cpu_pmu->name		= "armv7_cortex_a8";
1210	cpu_pmu->map_event	= armv7_a8_map_event;
1211	cpu_pmu->pmu.attr_groups = armv7_pmuv1_attr_groups;
1212	return armv7_probe_num_events(cpu_pmu);
1213}
1214
1215static int armv7_a9_pmu_init(struct arm_pmu *cpu_pmu)
1216{
1217	armv7pmu_init(cpu_pmu);
1218	cpu_pmu->name		= "armv7_cortex_a9";
1219	cpu_pmu->map_event	= armv7_a9_map_event;
1220	cpu_pmu->pmu.attr_groups = armv7_pmuv1_attr_groups;
1221	return armv7_probe_num_events(cpu_pmu);
1222}
1223
1224static int armv7_a5_pmu_init(struct arm_pmu *cpu_pmu)
1225{
1226	armv7pmu_init(cpu_pmu);
1227	cpu_pmu->name		= "armv7_cortex_a5";
1228	cpu_pmu->map_event	= armv7_a5_map_event;
1229	cpu_pmu->pmu.attr_groups = armv7_pmuv1_attr_groups;
1230	return armv7_probe_num_events(cpu_pmu);
1231}
1232
1233static int armv7_a15_pmu_init(struct arm_pmu *cpu_pmu)
1234{
1235	armv7pmu_init(cpu_pmu);
1236	cpu_pmu->name		= "armv7_cortex_a15";
1237	cpu_pmu->map_event	= armv7_a15_map_event;
1238	cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1239	cpu_pmu->pmu.attr_groups = armv7_pmuv2_attr_groups;
1240	return armv7_probe_num_events(cpu_pmu);
1241}
1242
1243static int armv7_a7_pmu_init(struct arm_pmu *cpu_pmu)
1244{
1245	armv7pmu_init(cpu_pmu);
1246	cpu_pmu->name		= "armv7_cortex_a7";
1247	cpu_pmu->map_event	= armv7_a7_map_event;
1248	cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1249	cpu_pmu->pmu.attr_groups = armv7_pmuv2_attr_groups;
1250	return armv7_probe_num_events(cpu_pmu);
1251}
1252
1253static int armv7_a12_pmu_init(struct arm_pmu *cpu_pmu)
1254{
1255	armv7pmu_init(cpu_pmu);
1256	cpu_pmu->name		= "armv7_cortex_a12";
1257	cpu_pmu->map_event	= armv7_a12_map_event;
1258	cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1259	cpu_pmu->pmu.attr_groups = armv7_pmuv2_attr_groups;
1260	return armv7_probe_num_events(cpu_pmu);
1261}
1262
1263static int armv7_a17_pmu_init(struct arm_pmu *cpu_pmu)
1264{
1265	int ret = armv7_a12_pmu_init(cpu_pmu);
1266	cpu_pmu->name = "armv7_cortex_a17";
1267	cpu_pmu->pmu.attr_groups = armv7_pmuv2_attr_groups;
1268	return ret;
1269}
1270
1271/*
1272 * Krait Performance Monitor Region Event Selection Register (PMRESRn)
1273 *
1274 *            31   30     24     16     8      0
1275 *            +--------------------------------+
1276 *  PMRESR0   | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 0
1277 *            +--------------------------------+
1278 *  PMRESR1   | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 1
1279 *            +--------------------------------+
1280 *  PMRESR2   | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 2
1281 *            +--------------------------------+
1282 *  VPMRESR0  | EN |  CC  |  CC  |  CC  |  CC  |   N = 2, R = ?
1283 *            +--------------------------------+
1284 *              EN | G=3  | G=2  | G=1  | G=0
1285 *
1286 *  Event Encoding:
1287 *
1288 *      hwc->config_base = 0xNRCCG
1289 *
1290 *      N  = prefix, 1 for Krait CPU (PMRESRn), 2 for Venum VFP (VPMRESR)
1291 *      R  = region register
1292 *      CC = class of events the group G is choosing from
1293 *      G  = group or particular event
1294 *
1295 *  Example: 0x12021 is a Krait CPU event in PMRESR2's group 1 with code 2
1296 *
1297 *  A region (R) corresponds to a piece of the CPU (execution unit, instruction
1298 *  unit, etc.) while the event code (CC) corresponds to a particular class of
1299 *  events (interrupts for example). An event code is broken down into
1300 *  groups (G) that can be mapped into the PMU (irq, fiqs, and irq+fiqs for
1301 *  example).
1302 */
1303
1304#define KRAIT_EVENT		(1 << 16)
1305#define VENUM_EVENT		(2 << 16)
1306#define KRAIT_EVENT_MASK	(KRAIT_EVENT | VENUM_EVENT)
1307#define PMRESRn_EN		BIT(31)
1308
1309#define EVENT_REGION(event)	(((event) >> 12) & 0xf)		/* R */
1310#define EVENT_GROUP(event)	((event) & 0xf)			/* G */
1311#define EVENT_CODE(event)	(((event) >> 4) & 0xff)		/* CC */
1312#define EVENT_VENUM(event)	(!!(event & VENUM_EVENT))	/* N=2 */
1313#define EVENT_CPU(event)	(!!(event & KRAIT_EVENT))	/* N=1 */
1314
1315static u32 krait_read_pmresrn(int n)
1316{
1317	u32 val;
1318
1319	switch (n) {
1320	case 0:
1321		asm volatile("mrc p15, 1, %0, c9, c15, 0" : "=r" (val));
1322		break;
1323	case 1:
1324		asm volatile("mrc p15, 1, %0, c9, c15, 1" : "=r" (val));
1325		break;
1326	case 2:
1327		asm volatile("mrc p15, 1, %0, c9, c15, 2" : "=r" (val));
1328		break;
1329	default:
1330		BUG(); /* Should be validated in krait_pmu_get_event_idx() */
1331	}
1332
1333	return val;
1334}
1335
1336static void krait_write_pmresrn(int n, u32 val)
1337{
1338	switch (n) {
1339	case 0:
1340		asm volatile("mcr p15, 1, %0, c9, c15, 0" : : "r" (val));
1341		break;
1342	case 1:
1343		asm volatile("mcr p15, 1, %0, c9, c15, 1" : : "r" (val));
1344		break;
1345	case 2:
1346		asm volatile("mcr p15, 1, %0, c9, c15, 2" : : "r" (val));
1347		break;
1348	default:
1349		BUG(); /* Should be validated in krait_pmu_get_event_idx() */
1350	}
1351}
1352
1353static u32 venum_read_pmresr(void)
1354{
1355	u32 val;
1356	asm volatile("mrc p10, 7, %0, c11, c0, 0" : "=r" (val));
1357	return val;
1358}
1359
1360static void venum_write_pmresr(u32 val)
1361{
1362	asm volatile("mcr p10, 7, %0, c11, c0, 0" : : "r" (val));
1363}
1364
1365static void venum_pre_pmresr(u32 *venum_orig_val, u32 *fp_orig_val)
1366{
1367	u32 venum_new_val;
1368	u32 fp_new_val;
1369
1370	BUG_ON(preemptible());
1371	/* CPACR Enable CP10 and CP11 access */
1372	*venum_orig_val = get_copro_access();
1373	venum_new_val = *venum_orig_val | CPACC_SVC(10) | CPACC_SVC(11);
1374	set_copro_access(venum_new_val);
1375
1376	/* Enable FPEXC */
1377	*fp_orig_val = fmrx(FPEXC);
1378	fp_new_val = *fp_orig_val | FPEXC_EN;
1379	fmxr(FPEXC, fp_new_val);
1380}
1381
1382static void venum_post_pmresr(u32 venum_orig_val, u32 fp_orig_val)
1383{
1384	BUG_ON(preemptible());
1385	/* Restore FPEXC */
1386	fmxr(FPEXC, fp_orig_val);
1387	isb();
1388	/* Restore CPACR */
1389	set_copro_access(venum_orig_val);
1390}
1391
1392static u32 krait_get_pmresrn_event(unsigned int region)
1393{
1394	static const u32 pmresrn_table[] = { KRAIT_PMRESR0_GROUP0,
1395					     KRAIT_PMRESR1_GROUP0,
1396					     KRAIT_PMRESR2_GROUP0 };
1397	return pmresrn_table[region];
1398}
1399
1400static void krait_evt_setup(int idx, u32 config_base)
1401{
1402	u32 val;
1403	u32 mask;
1404	u32 vval, fval;
1405	unsigned int region = EVENT_REGION(config_base);
1406	unsigned int group = EVENT_GROUP(config_base);
1407	unsigned int code = EVENT_CODE(config_base);
1408	unsigned int group_shift;
1409	bool venum_event = EVENT_VENUM(config_base);
1410
1411	group_shift = group * 8;
1412	mask = 0xff << group_shift;
1413
1414	/* Configure evtsel for the region and group */
1415	if (venum_event)
1416		val = KRAIT_VPMRESR0_GROUP0;
1417	else
1418		val = krait_get_pmresrn_event(region);
1419	val += group;
1420	/* Mix in mode-exclusion bits */
1421	val |= config_base & (ARMV7_EXCLUDE_USER | ARMV7_EXCLUDE_PL1);
1422	armv7_pmnc_write_evtsel(idx, val);
1423
1424	if (venum_event) {
1425		venum_pre_pmresr(&vval, &fval);
1426		val = venum_read_pmresr();
1427		val &= ~mask;
1428		val |= code << group_shift;
1429		val |= PMRESRn_EN;
1430		venum_write_pmresr(val);
1431		venum_post_pmresr(vval, fval);
1432	} else {
1433		val = krait_read_pmresrn(region);
1434		val &= ~mask;
1435		val |= code << group_shift;
1436		val |= PMRESRn_EN;
1437		krait_write_pmresrn(region, val);
1438	}
1439}
1440
1441static u32 clear_pmresrn_group(u32 val, int group)
1442{
1443	u32 mask;
1444	int group_shift;
1445
1446	group_shift = group * 8;
1447	mask = 0xff << group_shift;
1448	val &= ~mask;
1449
1450	/* Don't clear enable bit if entire region isn't disabled */
1451	if (val & ~PMRESRn_EN)
1452		return val |= PMRESRn_EN;
1453
1454	return 0;
1455}
1456
1457static void krait_clearpmu(u32 config_base)
1458{
1459	u32 val;
1460	u32 vval, fval;
1461	unsigned int region = EVENT_REGION(config_base);
1462	unsigned int group = EVENT_GROUP(config_base);
1463	bool venum_event = EVENT_VENUM(config_base);
1464
1465	if (venum_event) {
1466		venum_pre_pmresr(&vval, &fval);
1467		val = venum_read_pmresr();
1468		val = clear_pmresrn_group(val, group);
1469		venum_write_pmresr(val);
1470		venum_post_pmresr(vval, fval);
1471	} else {
1472		val = krait_read_pmresrn(region);
1473		val = clear_pmresrn_group(val, group);
1474		krait_write_pmresrn(region, val);
1475	}
1476}
1477
1478static void krait_pmu_disable_event(struct perf_event *event)
1479{
1480	unsigned long flags;
1481	struct hw_perf_event *hwc = &event->hw;
1482	int idx = hwc->idx;
1483	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1484	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1485
1486	/* Disable counter and interrupt */
1487	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1488
1489	/* Disable counter */
1490	armv7_pmnc_disable_counter(idx);
1491
1492	/*
1493	 * Clear pmresr code (if destined for PMNx counters)
1494	 */
1495	if (hwc->config_base & KRAIT_EVENT_MASK)
1496		krait_clearpmu(hwc->config_base);
1497
1498	/* Disable interrupt for this counter */
1499	armv7_pmnc_disable_intens(idx);
1500
1501	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1502}
1503
1504static void krait_pmu_enable_event(struct perf_event *event)
1505{
1506	unsigned long flags;
1507	struct hw_perf_event *hwc = &event->hw;
1508	int idx = hwc->idx;
1509	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1510	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1511
1512	/*
1513	 * Enable counter and interrupt, and set the counter to count
1514	 * the event that we're interested in.
1515	 */
1516	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1517
1518	/* Disable counter */
1519	armv7_pmnc_disable_counter(idx);
1520
1521	/*
1522	 * Set event (if destined for PMNx counters)
1523	 * We set the event for the cycle counter because we
1524	 * have the ability to perform event filtering.
1525	 */
1526	if (hwc->config_base & KRAIT_EVENT_MASK)
1527		krait_evt_setup(idx, hwc->config_base);
1528	else
1529		armv7_pmnc_write_evtsel(idx, hwc->config_base);
1530
1531	/* Enable interrupt for this counter */
1532	armv7_pmnc_enable_intens(idx);
1533
1534	/* Enable counter */
1535	armv7_pmnc_enable_counter(idx);
1536
1537	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1538}
1539
1540static void krait_pmu_reset(void *info)
1541{
1542	u32 vval, fval;
1543	struct arm_pmu *cpu_pmu = info;
1544	u32 idx, nb_cnt = cpu_pmu->num_events;
1545
1546	armv7pmu_reset(info);
1547
1548	/* Clear all pmresrs */
1549	krait_write_pmresrn(0, 0);
1550	krait_write_pmresrn(1, 0);
1551	krait_write_pmresrn(2, 0);
1552
1553	venum_pre_pmresr(&vval, &fval);
1554	venum_write_pmresr(0);
1555	venum_post_pmresr(vval, fval);
1556
1557	/* Reset PMxEVNCTCR to sane default */
1558	for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1559		armv7_pmnc_select_counter(idx);
1560		asm volatile("mcr p15, 0, %0, c9, c15, 0" : : "r" (0));
1561	}
1562
1563}
1564
1565static int krait_event_to_bit(struct perf_event *event, unsigned int region,
1566			      unsigned int group)
1567{
1568	int bit;
1569	struct hw_perf_event *hwc = &event->hw;
1570	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1571
1572	if (hwc->config_base & VENUM_EVENT)
1573		bit = KRAIT_VPMRESR0_GROUP0;
1574	else
1575		bit = krait_get_pmresrn_event(region);
1576	bit -= krait_get_pmresrn_event(0);
1577	bit += group;
1578	/*
1579	 * Lower bits are reserved for use by the counters (see
1580	 * armv7pmu_get_event_idx() for more info)
1581	 */
1582	bit += ARMV7_IDX_COUNTER_LAST(cpu_pmu) + 1;
1583
1584	return bit;
1585}
1586
1587/*
1588 * We check for column exclusion constraints here.
1589 * Two events cant use the same group within a pmresr register.
1590 */
1591static int krait_pmu_get_event_idx(struct pmu_hw_events *cpuc,
1592				   struct perf_event *event)
1593{
1594	int idx;
1595	int bit = -1;
1596	struct hw_perf_event *hwc = &event->hw;
1597	unsigned int region = EVENT_REGION(hwc->config_base);
1598	unsigned int code = EVENT_CODE(hwc->config_base);
1599	unsigned int group = EVENT_GROUP(hwc->config_base);
1600	bool venum_event = EVENT_VENUM(hwc->config_base);
1601	bool krait_event = EVENT_CPU(hwc->config_base);
1602
1603	if (venum_event || krait_event) {
1604		/* Ignore invalid events */
1605		if (group > 3 || region > 2)
1606			return -EINVAL;
1607		if (venum_event && (code & 0xe0))
1608			return -EINVAL;
1609
1610		bit = krait_event_to_bit(event, region, group);
1611		if (test_and_set_bit(bit, cpuc->used_mask))
1612			return -EAGAIN;
1613	}
1614
1615	idx = armv7pmu_get_event_idx(cpuc, event);
1616	if (idx < 0 && bit >= 0)
1617		clear_bit(bit, cpuc->used_mask);
1618
1619	return idx;
1620}
1621
1622static void krait_pmu_clear_event_idx(struct pmu_hw_events *cpuc,
1623				      struct perf_event *event)
1624{
1625	int bit;
1626	struct hw_perf_event *hwc = &event->hw;
1627	unsigned int region = EVENT_REGION(hwc->config_base);
1628	unsigned int group = EVENT_GROUP(hwc->config_base);
1629	bool venum_event = EVENT_VENUM(hwc->config_base);
1630	bool krait_event = EVENT_CPU(hwc->config_base);
1631
1632	if (venum_event || krait_event) {
1633		bit = krait_event_to_bit(event, region, group);
1634		clear_bit(bit, cpuc->used_mask);
1635	}
1636}
1637
1638static int krait_pmu_init(struct arm_pmu *cpu_pmu)
1639{
1640	armv7pmu_init(cpu_pmu);
1641	cpu_pmu->name		= "armv7_krait";
1642	/* Some early versions of Krait don't support PC write events */
1643	if (of_property_read_bool(cpu_pmu->plat_device->dev.of_node,
1644				  "qcom,no-pc-write"))
1645		cpu_pmu->map_event = krait_map_event_no_branch;
1646	else
1647		cpu_pmu->map_event = krait_map_event;
1648	cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1649	cpu_pmu->reset		= krait_pmu_reset;
1650	cpu_pmu->enable		= krait_pmu_enable_event;
1651	cpu_pmu->disable	= krait_pmu_disable_event;
1652	cpu_pmu->get_event_idx	= krait_pmu_get_event_idx;
1653	cpu_pmu->clear_event_idx = krait_pmu_clear_event_idx;
1654	return armv7_probe_num_events(cpu_pmu);
1655}
1656
1657/*
1658 * Scorpion Local Performance Monitor Register (LPMn)
1659 *
1660 *            31   30     24     16     8      0
1661 *            +--------------------------------+
1662 *  LPM0      | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 0
1663 *            +--------------------------------+
1664 *  LPM1      | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 1
1665 *            +--------------------------------+
1666 *  LPM2      | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 2
1667 *            +--------------------------------+
1668 *  L2LPM     | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 3
1669 *            +--------------------------------+
1670 *  VLPM      | EN |  CC  |  CC  |  CC  |  CC  |   N = 2, R = ?
1671 *            +--------------------------------+
1672 *              EN | G=3  | G=2  | G=1  | G=0
1673 *
1674 *
1675 *  Event Encoding:
1676 *
1677 *      hwc->config_base = 0xNRCCG
1678 *
1679 *      N  = prefix, 1 for Scorpion CPU (LPMn/L2LPM), 2 for Venum VFP (VLPM)
1680 *      R  = region register
1681 *      CC = class of events the group G is choosing from
1682 *      G  = group or particular event
1683 *
1684 *  Example: 0x12021 is a Scorpion CPU event in LPM2's group 1 with code 2
1685 *
1686 *  A region (R) corresponds to a piece of the CPU (execution unit, instruction
1687 *  unit, etc.) while the event code (CC) corresponds to a particular class of
1688 *  events (interrupts for example). An event code is broken down into
1689 *  groups (G) that can be mapped into the PMU (irq, fiqs, and irq+fiqs for
1690 *  example).
1691 */
1692
1693static u32 scorpion_read_pmresrn(int n)
1694{
1695	u32 val;
1696
1697	switch (n) {
1698	case 0:
1699		asm volatile("mrc p15, 0, %0, c15, c0, 0" : "=r" (val));
1700		break;
1701	case 1:
1702		asm volatile("mrc p15, 1, %0, c15, c0, 0" : "=r" (val));
1703		break;
1704	case 2:
1705		asm volatile("mrc p15, 2, %0, c15, c0, 0" : "=r" (val));
1706		break;
1707	case 3:
1708		asm volatile("mrc p15, 3, %0, c15, c2, 0" : "=r" (val));
1709		break;
1710	default:
1711		BUG(); /* Should be validated in scorpion_pmu_get_event_idx() */
1712	}
1713
1714	return val;
1715}
1716
1717static void scorpion_write_pmresrn(int n, u32 val)
1718{
1719	switch (n) {
1720	case 0:
1721		asm volatile("mcr p15, 0, %0, c15, c0, 0" : : "r" (val));
1722		break;
1723	case 1:
1724		asm volatile("mcr p15, 1, %0, c15, c0, 0" : : "r" (val));
1725		break;
1726	case 2:
1727		asm volatile("mcr p15, 2, %0, c15, c0, 0" : : "r" (val));
1728		break;
1729	case 3:
1730		asm volatile("mcr p15, 3, %0, c15, c2, 0" : : "r" (val));
1731		break;
1732	default:
1733		BUG(); /* Should be validated in scorpion_pmu_get_event_idx() */
1734	}
1735}
1736
1737static u32 scorpion_get_pmresrn_event(unsigned int region)
1738{
1739	static const u32 pmresrn_table[] = { SCORPION_LPM0_GROUP0,
1740					     SCORPION_LPM1_GROUP0,
1741					     SCORPION_LPM2_GROUP0,
1742					     SCORPION_L2LPM_GROUP0 };
1743	return pmresrn_table[region];
1744}
1745
1746static void scorpion_evt_setup(int idx, u32 config_base)
1747{
1748	u32 val;
1749	u32 mask;
1750	u32 vval, fval;
1751	unsigned int region = EVENT_REGION(config_base);
1752	unsigned int group = EVENT_GROUP(config_base);
1753	unsigned int code = EVENT_CODE(config_base);
1754	unsigned int group_shift;
1755	bool venum_event = EVENT_VENUM(config_base);
1756
1757	group_shift = group * 8;
1758	mask = 0xff << group_shift;
1759
1760	/* Configure evtsel for the region and group */
1761	if (venum_event)
1762		val = SCORPION_VLPM_GROUP0;
1763	else
1764		val = scorpion_get_pmresrn_event(region);
1765	val += group;
1766	/* Mix in mode-exclusion bits */
1767	val |= config_base & (ARMV7_EXCLUDE_USER | ARMV7_EXCLUDE_PL1);
1768	armv7_pmnc_write_evtsel(idx, val);
1769
1770	asm volatile("mcr p15, 0, %0, c9, c15, 0" : : "r" (0));
1771
1772	if (venum_event) {
1773		venum_pre_pmresr(&vval, &fval);
1774		val = venum_read_pmresr();
1775		val &= ~mask;
1776		val |= code << group_shift;
1777		val |= PMRESRn_EN;
1778		venum_write_pmresr(val);
1779		venum_post_pmresr(vval, fval);
1780	} else {
1781		val = scorpion_read_pmresrn(region);
1782		val &= ~mask;
1783		val |= code << group_shift;
1784		val |= PMRESRn_EN;
1785		scorpion_write_pmresrn(region, val);
1786	}
1787}
1788
1789static void scorpion_clearpmu(u32 config_base)
1790{
1791	u32 val;
1792	u32 vval, fval;
1793	unsigned int region = EVENT_REGION(config_base);
1794	unsigned int group = EVENT_GROUP(config_base);
1795	bool venum_event = EVENT_VENUM(config_base);
1796
1797	if (venum_event) {
1798		venum_pre_pmresr(&vval, &fval);
1799		val = venum_read_pmresr();
1800		val = clear_pmresrn_group(val, group);
1801		venum_write_pmresr(val);
1802		venum_post_pmresr(vval, fval);
1803	} else {
1804		val = scorpion_read_pmresrn(region);
1805		val = clear_pmresrn_group(val, group);
1806		scorpion_write_pmresrn(region, val);
1807	}
1808}
1809
1810static void scorpion_pmu_disable_event(struct perf_event *event)
1811{
1812	unsigned long flags;
1813	struct hw_perf_event *hwc = &event->hw;
1814	int idx = hwc->idx;
1815	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1816	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1817
1818	/* Disable counter and interrupt */
1819	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1820
1821	/* Disable counter */
1822	armv7_pmnc_disable_counter(idx);
1823
1824	/*
1825	 * Clear pmresr code (if destined for PMNx counters)
1826	 */
1827	if (hwc->config_base & KRAIT_EVENT_MASK)
1828		scorpion_clearpmu(hwc->config_base);
1829
1830	/* Disable interrupt for this counter */
1831	armv7_pmnc_disable_intens(idx);
1832
1833	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1834}
1835
1836static void scorpion_pmu_enable_event(struct perf_event *event)
1837{
1838	unsigned long flags;
1839	struct hw_perf_event *hwc = &event->hw;
1840	int idx = hwc->idx;
1841	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1842	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1843
1844	/*
1845	 * Enable counter and interrupt, and set the counter to count
1846	 * the event that we're interested in.
1847	 */
1848	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1849
1850	/* Disable counter */
1851	armv7_pmnc_disable_counter(idx);
1852
1853	/*
1854	 * Set event (if destined for PMNx counters)
1855	 * We don't set the event for the cycle counter because we
1856	 * don't have the ability to perform event filtering.
1857	 */
1858	if (hwc->config_base & KRAIT_EVENT_MASK)
1859		scorpion_evt_setup(idx, hwc->config_base);
1860	else if (idx != ARMV7_IDX_CYCLE_COUNTER)
1861		armv7_pmnc_write_evtsel(idx, hwc->config_base);
1862
1863	/* Enable interrupt for this counter */
1864	armv7_pmnc_enable_intens(idx);
1865
1866	/* Enable counter */
1867	armv7_pmnc_enable_counter(idx);
1868
1869	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1870}
1871
1872static void scorpion_pmu_reset(void *info)
1873{
1874	u32 vval, fval;
1875	struct arm_pmu *cpu_pmu = info;
1876	u32 idx, nb_cnt = cpu_pmu->num_events;
1877
1878	armv7pmu_reset(info);
1879
1880	/* Clear all pmresrs */
1881	scorpion_write_pmresrn(0, 0);
1882	scorpion_write_pmresrn(1, 0);
1883	scorpion_write_pmresrn(2, 0);
1884	scorpion_write_pmresrn(3, 0);
1885
1886	venum_pre_pmresr(&vval, &fval);
1887	venum_write_pmresr(0);
1888	venum_post_pmresr(vval, fval);
1889
1890	/* Reset PMxEVNCTCR to sane default */
1891	for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1892		armv7_pmnc_select_counter(idx);
1893		asm volatile("mcr p15, 0, %0, c9, c15, 0" : : "r" (0));
1894	}
1895}
1896
1897static int scorpion_event_to_bit(struct perf_event *event, unsigned int region,
1898			      unsigned int group)
1899{
1900	int bit;
1901	struct hw_perf_event *hwc = &event->hw;
1902	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1903
1904	if (hwc->config_base & VENUM_EVENT)
1905		bit = SCORPION_VLPM_GROUP0;
1906	else
1907		bit = scorpion_get_pmresrn_event(region);
1908	bit -= scorpion_get_pmresrn_event(0);
1909	bit += group;
1910	/*
1911	 * Lower bits are reserved for use by the counters (see
1912	 * armv7pmu_get_event_idx() for more info)
1913	 */
1914	bit += ARMV7_IDX_COUNTER_LAST(cpu_pmu) + 1;
1915
1916	return bit;
1917}
1918
1919/*
1920 * We check for column exclusion constraints here.
1921 * Two events cant use the same group within a pmresr register.
1922 */
1923static int scorpion_pmu_get_event_idx(struct pmu_hw_events *cpuc,
1924				   struct perf_event *event)
1925{
1926	int idx;
1927	int bit = -1;
1928	struct hw_perf_event *hwc = &event->hw;
1929	unsigned int region = EVENT_REGION(hwc->config_base);
1930	unsigned int group = EVENT_GROUP(hwc->config_base);
1931	bool venum_event = EVENT_VENUM(hwc->config_base);
1932	bool scorpion_event = EVENT_CPU(hwc->config_base);
1933
1934	if (venum_event || scorpion_event) {
1935		/* Ignore invalid events */
1936		if (group > 3 || region > 3)
1937			return -EINVAL;
1938
1939		bit = scorpion_event_to_bit(event, region, group);
1940		if (test_and_set_bit(bit, cpuc->used_mask))
1941			return -EAGAIN;
1942	}
1943
1944	idx = armv7pmu_get_event_idx(cpuc, event);
1945	if (idx < 0 && bit >= 0)
1946		clear_bit(bit, cpuc->used_mask);
1947
1948	return idx;
1949}
1950
1951static void scorpion_pmu_clear_event_idx(struct pmu_hw_events *cpuc,
1952				      struct perf_event *event)
1953{
1954	int bit;
1955	struct hw_perf_event *hwc = &event->hw;
1956	unsigned int region = EVENT_REGION(hwc->config_base);
1957	unsigned int group = EVENT_GROUP(hwc->config_base);
1958	bool venum_event = EVENT_VENUM(hwc->config_base);
1959	bool scorpion_event = EVENT_CPU(hwc->config_base);
1960
1961	if (venum_event || scorpion_event) {
1962		bit = scorpion_event_to_bit(event, region, group);
1963		clear_bit(bit, cpuc->used_mask);
1964	}
1965}
1966
1967static int scorpion_pmu_init(struct arm_pmu *cpu_pmu)
1968{
1969	armv7pmu_init(cpu_pmu);
1970	cpu_pmu->name		= "armv7_scorpion";
1971	cpu_pmu->map_event	= scorpion_map_event;
1972	cpu_pmu->reset		= scorpion_pmu_reset;
1973	cpu_pmu->enable		= scorpion_pmu_enable_event;
1974	cpu_pmu->disable	= scorpion_pmu_disable_event;
1975	cpu_pmu->get_event_idx	= scorpion_pmu_get_event_idx;
1976	cpu_pmu->clear_event_idx = scorpion_pmu_clear_event_idx;
1977	return armv7_probe_num_events(cpu_pmu);
1978}
1979
1980static int scorpion_mp_pmu_init(struct arm_pmu *cpu_pmu)
1981{
1982	armv7pmu_init(cpu_pmu);
1983	cpu_pmu->name		= "armv7_scorpion_mp";
1984	cpu_pmu->map_event	= scorpion_map_event;
1985	cpu_pmu->reset		= scorpion_pmu_reset;
1986	cpu_pmu->enable		= scorpion_pmu_enable_event;
1987	cpu_pmu->disable	= scorpion_pmu_disable_event;
1988	cpu_pmu->get_event_idx	= scorpion_pmu_get_event_idx;
1989	cpu_pmu->clear_event_idx = scorpion_pmu_clear_event_idx;
1990	return armv7_probe_num_events(cpu_pmu);
1991}
1992
1993static const struct of_device_id armv7_pmu_of_device_ids[] = {
1994	{.compatible = "arm,cortex-a17-pmu",	.data = armv7_a17_pmu_init},
1995	{.compatible = "arm,cortex-a15-pmu",	.data = armv7_a15_pmu_init},
1996	{.compatible = "arm,cortex-a12-pmu",	.data = armv7_a12_pmu_init},
1997	{.compatible = "arm,cortex-a9-pmu",	.data = armv7_a9_pmu_init},
1998	{.compatible = "arm,cortex-a8-pmu",	.data = armv7_a8_pmu_init},
1999	{.compatible = "arm,cortex-a7-pmu",	.data = armv7_a7_pmu_init},
2000	{.compatible = "arm,cortex-a5-pmu",	.data = armv7_a5_pmu_init},
2001	{.compatible = "qcom,krait-pmu",	.data = krait_pmu_init},
2002	{.compatible = "qcom,scorpion-pmu",	.data = scorpion_pmu_init},
2003	{.compatible = "qcom,scorpion-mp-pmu",	.data = scorpion_mp_pmu_init},
2004	{},
2005};
2006
2007static const struct pmu_probe_info armv7_pmu_probe_table[] = {
2008	ARM_PMU_PROBE(ARM_CPU_PART_CORTEX_A8, armv7_a8_pmu_init),
2009	ARM_PMU_PROBE(ARM_CPU_PART_CORTEX_A9, armv7_a9_pmu_init),
2010	{ /* sentinel value */ }
2011};
2012
2013
2014static int armv7_pmu_device_probe(struct platform_device *pdev)
2015{
2016	return arm_pmu_device_probe(pdev, armv7_pmu_of_device_ids,
2017				    armv7_pmu_probe_table);
2018}
2019
2020static struct platform_driver armv7_pmu_driver = {
2021	.driver		= {
2022		.name	= "armv7-pmu",
2023		.of_match_table = armv7_pmu_of_device_ids,
2024	},
2025	.probe		= armv7_pmu_device_probe,
2026};
2027
2028static int __init register_armv7_pmu_driver(void)
2029{
2030	return platform_driver_register(&armv7_pmu_driver);
2031}
2032device_initcall(register_armv7_pmu_driver);
2033#endif	/* CONFIG_CPU_V7 */
   1// SPDX-License-Identifier: GPL-2.0
   2/*
   3 * ARMv7 Cortex-A8 and Cortex-A9 Performance Events handling code.
   4 *
   5 * ARMv7 support: Jean Pihet <jpihet@mvista.com>
   6 * 2010 (c) MontaVista Software, LLC.
   7 *
   8 * Copied from ARMv6 code, with the low level code inspired
   9 *  by the ARMv7 Oprofile code.
  10 *
  11 * Cortex-A8 has up to 4 configurable performance counters and
  12 *  a single cycle counter.
  13 * Cortex-A9 has up to 31 configurable performance counters and
  14 *  a single cycle counter.
  15 *
  16 * All counters can be enabled/disabled and IRQ masked separately. The cycle
  17 *  counter and all 4 performance counters together can be reset separately.
  18 */
  19
  20#ifdef CONFIG_CPU_V7
  21
  22#include <asm/cp15.h>
  23#include <asm/cputype.h>
  24#include <asm/irq_regs.h>
  25#include <asm/vfp.h>
  26#include "../vfp/vfpinstr.h"
  27
  28#include <linux/of.h>
  29#include <linux/perf/arm_pmu.h>
  30#include <linux/platform_device.h>
  31
  32/*
  33 * Common ARMv7 event types
  34 *
  35 * Note: An implementation may not be able to count all of these events
  36 * but the encodings are considered to be `reserved' in the case that
  37 * they are not available.
  38 */
  39#define ARMV7_PERFCTR_PMNC_SW_INCR			0x00
  40#define ARMV7_PERFCTR_L1_ICACHE_REFILL			0x01
  41#define ARMV7_PERFCTR_ITLB_REFILL			0x02
  42#define ARMV7_PERFCTR_L1_DCACHE_REFILL			0x03
  43#define ARMV7_PERFCTR_L1_DCACHE_ACCESS			0x04
  44#define ARMV7_PERFCTR_DTLB_REFILL			0x05
  45#define ARMV7_PERFCTR_MEM_READ				0x06
  46#define ARMV7_PERFCTR_MEM_WRITE				0x07
  47#define ARMV7_PERFCTR_INSTR_EXECUTED			0x08
  48#define ARMV7_PERFCTR_EXC_TAKEN				0x09
  49#define ARMV7_PERFCTR_EXC_EXECUTED			0x0A
  50#define ARMV7_PERFCTR_CID_WRITE				0x0B
  51
  52/*
  53 * ARMV7_PERFCTR_PC_WRITE is equivalent to HW_BRANCH_INSTRUCTIONS.
  54 * It counts:
  55 *  - all (taken) branch instructions,
  56 *  - instructions that explicitly write the PC,
  57 *  - exception generating instructions.
  58 */
  59#define ARMV7_PERFCTR_PC_WRITE				0x0C
  60#define ARMV7_PERFCTR_PC_IMM_BRANCH			0x0D
  61#define ARMV7_PERFCTR_PC_PROC_RETURN			0x0E
  62#define ARMV7_PERFCTR_MEM_UNALIGNED_ACCESS		0x0F
  63#define ARMV7_PERFCTR_PC_BRANCH_MIS_PRED		0x10
  64#define ARMV7_PERFCTR_CLOCK_CYCLES			0x11
  65#define ARMV7_PERFCTR_PC_BRANCH_PRED			0x12
  66
  67/* These events are defined by the PMUv2 supplement (ARM DDI 0457A). */
  68#define ARMV7_PERFCTR_MEM_ACCESS			0x13
  69#define ARMV7_PERFCTR_L1_ICACHE_ACCESS			0x14
  70#define ARMV7_PERFCTR_L1_DCACHE_WB			0x15
  71#define ARMV7_PERFCTR_L2_CACHE_ACCESS			0x16
  72#define ARMV7_PERFCTR_L2_CACHE_REFILL			0x17
  73#define ARMV7_PERFCTR_L2_CACHE_WB			0x18
  74#define ARMV7_PERFCTR_BUS_ACCESS			0x19
  75#define ARMV7_PERFCTR_MEM_ERROR				0x1A
  76#define ARMV7_PERFCTR_INSTR_SPEC			0x1B
  77#define ARMV7_PERFCTR_TTBR_WRITE			0x1C
  78#define ARMV7_PERFCTR_BUS_CYCLES			0x1D
  79
  80#define ARMV7_PERFCTR_CPU_CYCLES			0xFF
  81
  82/* ARMv7 Cortex-A8 specific event types */
  83#define ARMV7_A8_PERFCTR_L2_CACHE_ACCESS		0x43
  84#define ARMV7_A8_PERFCTR_L2_CACHE_REFILL		0x44
  85#define ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS		0x50
  86#define ARMV7_A8_PERFCTR_STALL_ISIDE			0x56
  87
  88/* ARMv7 Cortex-A9 specific event types */
  89#define ARMV7_A9_PERFCTR_INSTR_CORE_RENAME		0x68
  90#define ARMV7_A9_PERFCTR_STALL_ICACHE			0x60
  91#define ARMV7_A9_PERFCTR_STALL_DISPATCH			0x66
  92
  93/* ARMv7 Cortex-A5 specific event types */
  94#define ARMV7_A5_PERFCTR_PREFETCH_LINEFILL		0xc2
  95#define ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP		0xc3
  96
  97/* ARMv7 Cortex-A15 specific event types */
  98#define ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ		0x40
  99#define ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE	0x41
 100#define ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ		0x42
 101#define ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE	0x43
 102
 103#define ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ		0x4C
 104#define ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE		0x4D
 105
 106#define ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ		0x50
 107#define ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE		0x51
 108#define ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ		0x52
 109#define ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE		0x53
 110
 111#define ARMV7_A15_PERFCTR_PC_WRITE_SPEC			0x76
 112
 113/* ARMv7 Cortex-A12 specific event types */
 114#define ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_READ		0x40
 115#define ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_WRITE	0x41
 116
 117#define ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_READ		0x50
 118#define ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_WRITE		0x51
 119
 120#define ARMV7_A12_PERFCTR_PC_WRITE_SPEC			0x76
 121
 122#define ARMV7_A12_PERFCTR_PF_TLB_REFILL			0xe7
 123
 124/* ARMv7 Krait specific event types */
 125#define KRAIT_PMRESR0_GROUP0				0xcc
 126#define KRAIT_PMRESR1_GROUP0				0xd0
 127#define KRAIT_PMRESR2_GROUP0				0xd4
 128#define KRAIT_VPMRESR0_GROUP0				0xd8
 129
 130#define KRAIT_PERFCTR_L1_ICACHE_ACCESS			0x10011
 131#define KRAIT_PERFCTR_L1_ICACHE_MISS			0x10010
 132
 133#define KRAIT_PERFCTR_L1_ITLB_ACCESS			0x12222
 134#define KRAIT_PERFCTR_L1_DTLB_ACCESS			0x12210
 135
 136/* ARMv7 Scorpion specific event types */
 137#define SCORPION_LPM0_GROUP0				0x4c
 138#define SCORPION_LPM1_GROUP0				0x50
 139#define SCORPION_LPM2_GROUP0				0x54
 140#define SCORPION_L2LPM_GROUP0				0x58
 141#define SCORPION_VLPM_GROUP0				0x5c
 142
 143#define SCORPION_ICACHE_ACCESS				0x10053
 144#define SCORPION_ICACHE_MISS				0x10052
 145
 146#define SCORPION_DTLB_ACCESS				0x12013
 147#define SCORPION_DTLB_MISS				0x12012
 148
 149#define SCORPION_ITLB_MISS				0x12021
 150
 151/*
 152 * Cortex-A8 HW events mapping
 153 *
 154 * The hardware events that we support. We do support cache operations but
 155 * we have harvard caches and no way to combine instruction and data
 156 * accesses/misses in hardware.
 157 */
 158static const unsigned armv7_a8_perf_map[PERF_COUNT_HW_MAX] = {
 159	PERF_MAP_ALL_UNSUPPORTED,
 160	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 161	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 162	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 163	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 164	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_PERFCTR_PC_WRITE,
 165	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 166	[PERF_COUNT_HW_STALLED_CYCLES_FRONTEND]	= ARMV7_A8_PERFCTR_STALL_ISIDE,
 167};
 168
 169static const unsigned armv7_a8_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 170					  [PERF_COUNT_HW_CACHE_OP_MAX]
 171					  [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 172	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 173
 174	/*
 175	 * The performance counters don't differentiate between read and write
 176	 * accesses/misses so this isn't strictly correct, but it's the best we
 177	 * can do. Writes and reads get combined.
 178	 */
 179	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 180	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 181	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 182	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 183
 184	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A8_PERFCTR_L1_ICACHE_ACCESS,
 185	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 186
 187	[C(LL)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
 188	[C(LL)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
 189	[C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A8_PERFCTR_L2_CACHE_ACCESS,
 190	[C(LL)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_A8_PERFCTR_L2_CACHE_REFILL,
 191
 192	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 193	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 194
 195	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 196	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 197
 198	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 199	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 200	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 201	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 202};
 203
 204/*
 205 * Cortex-A9 HW events mapping
 206 */
 207static const unsigned armv7_a9_perf_map[PERF_COUNT_HW_MAX] = {
 208	PERF_MAP_ALL_UNSUPPORTED,
 209	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 210	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_A9_PERFCTR_INSTR_CORE_RENAME,
 211	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 212	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 213	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_PERFCTR_PC_WRITE,
 214	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 215	[PERF_COUNT_HW_STALLED_CYCLES_FRONTEND]	= ARMV7_A9_PERFCTR_STALL_ICACHE,
 216	[PERF_COUNT_HW_STALLED_CYCLES_BACKEND]	= ARMV7_A9_PERFCTR_STALL_DISPATCH,
 217};
 218
 219static const unsigned armv7_a9_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 220					  [PERF_COUNT_HW_CACHE_OP_MAX]
 221					  [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 222	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 223
 224	/*
 225	 * The performance counters don't differentiate between read and write
 226	 * accesses/misses so this isn't strictly correct, but it's the best we
 227	 * can do. Writes and reads get combined.
 228	 */
 229	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 230	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 231	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 232	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 233
 234	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 235
 236	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 237	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 238
 239	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 240	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 241
 242	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 243	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 244	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 245	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 246};
 247
 248/*
 249 * Cortex-A5 HW events mapping
 250 */
 251static const unsigned armv7_a5_perf_map[PERF_COUNT_HW_MAX] = {
 252	PERF_MAP_ALL_UNSUPPORTED,
 253	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 254	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 255	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 256	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 257	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_PERFCTR_PC_WRITE,
 258	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 259};
 260
 261static const unsigned armv7_a5_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 262					[PERF_COUNT_HW_CACHE_OP_MAX]
 263					[PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 264	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 265
 266	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 267	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 268	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 269	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 270	[C(L1D)][C(OP_PREFETCH)][C(RESULT_ACCESS)]	= ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
 271	[C(L1D)][C(OP_PREFETCH)][C(RESULT_MISS)]	= ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
 272
 273	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_ICACHE_ACCESS,
 274	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 275	/*
 276	 * The prefetch counters don't differentiate between the I side and the
 277	 * D side.
 278	 */
 279	[C(L1I)][C(OP_PREFETCH)][C(RESULT_ACCESS)]	= ARMV7_A5_PERFCTR_PREFETCH_LINEFILL,
 280	[C(L1I)][C(OP_PREFETCH)][C(RESULT_MISS)]	= ARMV7_A5_PERFCTR_PREFETCH_LINEFILL_DROP,
 281
 282	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 283	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 284
 285	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 286	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 287
 288	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 289	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 290	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 291	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 292};
 293
 294/*
 295 * Cortex-A15 HW events mapping
 296 */
 297static const unsigned armv7_a15_perf_map[PERF_COUNT_HW_MAX] = {
 298	PERF_MAP_ALL_UNSUPPORTED,
 299	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 300	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 301	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 302	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 303	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_A15_PERFCTR_PC_WRITE_SPEC,
 304	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 305	[PERF_COUNT_HW_BUS_CYCLES]		= ARMV7_PERFCTR_BUS_CYCLES,
 306};
 307
 308static const unsigned armv7_a15_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 309					[PERF_COUNT_HW_CACHE_OP_MAX]
 310					[PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 311	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 312
 313	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_READ,
 314	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_READ,
 315	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A15_PERFCTR_L1_DCACHE_ACCESS_WRITE,
 316	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_L1_DCACHE_REFILL_WRITE,
 317
 318	/*
 319	 * Not all performance counters differentiate between read and write
 320	 * accesses/misses so we're not always strictly correct, but it's the
 321	 * best we can do. Writes and reads get combined in these cases.
 322	 */
 323	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_ICACHE_ACCESS,
 324	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 325
 326	[C(LL)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_READ,
 327	[C(LL)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_L2_CACHE_REFILL_READ,
 328	[C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A15_PERFCTR_L2_CACHE_ACCESS_WRITE,
 329	[C(LL)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_L2_CACHE_REFILL_WRITE,
 330
 331	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_DTLB_REFILL_L1_READ,
 332	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_A15_PERFCTR_DTLB_REFILL_L1_WRITE,
 333
 334	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 335	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 336
 337	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 338	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 339	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 340	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 341};
 342
 343/*
 344 * Cortex-A7 HW events mapping
 345 */
 346static const unsigned armv7_a7_perf_map[PERF_COUNT_HW_MAX] = {
 347	PERF_MAP_ALL_UNSUPPORTED,
 348	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 349	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 350	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 351	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 352	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_PERFCTR_PC_WRITE,
 353	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 354	[PERF_COUNT_HW_BUS_CYCLES]		= ARMV7_PERFCTR_BUS_CYCLES,
 355};
 356
 357static const unsigned armv7_a7_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 358					[PERF_COUNT_HW_CACHE_OP_MAX]
 359					[PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 360	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 361
 362	/*
 363	 * The performance counters don't differentiate between read and write
 364	 * accesses/misses so this isn't strictly correct, but it's the best we
 365	 * can do. Writes and reads get combined.
 366	 */
 367	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 368	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 369	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 370	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 371
 372	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_ICACHE_ACCESS,
 373	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 374
 375	[C(LL)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L2_CACHE_ACCESS,
 376	[C(LL)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L2_CACHE_REFILL,
 377	[C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L2_CACHE_ACCESS,
 378	[C(LL)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L2_CACHE_REFILL,
 379
 380	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 381	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 382
 383	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 384	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 385
 386	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 387	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 388	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 389	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 390};
 391
 392/*
 393 * Cortex-A12 HW events mapping
 394 */
 395static const unsigned armv7_a12_perf_map[PERF_COUNT_HW_MAX] = {
 396	PERF_MAP_ALL_UNSUPPORTED,
 397	[PERF_COUNT_HW_CPU_CYCLES]		= ARMV7_PERFCTR_CPU_CYCLES,
 398	[PERF_COUNT_HW_INSTRUCTIONS]		= ARMV7_PERFCTR_INSTR_EXECUTED,
 399	[PERF_COUNT_HW_CACHE_REFERENCES]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 400	[PERF_COUNT_HW_CACHE_MISSES]		= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 401	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= ARMV7_A12_PERFCTR_PC_WRITE_SPEC,
 402	[PERF_COUNT_HW_BRANCH_MISSES]		= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 403	[PERF_COUNT_HW_BUS_CYCLES]		= ARMV7_PERFCTR_BUS_CYCLES,
 404};
 405
 406static const unsigned armv7_a12_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 407					[PERF_COUNT_HW_CACHE_OP_MAX]
 408					[PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 409	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 410
 411	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_READ,
 412	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 413	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A12_PERFCTR_L1_DCACHE_ACCESS_WRITE,
 414	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 415
 416	/*
 417	 * Not all performance counters differentiate between read and write
 418	 * accesses/misses so we're not always strictly correct, but it's the
 419	 * best we can do. Writes and reads get combined in these cases.
 420	 */
 421	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_ICACHE_ACCESS,
 422	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_ICACHE_REFILL,
 423
 424	[C(LL)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_READ,
 425	[C(LL)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L2_CACHE_REFILL,
 426	[C(LL)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_A12_PERFCTR_L2_CACHE_ACCESS_WRITE,
 427	[C(LL)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L2_CACHE_REFILL,
 428
 429	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 430	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_DTLB_REFILL,
 431	[C(DTLB)][C(OP_PREFETCH)][C(RESULT_MISS)]	= ARMV7_A12_PERFCTR_PF_TLB_REFILL,
 432
 433	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 434	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_ITLB_REFILL,
 435
 436	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 437	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 438	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 439	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 440};
 441
 442/*
 443 * Krait HW events mapping
 444 */
 445static const unsigned krait_perf_map[PERF_COUNT_HW_MAX] = {
 446	PERF_MAP_ALL_UNSUPPORTED,
 447	[PERF_COUNT_HW_CPU_CYCLES]	    = ARMV7_PERFCTR_CPU_CYCLES,
 448	[PERF_COUNT_HW_INSTRUCTIONS]	    = ARMV7_PERFCTR_INSTR_EXECUTED,
 449	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
 450	[PERF_COUNT_HW_BRANCH_MISSES]	    = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 451	[PERF_COUNT_HW_BUS_CYCLES]	    = ARMV7_PERFCTR_CLOCK_CYCLES,
 452};
 453
 454static const unsigned krait_perf_map_no_branch[PERF_COUNT_HW_MAX] = {
 455	PERF_MAP_ALL_UNSUPPORTED,
 456	[PERF_COUNT_HW_CPU_CYCLES]	    = ARMV7_PERFCTR_CPU_CYCLES,
 457	[PERF_COUNT_HW_INSTRUCTIONS]	    = ARMV7_PERFCTR_INSTR_EXECUTED,
 458	[PERF_COUNT_HW_BRANCH_MISSES]	    = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 459	[PERF_COUNT_HW_BUS_CYCLES]	    = ARMV7_PERFCTR_CLOCK_CYCLES,
 460};
 461
 462static const unsigned krait_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 463					  [PERF_COUNT_HW_CACHE_OP_MAX]
 464					  [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 465	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 466
 467	/*
 468	 * The performance counters don't differentiate between read and write
 469	 * accesses/misses so this isn't strictly correct, but it's the best we
 470	 * can do. Writes and reads get combined.
 471	 */
 472	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 473	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 474	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 475	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_L1_DCACHE_REFILL,
 476
 477	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_ICACHE_ACCESS,
 478	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= KRAIT_PERFCTR_L1_ICACHE_MISS,
 479
 480	[C(DTLB)][C(OP_READ)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_DTLB_ACCESS,
 481	[C(DTLB)][C(OP_WRITE)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_DTLB_ACCESS,
 482
 483	[C(ITLB)][C(OP_READ)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_ITLB_ACCESS,
 484	[C(ITLB)][C(OP_WRITE)][C(RESULT_ACCESS)]	= KRAIT_PERFCTR_L1_ITLB_ACCESS,
 485
 486	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 487	[C(BPU)][C(OP_READ)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 488	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)]	= ARMV7_PERFCTR_PC_BRANCH_PRED,
 489	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)]	= ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 490};
 491
 492/*
 493 * Scorpion HW events mapping
 494 */
 495static const unsigned scorpion_perf_map[PERF_COUNT_HW_MAX] = {
 496	PERF_MAP_ALL_UNSUPPORTED,
 497	[PERF_COUNT_HW_CPU_CYCLES]	    = ARMV7_PERFCTR_CPU_CYCLES,
 498	[PERF_COUNT_HW_INSTRUCTIONS]	    = ARMV7_PERFCTR_INSTR_EXECUTED,
 499	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = ARMV7_PERFCTR_PC_WRITE,
 500	[PERF_COUNT_HW_BRANCH_MISSES]	    = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 501	[PERF_COUNT_HW_BUS_CYCLES]	    = ARMV7_PERFCTR_CLOCK_CYCLES,
 502};
 503
 504static const unsigned scorpion_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
 505					    [PERF_COUNT_HW_CACHE_OP_MAX]
 506					    [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
 507	PERF_CACHE_MAP_ALL_UNSUPPORTED,
 508	/*
 509	 * The performance counters don't differentiate between read and write
 510	 * accesses/misses so this isn't strictly correct, but it's the best we
 511	 * can do. Writes and reads get combined.
 512	 */
 513	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 514	[C(L1D)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
 515	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_L1_DCACHE_ACCESS,
 516	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_L1_DCACHE_REFILL,
 517	[C(L1I)][C(OP_READ)][C(RESULT_ACCESS)] = SCORPION_ICACHE_ACCESS,
 518	[C(L1I)][C(OP_READ)][C(RESULT_MISS)] = SCORPION_ICACHE_MISS,
 519	/*
 520	 * Only ITLB misses and DTLB refills are supported.  If users want the
 521	 * DTLB refills misses a raw counter must be used.
 522	 */
 523	[C(DTLB)][C(OP_READ)][C(RESULT_ACCESS)] = SCORPION_DTLB_ACCESS,
 524	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)] = SCORPION_DTLB_MISS,
 525	[C(DTLB)][C(OP_WRITE)][C(RESULT_ACCESS)] = SCORPION_DTLB_ACCESS,
 526	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)] = SCORPION_DTLB_MISS,
 527	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)] = SCORPION_ITLB_MISS,
 528	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)] = SCORPION_ITLB_MISS,
 529	[C(BPU)][C(OP_READ)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
 530	[C(BPU)][C(OP_READ)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 531	[C(BPU)][C(OP_WRITE)][C(RESULT_ACCESS)] = ARMV7_PERFCTR_PC_BRANCH_PRED,
 532	[C(BPU)][C(OP_WRITE)][C(RESULT_MISS)] = ARMV7_PERFCTR_PC_BRANCH_MIS_PRED,
 533};
 534
 535PMU_FORMAT_ATTR(event, "config:0-7");
 536
 537static struct attribute *armv7_pmu_format_attrs[] = {
 538	&format_attr_event.attr,
 539	NULL,
 540};
 541
 542static struct attribute_group armv7_pmu_format_attr_group = {
 543	.name = "format",
 544	.attrs = armv7_pmu_format_attrs,
 545};
 546
 547#define ARMV7_EVENT_ATTR_RESOLVE(m) #m
 548#define ARMV7_EVENT_ATTR(name, config) \
 549	PMU_EVENT_ATTR_STRING(name, armv7_event_attr_##name, \
 550			      "event=" ARMV7_EVENT_ATTR_RESOLVE(config))
 551
 552ARMV7_EVENT_ATTR(sw_incr, ARMV7_PERFCTR_PMNC_SW_INCR);
 553ARMV7_EVENT_ATTR(l1i_cache_refill, ARMV7_PERFCTR_L1_ICACHE_REFILL);
 554ARMV7_EVENT_ATTR(l1i_tlb_refill, ARMV7_PERFCTR_ITLB_REFILL);
 555ARMV7_EVENT_ATTR(l1d_cache_refill, ARMV7_PERFCTR_L1_DCACHE_REFILL);
 556ARMV7_EVENT_ATTR(l1d_cache, ARMV7_PERFCTR_L1_DCACHE_ACCESS);
 557ARMV7_EVENT_ATTR(l1d_tlb_refill, ARMV7_PERFCTR_DTLB_REFILL);
 558ARMV7_EVENT_ATTR(ld_retired, ARMV7_PERFCTR_MEM_READ);
 559ARMV7_EVENT_ATTR(st_retired, ARMV7_PERFCTR_MEM_WRITE);
 560ARMV7_EVENT_ATTR(inst_retired, ARMV7_PERFCTR_INSTR_EXECUTED);
 561ARMV7_EVENT_ATTR(exc_taken, ARMV7_PERFCTR_EXC_TAKEN);
 562ARMV7_EVENT_ATTR(exc_return, ARMV7_PERFCTR_EXC_EXECUTED);
 563ARMV7_EVENT_ATTR(cid_write_retired, ARMV7_PERFCTR_CID_WRITE);
 564ARMV7_EVENT_ATTR(pc_write_retired, ARMV7_PERFCTR_PC_WRITE);
 565ARMV7_EVENT_ATTR(br_immed_retired, ARMV7_PERFCTR_PC_IMM_BRANCH);
 566ARMV7_EVENT_ATTR(br_return_retired, ARMV7_PERFCTR_PC_PROC_RETURN);
 567ARMV7_EVENT_ATTR(unaligned_ldst_retired, ARMV7_PERFCTR_MEM_UNALIGNED_ACCESS);
 568ARMV7_EVENT_ATTR(br_mis_pred, ARMV7_PERFCTR_PC_BRANCH_MIS_PRED);
 569ARMV7_EVENT_ATTR(cpu_cycles, ARMV7_PERFCTR_CLOCK_CYCLES);
 570ARMV7_EVENT_ATTR(br_pred, ARMV7_PERFCTR_PC_BRANCH_PRED);
 571
 572static struct attribute *armv7_pmuv1_event_attrs[] = {
 573	&armv7_event_attr_sw_incr.attr.attr,
 574	&armv7_event_attr_l1i_cache_refill.attr.attr,
 575	&armv7_event_attr_l1i_tlb_refill.attr.attr,
 576	&armv7_event_attr_l1d_cache_refill.attr.attr,
 577	&armv7_event_attr_l1d_cache.attr.attr,
 578	&armv7_event_attr_l1d_tlb_refill.attr.attr,
 579	&armv7_event_attr_ld_retired.attr.attr,
 580	&armv7_event_attr_st_retired.attr.attr,
 581	&armv7_event_attr_inst_retired.attr.attr,
 582	&armv7_event_attr_exc_taken.attr.attr,
 583	&armv7_event_attr_exc_return.attr.attr,
 584	&armv7_event_attr_cid_write_retired.attr.attr,
 585	&armv7_event_attr_pc_write_retired.attr.attr,
 586	&armv7_event_attr_br_immed_retired.attr.attr,
 587	&armv7_event_attr_br_return_retired.attr.attr,
 588	&armv7_event_attr_unaligned_ldst_retired.attr.attr,
 589	&armv7_event_attr_br_mis_pred.attr.attr,
 590	&armv7_event_attr_cpu_cycles.attr.attr,
 591	&armv7_event_attr_br_pred.attr.attr,
 592	NULL,
 593};
 594
 595static struct attribute_group armv7_pmuv1_events_attr_group = {
 596	.name = "events",
 597	.attrs = armv7_pmuv1_event_attrs,
 598};
 599
 600ARMV7_EVENT_ATTR(mem_access, ARMV7_PERFCTR_MEM_ACCESS);
 601ARMV7_EVENT_ATTR(l1i_cache, ARMV7_PERFCTR_L1_ICACHE_ACCESS);
 602ARMV7_EVENT_ATTR(l1d_cache_wb, ARMV7_PERFCTR_L1_DCACHE_WB);
 603ARMV7_EVENT_ATTR(l2d_cache, ARMV7_PERFCTR_L2_CACHE_ACCESS);
 604ARMV7_EVENT_ATTR(l2d_cache_refill, ARMV7_PERFCTR_L2_CACHE_REFILL);
 605ARMV7_EVENT_ATTR(l2d_cache_wb, ARMV7_PERFCTR_L2_CACHE_WB);
 606ARMV7_EVENT_ATTR(bus_access, ARMV7_PERFCTR_BUS_ACCESS);
 607ARMV7_EVENT_ATTR(memory_error, ARMV7_PERFCTR_MEM_ERROR);
 608ARMV7_EVENT_ATTR(inst_spec, ARMV7_PERFCTR_INSTR_SPEC);
 609ARMV7_EVENT_ATTR(ttbr_write_retired, ARMV7_PERFCTR_TTBR_WRITE);
 610ARMV7_EVENT_ATTR(bus_cycles, ARMV7_PERFCTR_BUS_CYCLES);
 611
 612static struct attribute *armv7_pmuv2_event_attrs[] = {
 613	&armv7_event_attr_sw_incr.attr.attr,
 614	&armv7_event_attr_l1i_cache_refill.attr.attr,
 615	&armv7_event_attr_l1i_tlb_refill.attr.attr,
 616	&armv7_event_attr_l1d_cache_refill.attr.attr,
 617	&armv7_event_attr_l1d_cache.attr.attr,
 618	&armv7_event_attr_l1d_tlb_refill.attr.attr,
 619	&armv7_event_attr_ld_retired.attr.attr,
 620	&armv7_event_attr_st_retired.attr.attr,
 621	&armv7_event_attr_inst_retired.attr.attr,
 622	&armv7_event_attr_exc_taken.attr.attr,
 623	&armv7_event_attr_exc_return.attr.attr,
 624	&armv7_event_attr_cid_write_retired.attr.attr,
 625	&armv7_event_attr_pc_write_retired.attr.attr,
 626	&armv7_event_attr_br_immed_retired.attr.attr,
 627	&armv7_event_attr_br_return_retired.attr.attr,
 628	&armv7_event_attr_unaligned_ldst_retired.attr.attr,
 629	&armv7_event_attr_br_mis_pred.attr.attr,
 630	&armv7_event_attr_cpu_cycles.attr.attr,
 631	&armv7_event_attr_br_pred.attr.attr,
 632	&armv7_event_attr_mem_access.attr.attr,
 633	&armv7_event_attr_l1i_cache.attr.attr,
 634	&armv7_event_attr_l1d_cache_wb.attr.attr,
 635	&armv7_event_attr_l2d_cache.attr.attr,
 636	&armv7_event_attr_l2d_cache_refill.attr.attr,
 637	&armv7_event_attr_l2d_cache_wb.attr.attr,
 638	&armv7_event_attr_bus_access.attr.attr,
 639	&armv7_event_attr_memory_error.attr.attr,
 640	&armv7_event_attr_inst_spec.attr.attr,
 641	&armv7_event_attr_ttbr_write_retired.attr.attr,
 642	&armv7_event_attr_bus_cycles.attr.attr,
 643	NULL,
 644};
 645
 646static struct attribute_group armv7_pmuv2_events_attr_group = {
 647	.name = "events",
 648	.attrs = armv7_pmuv2_event_attrs,
 649};
 650
 651/*
 652 * Perf Events' indices
 653 */
 654#define	ARMV7_IDX_CYCLE_COUNTER	0
 655#define	ARMV7_IDX_COUNTER0	1
 656#define	ARMV7_IDX_COUNTER_LAST(cpu_pmu) \
 657	(ARMV7_IDX_CYCLE_COUNTER + cpu_pmu->num_events - 1)
 658
 659#define	ARMV7_MAX_COUNTERS	32
 660#define	ARMV7_COUNTER_MASK	(ARMV7_MAX_COUNTERS - 1)
 661
 662/*
 663 * ARMv7 low level PMNC access
 664 */
 665
 666/*
 667 * Perf Event to low level counters mapping
 668 */
 669#define	ARMV7_IDX_TO_COUNTER(x)	\
 670	(((x) - ARMV7_IDX_COUNTER0) & ARMV7_COUNTER_MASK)
 671
 672/*
 673 * Per-CPU PMNC: config reg
 674 */
 675#define ARMV7_PMNC_E		(1 << 0) /* Enable all counters */
 676#define ARMV7_PMNC_P		(1 << 1) /* Reset all counters */
 677#define ARMV7_PMNC_C		(1 << 2) /* Cycle counter reset */
 678#define ARMV7_PMNC_D		(1 << 3) /* CCNT counts every 64th cpu cycle */
 679#define ARMV7_PMNC_X		(1 << 4) /* Export to ETM */
 680#define ARMV7_PMNC_DP		(1 << 5) /* Disable CCNT if non-invasive debug*/
 681#define	ARMV7_PMNC_N_SHIFT	11	 /* Number of counters supported */
 682#define	ARMV7_PMNC_N_MASK	0x1f
 683#define	ARMV7_PMNC_MASK		0x3f	 /* Mask for writable bits */
 684
 685/*
 686 * FLAG: counters overflow flag status reg
 687 */
 688#define	ARMV7_FLAG_MASK		0xffffffff	/* Mask for writable bits */
 689#define	ARMV7_OVERFLOWED_MASK	ARMV7_FLAG_MASK
 690
 691/*
 692 * PMXEVTYPER: Event selection reg
 693 */
 694#define	ARMV7_EVTYPE_MASK	0xc80000ff	/* Mask for writable bits */
 695#define	ARMV7_EVTYPE_EVENT	0xff		/* Mask for EVENT bits */
 696
 697/*
 698 * Event filters for PMUv2
 699 */
 700#define	ARMV7_EXCLUDE_PL1	BIT(31)
 701#define	ARMV7_EXCLUDE_USER	BIT(30)
 702#define	ARMV7_INCLUDE_HYP	BIT(27)
 703
 704/*
 705 * Secure debug enable reg
 706 */
 707#define ARMV7_SDER_SUNIDEN	BIT(1) /* Permit non-invasive debug */
 708
 709static inline u32 armv7_pmnc_read(void)
 710{
 711	u32 val;
 712	asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r"(val));
 713	return val;
 714}
 715
 716static inline void armv7_pmnc_write(u32 val)
 717{
 718	val &= ARMV7_PMNC_MASK;
 719	isb();
 720	asm volatile("mcr p15, 0, %0, c9, c12, 0" : : "r"(val));
 721}
 722
 723static inline int armv7_pmnc_has_overflowed(u32 pmnc)
 724{
 725	return pmnc & ARMV7_OVERFLOWED_MASK;
 726}
 727
 728static inline int armv7_pmnc_counter_valid(struct arm_pmu *cpu_pmu, int idx)
 729{
 730	return idx >= ARMV7_IDX_CYCLE_COUNTER &&
 731		idx <= ARMV7_IDX_COUNTER_LAST(cpu_pmu);
 732}
 733
 734static inline int armv7_pmnc_counter_has_overflowed(u32 pmnc, int idx)
 735{
 736	return pmnc & BIT(ARMV7_IDX_TO_COUNTER(idx));
 737}
 738
 739static inline void armv7_pmnc_select_counter(int idx)
 740{
 741	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 742	asm volatile("mcr p15, 0, %0, c9, c12, 5" : : "r" (counter));
 743	isb();
 744}
 745
 746static inline u64 armv7pmu_read_counter(struct perf_event *event)
 747{
 748	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
 749	struct hw_perf_event *hwc = &event->hw;
 750	int idx = hwc->idx;
 751	u32 value = 0;
 752
 753	if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
 754		pr_err("CPU%u reading wrong counter %d\n",
 755			smp_processor_id(), idx);
 756	} else if (idx == ARMV7_IDX_CYCLE_COUNTER) {
 757		asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (value));
 758	} else {
 759		armv7_pmnc_select_counter(idx);
 760		asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (value));
 761	}
 762
 763	return value;
 764}
 765
 766static inline void armv7pmu_write_counter(struct perf_event *event, u64 value)
 767{
 768	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
 769	struct hw_perf_event *hwc = &event->hw;
 770	int idx = hwc->idx;
 771
 772	if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
 773		pr_err("CPU%u writing wrong counter %d\n",
 774			smp_processor_id(), idx);
 775	} else if (idx == ARMV7_IDX_CYCLE_COUNTER) {
 776		asm volatile("mcr p15, 0, %0, c9, c13, 0" : : "r" ((u32)value));
 777	} else {
 778		armv7_pmnc_select_counter(idx);
 779		asm volatile("mcr p15, 0, %0, c9, c13, 2" : : "r" ((u32)value));
 780	}
 781}
 782
 783static inline void armv7_pmnc_write_evtsel(int idx, u32 val)
 784{
 785	armv7_pmnc_select_counter(idx);
 786	val &= ARMV7_EVTYPE_MASK;
 787	asm volatile("mcr p15, 0, %0, c9, c13, 1" : : "r" (val));
 788}
 789
 790static inline void armv7_pmnc_enable_counter(int idx)
 791{
 792	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 793	asm volatile("mcr p15, 0, %0, c9, c12, 1" : : "r" (BIT(counter)));
 794}
 795
 796static inline void armv7_pmnc_disable_counter(int idx)
 797{
 798	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 799	asm volatile("mcr p15, 0, %0, c9, c12, 2" : : "r" (BIT(counter)));
 800}
 801
 802static inline void armv7_pmnc_enable_intens(int idx)
 803{
 804	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 805	asm volatile("mcr p15, 0, %0, c9, c14, 1" : : "r" (BIT(counter)));
 806}
 807
 808static inline void armv7_pmnc_disable_intens(int idx)
 809{
 810	u32 counter = ARMV7_IDX_TO_COUNTER(idx);
 811	asm volatile("mcr p15, 0, %0, c9, c14, 2" : : "r" (BIT(counter)));
 812	isb();
 813	/* Clear the overflow flag in case an interrupt is pending. */
 814	asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (BIT(counter)));
 815	isb();
 816}
 817
 818static inline u32 armv7_pmnc_getreset_flags(void)
 819{
 820	u32 val;
 821
 822	/* Read */
 823	asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
 824
 825	/* Write to clear flags */
 826	val &= ARMV7_FLAG_MASK;
 827	asm volatile("mcr p15, 0, %0, c9, c12, 3" : : "r" (val));
 828
 829	return val;
 830}
 831
 832#ifdef DEBUG
 833static void armv7_pmnc_dump_regs(struct arm_pmu *cpu_pmu)
 834{
 835	u32 val;
 836	unsigned int cnt;
 837
 838	pr_info("PMNC registers dump:\n");
 839
 840	asm volatile("mrc p15, 0, %0, c9, c12, 0" : "=r" (val));
 841	pr_info("PMNC  =0x%08x\n", val);
 842
 843	asm volatile("mrc p15, 0, %0, c9, c12, 1" : "=r" (val));
 844	pr_info("CNTENS=0x%08x\n", val);
 845
 846	asm volatile("mrc p15, 0, %0, c9, c14, 1" : "=r" (val));
 847	pr_info("INTENS=0x%08x\n", val);
 848
 849	asm volatile("mrc p15, 0, %0, c9, c12, 3" : "=r" (val));
 850	pr_info("FLAGS =0x%08x\n", val);
 851
 852	asm volatile("mrc p15, 0, %0, c9, c12, 5" : "=r" (val));
 853	pr_info("SELECT=0x%08x\n", val);
 854
 855	asm volatile("mrc p15, 0, %0, c9, c13, 0" : "=r" (val));
 856	pr_info("CCNT  =0x%08x\n", val);
 857
 858	for (cnt = ARMV7_IDX_COUNTER0;
 859			cnt <= ARMV7_IDX_COUNTER_LAST(cpu_pmu); cnt++) {
 860		armv7_pmnc_select_counter(cnt);
 861		asm volatile("mrc p15, 0, %0, c9, c13, 2" : "=r" (val));
 862		pr_info("CNT[%d] count =0x%08x\n",
 863			ARMV7_IDX_TO_COUNTER(cnt), val);
 864		asm volatile("mrc p15, 0, %0, c9, c13, 1" : "=r" (val));
 865		pr_info("CNT[%d] evtsel=0x%08x\n",
 866			ARMV7_IDX_TO_COUNTER(cnt), val);
 867	}
 868}
 869#endif
 870
 871static void armv7pmu_enable_event(struct perf_event *event)
 872{
 873	unsigned long flags;
 874	struct hw_perf_event *hwc = &event->hw;
 875	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
 876	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
 877	int idx = hwc->idx;
 878
 879	if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
 880		pr_err("CPU%u enabling wrong PMNC counter IRQ enable %d\n",
 881			smp_processor_id(), idx);
 882		return;
 883	}
 884
 885	/*
 886	 * Enable counter and interrupt, and set the counter to count
 887	 * the event that we're interested in.
 888	 */
 889	raw_spin_lock_irqsave(&events->pmu_lock, flags);
 890
 891	/*
 892	 * Disable counter
 893	 */
 894	armv7_pmnc_disable_counter(idx);
 895
 896	/*
 897	 * Set event (if destined for PMNx counters)
 898	 * We only need to set the event for the cycle counter if we
 899	 * have the ability to perform event filtering.
 900	 */
 901	if (cpu_pmu->set_event_filter || idx != ARMV7_IDX_CYCLE_COUNTER)
 902		armv7_pmnc_write_evtsel(idx, hwc->config_base);
 903
 904	/*
 905	 * Enable interrupt for this counter
 906	 */
 907	armv7_pmnc_enable_intens(idx);
 908
 909	/*
 910	 * Enable counter
 911	 */
 912	armv7_pmnc_enable_counter(idx);
 913
 914	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
 915}
 916
 917static void armv7pmu_disable_event(struct perf_event *event)
 918{
 919	unsigned long flags;
 920	struct hw_perf_event *hwc = &event->hw;
 921	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
 922	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
 923	int idx = hwc->idx;
 924
 925	if (!armv7_pmnc_counter_valid(cpu_pmu, idx)) {
 926		pr_err("CPU%u disabling wrong PMNC counter IRQ enable %d\n",
 927			smp_processor_id(), idx);
 928		return;
 929	}
 930
 931	/*
 932	 * Disable counter and interrupt
 933	 */
 934	raw_spin_lock_irqsave(&events->pmu_lock, flags);
 935
 936	/*
 937	 * Disable counter
 938	 */
 939	armv7_pmnc_disable_counter(idx);
 940
 941	/*
 942	 * Disable interrupt for this counter
 943	 */
 944	armv7_pmnc_disable_intens(idx);
 945
 946	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
 947}
 948
 949static irqreturn_t armv7pmu_handle_irq(struct arm_pmu *cpu_pmu)
 950{
 951	u32 pmnc;
 952	struct perf_sample_data data;
 953	struct pmu_hw_events *cpuc = this_cpu_ptr(cpu_pmu->hw_events);
 954	struct pt_regs *regs;
 955	int idx;
 956
 957	/*
 958	 * Get and reset the IRQ flags
 959	 */
 960	pmnc = armv7_pmnc_getreset_flags();
 961
 962	/*
 963	 * Did an overflow occur?
 964	 */
 965	if (!armv7_pmnc_has_overflowed(pmnc))
 966		return IRQ_NONE;
 967
 968	/*
 969	 * Handle the counter(s) overflow(s)
 970	 */
 971	regs = get_irq_regs();
 972
 973	for (idx = 0; idx < cpu_pmu->num_events; ++idx) {
 974		struct perf_event *event = cpuc->events[idx];
 975		struct hw_perf_event *hwc;
 976
 977		/* Ignore if we don't have an event. */
 978		if (!event)
 979			continue;
 980
 981		/*
 982		 * We have a single interrupt for all counters. Check that
 983		 * each counter has overflowed before we process it.
 984		 */
 985		if (!armv7_pmnc_counter_has_overflowed(pmnc, idx))
 986			continue;
 987
 988		hwc = &event->hw;
 989		armpmu_event_update(event);
 990		perf_sample_data_init(&data, 0, hwc->last_period);
 991		if (!armpmu_event_set_period(event))
 992			continue;
 993
 994		if (perf_event_overflow(event, &data, regs))
 995			cpu_pmu->disable(event);
 996	}
 997
 998	/*
 999	 * Handle the pending perf events.
1000	 *
1001	 * Note: this call *must* be run with interrupts disabled. For
1002	 * platforms that can have the PMU interrupts raised as an NMI, this
1003	 * will not work.
1004	 */
1005	irq_work_run();
1006
1007	return IRQ_HANDLED;
1008}
1009
1010static void armv7pmu_start(struct arm_pmu *cpu_pmu)
1011{
1012	unsigned long flags;
1013	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1014
1015	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1016	/* Enable all counters */
1017	armv7_pmnc_write(armv7_pmnc_read() | ARMV7_PMNC_E);
1018	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1019}
1020
1021static void armv7pmu_stop(struct arm_pmu *cpu_pmu)
1022{
1023	unsigned long flags;
1024	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1025
1026	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1027	/* Disable all counters */
1028	armv7_pmnc_write(armv7_pmnc_read() & ~ARMV7_PMNC_E);
1029	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1030}
1031
1032static int armv7pmu_get_event_idx(struct pmu_hw_events *cpuc,
1033				  struct perf_event *event)
1034{
1035	int idx;
1036	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1037	struct hw_perf_event *hwc = &event->hw;
1038	unsigned long evtype = hwc->config_base & ARMV7_EVTYPE_EVENT;
1039
1040	/* Always place a cycle counter into the cycle counter. */
1041	if (evtype == ARMV7_PERFCTR_CPU_CYCLES) {
1042		if (test_and_set_bit(ARMV7_IDX_CYCLE_COUNTER, cpuc->used_mask))
1043			return -EAGAIN;
1044
1045		return ARMV7_IDX_CYCLE_COUNTER;
1046	}
1047
1048	/*
1049	 * For anything other than a cycle counter, try and use
1050	 * the events counters
1051	 */
1052	for (idx = ARMV7_IDX_COUNTER0; idx < cpu_pmu->num_events; ++idx) {
1053		if (!test_and_set_bit(idx, cpuc->used_mask))
1054			return idx;
1055	}
1056
1057	/* The counters are all in use. */
1058	return -EAGAIN;
1059}
1060
1061static void armv7pmu_clear_event_idx(struct pmu_hw_events *cpuc,
1062				     struct perf_event *event)
1063{
1064	clear_bit(event->hw.idx, cpuc->used_mask);
1065}
1066
1067/*
1068 * Add an event filter to a given event. This will only work for PMUv2 PMUs.
1069 */
1070static int armv7pmu_set_event_filter(struct hw_perf_event *event,
1071				     struct perf_event_attr *attr)
1072{
1073	unsigned long config_base = 0;
1074
1075	if (attr->exclude_idle)
1076		return -EPERM;
1077	if (attr->exclude_user)
1078		config_base |= ARMV7_EXCLUDE_USER;
1079	if (attr->exclude_kernel)
1080		config_base |= ARMV7_EXCLUDE_PL1;
1081	if (!attr->exclude_hv)
1082		config_base |= ARMV7_INCLUDE_HYP;
1083
1084	/*
1085	 * Install the filter into config_base as this is used to
1086	 * construct the event type.
1087	 */
1088	event->config_base = config_base;
1089
1090	return 0;
1091}
1092
1093static void armv7pmu_reset(void *info)
1094{
1095	struct arm_pmu *cpu_pmu = (struct arm_pmu *)info;
1096	u32 idx, nb_cnt = cpu_pmu->num_events, val;
1097
1098	if (cpu_pmu->secure_access) {
1099		asm volatile("mrc p15, 0, %0, c1, c1, 1" : "=r" (val));
1100		val |= ARMV7_SDER_SUNIDEN;
1101		asm volatile("mcr p15, 0, %0, c1, c1, 1" : : "r" (val));
1102	}
1103
1104	/* The counter and interrupt enable registers are unknown at reset. */
1105	for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1106		armv7_pmnc_disable_counter(idx);
1107		armv7_pmnc_disable_intens(idx);
1108	}
1109
1110	/* Initialize & Reset PMNC: C and P bits */
1111	armv7_pmnc_write(ARMV7_PMNC_P | ARMV7_PMNC_C);
1112}
1113
1114static int armv7_a8_map_event(struct perf_event *event)
1115{
1116	return armpmu_map_event(event, &armv7_a8_perf_map,
1117				&armv7_a8_perf_cache_map, 0xFF);
1118}
1119
1120static int armv7_a9_map_event(struct perf_event *event)
1121{
1122	return armpmu_map_event(event, &armv7_a9_perf_map,
1123				&armv7_a9_perf_cache_map, 0xFF);
1124}
1125
1126static int armv7_a5_map_event(struct perf_event *event)
1127{
1128	return armpmu_map_event(event, &armv7_a5_perf_map,
1129				&armv7_a5_perf_cache_map, 0xFF);
1130}
1131
1132static int armv7_a15_map_event(struct perf_event *event)
1133{
1134	return armpmu_map_event(event, &armv7_a15_perf_map,
1135				&armv7_a15_perf_cache_map, 0xFF);
1136}
1137
1138static int armv7_a7_map_event(struct perf_event *event)
1139{
1140	return armpmu_map_event(event, &armv7_a7_perf_map,
1141				&armv7_a7_perf_cache_map, 0xFF);
1142}
1143
1144static int armv7_a12_map_event(struct perf_event *event)
1145{
1146	return armpmu_map_event(event, &armv7_a12_perf_map,
1147				&armv7_a12_perf_cache_map, 0xFF);
1148}
1149
1150static int krait_map_event(struct perf_event *event)
1151{
1152	return armpmu_map_event(event, &krait_perf_map,
1153				&krait_perf_cache_map, 0xFFFFF);
1154}
1155
1156static int krait_map_event_no_branch(struct perf_event *event)
1157{
1158	return armpmu_map_event(event, &krait_perf_map_no_branch,
1159				&krait_perf_cache_map, 0xFFFFF);
1160}
1161
1162static int scorpion_map_event(struct perf_event *event)
1163{
1164	return armpmu_map_event(event, &scorpion_perf_map,
1165				&scorpion_perf_cache_map, 0xFFFFF);
1166}
1167
1168static void armv7pmu_init(struct arm_pmu *cpu_pmu)
1169{
1170	cpu_pmu->handle_irq	= armv7pmu_handle_irq;
1171	cpu_pmu->enable		= armv7pmu_enable_event;
1172	cpu_pmu->disable	= armv7pmu_disable_event;
1173	cpu_pmu->read_counter	= armv7pmu_read_counter;
1174	cpu_pmu->write_counter	= armv7pmu_write_counter;
1175	cpu_pmu->get_event_idx	= armv7pmu_get_event_idx;
1176	cpu_pmu->clear_event_idx = armv7pmu_clear_event_idx;
1177	cpu_pmu->start		= armv7pmu_start;
1178	cpu_pmu->stop		= armv7pmu_stop;
1179	cpu_pmu->reset		= armv7pmu_reset;
1180};
1181
1182static void armv7_read_num_pmnc_events(void *info)
1183{
1184	int *nb_cnt = info;
1185
1186	/* Read the nb of CNTx counters supported from PMNC */
1187	*nb_cnt = (armv7_pmnc_read() >> ARMV7_PMNC_N_SHIFT) & ARMV7_PMNC_N_MASK;
1188
1189	/* Add the CPU cycles counter */
1190	*nb_cnt += 1;
1191}
1192
1193static int armv7_probe_num_events(struct arm_pmu *arm_pmu)
1194{
1195	return smp_call_function_any(&arm_pmu->supported_cpus,
1196				     armv7_read_num_pmnc_events,
1197				     &arm_pmu->num_events, 1);
1198}
1199
1200static int armv7_a8_pmu_init(struct arm_pmu *cpu_pmu)
1201{
1202	armv7pmu_init(cpu_pmu);
1203	cpu_pmu->name		= "armv7_cortex_a8";
1204	cpu_pmu->map_event	= armv7_a8_map_event;
1205	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1206		&armv7_pmuv1_events_attr_group;
1207	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1208		&armv7_pmu_format_attr_group;
1209	return armv7_probe_num_events(cpu_pmu);
1210}
1211
1212static int armv7_a9_pmu_init(struct arm_pmu *cpu_pmu)
1213{
1214	armv7pmu_init(cpu_pmu);
1215	cpu_pmu->name		= "armv7_cortex_a9";
1216	cpu_pmu->map_event	= armv7_a9_map_event;
1217	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1218		&armv7_pmuv1_events_attr_group;
1219	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1220		&armv7_pmu_format_attr_group;
1221	return armv7_probe_num_events(cpu_pmu);
1222}
1223
1224static int armv7_a5_pmu_init(struct arm_pmu *cpu_pmu)
1225{
1226	armv7pmu_init(cpu_pmu);
1227	cpu_pmu->name		= "armv7_cortex_a5";
1228	cpu_pmu->map_event	= armv7_a5_map_event;
1229	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1230		&armv7_pmuv1_events_attr_group;
1231	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1232		&armv7_pmu_format_attr_group;
1233	return armv7_probe_num_events(cpu_pmu);
1234}
1235
1236static int armv7_a15_pmu_init(struct arm_pmu *cpu_pmu)
1237{
1238	armv7pmu_init(cpu_pmu);
1239	cpu_pmu->name		= "armv7_cortex_a15";
1240	cpu_pmu->map_event	= armv7_a15_map_event;
1241	cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1242	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1243		&armv7_pmuv2_events_attr_group;
1244	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1245		&armv7_pmu_format_attr_group;
1246	return armv7_probe_num_events(cpu_pmu);
1247}
1248
1249static int armv7_a7_pmu_init(struct arm_pmu *cpu_pmu)
1250{
1251	armv7pmu_init(cpu_pmu);
1252	cpu_pmu->name		= "armv7_cortex_a7";
1253	cpu_pmu->map_event	= armv7_a7_map_event;
1254	cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1255	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1256		&armv7_pmuv2_events_attr_group;
1257	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1258		&armv7_pmu_format_attr_group;
1259	return armv7_probe_num_events(cpu_pmu);
1260}
1261
1262static int armv7_a12_pmu_init(struct arm_pmu *cpu_pmu)
1263{
1264	armv7pmu_init(cpu_pmu);
1265	cpu_pmu->name		= "armv7_cortex_a12";
1266	cpu_pmu->map_event	= armv7_a12_map_event;
1267	cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1268	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1269		&armv7_pmuv2_events_attr_group;
1270	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1271		&armv7_pmu_format_attr_group;
1272	return armv7_probe_num_events(cpu_pmu);
1273}
1274
1275static int armv7_a17_pmu_init(struct arm_pmu *cpu_pmu)
1276{
1277	int ret = armv7_a12_pmu_init(cpu_pmu);
1278	cpu_pmu->name = "armv7_cortex_a17";
1279	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] =
1280		&armv7_pmuv2_events_attr_group;
1281	cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] =
1282		&armv7_pmu_format_attr_group;
1283	return ret;
1284}
1285
1286/*
1287 * Krait Performance Monitor Region Event Selection Register (PMRESRn)
1288 *
1289 *            31   30     24     16     8      0
1290 *            +--------------------------------+
1291 *  PMRESR0   | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 0
1292 *            +--------------------------------+
1293 *  PMRESR1   | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 1
1294 *            +--------------------------------+
1295 *  PMRESR2   | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 2
1296 *            +--------------------------------+
1297 *  VPMRESR0  | EN |  CC  |  CC  |  CC  |  CC  |   N = 2, R = ?
1298 *            +--------------------------------+
1299 *              EN | G=3  | G=2  | G=1  | G=0
1300 *
1301 *  Event Encoding:
1302 *
1303 *      hwc->config_base = 0xNRCCG
1304 *
1305 *      N  = prefix, 1 for Krait CPU (PMRESRn), 2 for Venum VFP (VPMRESR)
1306 *      R  = region register
1307 *      CC = class of events the group G is choosing from
1308 *      G  = group or particular event
1309 *
1310 *  Example: 0x12021 is a Krait CPU event in PMRESR2's group 1 with code 2
1311 *
1312 *  A region (R) corresponds to a piece of the CPU (execution unit, instruction
1313 *  unit, etc.) while the event code (CC) corresponds to a particular class of
1314 *  events (interrupts for example). An event code is broken down into
1315 *  groups (G) that can be mapped into the PMU (irq, fiqs, and irq+fiqs for
1316 *  example).
1317 */
1318
1319#define KRAIT_EVENT		(1 << 16)
1320#define VENUM_EVENT		(2 << 16)
1321#define KRAIT_EVENT_MASK	(KRAIT_EVENT | VENUM_EVENT)
1322#define PMRESRn_EN		BIT(31)
1323
1324#define EVENT_REGION(event)	(((event) >> 12) & 0xf)		/* R */
1325#define EVENT_GROUP(event)	((event) & 0xf)			/* G */
1326#define EVENT_CODE(event)	(((event) >> 4) & 0xff)		/* CC */
1327#define EVENT_VENUM(event)	(!!(event & VENUM_EVENT))	/* N=2 */
1328#define EVENT_CPU(event)	(!!(event & KRAIT_EVENT))	/* N=1 */
1329
1330static u32 krait_read_pmresrn(int n)
1331{
1332	u32 val;
1333
1334	switch (n) {
1335	case 0:
1336		asm volatile("mrc p15, 1, %0, c9, c15, 0" : "=r" (val));
1337		break;
1338	case 1:
1339		asm volatile("mrc p15, 1, %0, c9, c15, 1" : "=r" (val));
1340		break;
1341	case 2:
1342		asm volatile("mrc p15, 1, %0, c9, c15, 2" : "=r" (val));
1343		break;
1344	default:
1345		BUG(); /* Should be validated in krait_pmu_get_event_idx() */
1346	}
1347
1348	return val;
1349}
1350
1351static void krait_write_pmresrn(int n, u32 val)
1352{
1353	switch (n) {
1354	case 0:
1355		asm volatile("mcr p15, 1, %0, c9, c15, 0" : : "r" (val));
1356		break;
1357	case 1:
1358		asm volatile("mcr p15, 1, %0, c9, c15, 1" : : "r" (val));
1359		break;
1360	case 2:
1361		asm volatile("mcr p15, 1, %0, c9, c15, 2" : : "r" (val));
1362		break;
1363	default:
1364		BUG(); /* Should be validated in krait_pmu_get_event_idx() */
1365	}
1366}
1367
1368static u32 venum_read_pmresr(void)
1369{
1370	u32 val;
1371	asm volatile("mrc p10, 7, %0, c11, c0, 0" : "=r" (val));
1372	return val;
1373}
1374
1375static void venum_write_pmresr(u32 val)
1376{
1377	asm volatile("mcr p10, 7, %0, c11, c0, 0" : : "r" (val));
1378}
1379
1380static void venum_pre_pmresr(u32 *venum_orig_val, u32 *fp_orig_val)
1381{
1382	u32 venum_new_val;
1383	u32 fp_new_val;
1384
1385	BUG_ON(preemptible());
1386	/* CPACR Enable CP10 and CP11 access */
1387	*venum_orig_val = get_copro_access();
1388	venum_new_val = *venum_orig_val | CPACC_SVC(10) | CPACC_SVC(11);
1389	set_copro_access(venum_new_val);
1390
1391	/* Enable FPEXC */
1392	*fp_orig_val = fmrx(FPEXC);
1393	fp_new_val = *fp_orig_val | FPEXC_EN;
1394	fmxr(FPEXC, fp_new_val);
1395}
1396
1397static void venum_post_pmresr(u32 venum_orig_val, u32 fp_orig_val)
1398{
1399	BUG_ON(preemptible());
1400	/* Restore FPEXC */
1401	fmxr(FPEXC, fp_orig_val);
1402	isb();
1403	/* Restore CPACR */
1404	set_copro_access(venum_orig_val);
1405}
1406
1407static u32 krait_get_pmresrn_event(unsigned int region)
1408{
1409	static const u32 pmresrn_table[] = { KRAIT_PMRESR0_GROUP0,
1410					     KRAIT_PMRESR1_GROUP0,
1411					     KRAIT_PMRESR2_GROUP0 };
1412	return pmresrn_table[region];
1413}
1414
1415static void krait_evt_setup(int idx, u32 config_base)
1416{
1417	u32 val;
1418	u32 mask;
1419	u32 vval, fval;
1420	unsigned int region = EVENT_REGION(config_base);
1421	unsigned int group = EVENT_GROUP(config_base);
1422	unsigned int code = EVENT_CODE(config_base);
1423	unsigned int group_shift;
1424	bool venum_event = EVENT_VENUM(config_base);
1425
1426	group_shift = group * 8;
1427	mask = 0xff << group_shift;
1428
1429	/* Configure evtsel for the region and group */
1430	if (venum_event)
1431		val = KRAIT_VPMRESR0_GROUP0;
1432	else
1433		val = krait_get_pmresrn_event(region);
1434	val += group;
1435	/* Mix in mode-exclusion bits */
1436	val |= config_base & (ARMV7_EXCLUDE_USER | ARMV7_EXCLUDE_PL1);
1437	armv7_pmnc_write_evtsel(idx, val);
1438
1439	if (venum_event) {
1440		venum_pre_pmresr(&vval, &fval);
1441		val = venum_read_pmresr();
1442		val &= ~mask;
1443		val |= code << group_shift;
1444		val |= PMRESRn_EN;
1445		venum_write_pmresr(val);
1446		venum_post_pmresr(vval, fval);
1447	} else {
1448		val = krait_read_pmresrn(region);
1449		val &= ~mask;
1450		val |= code << group_shift;
1451		val |= PMRESRn_EN;
1452		krait_write_pmresrn(region, val);
1453	}
1454}
1455
1456static u32 clear_pmresrn_group(u32 val, int group)
1457{
1458	u32 mask;
1459	int group_shift;
1460
1461	group_shift = group * 8;
1462	mask = 0xff << group_shift;
1463	val &= ~mask;
1464
1465	/* Don't clear enable bit if entire region isn't disabled */
1466	if (val & ~PMRESRn_EN)
1467		return val |= PMRESRn_EN;
1468
1469	return 0;
1470}
1471
1472static void krait_clearpmu(u32 config_base)
1473{
1474	u32 val;
1475	u32 vval, fval;
1476	unsigned int region = EVENT_REGION(config_base);
1477	unsigned int group = EVENT_GROUP(config_base);
1478	bool venum_event = EVENT_VENUM(config_base);
1479
1480	if (venum_event) {
1481		venum_pre_pmresr(&vval, &fval);
1482		val = venum_read_pmresr();
1483		val = clear_pmresrn_group(val, group);
1484		venum_write_pmresr(val);
1485		venum_post_pmresr(vval, fval);
1486	} else {
1487		val = krait_read_pmresrn(region);
1488		val = clear_pmresrn_group(val, group);
1489		krait_write_pmresrn(region, val);
1490	}
1491}
1492
1493static void krait_pmu_disable_event(struct perf_event *event)
1494{
1495	unsigned long flags;
1496	struct hw_perf_event *hwc = &event->hw;
1497	int idx = hwc->idx;
1498	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1499	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1500
1501	/* Disable counter and interrupt */
1502	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1503
1504	/* Disable counter */
1505	armv7_pmnc_disable_counter(idx);
1506
1507	/*
1508	 * Clear pmresr code (if destined for PMNx counters)
1509	 */
1510	if (hwc->config_base & KRAIT_EVENT_MASK)
1511		krait_clearpmu(hwc->config_base);
1512
1513	/* Disable interrupt for this counter */
1514	armv7_pmnc_disable_intens(idx);
1515
1516	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1517}
1518
1519static void krait_pmu_enable_event(struct perf_event *event)
1520{
1521	unsigned long flags;
1522	struct hw_perf_event *hwc = &event->hw;
1523	int idx = hwc->idx;
1524	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1525	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1526
1527	/*
1528	 * Enable counter and interrupt, and set the counter to count
1529	 * the event that we're interested in.
1530	 */
1531	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1532
1533	/* Disable counter */
1534	armv7_pmnc_disable_counter(idx);
1535
1536	/*
1537	 * Set event (if destined for PMNx counters)
1538	 * We set the event for the cycle counter because we
1539	 * have the ability to perform event filtering.
1540	 */
1541	if (hwc->config_base & KRAIT_EVENT_MASK)
1542		krait_evt_setup(idx, hwc->config_base);
1543	else
1544		armv7_pmnc_write_evtsel(idx, hwc->config_base);
1545
1546	/* Enable interrupt for this counter */
1547	armv7_pmnc_enable_intens(idx);
1548
1549	/* Enable counter */
1550	armv7_pmnc_enable_counter(idx);
1551
1552	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1553}
1554
1555static void krait_pmu_reset(void *info)
1556{
1557	u32 vval, fval;
1558	struct arm_pmu *cpu_pmu = info;
1559	u32 idx, nb_cnt = cpu_pmu->num_events;
1560
1561	armv7pmu_reset(info);
1562
1563	/* Clear all pmresrs */
1564	krait_write_pmresrn(0, 0);
1565	krait_write_pmresrn(1, 0);
1566	krait_write_pmresrn(2, 0);
1567
1568	venum_pre_pmresr(&vval, &fval);
1569	venum_write_pmresr(0);
1570	venum_post_pmresr(vval, fval);
1571
1572	/* Reset PMxEVNCTCR to sane default */
1573	for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1574		armv7_pmnc_select_counter(idx);
1575		asm volatile("mcr p15, 0, %0, c9, c15, 0" : : "r" (0));
1576	}
1577
1578}
1579
1580static int krait_event_to_bit(struct perf_event *event, unsigned int region,
1581			      unsigned int group)
1582{
1583	int bit;
1584	struct hw_perf_event *hwc = &event->hw;
1585	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1586
1587	if (hwc->config_base & VENUM_EVENT)
1588		bit = KRAIT_VPMRESR0_GROUP0;
1589	else
1590		bit = krait_get_pmresrn_event(region);
1591	bit -= krait_get_pmresrn_event(0);
1592	bit += group;
1593	/*
1594	 * Lower bits are reserved for use by the counters (see
1595	 * armv7pmu_get_event_idx() for more info)
1596	 */
1597	bit += ARMV7_IDX_COUNTER_LAST(cpu_pmu) + 1;
1598
1599	return bit;
1600}
1601
1602/*
1603 * We check for column exclusion constraints here.
1604 * Two events cant use the same group within a pmresr register.
1605 */
1606static int krait_pmu_get_event_idx(struct pmu_hw_events *cpuc,
1607				   struct perf_event *event)
1608{
1609	int idx;
1610	int bit = -1;
1611	struct hw_perf_event *hwc = &event->hw;
1612	unsigned int region = EVENT_REGION(hwc->config_base);
1613	unsigned int code = EVENT_CODE(hwc->config_base);
1614	unsigned int group = EVENT_GROUP(hwc->config_base);
1615	bool venum_event = EVENT_VENUM(hwc->config_base);
1616	bool krait_event = EVENT_CPU(hwc->config_base);
1617
1618	if (venum_event || krait_event) {
1619		/* Ignore invalid events */
1620		if (group > 3 || region > 2)
1621			return -EINVAL;
1622		if (venum_event && (code & 0xe0))
1623			return -EINVAL;
1624
1625		bit = krait_event_to_bit(event, region, group);
1626		if (test_and_set_bit(bit, cpuc->used_mask))
1627			return -EAGAIN;
1628	}
1629
1630	idx = armv7pmu_get_event_idx(cpuc, event);
1631	if (idx < 0 && bit >= 0)
1632		clear_bit(bit, cpuc->used_mask);
1633
1634	return idx;
1635}
1636
1637static void krait_pmu_clear_event_idx(struct pmu_hw_events *cpuc,
1638				      struct perf_event *event)
1639{
1640	int bit;
1641	struct hw_perf_event *hwc = &event->hw;
1642	unsigned int region = EVENT_REGION(hwc->config_base);
1643	unsigned int group = EVENT_GROUP(hwc->config_base);
1644	bool venum_event = EVENT_VENUM(hwc->config_base);
1645	bool krait_event = EVENT_CPU(hwc->config_base);
1646
1647	armv7pmu_clear_event_idx(cpuc, event);
1648	if (venum_event || krait_event) {
1649		bit = krait_event_to_bit(event, region, group);
1650		clear_bit(bit, cpuc->used_mask);
1651	}
1652}
1653
1654static int krait_pmu_init(struct arm_pmu *cpu_pmu)
1655{
1656	armv7pmu_init(cpu_pmu);
1657	cpu_pmu->name		= "armv7_krait";
1658	/* Some early versions of Krait don't support PC write events */
1659	if (of_property_read_bool(cpu_pmu->plat_device->dev.of_node,
1660				  "qcom,no-pc-write"))
1661		cpu_pmu->map_event = krait_map_event_no_branch;
1662	else
1663		cpu_pmu->map_event = krait_map_event;
1664	cpu_pmu->set_event_filter = armv7pmu_set_event_filter;
1665	cpu_pmu->reset		= krait_pmu_reset;
1666	cpu_pmu->enable		= krait_pmu_enable_event;
1667	cpu_pmu->disable	= krait_pmu_disable_event;
1668	cpu_pmu->get_event_idx	= krait_pmu_get_event_idx;
1669	cpu_pmu->clear_event_idx = krait_pmu_clear_event_idx;
1670	return armv7_probe_num_events(cpu_pmu);
1671}
1672
1673/*
1674 * Scorpion Local Performance Monitor Register (LPMn)
1675 *
1676 *            31   30     24     16     8      0
1677 *            +--------------------------------+
1678 *  LPM0      | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 0
1679 *            +--------------------------------+
1680 *  LPM1      | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 1
1681 *            +--------------------------------+
1682 *  LPM2      | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 2
1683 *            +--------------------------------+
1684 *  L2LPM     | EN |  CC  |  CC  |  CC  |  CC  |   N = 1, R = 3
1685 *            +--------------------------------+
1686 *  VLPM      | EN |  CC  |  CC  |  CC  |  CC  |   N = 2, R = ?
1687 *            +--------------------------------+
1688 *              EN | G=3  | G=2  | G=1  | G=0
1689 *
1690 *
1691 *  Event Encoding:
1692 *
1693 *      hwc->config_base = 0xNRCCG
1694 *
1695 *      N  = prefix, 1 for Scorpion CPU (LPMn/L2LPM), 2 for Venum VFP (VLPM)
1696 *      R  = region register
1697 *      CC = class of events the group G is choosing from
1698 *      G  = group or particular event
1699 *
1700 *  Example: 0x12021 is a Scorpion CPU event in LPM2's group 1 with code 2
1701 *
1702 *  A region (R) corresponds to a piece of the CPU (execution unit, instruction
1703 *  unit, etc.) while the event code (CC) corresponds to a particular class of
1704 *  events (interrupts for example). An event code is broken down into
1705 *  groups (G) that can be mapped into the PMU (irq, fiqs, and irq+fiqs for
1706 *  example).
1707 */
1708
1709static u32 scorpion_read_pmresrn(int n)
1710{
1711	u32 val;
1712
1713	switch (n) {
1714	case 0:
1715		asm volatile("mrc p15, 0, %0, c15, c0, 0" : "=r" (val));
1716		break;
1717	case 1:
1718		asm volatile("mrc p15, 1, %0, c15, c0, 0" : "=r" (val));
1719		break;
1720	case 2:
1721		asm volatile("mrc p15, 2, %0, c15, c0, 0" : "=r" (val));
1722		break;
1723	case 3:
1724		asm volatile("mrc p15, 3, %0, c15, c2, 0" : "=r" (val));
1725		break;
1726	default:
1727		BUG(); /* Should be validated in scorpion_pmu_get_event_idx() */
1728	}
1729
1730	return val;
1731}
1732
1733static void scorpion_write_pmresrn(int n, u32 val)
1734{
1735	switch (n) {
1736	case 0:
1737		asm volatile("mcr p15, 0, %0, c15, c0, 0" : : "r" (val));
1738		break;
1739	case 1:
1740		asm volatile("mcr p15, 1, %0, c15, c0, 0" : : "r" (val));
1741		break;
1742	case 2:
1743		asm volatile("mcr p15, 2, %0, c15, c0, 0" : : "r" (val));
1744		break;
1745	case 3:
1746		asm volatile("mcr p15, 3, %0, c15, c2, 0" : : "r" (val));
1747		break;
1748	default:
1749		BUG(); /* Should be validated in scorpion_pmu_get_event_idx() */
1750	}
1751}
1752
1753static u32 scorpion_get_pmresrn_event(unsigned int region)
1754{
1755	static const u32 pmresrn_table[] = { SCORPION_LPM0_GROUP0,
1756					     SCORPION_LPM1_GROUP0,
1757					     SCORPION_LPM2_GROUP0,
1758					     SCORPION_L2LPM_GROUP0 };
1759	return pmresrn_table[region];
1760}
1761
1762static void scorpion_evt_setup(int idx, u32 config_base)
1763{
1764	u32 val;
1765	u32 mask;
1766	u32 vval, fval;
1767	unsigned int region = EVENT_REGION(config_base);
1768	unsigned int group = EVENT_GROUP(config_base);
1769	unsigned int code = EVENT_CODE(config_base);
1770	unsigned int group_shift;
1771	bool venum_event = EVENT_VENUM(config_base);
1772
1773	group_shift = group * 8;
1774	mask = 0xff << group_shift;
1775
1776	/* Configure evtsel for the region and group */
1777	if (venum_event)
1778		val = SCORPION_VLPM_GROUP0;
1779	else
1780		val = scorpion_get_pmresrn_event(region);
1781	val += group;
1782	/* Mix in mode-exclusion bits */
1783	val |= config_base & (ARMV7_EXCLUDE_USER | ARMV7_EXCLUDE_PL1);
1784	armv7_pmnc_write_evtsel(idx, val);
1785
1786	asm volatile("mcr p15, 0, %0, c9, c15, 0" : : "r" (0));
1787
1788	if (venum_event) {
1789		venum_pre_pmresr(&vval, &fval);
1790		val = venum_read_pmresr();
1791		val &= ~mask;
1792		val |= code << group_shift;
1793		val |= PMRESRn_EN;
1794		venum_write_pmresr(val);
1795		venum_post_pmresr(vval, fval);
1796	} else {
1797		val = scorpion_read_pmresrn(region);
1798		val &= ~mask;
1799		val |= code << group_shift;
1800		val |= PMRESRn_EN;
1801		scorpion_write_pmresrn(region, val);
1802	}
1803}
1804
1805static void scorpion_clearpmu(u32 config_base)
1806{
1807	u32 val;
1808	u32 vval, fval;
1809	unsigned int region = EVENT_REGION(config_base);
1810	unsigned int group = EVENT_GROUP(config_base);
1811	bool venum_event = EVENT_VENUM(config_base);
1812
1813	if (venum_event) {
1814		venum_pre_pmresr(&vval, &fval);
1815		val = venum_read_pmresr();
1816		val = clear_pmresrn_group(val, group);
1817		venum_write_pmresr(val);
1818		venum_post_pmresr(vval, fval);
1819	} else {
1820		val = scorpion_read_pmresrn(region);
1821		val = clear_pmresrn_group(val, group);
1822		scorpion_write_pmresrn(region, val);
1823	}
1824}
1825
1826static void scorpion_pmu_disable_event(struct perf_event *event)
1827{
1828	unsigned long flags;
1829	struct hw_perf_event *hwc = &event->hw;
1830	int idx = hwc->idx;
1831	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1832	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1833
1834	/* Disable counter and interrupt */
1835	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1836
1837	/* Disable counter */
1838	armv7_pmnc_disable_counter(idx);
1839
1840	/*
1841	 * Clear pmresr code (if destined for PMNx counters)
1842	 */
1843	if (hwc->config_base & KRAIT_EVENT_MASK)
1844		scorpion_clearpmu(hwc->config_base);
1845
1846	/* Disable interrupt for this counter */
1847	armv7_pmnc_disable_intens(idx);
1848
1849	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1850}
1851
1852static void scorpion_pmu_enable_event(struct perf_event *event)
1853{
1854	unsigned long flags;
1855	struct hw_perf_event *hwc = &event->hw;
1856	int idx = hwc->idx;
1857	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1858	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
1859
1860	/*
1861	 * Enable counter and interrupt, and set the counter to count
1862	 * the event that we're interested in.
1863	 */
1864	raw_spin_lock_irqsave(&events->pmu_lock, flags);
1865
1866	/* Disable counter */
1867	armv7_pmnc_disable_counter(idx);
1868
1869	/*
1870	 * Set event (if destined for PMNx counters)
1871	 * We don't set the event for the cycle counter because we
1872	 * don't have the ability to perform event filtering.
1873	 */
1874	if (hwc->config_base & KRAIT_EVENT_MASK)
1875		scorpion_evt_setup(idx, hwc->config_base);
1876	else if (idx != ARMV7_IDX_CYCLE_COUNTER)
1877		armv7_pmnc_write_evtsel(idx, hwc->config_base);
1878
1879	/* Enable interrupt for this counter */
1880	armv7_pmnc_enable_intens(idx);
1881
1882	/* Enable counter */
1883	armv7_pmnc_enable_counter(idx);
1884
1885	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
1886}
1887
1888static void scorpion_pmu_reset(void *info)
1889{
1890	u32 vval, fval;
1891	struct arm_pmu *cpu_pmu = info;
1892	u32 idx, nb_cnt = cpu_pmu->num_events;
1893
1894	armv7pmu_reset(info);
1895
1896	/* Clear all pmresrs */
1897	scorpion_write_pmresrn(0, 0);
1898	scorpion_write_pmresrn(1, 0);
1899	scorpion_write_pmresrn(2, 0);
1900	scorpion_write_pmresrn(3, 0);
1901
1902	venum_pre_pmresr(&vval, &fval);
1903	venum_write_pmresr(0);
1904	venum_post_pmresr(vval, fval);
1905
1906	/* Reset PMxEVNCTCR to sane default */
1907	for (idx = ARMV7_IDX_CYCLE_COUNTER; idx < nb_cnt; ++idx) {
1908		armv7_pmnc_select_counter(idx);
1909		asm volatile("mcr p15, 0, %0, c9, c15, 0" : : "r" (0));
1910	}
1911}
1912
1913static int scorpion_event_to_bit(struct perf_event *event, unsigned int region,
1914			      unsigned int group)
1915{
1916	int bit;
1917	struct hw_perf_event *hwc = &event->hw;
1918	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
1919
1920	if (hwc->config_base & VENUM_EVENT)
1921		bit = SCORPION_VLPM_GROUP0;
1922	else
1923		bit = scorpion_get_pmresrn_event(region);
1924	bit -= scorpion_get_pmresrn_event(0);
1925	bit += group;
1926	/*
1927	 * Lower bits are reserved for use by the counters (see
1928	 * armv7pmu_get_event_idx() for more info)
1929	 */
1930	bit += ARMV7_IDX_COUNTER_LAST(cpu_pmu) + 1;
1931
1932	return bit;
1933}
1934
1935/*
1936 * We check for column exclusion constraints here.
1937 * Two events cant use the same group within a pmresr register.
1938 */
1939static int scorpion_pmu_get_event_idx(struct pmu_hw_events *cpuc,
1940				   struct perf_event *event)
1941{
1942	int idx;
1943	int bit = -1;
1944	struct hw_perf_event *hwc = &event->hw;
1945	unsigned int region = EVENT_REGION(hwc->config_base);
1946	unsigned int group = EVENT_GROUP(hwc->config_base);
1947	bool venum_event = EVENT_VENUM(hwc->config_base);
1948	bool scorpion_event = EVENT_CPU(hwc->config_base);
1949
1950	if (venum_event || scorpion_event) {
1951		/* Ignore invalid events */
1952		if (group > 3 || region > 3)
1953			return -EINVAL;
1954
1955		bit = scorpion_event_to_bit(event, region, group);
1956		if (test_and_set_bit(bit, cpuc->used_mask))
1957			return -EAGAIN;
1958	}
1959
1960	idx = armv7pmu_get_event_idx(cpuc, event);
1961	if (idx < 0 && bit >= 0)
1962		clear_bit(bit, cpuc->used_mask);
1963
1964	return idx;
1965}
1966
1967static void scorpion_pmu_clear_event_idx(struct pmu_hw_events *cpuc,
1968				      struct perf_event *event)
1969{
1970	int bit;
1971	struct hw_perf_event *hwc = &event->hw;
1972	unsigned int region = EVENT_REGION(hwc->config_base);
1973	unsigned int group = EVENT_GROUP(hwc->config_base);
1974	bool venum_event = EVENT_VENUM(hwc->config_base);
1975	bool scorpion_event = EVENT_CPU(hwc->config_base);
1976
1977	armv7pmu_clear_event_idx(cpuc, event);
1978	if (venum_event || scorpion_event) {
1979		bit = scorpion_event_to_bit(event, region, group);
1980		clear_bit(bit, cpuc->used_mask);
1981	}
1982}
1983
1984static int scorpion_pmu_init(struct arm_pmu *cpu_pmu)
1985{
1986	armv7pmu_init(cpu_pmu);
1987	cpu_pmu->name		= "armv7_scorpion";
1988	cpu_pmu->map_event	= scorpion_map_event;
1989	cpu_pmu->reset		= scorpion_pmu_reset;
1990	cpu_pmu->enable		= scorpion_pmu_enable_event;
1991	cpu_pmu->disable	= scorpion_pmu_disable_event;
1992	cpu_pmu->get_event_idx	= scorpion_pmu_get_event_idx;
1993	cpu_pmu->clear_event_idx = scorpion_pmu_clear_event_idx;
1994	return armv7_probe_num_events(cpu_pmu);
1995}
1996
1997static int scorpion_mp_pmu_init(struct arm_pmu *cpu_pmu)
1998{
1999	armv7pmu_init(cpu_pmu);
2000	cpu_pmu->name		= "armv7_scorpion_mp";
2001	cpu_pmu->map_event	= scorpion_map_event;
2002	cpu_pmu->reset		= scorpion_pmu_reset;
2003	cpu_pmu->enable		= scorpion_pmu_enable_event;
2004	cpu_pmu->disable	= scorpion_pmu_disable_event;
2005	cpu_pmu->get_event_idx	= scorpion_pmu_get_event_idx;
2006	cpu_pmu->clear_event_idx = scorpion_pmu_clear_event_idx;
2007	return armv7_probe_num_events(cpu_pmu);
2008}
2009
2010static const struct of_device_id armv7_pmu_of_device_ids[] = {
2011	{.compatible = "arm,cortex-a17-pmu",	.data = armv7_a17_pmu_init},
2012	{.compatible = "arm,cortex-a15-pmu",	.data = armv7_a15_pmu_init},
2013	{.compatible = "arm,cortex-a12-pmu",	.data = armv7_a12_pmu_init},
2014	{.compatible = "arm,cortex-a9-pmu",	.data = armv7_a9_pmu_init},
2015	{.compatible = "arm,cortex-a8-pmu",	.data = armv7_a8_pmu_init},
2016	{.compatible = "arm,cortex-a7-pmu",	.data = armv7_a7_pmu_init},
2017	{.compatible = "arm,cortex-a5-pmu",	.data = armv7_a5_pmu_init},
2018	{.compatible = "qcom,krait-pmu",	.data = krait_pmu_init},
2019	{.compatible = "qcom,scorpion-pmu",	.data = scorpion_pmu_init},
2020	{.compatible = "qcom,scorpion-mp-pmu",	.data = scorpion_mp_pmu_init},
2021	{},
2022};
2023
2024static const struct pmu_probe_info armv7_pmu_probe_table[] = {
2025	ARM_PMU_PROBE(ARM_CPU_PART_CORTEX_A8, armv7_a8_pmu_init),
2026	ARM_PMU_PROBE(ARM_CPU_PART_CORTEX_A9, armv7_a9_pmu_init),
2027	{ /* sentinel value */ }
2028};
2029
2030
2031static int armv7_pmu_device_probe(struct platform_device *pdev)
2032{
2033	return arm_pmu_device_probe(pdev, armv7_pmu_of_device_ids,
2034				    armv7_pmu_probe_table);
2035}
2036
2037static struct platform_driver armv7_pmu_driver = {
2038	.driver		= {
2039		.name	= "armv7-pmu",
2040		.of_match_table = armv7_pmu_of_device_ids,
2041		.suppress_bind_attrs = true,
2042	},
2043	.probe		= armv7_pmu_device_probe,
2044};
2045
2046builtin_platform_driver(armv7_pmu_driver);
2047#endif	/* CONFIG_CPU_V7 */