• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * ARMv5 [xscale] Performance counter handling code.
4  *
5  * Copyright (C) 2010, ARM Ltd., Will Deacon <will.deacon@arm.com>
6  *
7  * Based on the previous xscale OProfile code.
8  *
9  * There are two variants of the xscale PMU that we support:
10  * 	- xscale1pmu: 2 event counters and a cycle counter
11  * 	- xscale2pmu: 4 event counters and a cycle counter
12  * The two variants share event definitions, but have different
13  * PMU structures.
14  */
15 
16 #ifdef CONFIG_CPU_XSCALE
17 
18 #include <asm/cputype.h>
19 #include <asm/irq_regs.h>
20 
21 #include <linux/of.h>
22 #include <linux/perf/arm_pmu.h>
23 #include <linux/platform_device.h>
24 
25 enum xscale_perf_types {
26 	XSCALE_PERFCTR_ICACHE_MISS		= 0x00,
27 	XSCALE_PERFCTR_ICACHE_NO_DELIVER	= 0x01,
28 	XSCALE_PERFCTR_DATA_STALL		= 0x02,
29 	XSCALE_PERFCTR_ITLB_MISS		= 0x03,
30 	XSCALE_PERFCTR_DTLB_MISS		= 0x04,
31 	XSCALE_PERFCTR_BRANCH			= 0x05,
32 	XSCALE_PERFCTR_BRANCH_MISS		= 0x06,
33 	XSCALE_PERFCTR_INSTRUCTION		= 0x07,
34 	XSCALE_PERFCTR_DCACHE_FULL_STALL	= 0x08,
35 	XSCALE_PERFCTR_DCACHE_FULL_STALL_CONTIG	= 0x09,
36 	XSCALE_PERFCTR_DCACHE_ACCESS		= 0x0A,
37 	XSCALE_PERFCTR_DCACHE_MISS		= 0x0B,
38 	XSCALE_PERFCTR_DCACHE_WRITE_BACK	= 0x0C,
39 	XSCALE_PERFCTR_PC_CHANGED		= 0x0D,
40 	XSCALE_PERFCTR_BCU_REQUEST		= 0x10,
41 	XSCALE_PERFCTR_BCU_FULL			= 0x11,
42 	XSCALE_PERFCTR_BCU_DRAIN		= 0x12,
43 	XSCALE_PERFCTR_BCU_ECC_NO_ELOG		= 0x14,
44 	XSCALE_PERFCTR_BCU_1_BIT_ERR		= 0x15,
45 	XSCALE_PERFCTR_RMW			= 0x16,
46 	/* XSCALE_PERFCTR_CCNT is not hardware defined */
47 	XSCALE_PERFCTR_CCNT			= 0xFE,
48 	XSCALE_PERFCTR_UNUSED			= 0xFF,
49 };
50 
51 enum xscale_counters {
52 	XSCALE_CYCLE_COUNTER	= 0,
53 	XSCALE_COUNTER0,
54 	XSCALE_COUNTER1,
55 	XSCALE_COUNTER2,
56 	XSCALE_COUNTER3,
57 };
58 
59 static const unsigned xscale_perf_map[PERF_COUNT_HW_MAX] = {
60 	PERF_MAP_ALL_UNSUPPORTED,
61 	[PERF_COUNT_HW_CPU_CYCLES]		= XSCALE_PERFCTR_CCNT,
62 	[PERF_COUNT_HW_INSTRUCTIONS]		= XSCALE_PERFCTR_INSTRUCTION,
63 	[PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= XSCALE_PERFCTR_BRANCH,
64 	[PERF_COUNT_HW_BRANCH_MISSES]		= XSCALE_PERFCTR_BRANCH_MISS,
65 	[PERF_COUNT_HW_STALLED_CYCLES_FRONTEND]	= XSCALE_PERFCTR_ICACHE_NO_DELIVER,
66 };
67 
68 static const unsigned xscale_perf_cache_map[PERF_COUNT_HW_CACHE_MAX]
69 					   [PERF_COUNT_HW_CACHE_OP_MAX]
70 					   [PERF_COUNT_HW_CACHE_RESULT_MAX] = {
71 	PERF_CACHE_MAP_ALL_UNSUPPORTED,
72 
73 	[C(L1D)][C(OP_READ)][C(RESULT_ACCESS)]	= XSCALE_PERFCTR_DCACHE_ACCESS,
74 	[C(L1D)][C(OP_READ)][C(RESULT_MISS)]	= XSCALE_PERFCTR_DCACHE_MISS,
75 	[C(L1D)][C(OP_WRITE)][C(RESULT_ACCESS)]	= XSCALE_PERFCTR_DCACHE_ACCESS,
76 	[C(L1D)][C(OP_WRITE)][C(RESULT_MISS)]	= XSCALE_PERFCTR_DCACHE_MISS,
77 
78 	[C(L1I)][C(OP_READ)][C(RESULT_MISS)]	= XSCALE_PERFCTR_ICACHE_MISS,
79 
80 	[C(DTLB)][C(OP_READ)][C(RESULT_MISS)]	= XSCALE_PERFCTR_DTLB_MISS,
81 	[C(DTLB)][C(OP_WRITE)][C(RESULT_MISS)]	= XSCALE_PERFCTR_DTLB_MISS,
82 
83 	[C(ITLB)][C(OP_READ)][C(RESULT_MISS)]	= XSCALE_PERFCTR_ITLB_MISS,
84 	[C(ITLB)][C(OP_WRITE)][C(RESULT_MISS)]	= XSCALE_PERFCTR_ITLB_MISS,
85 };
86 
87 #define	XSCALE_PMU_ENABLE	0x001
88 #define XSCALE_PMN_RESET	0x002
89 #define	XSCALE_CCNT_RESET	0x004
90 #define	XSCALE_PMU_RESET	(CCNT_RESET | PMN_RESET)
91 #define XSCALE_PMU_CNT64	0x008
92 
93 #define XSCALE1_OVERFLOWED_MASK	0x700
94 #define XSCALE1_CCOUNT_OVERFLOW	0x400
95 #define XSCALE1_COUNT0_OVERFLOW	0x100
96 #define XSCALE1_COUNT1_OVERFLOW	0x200
97 #define XSCALE1_CCOUNT_INT_EN	0x040
98 #define XSCALE1_COUNT0_INT_EN	0x010
99 #define XSCALE1_COUNT1_INT_EN	0x020
100 #define XSCALE1_COUNT0_EVT_SHFT	12
101 #define XSCALE1_COUNT0_EVT_MASK	(0xff << XSCALE1_COUNT0_EVT_SHFT)
102 #define XSCALE1_COUNT1_EVT_SHFT	20
103 #define XSCALE1_COUNT1_EVT_MASK	(0xff << XSCALE1_COUNT1_EVT_SHFT)
104 
105 static inline u32
xscale1pmu_read_pmnc(void)106 xscale1pmu_read_pmnc(void)
107 {
108 	u32 val;
109 	asm volatile("mrc p14, 0, %0, c0, c0, 0" : "=r" (val));
110 	return val;
111 }
112 
113 static inline void
xscale1pmu_write_pmnc(u32 val)114 xscale1pmu_write_pmnc(u32 val)
115 {
116 	/* upper 4bits and 7, 11 are write-as-0 */
117 	val &= 0xffff77f;
118 	asm volatile("mcr p14, 0, %0, c0, c0, 0" : : "r" (val));
119 }
120 
121 static inline int
xscale1_pmnc_counter_has_overflowed(unsigned long pmnc,enum xscale_counters counter)122 xscale1_pmnc_counter_has_overflowed(unsigned long pmnc,
123 					enum xscale_counters counter)
124 {
125 	int ret = 0;
126 
127 	switch (counter) {
128 	case XSCALE_CYCLE_COUNTER:
129 		ret = pmnc & XSCALE1_CCOUNT_OVERFLOW;
130 		break;
131 	case XSCALE_COUNTER0:
132 		ret = pmnc & XSCALE1_COUNT0_OVERFLOW;
133 		break;
134 	case XSCALE_COUNTER1:
135 		ret = pmnc & XSCALE1_COUNT1_OVERFLOW;
136 		break;
137 	default:
138 		WARN_ONCE(1, "invalid counter number (%d)\n", counter);
139 	}
140 
141 	return ret;
142 }
143 
144 static irqreturn_t
xscale1pmu_handle_irq(struct arm_pmu * cpu_pmu)145 xscale1pmu_handle_irq(struct arm_pmu *cpu_pmu)
146 {
147 	unsigned long pmnc;
148 	struct perf_sample_data data;
149 	struct pmu_hw_events *cpuc = this_cpu_ptr(cpu_pmu->hw_events);
150 	struct pt_regs *regs;
151 	int idx;
152 
153 	/*
154 	 * NOTE: there's an A stepping erratum that states if an overflow
155 	 *       bit already exists and another occurs, the previous
156 	 *       Overflow bit gets cleared. There's no workaround.
157 	 *	 Fixed in B stepping or later.
158 	 */
159 	pmnc = xscale1pmu_read_pmnc();
160 
161 	/*
162 	 * Write the value back to clear the overflow flags. Overflow
163 	 * flags remain in pmnc for use below. We also disable the PMU
164 	 * while we process the interrupt.
165 	 */
166 	xscale1pmu_write_pmnc(pmnc & ~XSCALE_PMU_ENABLE);
167 
168 	if (!(pmnc & XSCALE1_OVERFLOWED_MASK))
169 		return IRQ_NONE;
170 
171 	regs = get_irq_regs();
172 
173 	for (idx = 0; idx < cpu_pmu->num_events; ++idx) {
174 		struct perf_event *event = cpuc->events[idx];
175 		struct hw_perf_event *hwc;
176 
177 		if (!event)
178 			continue;
179 
180 		if (!xscale1_pmnc_counter_has_overflowed(pmnc, idx))
181 			continue;
182 
183 		hwc = &event->hw;
184 		armpmu_event_update(event);
185 		perf_sample_data_init(&data, 0, hwc->last_period);
186 		if (!armpmu_event_set_period(event))
187 			continue;
188 
189 		if (perf_event_overflow(event, &data, regs))
190 			cpu_pmu->disable(event);
191 	}
192 
193 	irq_work_run();
194 
195 	/*
196 	 * Re-enable the PMU.
197 	 */
198 	pmnc = xscale1pmu_read_pmnc() | XSCALE_PMU_ENABLE;
199 	xscale1pmu_write_pmnc(pmnc);
200 
201 	return IRQ_HANDLED;
202 }
203 
xscale1pmu_enable_event(struct perf_event * event)204 static void xscale1pmu_enable_event(struct perf_event *event)
205 {
206 	unsigned long val, mask, evt, flags;
207 	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
208 	struct hw_perf_event *hwc = &event->hw;
209 	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
210 	int idx = hwc->idx;
211 
212 	switch (idx) {
213 	case XSCALE_CYCLE_COUNTER:
214 		mask = 0;
215 		evt = XSCALE1_CCOUNT_INT_EN;
216 		break;
217 	case XSCALE_COUNTER0:
218 		mask = XSCALE1_COUNT0_EVT_MASK;
219 		evt = (hwc->config_base << XSCALE1_COUNT0_EVT_SHFT) |
220 			XSCALE1_COUNT0_INT_EN;
221 		break;
222 	case XSCALE_COUNTER1:
223 		mask = XSCALE1_COUNT1_EVT_MASK;
224 		evt = (hwc->config_base << XSCALE1_COUNT1_EVT_SHFT) |
225 			XSCALE1_COUNT1_INT_EN;
226 		break;
227 	default:
228 		WARN_ONCE(1, "invalid counter number (%d)\n", idx);
229 		return;
230 	}
231 
232 	raw_spin_lock_irqsave(&events->pmu_lock, flags);
233 	val = xscale1pmu_read_pmnc();
234 	val &= ~mask;
235 	val |= evt;
236 	xscale1pmu_write_pmnc(val);
237 	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
238 }
239 
xscale1pmu_disable_event(struct perf_event * event)240 static void xscale1pmu_disable_event(struct perf_event *event)
241 {
242 	unsigned long val, mask, evt, flags;
243 	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
244 	struct hw_perf_event *hwc = &event->hw;
245 	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
246 	int idx = hwc->idx;
247 
248 	switch (idx) {
249 	case XSCALE_CYCLE_COUNTER:
250 		mask = XSCALE1_CCOUNT_INT_EN;
251 		evt = 0;
252 		break;
253 	case XSCALE_COUNTER0:
254 		mask = XSCALE1_COUNT0_INT_EN | XSCALE1_COUNT0_EVT_MASK;
255 		evt = XSCALE_PERFCTR_UNUSED << XSCALE1_COUNT0_EVT_SHFT;
256 		break;
257 	case XSCALE_COUNTER1:
258 		mask = XSCALE1_COUNT1_INT_EN | XSCALE1_COUNT1_EVT_MASK;
259 		evt = XSCALE_PERFCTR_UNUSED << XSCALE1_COUNT1_EVT_SHFT;
260 		break;
261 	default:
262 		WARN_ONCE(1, "invalid counter number (%d)\n", idx);
263 		return;
264 	}
265 
266 	raw_spin_lock_irqsave(&events->pmu_lock, flags);
267 	val = xscale1pmu_read_pmnc();
268 	val &= ~mask;
269 	val |= evt;
270 	xscale1pmu_write_pmnc(val);
271 	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
272 }
273 
274 static int
xscale1pmu_get_event_idx(struct pmu_hw_events * cpuc,struct perf_event * event)275 xscale1pmu_get_event_idx(struct pmu_hw_events *cpuc,
276 				struct perf_event *event)
277 {
278 	struct hw_perf_event *hwc = &event->hw;
279 	if (XSCALE_PERFCTR_CCNT == hwc->config_base) {
280 		if (test_and_set_bit(XSCALE_CYCLE_COUNTER, cpuc->used_mask))
281 			return -EAGAIN;
282 
283 		return XSCALE_CYCLE_COUNTER;
284 	} else {
285 		if (!test_and_set_bit(XSCALE_COUNTER1, cpuc->used_mask))
286 			return XSCALE_COUNTER1;
287 
288 		if (!test_and_set_bit(XSCALE_COUNTER0, cpuc->used_mask))
289 			return XSCALE_COUNTER0;
290 
291 		return -EAGAIN;
292 	}
293 }
294 
xscalepmu_clear_event_idx(struct pmu_hw_events * cpuc,struct perf_event * event)295 static void xscalepmu_clear_event_idx(struct pmu_hw_events *cpuc,
296 				     struct perf_event *event)
297 {
298 	clear_bit(event->hw.idx, cpuc->used_mask);
299 }
300 
xscale1pmu_start(struct arm_pmu * cpu_pmu)301 static void xscale1pmu_start(struct arm_pmu *cpu_pmu)
302 {
303 	unsigned long flags, val;
304 	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
305 
306 	raw_spin_lock_irqsave(&events->pmu_lock, flags);
307 	val = xscale1pmu_read_pmnc();
308 	val |= XSCALE_PMU_ENABLE;
309 	xscale1pmu_write_pmnc(val);
310 	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
311 }
312 
xscale1pmu_stop(struct arm_pmu * cpu_pmu)313 static void xscale1pmu_stop(struct arm_pmu *cpu_pmu)
314 {
315 	unsigned long flags, val;
316 	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
317 
318 	raw_spin_lock_irqsave(&events->pmu_lock, flags);
319 	val = xscale1pmu_read_pmnc();
320 	val &= ~XSCALE_PMU_ENABLE;
321 	xscale1pmu_write_pmnc(val);
322 	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
323 }
324 
xscale1pmu_read_counter(struct perf_event * event)325 static inline u64 xscale1pmu_read_counter(struct perf_event *event)
326 {
327 	struct hw_perf_event *hwc = &event->hw;
328 	int counter = hwc->idx;
329 	u32 val = 0;
330 
331 	switch (counter) {
332 	case XSCALE_CYCLE_COUNTER:
333 		asm volatile("mrc p14, 0, %0, c1, c0, 0" : "=r" (val));
334 		break;
335 	case XSCALE_COUNTER0:
336 		asm volatile("mrc p14, 0, %0, c2, c0, 0" : "=r" (val));
337 		break;
338 	case XSCALE_COUNTER1:
339 		asm volatile("mrc p14, 0, %0, c3, c0, 0" : "=r" (val));
340 		break;
341 	}
342 
343 	return val;
344 }
345 
xscale1pmu_write_counter(struct perf_event * event,u64 val)346 static inline void xscale1pmu_write_counter(struct perf_event *event, u64 val)
347 {
348 	struct hw_perf_event *hwc = &event->hw;
349 	int counter = hwc->idx;
350 
351 	switch (counter) {
352 	case XSCALE_CYCLE_COUNTER:
353 		asm volatile("mcr p14, 0, %0, c1, c0, 0" : : "r" (val));
354 		break;
355 	case XSCALE_COUNTER0:
356 		asm volatile("mcr p14, 0, %0, c2, c0, 0" : : "r" (val));
357 		break;
358 	case XSCALE_COUNTER1:
359 		asm volatile("mcr p14, 0, %0, c3, c0, 0" : : "r" (val));
360 		break;
361 	}
362 }
363 
xscale_map_event(struct perf_event * event)364 static int xscale_map_event(struct perf_event *event)
365 {
366 	return armpmu_map_event(event, &xscale_perf_map,
367 				&xscale_perf_cache_map, 0xFF);
368 }
369 
xscale1pmu_init(struct arm_pmu * cpu_pmu)370 static int xscale1pmu_init(struct arm_pmu *cpu_pmu)
371 {
372 	cpu_pmu->name		= "armv5_xscale1";
373 	cpu_pmu->handle_irq	= xscale1pmu_handle_irq;
374 	cpu_pmu->enable		= xscale1pmu_enable_event;
375 	cpu_pmu->disable	= xscale1pmu_disable_event;
376 	cpu_pmu->read_counter	= xscale1pmu_read_counter;
377 	cpu_pmu->write_counter	= xscale1pmu_write_counter;
378 	cpu_pmu->get_event_idx	= xscale1pmu_get_event_idx;
379 	cpu_pmu->clear_event_idx = xscalepmu_clear_event_idx;
380 	cpu_pmu->start		= xscale1pmu_start;
381 	cpu_pmu->stop		= xscale1pmu_stop;
382 	cpu_pmu->map_event	= xscale_map_event;
383 	cpu_pmu->num_events	= 3;
384 
385 	return 0;
386 }
387 
388 #define XSCALE2_OVERFLOWED_MASK	0x01f
389 #define XSCALE2_CCOUNT_OVERFLOW	0x001
390 #define XSCALE2_COUNT0_OVERFLOW	0x002
391 #define XSCALE2_COUNT1_OVERFLOW	0x004
392 #define XSCALE2_COUNT2_OVERFLOW	0x008
393 #define XSCALE2_COUNT3_OVERFLOW	0x010
394 #define XSCALE2_CCOUNT_INT_EN	0x001
395 #define XSCALE2_COUNT0_INT_EN	0x002
396 #define XSCALE2_COUNT1_INT_EN	0x004
397 #define XSCALE2_COUNT2_INT_EN	0x008
398 #define XSCALE2_COUNT3_INT_EN	0x010
399 #define XSCALE2_COUNT0_EVT_SHFT	0
400 #define XSCALE2_COUNT0_EVT_MASK	(0xff << XSCALE2_COUNT0_EVT_SHFT)
401 #define XSCALE2_COUNT1_EVT_SHFT	8
402 #define XSCALE2_COUNT1_EVT_MASK	(0xff << XSCALE2_COUNT1_EVT_SHFT)
403 #define XSCALE2_COUNT2_EVT_SHFT	16
404 #define XSCALE2_COUNT2_EVT_MASK	(0xff << XSCALE2_COUNT2_EVT_SHFT)
405 #define XSCALE2_COUNT3_EVT_SHFT	24
406 #define XSCALE2_COUNT3_EVT_MASK	(0xff << XSCALE2_COUNT3_EVT_SHFT)
407 
408 static inline u32
xscale2pmu_read_pmnc(void)409 xscale2pmu_read_pmnc(void)
410 {
411 	u32 val;
412 	asm volatile("mrc p14, 0, %0, c0, c1, 0" : "=r" (val));
413 	/* bits 1-2 and 4-23 are read-unpredictable */
414 	return val & 0xff000009;
415 }
416 
417 static inline void
xscale2pmu_write_pmnc(u32 val)418 xscale2pmu_write_pmnc(u32 val)
419 {
420 	/* bits 4-23 are write-as-0, 24-31 are write ignored */
421 	val &= 0xf;
422 	asm volatile("mcr p14, 0, %0, c0, c1, 0" : : "r" (val));
423 }
424 
425 static inline u32
xscale2pmu_read_overflow_flags(void)426 xscale2pmu_read_overflow_flags(void)
427 {
428 	u32 val;
429 	asm volatile("mrc p14, 0, %0, c5, c1, 0" : "=r" (val));
430 	return val;
431 }
432 
433 static inline void
xscale2pmu_write_overflow_flags(u32 val)434 xscale2pmu_write_overflow_flags(u32 val)
435 {
436 	asm volatile("mcr p14, 0, %0, c5, c1, 0" : : "r" (val));
437 }
438 
439 static inline u32
xscale2pmu_read_event_select(void)440 xscale2pmu_read_event_select(void)
441 {
442 	u32 val;
443 	asm volatile("mrc p14, 0, %0, c8, c1, 0" : "=r" (val));
444 	return val;
445 }
446 
447 static inline void
xscale2pmu_write_event_select(u32 val)448 xscale2pmu_write_event_select(u32 val)
449 {
450 	asm volatile("mcr p14, 0, %0, c8, c1, 0" : : "r"(val));
451 }
452 
453 static inline u32
xscale2pmu_read_int_enable(void)454 xscale2pmu_read_int_enable(void)
455 {
456 	u32 val;
457 	asm volatile("mrc p14, 0, %0, c4, c1, 0" : "=r" (val));
458 	return val;
459 }
460 
461 static void
xscale2pmu_write_int_enable(u32 val)462 xscale2pmu_write_int_enable(u32 val)
463 {
464 	asm volatile("mcr p14, 0, %0, c4, c1, 0" : : "r" (val));
465 }
466 
467 static inline int
xscale2_pmnc_counter_has_overflowed(unsigned long of_flags,enum xscale_counters counter)468 xscale2_pmnc_counter_has_overflowed(unsigned long of_flags,
469 					enum xscale_counters counter)
470 {
471 	int ret = 0;
472 
473 	switch (counter) {
474 	case XSCALE_CYCLE_COUNTER:
475 		ret = of_flags & XSCALE2_CCOUNT_OVERFLOW;
476 		break;
477 	case XSCALE_COUNTER0:
478 		ret = of_flags & XSCALE2_COUNT0_OVERFLOW;
479 		break;
480 	case XSCALE_COUNTER1:
481 		ret = of_flags & XSCALE2_COUNT1_OVERFLOW;
482 		break;
483 	case XSCALE_COUNTER2:
484 		ret = of_flags & XSCALE2_COUNT2_OVERFLOW;
485 		break;
486 	case XSCALE_COUNTER3:
487 		ret = of_flags & XSCALE2_COUNT3_OVERFLOW;
488 		break;
489 	default:
490 		WARN_ONCE(1, "invalid counter number (%d)\n", counter);
491 	}
492 
493 	return ret;
494 }
495 
496 static irqreturn_t
xscale2pmu_handle_irq(struct arm_pmu * cpu_pmu)497 xscale2pmu_handle_irq(struct arm_pmu *cpu_pmu)
498 {
499 	unsigned long pmnc, of_flags;
500 	struct perf_sample_data data;
501 	struct pmu_hw_events *cpuc = this_cpu_ptr(cpu_pmu->hw_events);
502 	struct pt_regs *regs;
503 	int idx;
504 
505 	/* Disable the PMU. */
506 	pmnc = xscale2pmu_read_pmnc();
507 	xscale2pmu_write_pmnc(pmnc & ~XSCALE_PMU_ENABLE);
508 
509 	/* Check the overflow flag register. */
510 	of_flags = xscale2pmu_read_overflow_flags();
511 	if (!(of_flags & XSCALE2_OVERFLOWED_MASK))
512 		return IRQ_NONE;
513 
514 	/* Clear the overflow bits. */
515 	xscale2pmu_write_overflow_flags(of_flags);
516 
517 	regs = get_irq_regs();
518 
519 	for (idx = 0; idx < cpu_pmu->num_events; ++idx) {
520 		struct perf_event *event = cpuc->events[idx];
521 		struct hw_perf_event *hwc;
522 
523 		if (!event)
524 			continue;
525 
526 		if (!xscale2_pmnc_counter_has_overflowed(of_flags, idx))
527 			continue;
528 
529 		hwc = &event->hw;
530 		armpmu_event_update(event);
531 		perf_sample_data_init(&data, 0, hwc->last_period);
532 		if (!armpmu_event_set_period(event))
533 			continue;
534 
535 		if (perf_event_overflow(event, &data, regs))
536 			cpu_pmu->disable(event);
537 	}
538 
539 	irq_work_run();
540 
541 	/*
542 	 * Re-enable the PMU.
543 	 */
544 	pmnc = xscale2pmu_read_pmnc() | XSCALE_PMU_ENABLE;
545 	xscale2pmu_write_pmnc(pmnc);
546 
547 	return IRQ_HANDLED;
548 }
549 
xscale2pmu_enable_event(struct perf_event * event)550 static void xscale2pmu_enable_event(struct perf_event *event)
551 {
552 	unsigned long flags, ien, evtsel;
553 	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
554 	struct hw_perf_event *hwc = &event->hw;
555 	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
556 	int idx = hwc->idx;
557 
558 	ien = xscale2pmu_read_int_enable();
559 	evtsel = xscale2pmu_read_event_select();
560 
561 	switch (idx) {
562 	case XSCALE_CYCLE_COUNTER:
563 		ien |= XSCALE2_CCOUNT_INT_EN;
564 		break;
565 	case XSCALE_COUNTER0:
566 		ien |= XSCALE2_COUNT0_INT_EN;
567 		evtsel &= ~XSCALE2_COUNT0_EVT_MASK;
568 		evtsel |= hwc->config_base << XSCALE2_COUNT0_EVT_SHFT;
569 		break;
570 	case XSCALE_COUNTER1:
571 		ien |= XSCALE2_COUNT1_INT_EN;
572 		evtsel &= ~XSCALE2_COUNT1_EVT_MASK;
573 		evtsel |= hwc->config_base << XSCALE2_COUNT1_EVT_SHFT;
574 		break;
575 	case XSCALE_COUNTER2:
576 		ien |= XSCALE2_COUNT2_INT_EN;
577 		evtsel &= ~XSCALE2_COUNT2_EVT_MASK;
578 		evtsel |= hwc->config_base << XSCALE2_COUNT2_EVT_SHFT;
579 		break;
580 	case XSCALE_COUNTER3:
581 		ien |= XSCALE2_COUNT3_INT_EN;
582 		evtsel &= ~XSCALE2_COUNT3_EVT_MASK;
583 		evtsel |= hwc->config_base << XSCALE2_COUNT3_EVT_SHFT;
584 		break;
585 	default:
586 		WARN_ONCE(1, "invalid counter number (%d)\n", idx);
587 		return;
588 	}
589 
590 	raw_spin_lock_irqsave(&events->pmu_lock, flags);
591 	xscale2pmu_write_event_select(evtsel);
592 	xscale2pmu_write_int_enable(ien);
593 	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
594 }
595 
xscale2pmu_disable_event(struct perf_event * event)596 static void xscale2pmu_disable_event(struct perf_event *event)
597 {
598 	unsigned long flags, ien, evtsel, of_flags;
599 	struct arm_pmu *cpu_pmu = to_arm_pmu(event->pmu);
600 	struct hw_perf_event *hwc = &event->hw;
601 	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
602 	int idx = hwc->idx;
603 
604 	ien = xscale2pmu_read_int_enable();
605 	evtsel = xscale2pmu_read_event_select();
606 
607 	switch (idx) {
608 	case XSCALE_CYCLE_COUNTER:
609 		ien &= ~XSCALE2_CCOUNT_INT_EN;
610 		of_flags = XSCALE2_CCOUNT_OVERFLOW;
611 		break;
612 	case XSCALE_COUNTER0:
613 		ien &= ~XSCALE2_COUNT0_INT_EN;
614 		evtsel &= ~XSCALE2_COUNT0_EVT_MASK;
615 		evtsel |= XSCALE_PERFCTR_UNUSED << XSCALE2_COUNT0_EVT_SHFT;
616 		of_flags = XSCALE2_COUNT0_OVERFLOW;
617 		break;
618 	case XSCALE_COUNTER1:
619 		ien &= ~XSCALE2_COUNT1_INT_EN;
620 		evtsel &= ~XSCALE2_COUNT1_EVT_MASK;
621 		evtsel |= XSCALE_PERFCTR_UNUSED << XSCALE2_COUNT1_EVT_SHFT;
622 		of_flags = XSCALE2_COUNT1_OVERFLOW;
623 		break;
624 	case XSCALE_COUNTER2:
625 		ien &= ~XSCALE2_COUNT2_INT_EN;
626 		evtsel &= ~XSCALE2_COUNT2_EVT_MASK;
627 		evtsel |= XSCALE_PERFCTR_UNUSED << XSCALE2_COUNT2_EVT_SHFT;
628 		of_flags = XSCALE2_COUNT2_OVERFLOW;
629 		break;
630 	case XSCALE_COUNTER3:
631 		ien &= ~XSCALE2_COUNT3_INT_EN;
632 		evtsel &= ~XSCALE2_COUNT3_EVT_MASK;
633 		evtsel |= XSCALE_PERFCTR_UNUSED << XSCALE2_COUNT3_EVT_SHFT;
634 		of_flags = XSCALE2_COUNT3_OVERFLOW;
635 		break;
636 	default:
637 		WARN_ONCE(1, "invalid counter number (%d)\n", idx);
638 		return;
639 	}
640 
641 	raw_spin_lock_irqsave(&events->pmu_lock, flags);
642 	xscale2pmu_write_event_select(evtsel);
643 	xscale2pmu_write_int_enable(ien);
644 	xscale2pmu_write_overflow_flags(of_flags);
645 	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
646 }
647 
648 static int
xscale2pmu_get_event_idx(struct pmu_hw_events * cpuc,struct perf_event * event)649 xscale2pmu_get_event_idx(struct pmu_hw_events *cpuc,
650 				struct perf_event *event)
651 {
652 	int idx = xscale1pmu_get_event_idx(cpuc, event);
653 	if (idx >= 0)
654 		goto out;
655 
656 	if (!test_and_set_bit(XSCALE_COUNTER3, cpuc->used_mask))
657 		idx = XSCALE_COUNTER3;
658 	else if (!test_and_set_bit(XSCALE_COUNTER2, cpuc->used_mask))
659 		idx = XSCALE_COUNTER2;
660 out:
661 	return idx;
662 }
663 
xscale2pmu_start(struct arm_pmu * cpu_pmu)664 static void xscale2pmu_start(struct arm_pmu *cpu_pmu)
665 {
666 	unsigned long flags, val;
667 	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
668 
669 	raw_spin_lock_irqsave(&events->pmu_lock, flags);
670 	val = xscale2pmu_read_pmnc() & ~XSCALE_PMU_CNT64;
671 	val |= XSCALE_PMU_ENABLE;
672 	xscale2pmu_write_pmnc(val);
673 	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
674 }
675 
xscale2pmu_stop(struct arm_pmu * cpu_pmu)676 static void xscale2pmu_stop(struct arm_pmu *cpu_pmu)
677 {
678 	unsigned long flags, val;
679 	struct pmu_hw_events *events = this_cpu_ptr(cpu_pmu->hw_events);
680 
681 	raw_spin_lock_irqsave(&events->pmu_lock, flags);
682 	val = xscale2pmu_read_pmnc();
683 	val &= ~XSCALE_PMU_ENABLE;
684 	xscale2pmu_write_pmnc(val);
685 	raw_spin_unlock_irqrestore(&events->pmu_lock, flags);
686 }
687 
xscale2pmu_read_counter(struct perf_event * event)688 static inline u64 xscale2pmu_read_counter(struct perf_event *event)
689 {
690 	struct hw_perf_event *hwc = &event->hw;
691 	int counter = hwc->idx;
692 	u32 val = 0;
693 
694 	switch (counter) {
695 	case XSCALE_CYCLE_COUNTER:
696 		asm volatile("mrc p14, 0, %0, c1, c1, 0" : "=r" (val));
697 		break;
698 	case XSCALE_COUNTER0:
699 		asm volatile("mrc p14, 0, %0, c0, c2, 0" : "=r" (val));
700 		break;
701 	case XSCALE_COUNTER1:
702 		asm volatile("mrc p14, 0, %0, c1, c2, 0" : "=r" (val));
703 		break;
704 	case XSCALE_COUNTER2:
705 		asm volatile("mrc p14, 0, %0, c2, c2, 0" : "=r" (val));
706 		break;
707 	case XSCALE_COUNTER3:
708 		asm volatile("mrc p14, 0, %0, c3, c2, 0" : "=r" (val));
709 		break;
710 	}
711 
712 	return val;
713 }
714 
xscale2pmu_write_counter(struct perf_event * event,u64 val)715 static inline void xscale2pmu_write_counter(struct perf_event *event, u64 val)
716 {
717 	struct hw_perf_event *hwc = &event->hw;
718 	int counter = hwc->idx;
719 
720 	switch (counter) {
721 	case XSCALE_CYCLE_COUNTER:
722 		asm volatile("mcr p14, 0, %0, c1, c1, 0" : : "r" (val));
723 		break;
724 	case XSCALE_COUNTER0:
725 		asm volatile("mcr p14, 0, %0, c0, c2, 0" : : "r" (val));
726 		break;
727 	case XSCALE_COUNTER1:
728 		asm volatile("mcr p14, 0, %0, c1, c2, 0" : : "r" (val));
729 		break;
730 	case XSCALE_COUNTER2:
731 		asm volatile("mcr p14, 0, %0, c2, c2, 0" : : "r" (val));
732 		break;
733 	case XSCALE_COUNTER3:
734 		asm volatile("mcr p14, 0, %0, c3, c2, 0" : : "r" (val));
735 		break;
736 	}
737 }
738 
xscale2pmu_init(struct arm_pmu * cpu_pmu)739 static int xscale2pmu_init(struct arm_pmu *cpu_pmu)
740 {
741 	cpu_pmu->name		= "armv5_xscale2";
742 	cpu_pmu->handle_irq	= xscale2pmu_handle_irq;
743 	cpu_pmu->enable		= xscale2pmu_enable_event;
744 	cpu_pmu->disable	= xscale2pmu_disable_event;
745 	cpu_pmu->read_counter	= xscale2pmu_read_counter;
746 	cpu_pmu->write_counter	= xscale2pmu_write_counter;
747 	cpu_pmu->get_event_idx	= xscale2pmu_get_event_idx;
748 	cpu_pmu->clear_event_idx = xscalepmu_clear_event_idx;
749 	cpu_pmu->start		= xscale2pmu_start;
750 	cpu_pmu->stop		= xscale2pmu_stop;
751 	cpu_pmu->map_event	= xscale_map_event;
752 	cpu_pmu->num_events	= 5;
753 
754 	return 0;
755 }
756 
757 static const struct pmu_probe_info xscale_pmu_probe_table[] = {
758 	XSCALE_PMU_PROBE(ARM_CPU_XSCALE_ARCH_V1, xscale1pmu_init),
759 	XSCALE_PMU_PROBE(ARM_CPU_XSCALE_ARCH_V2, xscale2pmu_init),
760 	{ /* sentinel value */ }
761 };
762 
xscale_pmu_device_probe(struct platform_device * pdev)763 static int xscale_pmu_device_probe(struct platform_device *pdev)
764 {
765 	return arm_pmu_device_probe(pdev, NULL, xscale_pmu_probe_table);
766 }
767 
768 static struct platform_driver xscale_pmu_driver = {
769 	.driver		= {
770 		.name	= "xscale-pmu",
771 	},
772 	.probe		= xscale_pmu_device_probe,
773 };
774 
775 builtin_platform_driver(xscale_pmu_driver);
776 #endif	/* CONFIG_CPU_XSCALE */
777