1 #if defined(CONFIG_CPU_MIPS32) || defined(CONFIG_CPU_MIPS64) || \
2 defined(CONFIG_CPU_R10000) || defined(CONFIG_CPU_SB1)
4 #define M_CONFIG1_PC (1 << 4)
6 #define M_PERFCTL_EXL (1UL << 0)
7 #define M_PERFCTL_KERNEL (1UL << 1)
8 #define M_PERFCTL_SUPERVISOR (1UL << 2)
9 #define M_PERFCTL_USER (1UL << 3)
10 #define M_PERFCTL_INTERRUPT_ENABLE (1UL << 4)
11 #define M_PERFCTL_EVENT(event) (((event) & 0x3ff) << 5)
12 #define M_PERFCTL_VPEID(vpe) ((vpe) << 16)
13 #define M_PERFCTL_MT_EN(filter) ((filter) << 20)
14 #define M_TC_EN_ALL M_PERFCTL_MT_EN(0)
15 #define M_TC_EN_VPE M_PERFCTL_MT_EN(1)
16 #define M_TC_EN_TC M_PERFCTL_MT_EN(2)
17 #define M_PERFCTL_TCID(tcid) ((tcid) << 22)
18 #define M_PERFCTL_WIDE (1UL << 30)
19 #define M_PERFCTL_MORE (1UL << 31)
21 #define M_PERFCTL_COUNT_EVENT_WHENEVER (M_PERFCTL_EXL | \
24 M_PERFCTL_SUPERVISOR | \
25 M_PERFCTL_INTERRUPT_ENABLE)
27 #ifdef CONFIG_MIPS_MT_SMP
28 #define M_PERFCTL_CONFIG_MASK 0x3fff801f
30 #define M_PERFCTL_CONFIG_MASK 0x1f
32 #define M_PERFCTL_EVENT_MASK 0xfe0
34 #define M_COUNTER_OVERFLOW (1UL << 31)
36 #ifdef CONFIG_MIPS_MT_SMP
37 static int cpu_has_mipsmt_pertccounters
;
40 * FIXME: For VSMP, vpe_id() is redefined for Perf-events, because
41 * cpu_data[cpuid].vpe_id reports 0 for _both_ CPUs.
43 #if defined(CONFIG_HW_PERF_EVENTS)
44 #define vpe_id() (cpu_has_mipsmt_pertccounters ? \
45 0 : smp_processor_id())
47 #define vpe_id() (cpu_has_mipsmt_pertccounters ? \
48 0 : cpu_data[smp_processor_id()].vpe_id)
51 /* Copied from op_model_mipsxx.c */
52 static inline unsigned int vpe_shift(void)
54 if (num_possible_cpus() > 1)
59 #else /* !CONFIG_MIPS_MT_SMP */
62 static inline unsigned int vpe_shift(void)
66 #endif /* CONFIG_MIPS_MT_SMP */
68 static inline unsigned int
69 counters_total_to_per_cpu(unsigned int counters
)
71 return counters
>> vpe_shift();
74 static inline unsigned int
75 counters_per_cpu_to_total(unsigned int counters
)
77 return counters
<< vpe_shift();
80 #define __define_perf_accessors(r, n, np) \
82 static inline unsigned int r_c0_ ## r ## n(void) \
84 unsigned int cpu = vpe_id(); \
88 return read_c0_ ## r ## n(); \
90 return read_c0_ ## r ## np(); \
97 static inline void w_c0_ ## r ## n(unsigned int value) \
99 unsigned int cpu = vpe_id(); \
103 write_c0_ ## r ## n(value); \
106 write_c0_ ## r ## np(value); \
114 __define_perf_accessors(perfcntr, 0, 2)
115 __define_perf_accessors(perfcntr
, 1, 3)
116 __define_perf_accessors(perfcntr
, 2, 0)
117 __define_perf_accessors(perfcntr
, 3, 1)
119 __define_perf_accessors(perfctrl
, 0, 2)
120 __define_perf_accessors(perfctrl
, 1, 3)
121 __define_perf_accessors(perfctrl
, 2, 0)
122 __define_perf_accessors(perfctrl
, 3, 1)
124 static inline int __n_counters(void)
126 if (!(read_c0_config1() & M_CONFIG1_PC
))
128 if (!(read_c0_perfctrl0() & M_PERFCTL_MORE
))
130 if (!(read_c0_perfctrl1() & M_PERFCTL_MORE
))
132 if (!(read_c0_perfctrl2() & M_PERFCTL_MORE
))
138 static inline int n_counters(void)
142 switch (current_cpu_type()) {
153 counters
= __n_counters();
159 static void reset_counters(void *arg
)
161 int counters
= (int)(long)arg
;
179 mipsxx_pmu_read_counter(unsigned int idx
)
183 return r_c0_perfcntr0();
185 return r_c0_perfcntr1();
187 return r_c0_perfcntr2();
189 return r_c0_perfcntr3();
191 WARN_ONCE(1, "Invalid performance counter number (%d)\n", idx
);
197 mipsxx_pmu_write_counter(unsigned int idx
, u64 val
)
215 static inline unsigned int
216 mipsxx_pmu_read_control(unsigned int idx
)
220 return r_c0_perfctrl0();
222 return r_c0_perfctrl1();
224 return r_c0_perfctrl2();
226 return r_c0_perfctrl3();
228 WARN_ONCE(1, "Invalid performance counter number (%d)\n", idx
);
234 mipsxx_pmu_write_control(unsigned int idx
, unsigned int val
)
252 #ifdef CONFIG_MIPS_MT_SMP
253 static DEFINE_RWLOCK(pmuint_rwlock
);
256 /* 24K/34K/1004K cores can share the same event map. */
257 static const struct mips_perf_event mipsxxcore_event_map
258 [PERF_COUNT_HW_MAX
] = {
259 [PERF_COUNT_HW_CPU_CYCLES
] = { 0x00, CNTR_EVEN
| CNTR_ODD
, P
},
260 [PERF_COUNT_HW_INSTRUCTIONS
] = { 0x01, CNTR_EVEN
| CNTR_ODD
, T
},
261 [PERF_COUNT_HW_CACHE_REFERENCES
] = { UNSUPPORTED_PERF_EVENT_ID
},
262 [PERF_COUNT_HW_CACHE_MISSES
] = { UNSUPPORTED_PERF_EVENT_ID
},
263 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS
] = { 0x02, CNTR_EVEN
, T
},
264 [PERF_COUNT_HW_BRANCH_MISSES
] = { 0x02, CNTR_ODD
, T
},
265 [PERF_COUNT_HW_BUS_CYCLES
] = { UNSUPPORTED_PERF_EVENT_ID
},
268 /* 74K core has different branch event code. */
269 static const struct mips_perf_event mipsxx74Kcore_event_map
270 [PERF_COUNT_HW_MAX
] = {
271 [PERF_COUNT_HW_CPU_CYCLES
] = { 0x00, CNTR_EVEN
| CNTR_ODD
, P
},
272 [PERF_COUNT_HW_INSTRUCTIONS
] = { 0x01, CNTR_EVEN
| CNTR_ODD
, T
},
273 [PERF_COUNT_HW_CACHE_REFERENCES
] = { UNSUPPORTED_PERF_EVENT_ID
},
274 [PERF_COUNT_HW_CACHE_MISSES
] = { UNSUPPORTED_PERF_EVENT_ID
},
275 [PERF_COUNT_HW_BRANCH_INSTRUCTIONS
] = { 0x27, CNTR_EVEN
, T
},
276 [PERF_COUNT_HW_BRANCH_MISSES
] = { 0x27, CNTR_ODD
, T
},
277 [PERF_COUNT_HW_BUS_CYCLES
] = { UNSUPPORTED_PERF_EVENT_ID
},
280 /* 24K/34K/1004K cores can share the same cache event map. */
281 static const struct mips_perf_event mipsxxcore_cache_map
282 [PERF_COUNT_HW_CACHE_MAX
]
283 [PERF_COUNT_HW_CACHE_OP_MAX
]
284 [PERF_COUNT_HW_CACHE_RESULT_MAX
] = {
287 * Like some other architectures (e.g. ARM), the performance
288 * counters don't differentiate between read and write
289 * accesses/misses, so this isn't strictly correct, but it's the
290 * best we can do. Writes and reads get combined.
293 [C(RESULT_ACCESS
)] = { 0x0a, CNTR_EVEN
, T
},
294 [C(RESULT_MISS
)] = { 0x0b, CNTR_EVEN
| CNTR_ODD
, T
},
297 [C(RESULT_ACCESS
)] = { 0x0a, CNTR_EVEN
, T
},
298 [C(RESULT_MISS
)] = { 0x0b, CNTR_EVEN
| CNTR_ODD
, T
},
301 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
302 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
307 [C(RESULT_ACCESS
)] = { 0x09, CNTR_EVEN
, T
},
308 [C(RESULT_MISS
)] = { 0x09, CNTR_ODD
, T
},
311 [C(RESULT_ACCESS
)] = { 0x09, CNTR_EVEN
, T
},
312 [C(RESULT_MISS
)] = { 0x09, CNTR_ODD
, T
},
315 [C(RESULT_ACCESS
)] = { 0x14, CNTR_EVEN
, T
},
317 * Note that MIPS has only "hit" events countable for
318 * the prefetch operation.
320 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
325 [C(RESULT_ACCESS
)] = { 0x15, CNTR_ODD
, P
},
326 [C(RESULT_MISS
)] = { 0x16, CNTR_EVEN
, P
},
329 [C(RESULT_ACCESS
)] = { 0x15, CNTR_ODD
, P
},
330 [C(RESULT_MISS
)] = { 0x16, CNTR_EVEN
, P
},
333 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
334 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
339 [C(RESULT_ACCESS
)] = { 0x06, CNTR_EVEN
, T
},
340 [C(RESULT_MISS
)] = { 0x06, CNTR_ODD
, T
},
343 [C(RESULT_ACCESS
)] = { 0x06, CNTR_EVEN
, T
},
344 [C(RESULT_MISS
)] = { 0x06, CNTR_ODD
, T
},
347 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
348 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
353 [C(RESULT_ACCESS
)] = { 0x05, CNTR_EVEN
, T
},
354 [C(RESULT_MISS
)] = { 0x05, CNTR_ODD
, T
},
357 [C(RESULT_ACCESS
)] = { 0x05, CNTR_EVEN
, T
},
358 [C(RESULT_MISS
)] = { 0x05, CNTR_ODD
, T
},
361 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
362 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
366 /* Using the same code for *HW_BRANCH* */
368 [C(RESULT_ACCESS
)] = { 0x02, CNTR_EVEN
, T
},
369 [C(RESULT_MISS
)] = { 0x02, CNTR_ODD
, T
},
372 [C(RESULT_ACCESS
)] = { 0x02, CNTR_EVEN
, T
},
373 [C(RESULT_MISS
)] = { 0x02, CNTR_ODD
, T
},
376 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
377 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
382 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
383 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
386 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
387 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
390 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
391 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
396 /* 74K core has completely different cache event map. */
397 static const struct mips_perf_event mipsxx74Kcore_cache_map
398 [PERF_COUNT_HW_CACHE_MAX
]
399 [PERF_COUNT_HW_CACHE_OP_MAX
]
400 [PERF_COUNT_HW_CACHE_RESULT_MAX
] = {
403 * Like some other architectures (e.g. ARM), the performance
404 * counters don't differentiate between read and write
405 * accesses/misses, so this isn't strictly correct, but it's the
406 * best we can do. Writes and reads get combined.
409 [C(RESULT_ACCESS
)] = { 0x17, CNTR_ODD
, T
},
410 [C(RESULT_MISS
)] = { 0x18, CNTR_ODD
, T
},
413 [C(RESULT_ACCESS
)] = { 0x17, CNTR_ODD
, T
},
414 [C(RESULT_MISS
)] = { 0x18, CNTR_ODD
, T
},
417 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
418 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
423 [C(RESULT_ACCESS
)] = { 0x06, CNTR_EVEN
, T
},
424 [C(RESULT_MISS
)] = { 0x06, CNTR_ODD
, T
},
427 [C(RESULT_ACCESS
)] = { 0x06, CNTR_EVEN
, T
},
428 [C(RESULT_MISS
)] = { 0x06, CNTR_ODD
, T
},
431 [C(RESULT_ACCESS
)] = { 0x34, CNTR_EVEN
, T
},
433 * Note that MIPS has only "hit" events countable for
434 * the prefetch operation.
436 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
441 [C(RESULT_ACCESS
)] = { 0x1c, CNTR_ODD
, P
},
442 [C(RESULT_MISS
)] = { 0x1d, CNTR_EVEN
| CNTR_ODD
, P
},
445 [C(RESULT_ACCESS
)] = { 0x1c, CNTR_ODD
, P
},
446 [C(RESULT_MISS
)] = { 0x1d, CNTR_EVEN
| CNTR_ODD
, P
},
449 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
450 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
454 /* 74K core does not have specific DTLB events. */
456 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
457 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
460 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
461 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
464 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
465 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
470 [C(RESULT_ACCESS
)] = { 0x04, CNTR_EVEN
, T
},
471 [C(RESULT_MISS
)] = { 0x04, CNTR_ODD
, T
},
474 [C(RESULT_ACCESS
)] = { 0x04, CNTR_EVEN
, T
},
475 [C(RESULT_MISS
)] = { 0x04, CNTR_ODD
, T
},
478 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
479 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
483 /* Using the same code for *HW_BRANCH* */
485 [C(RESULT_ACCESS
)] = { 0x27, CNTR_EVEN
, T
},
486 [C(RESULT_MISS
)] = { 0x27, CNTR_ODD
, T
},
489 [C(RESULT_ACCESS
)] = { 0x27, CNTR_EVEN
, T
},
490 [C(RESULT_MISS
)] = { 0x27, CNTR_ODD
, T
},
493 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
494 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
499 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
500 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
503 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
504 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
507 [C(RESULT_ACCESS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
508 [C(RESULT_MISS
)] = { UNSUPPORTED_PERF_EVENT_ID
},
513 #ifdef CONFIG_MIPS_MT_SMP
515 check_and_calc_range(struct perf_event
*event
,
516 const struct mips_perf_event
*pev
)
518 struct hw_perf_event
*hwc
= &event
->hw
;
520 if (event
->cpu
>= 0) {
521 if (pev
->range
> V
) {
523 * The user selected an event that is processor
524 * wide, while expecting it to be VPE wide.
526 hwc
->config_base
|= M_TC_EN_ALL
;
529 * FIXME: cpu_data[event->cpu].vpe_id reports 0
532 hwc
->config_base
|= M_PERFCTL_VPEID(event
->cpu
);
533 hwc
->config_base
|= M_TC_EN_VPE
;
536 hwc
->config_base
|= M_TC_EN_ALL
;
540 check_and_calc_range(struct perf_event
*event
,
541 const struct mips_perf_event
*pev
)
546 static int __hw_perf_event_init(struct perf_event
*event
)
548 struct perf_event_attr
*attr
= &event
->attr
;
549 struct hw_perf_event
*hwc
= &event
->hw
;
550 const struct mips_perf_event
*pev
;
553 /* Returning MIPS event descriptor for generic perf event. */
554 if (PERF_TYPE_HARDWARE
== event
->attr
.type
) {
555 if (event
->attr
.config
>= PERF_COUNT_HW_MAX
)
557 pev
= mipspmu_map_general_event(event
->attr
.config
);
558 } else if (PERF_TYPE_HW_CACHE
== event
->attr
.type
) {
559 pev
= mipspmu_map_cache_event(event
->attr
.config
);
560 } else if (PERF_TYPE_RAW
== event
->attr
.type
) {
561 /* We are working on the global raw event. */
562 mutex_lock(&raw_event_mutex
);
563 pev
= mipspmu
->map_raw_event(event
->attr
.config
);
565 /* The event type is not (yet) supported. */
570 if (PERF_TYPE_RAW
== event
->attr
.type
)
571 mutex_unlock(&raw_event_mutex
);
576 * We allow max flexibility on how each individual counter shared
577 * by the single CPU operates (the mode exclusion and the range).
579 hwc
->config_base
= M_PERFCTL_INTERRUPT_ENABLE
;
581 /* Calculate range bits and validate it. */
582 if (num_possible_cpus() > 1)
583 check_and_calc_range(event
, pev
);
585 hwc
->event_base
= mipspmu_perf_event_encode(pev
);
586 if (PERF_TYPE_RAW
== event
->attr
.type
)
587 mutex_unlock(&raw_event_mutex
);
589 if (!attr
->exclude_user
)
590 hwc
->config_base
|= M_PERFCTL_USER
;
591 if (!attr
->exclude_kernel
) {
592 hwc
->config_base
|= M_PERFCTL_KERNEL
;
593 /* MIPS kernel mode: KSU == 00b || EXL == 1 || ERL == 1 */
594 hwc
->config_base
|= M_PERFCTL_EXL
;
596 if (!attr
->exclude_hv
)
597 hwc
->config_base
|= M_PERFCTL_SUPERVISOR
;
599 hwc
->config_base
&= M_PERFCTL_CONFIG_MASK
;
601 * The event can belong to another cpu. We do not assign a local
602 * counter for it for now.
607 if (!hwc
->sample_period
) {
608 hwc
->sample_period
= MAX_PERIOD
;
609 hwc
->last_period
= hwc
->sample_period
;
610 local64_set(&hwc
->period_left
, hwc
->sample_period
);
614 if (event
->group_leader
!= event
) {
615 err
= validate_group(event
);
620 event
->destroy
= hw_perf_event_destroy
;
625 static void pause_local_counters(void)
627 struct cpu_hw_events
*cpuc
= &__get_cpu_var(cpu_hw_events
);
628 int counters
= mipspmu
->num_counters
;
631 local_irq_save(flags
);
634 cpuc
->saved_ctrl
[3] = r_c0_perfctrl3();
635 w_c0_perfctrl3(cpuc
->saved_ctrl
[3] &
636 ~M_PERFCTL_COUNT_EVENT_WHENEVER
);
638 cpuc
->saved_ctrl
[2] = r_c0_perfctrl2();
639 w_c0_perfctrl2(cpuc
->saved_ctrl
[2] &
640 ~M_PERFCTL_COUNT_EVENT_WHENEVER
);
642 cpuc
->saved_ctrl
[1] = r_c0_perfctrl1();
643 w_c0_perfctrl1(cpuc
->saved_ctrl
[1] &
644 ~M_PERFCTL_COUNT_EVENT_WHENEVER
);
646 cpuc
->saved_ctrl
[0] = r_c0_perfctrl0();
647 w_c0_perfctrl0(cpuc
->saved_ctrl
[0] &
648 ~M_PERFCTL_COUNT_EVENT_WHENEVER
);
650 local_irq_restore(flags
);
653 static void resume_local_counters(void)
655 struct cpu_hw_events
*cpuc
= &__get_cpu_var(cpu_hw_events
);
656 int counters
= mipspmu
->num_counters
;
659 local_irq_save(flags
);
662 w_c0_perfctrl3(cpuc
->saved_ctrl
[3]);
664 w_c0_perfctrl2(cpuc
->saved_ctrl
[2]);
666 w_c0_perfctrl1(cpuc
->saved_ctrl
[1]);
668 w_c0_perfctrl0(cpuc
->saved_ctrl
[0]);
670 local_irq_restore(flags
);
673 static int mipsxx_pmu_handle_shared_irq(void)
675 struct cpu_hw_events
*cpuc
= &__get_cpu_var(cpu_hw_events
);
676 struct perf_sample_data data
;
677 unsigned int counters
= mipspmu
->num_counters
;
678 unsigned int counter
;
679 int handled
= IRQ_NONE
;
680 struct pt_regs
*regs
;
682 if (cpu_has_mips_r2
&& !(read_c0_cause() & (1 << 26)))
686 * First we pause the local counters, so that when we are locked
687 * here, the counters are all paused. When it gets locked due to
688 * perf_disable(), the timer interrupt handler will be delayed.
690 * See also mipsxx_pmu_start().
692 pause_local_counters();
693 #ifdef CONFIG_MIPS_MT_SMP
694 read_lock(&pmuint_rwlock
);
697 regs
= get_irq_regs();
699 perf_sample_data_init(&data
, 0);
702 #define HANDLE_COUNTER(n) \
704 if (test_bit(n, cpuc->used_mask)) { \
705 counter = r_c0_perfcntr ## n(); \
706 if (counter & M_COUNTER_OVERFLOW) { \
707 w_c0_perfcntr ## n(counter & \
709 if (test_and_change_bit(n, cpuc->msbs)) \
710 handle_associated_event(cpuc, \
712 handled = IRQ_HANDLED; \
722 * Do all the work for the pending perf events. We can do this
723 * in here because the performance counter interrupt is a regular
724 * interrupt, not NMI.
726 if (handled
== IRQ_HANDLED
)
729 #ifdef CONFIG_MIPS_MT_SMP
730 read_unlock(&pmuint_rwlock
);
732 resume_local_counters();
737 mipsxx_pmu_handle_irq(int irq
, void *dev
)
739 return mipsxx_pmu_handle_shared_irq();
742 static void mipsxx_pmu_start(void)
744 #ifdef CONFIG_MIPS_MT_SMP
745 write_unlock(&pmuint_rwlock
);
747 resume_local_counters();
751 * MIPS performance counters can be per-TC. The control registers can
752 * not be directly accessed across CPUs. Hence if we want to do global
753 * control, we need cross CPU calls. on_each_cpu() can help us, but we
754 * can not make sure this function is called with interrupts enabled. So
755 * here we pause local counters and then grab a rwlock and leave the
756 * counters on other CPUs alone. If any counter interrupt raises while
757 * we own the write lock, simply pause local counters on that CPU and
758 * spin in the handler. Also we know we won't be switched to another
759 * CPU after pausing local counters and before grabbing the lock.
761 static void mipsxx_pmu_stop(void)
763 pause_local_counters();
764 #ifdef CONFIG_MIPS_MT_SMP
765 write_lock(&pmuint_rwlock
);
770 mipsxx_pmu_alloc_counter(struct cpu_hw_events
*cpuc
,
771 struct hw_perf_event
*hwc
)
776 * We only need to care the counter mask. The range has been
777 * checked definitely.
779 unsigned long cntr_mask
= (hwc
->event_base
>> 8) & 0xffff;
781 for (i
= mipspmu
->num_counters
- 1; i
>= 0; i
--) {
783 * Note that some MIPS perf events can be counted by both
784 * even and odd counters, wheresas many other are only by
785 * even _or_ odd counters. This introduces an issue that
786 * when the former kind of event takes the counter the
787 * latter kind of event wants to use, then the "counter
788 * allocation" for the latter event will fail. In fact if
789 * they can be dynamically swapped, they both feel happy.
790 * But here we leave this issue alone for now.
792 if (test_bit(i
, &cntr_mask
) &&
793 !test_and_set_bit(i
, cpuc
->used_mask
))
801 mipsxx_pmu_enable_event(struct hw_perf_event
*evt
, int idx
)
803 struct cpu_hw_events
*cpuc
= &__get_cpu_var(cpu_hw_events
);
806 WARN_ON(idx
< 0 || idx
>= mipspmu
->num_counters
);
808 local_irq_save(flags
);
809 cpuc
->saved_ctrl
[idx
] = M_PERFCTL_EVENT(evt
->event_base
& 0xff) |
810 (evt
->config_base
& M_PERFCTL_CONFIG_MASK
) |
811 /* Make sure interrupt enabled. */
812 M_PERFCTL_INTERRUPT_ENABLE
;
814 * We do not actually let the counter run. Leave it until start().
816 local_irq_restore(flags
);
820 mipsxx_pmu_disable_event(int idx
)
822 struct cpu_hw_events
*cpuc
= &__get_cpu_var(cpu_hw_events
);
825 WARN_ON(idx
< 0 || idx
>= mipspmu
->num_counters
);
827 local_irq_save(flags
);
828 cpuc
->saved_ctrl
[idx
] = mipsxx_pmu_read_control(idx
) &
829 ~M_PERFCTL_COUNT_EVENT_WHENEVER
;
830 mipsxx_pmu_write_control(idx
, cpuc
->saved_ctrl
[idx
]);
831 local_irq_restore(flags
);
835 #define IS_UNSUPPORTED_24K_EVENT(r, b) \
836 ((b) == 12 || (r) == 151 || (r) == 152 || (b) == 26 || \
837 (b) == 27 || (r) == 28 || (r) == 158 || (b) == 31 || \
838 (b) == 32 || (b) == 34 || (b) == 36 || (r) == 168 || \
839 (r) == 172 || (b) == 47 || ((b) >= 56 && (b) <= 63) || \
840 ((b) >= 68 && (b) <= 127))
841 #define IS_BOTH_COUNTERS_24K_EVENT(b) \
842 ((b) == 0 || (b) == 1 || (b) == 11)
845 #define IS_UNSUPPORTED_34K_EVENT(r, b) \
846 ((b) == 12 || (r) == 27 || (r) == 158 || (b) == 36 || \
847 (b) == 38 || (r) == 175 || ((b) >= 56 && (b) <= 63) || \
848 ((b) >= 68 && (b) <= 127))
849 #define IS_BOTH_COUNTERS_34K_EVENT(b) \
850 ((b) == 0 || (b) == 1 || (b) == 11)
851 #ifdef CONFIG_MIPS_MT_SMP
852 #define IS_RANGE_P_34K_EVENT(r, b) \
853 ((b) == 0 || (r) == 18 || (b) == 21 || (b) == 22 || \
854 (b) == 25 || (b) == 39 || (r) == 44 || (r) == 174 || \
855 (r) == 176 || ((b) >= 50 && (b) <= 55) || \
856 ((b) >= 64 && (b) <= 67))
857 #define IS_RANGE_V_34K_EVENT(r) ((r) == 47)
861 #define IS_UNSUPPORTED_74K_EVENT(r, b) \
862 ((r) == 5 || ((r) >= 135 && (r) <= 137) || \
863 ((b) >= 10 && (b) <= 12) || (b) == 22 || (b) == 27 || \
864 (b) == 33 || (b) == 34 || ((b) >= 47 && (b) <= 49) || \
865 (r) == 178 || (b) == 55 || (b) == 57 || (b) == 60 || \
866 (b) == 61 || (r) == 62 || (r) == 191 || \
867 ((b) >= 64 && (b) <= 127))
868 #define IS_BOTH_COUNTERS_74K_EVENT(b) \
869 ((b) == 0 || (b) == 1)
872 #define IS_UNSUPPORTED_1004K_EVENT(r, b) \
873 ((b) == 12 || (r) == 27 || (r) == 158 || (b) == 38 || \
874 (r) == 175 || (b) == 63 || ((b) >= 68 && (b) <= 127))
875 #define IS_BOTH_COUNTERS_1004K_EVENT(b) \
876 ((b) == 0 || (b) == 1 || (b) == 11)
877 #ifdef CONFIG_MIPS_MT_SMP
878 #define IS_RANGE_P_1004K_EVENT(r, b) \
879 ((b) == 0 || (r) == 18 || (b) == 21 || (b) == 22 || \
880 (b) == 25 || (b) == 36 || (b) == 39 || (r) == 44 || \
881 (r) == 174 || (r) == 176 || ((b) >= 50 && (b) <= 59) || \
882 (r) == 188 || (b) == 61 || (b) == 62 || \
883 ((b) >= 64 && (b) <= 67))
884 #define IS_RANGE_V_1004K_EVENT(r) ((r) == 47)
888 * User can use 0-255 raw events, where 0-127 for the events of even
889 * counters, and 128-255 for odd counters. Note that bit 7 is used to
890 * indicate the parity. So, for example, when user wants to take the
891 * Event Num of 15 for odd counters (by referring to the user manual),
892 * then 128 needs to be added to 15 as the input for the event config,
893 * i.e., 143 (0x8F) to be used.
895 static const struct mips_perf_event
*
896 mipsxx_pmu_map_raw_event(u64 config
)
898 unsigned int raw_id
= config
& 0xff;
899 unsigned int base_id
= raw_id
& 0x7f;
901 switch (current_cpu_type()) {
903 if (IS_UNSUPPORTED_24K_EVENT(raw_id
, base_id
))
904 return ERR_PTR(-EOPNOTSUPP
);
905 raw_event
.event_id
= base_id
;
906 if (IS_BOTH_COUNTERS_24K_EVENT(base_id
))
907 raw_event
.cntr_mask
= CNTR_EVEN
| CNTR_ODD
;
909 raw_event
.cntr_mask
=
910 raw_id
> 127 ? CNTR_ODD
: CNTR_EVEN
;
911 #ifdef CONFIG_MIPS_MT_SMP
913 * This is actually doing nothing. Non-multithreading
914 * CPUs will not check and calculate the range.
920 if (IS_UNSUPPORTED_34K_EVENT(raw_id
, base_id
))
921 return ERR_PTR(-EOPNOTSUPP
);
922 raw_event
.event_id
= base_id
;
923 if (IS_BOTH_COUNTERS_34K_EVENT(base_id
))
924 raw_event
.cntr_mask
= CNTR_EVEN
| CNTR_ODD
;
926 raw_event
.cntr_mask
=
927 raw_id
> 127 ? CNTR_ODD
: CNTR_EVEN
;
928 #ifdef CONFIG_MIPS_MT_SMP
929 if (IS_RANGE_P_34K_EVENT(raw_id
, base_id
))
931 else if (unlikely(IS_RANGE_V_34K_EVENT(raw_id
)))
938 if (IS_UNSUPPORTED_74K_EVENT(raw_id
, base_id
))
939 return ERR_PTR(-EOPNOTSUPP
);
940 raw_event
.event_id
= base_id
;
941 if (IS_BOTH_COUNTERS_74K_EVENT(base_id
))
942 raw_event
.cntr_mask
= CNTR_EVEN
| CNTR_ODD
;
944 raw_event
.cntr_mask
=
945 raw_id
> 127 ? CNTR_ODD
: CNTR_EVEN
;
946 #ifdef CONFIG_MIPS_MT_SMP
951 if (IS_UNSUPPORTED_1004K_EVENT(raw_id
, base_id
))
952 return ERR_PTR(-EOPNOTSUPP
);
953 raw_event
.event_id
= base_id
;
954 if (IS_BOTH_COUNTERS_1004K_EVENT(base_id
))
955 raw_event
.cntr_mask
= CNTR_EVEN
| CNTR_ODD
;
957 raw_event
.cntr_mask
=
958 raw_id
> 127 ? CNTR_ODD
: CNTR_EVEN
;
959 #ifdef CONFIG_MIPS_MT_SMP
960 if (IS_RANGE_P_1004K_EVENT(raw_id
, base_id
))
962 else if (unlikely(IS_RANGE_V_1004K_EVENT(raw_id
)))
973 static struct mips_pmu mipsxxcore_pmu
= {
974 .handle_irq
= mipsxx_pmu_handle_irq
,
975 .handle_shared_irq
= mipsxx_pmu_handle_shared_irq
,
976 .start
= mipsxx_pmu_start
,
977 .stop
= mipsxx_pmu_stop
,
978 .alloc_counter
= mipsxx_pmu_alloc_counter
,
979 .read_counter
= mipsxx_pmu_read_counter
,
980 .write_counter
= mipsxx_pmu_write_counter
,
981 .enable_event
= mipsxx_pmu_enable_event
,
982 .disable_event
= mipsxx_pmu_disable_event
,
983 .map_raw_event
= mipsxx_pmu_map_raw_event
,
984 .general_event_map
= &mipsxxcore_event_map
,
985 .cache_event_map
= &mipsxxcore_cache_map
,
988 static struct mips_pmu mipsxx74Kcore_pmu
= {
989 .handle_irq
= mipsxx_pmu_handle_irq
,
990 .handle_shared_irq
= mipsxx_pmu_handle_shared_irq
,
991 .start
= mipsxx_pmu_start
,
992 .stop
= mipsxx_pmu_stop
,
993 .alloc_counter
= mipsxx_pmu_alloc_counter
,
994 .read_counter
= mipsxx_pmu_read_counter
,
995 .write_counter
= mipsxx_pmu_write_counter
,
996 .enable_event
= mipsxx_pmu_enable_event
,
997 .disable_event
= mipsxx_pmu_disable_event
,
998 .map_raw_event
= mipsxx_pmu_map_raw_event
,
999 .general_event_map
= &mipsxx74Kcore_event_map
,
1000 .cache_event_map
= &mipsxx74Kcore_cache_map
,
1004 init_hw_perf_events(void)
1008 pr_info("Performance counters: ");
1010 counters
= n_counters();
1011 if (counters
== 0) {
1012 pr_cont("No available PMU.\n");
1016 #ifdef CONFIG_MIPS_MT_SMP
1017 cpu_has_mipsmt_pertccounters
= read_c0_config7() & (1<<19);
1018 if (!cpu_has_mipsmt_pertccounters
)
1019 counters
= counters_total_to_per_cpu(counters
);
1022 #ifdef MSC01E_INT_BASE
1025 * Using platform specific interrupt controller defines.
1027 irq
= MSC01E_INT_BASE
+ MSC01E_INT_PERFCTR
;
1030 if (cp0_perfcount_irq
>= 0)
1031 irq
= MIPS_CPU_IRQ_BASE
+ cp0_perfcount_irq
;
1034 #ifdef MSC01E_INT_BASE
1038 on_each_cpu(reset_counters
, (void *)(long)counters
, 1);
1040 switch (current_cpu_type()) {
1042 mipsxxcore_pmu
.name
= "mips/24K";
1043 mipsxxcore_pmu
.num_counters
= counters
;
1044 mipsxxcore_pmu
.irq
= irq
;
1045 mipspmu
= &mipsxxcore_pmu
;
1048 mipsxxcore_pmu
.name
= "mips/34K";
1049 mipsxxcore_pmu
.num_counters
= counters
;
1050 mipsxxcore_pmu
.irq
= irq
;
1051 mipspmu
= &mipsxxcore_pmu
;
1054 mipsxx74Kcore_pmu
.name
= "mips/74K";
1055 mipsxx74Kcore_pmu
.num_counters
= counters
;
1056 mipsxx74Kcore_pmu
.irq
= irq
;
1057 mipspmu
= &mipsxx74Kcore_pmu
;
1060 mipsxxcore_pmu
.name
= "mips/1004K";
1061 mipsxxcore_pmu
.num_counters
= counters
;
1062 mipsxxcore_pmu
.irq
= irq
;
1063 mipspmu
= &mipsxxcore_pmu
;
1066 pr_cont("Either hardware does not support performance "
1067 "counters, or not yet implemented.\n");
1072 pr_cont("%s PMU enabled, %d counters available to each "
1073 "CPU, irq %d%s\n", mipspmu
->name
, counters
, irq
,
1074 irq
< 0 ? " (share with timer interrupt)" : "");
1076 perf_pmu_register(&pmu
, "cpu", PERF_TYPE_RAW
);
1080 early_initcall(init_hw_perf_events
);
1082 #endif /* defined(CONFIG_CPU_MIPS32)... */