2 * HiSilicon SoC Hardware event counters support
4 * Copyright (C) 2017 Hisilicon Limited
5 * Author: Anurup M <anurup.m@huawei.com>
6 * Shaokun Zhang <zhangshaokun@hisilicon.com>
8 * This code is based on the uncore PMUs like arm-cci and arm-ccn.
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License version 2 as
12 * published by the Free Software Foundation.
14 #include <linux/bitmap.h>
15 #include <linux/bitops.h>
16 #include <linux/bug.h>
17 #include <linux/err.h>
18 #include <linux/errno.h>
19 #include <linux/interrupt.h>
21 #include <asm/local64.h>
23 #include "hisi_uncore_pmu.h"
25 #define HISI_GET_EVENTID(ev) (ev->hw.config_base & 0xff)
26 #define HISI_MAX_PERIOD(nr) (BIT_ULL(nr) - 1)
29 * PMU format attributes
31 ssize_t
hisi_format_sysfs_show(struct device
*dev
,
32 struct device_attribute
*attr
, char *buf
)
34 struct dev_ext_attribute
*eattr
;
36 eattr
= container_of(attr
, struct dev_ext_attribute
, attr
);
38 return sprintf(buf
, "%s\n", (char *)eattr
->var
);
42 * PMU event attributes
44 ssize_t
hisi_event_sysfs_show(struct device
*dev
,
45 struct device_attribute
*attr
, char *page
)
47 struct dev_ext_attribute
*eattr
;
49 eattr
= container_of(attr
, struct dev_ext_attribute
, attr
);
51 return sprintf(page
, "config=0x%lx\n", (unsigned long)eattr
->var
);
55 * sysfs cpumask attributes. For uncore PMU, we only have a single CPU to show
57 ssize_t
hisi_cpumask_sysfs_show(struct device
*dev
,
58 struct device_attribute
*attr
, char *buf
)
60 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(dev_get_drvdata(dev
));
62 return sprintf(buf
, "%d\n", hisi_pmu
->on_cpu
);
65 static bool hisi_validate_event_group(struct perf_event
*event
)
67 struct perf_event
*sibling
, *leader
= event
->group_leader
;
68 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(event
->pmu
);
69 /* Include count for the event */
72 if (!is_software_event(leader
)) {
74 * We must NOT create groups containing mixed PMUs, although
75 * software events are acceptable
77 if (leader
->pmu
!= event
->pmu
)
80 /* Increment counter for the leader */
85 list_for_each_entry(sibling
, &event
->group_leader
->sibling_list
,
87 if (is_software_event(sibling
))
89 if (sibling
->pmu
!= event
->pmu
)
91 /* Increment counter for each sibling */
95 /* The group can not count events more than the counters in the HW */
96 return counters
<= hisi_pmu
->num_counters
;
99 int hisi_uncore_pmu_counter_valid(struct hisi_pmu
*hisi_pmu
, int idx
)
101 return idx
>= 0 && idx
< hisi_pmu
->num_counters
;
104 int hisi_uncore_pmu_get_event_idx(struct perf_event
*event
)
106 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(event
->pmu
);
107 unsigned long *used_mask
= hisi_pmu
->pmu_events
.used_mask
;
108 u32 num_counters
= hisi_pmu
->num_counters
;
111 idx
= find_first_zero_bit(used_mask
, num_counters
);
112 if (idx
== num_counters
)
115 set_bit(idx
, used_mask
);
120 static void hisi_uncore_pmu_clear_event_idx(struct hisi_pmu
*hisi_pmu
, int idx
)
122 if (!hisi_uncore_pmu_counter_valid(hisi_pmu
, idx
)) {
123 dev_err(hisi_pmu
->dev
, "Unsupported event index:%d!\n", idx
);
127 clear_bit(idx
, hisi_pmu
->pmu_events
.used_mask
);
130 int hisi_uncore_pmu_event_init(struct perf_event
*event
)
132 struct hw_perf_event
*hwc
= &event
->hw
;
133 struct hisi_pmu
*hisi_pmu
;
135 if (event
->attr
.type
!= event
->pmu
->type
)
139 * We do not support sampling as the counters are all
140 * shared by all CPU cores in a CPU die(SCCL). Also we
141 * do not support attach to a task(per-process mode)
143 if (is_sampling_event(event
) || event
->attach_state
& PERF_ATTACH_TASK
)
146 /* counters do not have these bits */
147 if (event
->attr
.exclude_user
||
148 event
->attr
.exclude_kernel
||
149 event
->attr
.exclude_host
||
150 event
->attr
.exclude_guest
||
151 event
->attr
.exclude_hv
||
152 event
->attr
.exclude_idle
)
156 * The uncore counters not specific to any CPU, so cannot
163 * Validate if the events in group does not exceed the
164 * available counters in hardware.
166 if (!hisi_validate_event_group(event
))
169 hisi_pmu
= to_hisi_pmu(event
->pmu
);
170 if (event
->attr
.config
> hisi_pmu
->check_event
)
173 if (hisi_pmu
->on_cpu
== -1)
176 * We don't assign an index until we actually place the event onto
177 * hardware. Use -1 to signify that we haven't decided where to put it
181 hwc
->config_base
= event
->attr
.config
;
183 /* Enforce to use the same CPU for all events in this PMU */
184 event
->cpu
= hisi_pmu
->on_cpu
;
190 * Set the counter to count the event that we're interested in,
191 * and enable interrupt and counter.
193 static void hisi_uncore_pmu_enable_event(struct perf_event
*event
)
195 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(event
->pmu
);
196 struct hw_perf_event
*hwc
= &event
->hw
;
198 hisi_pmu
->ops
->write_evtype(hisi_pmu
, hwc
->idx
,
199 HISI_GET_EVENTID(event
));
201 hisi_pmu
->ops
->enable_counter_int(hisi_pmu
, hwc
);
202 hisi_pmu
->ops
->enable_counter(hisi_pmu
, hwc
);
206 * Disable counter and interrupt.
208 static void hisi_uncore_pmu_disable_event(struct perf_event
*event
)
210 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(event
->pmu
);
211 struct hw_perf_event
*hwc
= &event
->hw
;
213 hisi_pmu
->ops
->disable_counter(hisi_pmu
, hwc
);
214 hisi_pmu
->ops
->disable_counter_int(hisi_pmu
, hwc
);
217 void hisi_uncore_pmu_set_event_period(struct perf_event
*event
)
219 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(event
->pmu
);
220 struct hw_perf_event
*hwc
= &event
->hw
;
223 * The HiSilicon PMU counters support 32 bits or 48 bits, depending on
224 * the PMU. We reduce it to 2^(counter_bits - 1) to account for the
225 * extreme interrupt latency. So we could hopefully handle the overflow
226 * interrupt before another 2^(counter_bits - 1) events occur and the
227 * counter overtakes its previous value.
229 u64 val
= BIT_ULL(hisi_pmu
->counter_bits
- 1);
231 local64_set(&hwc
->prev_count
, val
);
232 /* Write start value to the hardware event counter */
233 hisi_pmu
->ops
->write_counter(hisi_pmu
, hwc
, val
);
236 void hisi_uncore_pmu_event_update(struct perf_event
*event
)
238 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(event
->pmu
);
239 struct hw_perf_event
*hwc
= &event
->hw
;
240 u64 delta
, prev_raw_count
, new_raw_count
;
243 /* Read the count from the counter register */
244 new_raw_count
= hisi_pmu
->ops
->read_counter(hisi_pmu
, hwc
);
245 prev_raw_count
= local64_read(&hwc
->prev_count
);
246 } while (local64_cmpxchg(&hwc
->prev_count
, prev_raw_count
,
247 new_raw_count
) != prev_raw_count
);
251 delta
= (new_raw_count
- prev_raw_count
) &
252 HISI_MAX_PERIOD(hisi_pmu
->counter_bits
);
253 local64_add(delta
, &event
->count
);
256 void hisi_uncore_pmu_start(struct perf_event
*event
, int flags
)
258 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(event
->pmu
);
259 struct hw_perf_event
*hwc
= &event
->hw
;
261 if (WARN_ON_ONCE(!(hwc
->state
& PERF_HES_STOPPED
)))
264 WARN_ON_ONCE(!(hwc
->state
& PERF_HES_UPTODATE
));
266 hisi_uncore_pmu_set_event_period(event
);
268 if (flags
& PERF_EF_RELOAD
) {
269 u64 prev_raw_count
= local64_read(&hwc
->prev_count
);
271 hisi_pmu
->ops
->write_counter(hisi_pmu
, hwc
, prev_raw_count
);
274 hisi_uncore_pmu_enable_event(event
);
275 perf_event_update_userpage(event
);
278 void hisi_uncore_pmu_stop(struct perf_event
*event
, int flags
)
280 struct hw_perf_event
*hwc
= &event
->hw
;
282 hisi_uncore_pmu_disable_event(event
);
283 WARN_ON_ONCE(hwc
->state
& PERF_HES_STOPPED
);
284 hwc
->state
|= PERF_HES_STOPPED
;
286 if (hwc
->state
& PERF_HES_UPTODATE
)
289 /* Read hardware counter and update the perf counter statistics */
290 hisi_uncore_pmu_event_update(event
);
291 hwc
->state
|= PERF_HES_UPTODATE
;
294 int hisi_uncore_pmu_add(struct perf_event
*event
, int flags
)
296 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(event
->pmu
);
297 struct hw_perf_event
*hwc
= &event
->hw
;
300 hwc
->state
= PERF_HES_STOPPED
| PERF_HES_UPTODATE
;
302 /* Get an available counter index for counting */
303 idx
= hisi_pmu
->ops
->get_event_idx(event
);
308 hisi_pmu
->pmu_events
.hw_events
[idx
] = event
;
310 if (flags
& PERF_EF_START
)
311 hisi_uncore_pmu_start(event
, PERF_EF_RELOAD
);
316 void hisi_uncore_pmu_del(struct perf_event
*event
, int flags
)
318 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(event
->pmu
);
319 struct hw_perf_event
*hwc
= &event
->hw
;
321 hisi_uncore_pmu_stop(event
, PERF_EF_UPDATE
);
322 hisi_uncore_pmu_clear_event_idx(hisi_pmu
, hwc
->idx
);
323 perf_event_update_userpage(event
);
324 hisi_pmu
->pmu_events
.hw_events
[hwc
->idx
] = NULL
;
327 void hisi_uncore_pmu_read(struct perf_event
*event
)
329 /* Read hardware counter and update the perf counter statistics */
330 hisi_uncore_pmu_event_update(event
);
333 void hisi_uncore_pmu_enable(struct pmu
*pmu
)
335 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(pmu
);
336 int enabled
= bitmap_weight(hisi_pmu
->pmu_events
.used_mask
,
337 hisi_pmu
->num_counters
);
342 hisi_pmu
->ops
->start_counters(hisi_pmu
);
345 void hisi_uncore_pmu_disable(struct pmu
*pmu
)
347 struct hisi_pmu
*hisi_pmu
= to_hisi_pmu(pmu
);
349 hisi_pmu
->ops
->stop_counters(hisi_pmu
);
353 * Read Super CPU cluster and CPU cluster ID from MPIDR_EL1.
354 * If multi-threading is supported, SCCL_ID is in MPIDR[aff3] and CCL_ID
355 * is in MPIDR[aff2]; if not, SCCL_ID is in MPIDR[aff2] and CCL_ID is
356 * in MPIDR[aff1]. If this changes in future, this shall be updated.
358 static void hisi_read_sccl_and_ccl_id(int *sccl_id
, int *ccl_id
)
360 u64 mpidr
= read_cpuid_mpidr();
362 if (mpidr
& MPIDR_MT_BITMASK
) {
364 *sccl_id
= MPIDR_AFFINITY_LEVEL(mpidr
, 3);
366 *ccl_id
= MPIDR_AFFINITY_LEVEL(mpidr
, 2);
369 *sccl_id
= MPIDR_AFFINITY_LEVEL(mpidr
, 2);
371 *ccl_id
= MPIDR_AFFINITY_LEVEL(mpidr
, 1);
376 * Check whether the CPU is associated with this uncore PMU
378 static bool hisi_pmu_cpu_is_associated_pmu(struct hisi_pmu
*hisi_pmu
)
382 if (hisi_pmu
->ccl_id
== -1) {
383 /* If CCL_ID is -1, the PMU only shares the same SCCL */
384 hisi_read_sccl_and_ccl_id(&sccl_id
, NULL
);
386 return sccl_id
== hisi_pmu
->sccl_id
;
389 hisi_read_sccl_and_ccl_id(&sccl_id
, &ccl_id
);
391 return sccl_id
== hisi_pmu
->sccl_id
&& ccl_id
== hisi_pmu
->ccl_id
;
394 int hisi_uncore_pmu_online_cpu(unsigned int cpu
, struct hlist_node
*node
)
396 struct hisi_pmu
*hisi_pmu
= hlist_entry_safe(node
, struct hisi_pmu
,
399 if (!hisi_pmu_cpu_is_associated_pmu(hisi_pmu
))
402 cpumask_set_cpu(cpu
, &hisi_pmu
->associated_cpus
);
404 /* If another CPU is already managing this PMU, simply return. */
405 if (hisi_pmu
->on_cpu
!= -1)
408 /* Use this CPU in cpumask for event counting */
409 hisi_pmu
->on_cpu
= cpu
;
411 /* Overflow interrupt also should use the same CPU */
412 WARN_ON(irq_set_affinity(hisi_pmu
->irq
, cpumask_of(cpu
)));
417 int hisi_uncore_pmu_offline_cpu(unsigned int cpu
, struct hlist_node
*node
)
419 struct hisi_pmu
*hisi_pmu
= hlist_entry_safe(node
, struct hisi_pmu
,
421 cpumask_t pmu_online_cpus
;
424 if (!cpumask_test_and_clear_cpu(cpu
, &hisi_pmu
->associated_cpus
))
427 /* Nothing to do if this CPU doesn't own the PMU */
428 if (hisi_pmu
->on_cpu
!= cpu
)
431 /* Give up ownership of the PMU */
432 hisi_pmu
->on_cpu
= -1;
434 /* Choose a new CPU to migrate ownership of the PMU to */
435 cpumask_and(&pmu_online_cpus
, &hisi_pmu
->associated_cpus
,
437 target
= cpumask_any_but(&pmu_online_cpus
, cpu
);
438 if (target
>= nr_cpu_ids
)
441 perf_pmu_migrate_context(&hisi_pmu
->pmu
, cpu
, target
);
442 /* Use this CPU for event counting */
443 hisi_pmu
->on_cpu
= target
;
444 WARN_ON(irq_set_affinity(hisi_pmu
->irq
, cpumask_of(target
)));