18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 28c2ecf20Sopenharmony_ci#undef DEBUG 38c2ecf20Sopenharmony_ci 48c2ecf20Sopenharmony_ci/* 58c2ecf20Sopenharmony_ci * ARM performance counter support. 68c2ecf20Sopenharmony_ci * 78c2ecf20Sopenharmony_ci * Copyright (C) 2009 picoChip Designs, Ltd., Jamie Iles 88c2ecf20Sopenharmony_ci * Copyright (C) 2010 ARM Ltd., Will Deacon <will.deacon@arm.com> 98c2ecf20Sopenharmony_ci * 108c2ecf20Sopenharmony_ci * This code is based on the sparc64 perf event code, which is in turn based 118c2ecf20Sopenharmony_ci * on the x86 code. 128c2ecf20Sopenharmony_ci */ 138c2ecf20Sopenharmony_ci#define pr_fmt(fmt) "hw perfevents: " fmt 148c2ecf20Sopenharmony_ci 158c2ecf20Sopenharmony_ci#include <linux/bitmap.h> 168c2ecf20Sopenharmony_ci#include <linux/cpumask.h> 178c2ecf20Sopenharmony_ci#include <linux/cpu_pm.h> 188c2ecf20Sopenharmony_ci#include <linux/export.h> 198c2ecf20Sopenharmony_ci#include <linux/kernel.h> 208c2ecf20Sopenharmony_ci#include <linux/perf/arm_pmu.h> 218c2ecf20Sopenharmony_ci#include <linux/slab.h> 228c2ecf20Sopenharmony_ci#include <linux/sched/clock.h> 238c2ecf20Sopenharmony_ci#include <linux/spinlock.h> 248c2ecf20Sopenharmony_ci#include <linux/irq.h> 258c2ecf20Sopenharmony_ci#include <linux/irqdesc.h> 268c2ecf20Sopenharmony_ci 278c2ecf20Sopenharmony_ci#include <asm/irq_regs.h> 288c2ecf20Sopenharmony_ci 298c2ecf20Sopenharmony_cistatic int armpmu_count_irq_users(const int irq); 308c2ecf20Sopenharmony_ci 318c2ecf20Sopenharmony_cistruct pmu_irq_ops { 328c2ecf20Sopenharmony_ci void (*enable_pmuirq)(unsigned int irq); 338c2ecf20Sopenharmony_ci void (*disable_pmuirq)(unsigned int irq); 348c2ecf20Sopenharmony_ci void (*free_pmuirq)(unsigned int irq, int cpu, void __percpu *devid); 358c2ecf20Sopenharmony_ci}; 368c2ecf20Sopenharmony_ci 378c2ecf20Sopenharmony_cistatic void armpmu_free_pmuirq(unsigned int irq, int cpu, void __percpu *devid) 388c2ecf20Sopenharmony_ci{ 398c2ecf20Sopenharmony_ci free_irq(irq, per_cpu_ptr(devid, cpu)); 408c2ecf20Sopenharmony_ci} 418c2ecf20Sopenharmony_ci 428c2ecf20Sopenharmony_cistatic const struct pmu_irq_ops pmuirq_ops = { 438c2ecf20Sopenharmony_ci .enable_pmuirq = enable_irq, 448c2ecf20Sopenharmony_ci .disable_pmuirq = disable_irq_nosync, 458c2ecf20Sopenharmony_ci .free_pmuirq = armpmu_free_pmuirq 468c2ecf20Sopenharmony_ci}; 478c2ecf20Sopenharmony_ci 488c2ecf20Sopenharmony_cistatic void armpmu_free_pmunmi(unsigned int irq, int cpu, void __percpu *devid) 498c2ecf20Sopenharmony_ci{ 508c2ecf20Sopenharmony_ci free_nmi(irq, per_cpu_ptr(devid, cpu)); 518c2ecf20Sopenharmony_ci} 528c2ecf20Sopenharmony_ci 538c2ecf20Sopenharmony_cistatic const struct pmu_irq_ops pmunmi_ops = { 548c2ecf20Sopenharmony_ci .enable_pmuirq = enable_nmi, 558c2ecf20Sopenharmony_ci .disable_pmuirq = disable_nmi_nosync, 568c2ecf20Sopenharmony_ci .free_pmuirq = armpmu_free_pmunmi 578c2ecf20Sopenharmony_ci}; 588c2ecf20Sopenharmony_ci 598c2ecf20Sopenharmony_cistatic void armpmu_enable_percpu_pmuirq(unsigned int irq) 608c2ecf20Sopenharmony_ci{ 618c2ecf20Sopenharmony_ci enable_percpu_irq(irq, IRQ_TYPE_NONE); 628c2ecf20Sopenharmony_ci} 638c2ecf20Sopenharmony_ci 648c2ecf20Sopenharmony_cistatic void armpmu_free_percpu_pmuirq(unsigned int irq, int cpu, 658c2ecf20Sopenharmony_ci void __percpu *devid) 668c2ecf20Sopenharmony_ci{ 678c2ecf20Sopenharmony_ci if (armpmu_count_irq_users(irq) == 1) 688c2ecf20Sopenharmony_ci free_percpu_irq(irq, devid); 698c2ecf20Sopenharmony_ci} 708c2ecf20Sopenharmony_ci 718c2ecf20Sopenharmony_cistatic const struct pmu_irq_ops percpu_pmuirq_ops = { 728c2ecf20Sopenharmony_ci .enable_pmuirq = armpmu_enable_percpu_pmuirq, 738c2ecf20Sopenharmony_ci .disable_pmuirq = disable_percpu_irq, 748c2ecf20Sopenharmony_ci .free_pmuirq = armpmu_free_percpu_pmuirq 758c2ecf20Sopenharmony_ci}; 768c2ecf20Sopenharmony_ci 778c2ecf20Sopenharmony_cistatic void armpmu_enable_percpu_pmunmi(unsigned int irq) 788c2ecf20Sopenharmony_ci{ 798c2ecf20Sopenharmony_ci if (!prepare_percpu_nmi(irq)) 808c2ecf20Sopenharmony_ci enable_percpu_nmi(irq, IRQ_TYPE_NONE); 818c2ecf20Sopenharmony_ci} 828c2ecf20Sopenharmony_ci 838c2ecf20Sopenharmony_cistatic void armpmu_disable_percpu_pmunmi(unsigned int irq) 848c2ecf20Sopenharmony_ci{ 858c2ecf20Sopenharmony_ci disable_percpu_nmi(irq); 868c2ecf20Sopenharmony_ci teardown_percpu_nmi(irq); 878c2ecf20Sopenharmony_ci} 888c2ecf20Sopenharmony_ci 898c2ecf20Sopenharmony_cistatic void armpmu_free_percpu_pmunmi(unsigned int irq, int cpu, 908c2ecf20Sopenharmony_ci void __percpu *devid) 918c2ecf20Sopenharmony_ci{ 928c2ecf20Sopenharmony_ci if (armpmu_count_irq_users(irq) == 1) 938c2ecf20Sopenharmony_ci free_percpu_nmi(irq, devid); 948c2ecf20Sopenharmony_ci} 958c2ecf20Sopenharmony_ci 968c2ecf20Sopenharmony_cistatic const struct pmu_irq_ops percpu_pmunmi_ops = { 978c2ecf20Sopenharmony_ci .enable_pmuirq = armpmu_enable_percpu_pmunmi, 988c2ecf20Sopenharmony_ci .disable_pmuirq = armpmu_disable_percpu_pmunmi, 998c2ecf20Sopenharmony_ci .free_pmuirq = armpmu_free_percpu_pmunmi 1008c2ecf20Sopenharmony_ci}; 1018c2ecf20Sopenharmony_ci 1028c2ecf20Sopenharmony_cistatic DEFINE_PER_CPU(struct arm_pmu *, cpu_armpmu); 1038c2ecf20Sopenharmony_cistatic DEFINE_PER_CPU(int, cpu_irq); 1048c2ecf20Sopenharmony_cistatic DEFINE_PER_CPU(const struct pmu_irq_ops *, cpu_irq_ops); 1058c2ecf20Sopenharmony_ci 1068c2ecf20Sopenharmony_cistatic bool has_nmi; 1078c2ecf20Sopenharmony_ci 1088c2ecf20Sopenharmony_cistatic inline u64 arm_pmu_event_max_period(struct perf_event *event) 1098c2ecf20Sopenharmony_ci{ 1108c2ecf20Sopenharmony_ci if (event->hw.flags & ARMPMU_EVT_64BIT) 1118c2ecf20Sopenharmony_ci return GENMASK_ULL(63, 0); 1128c2ecf20Sopenharmony_ci else 1138c2ecf20Sopenharmony_ci return GENMASK_ULL(31, 0); 1148c2ecf20Sopenharmony_ci} 1158c2ecf20Sopenharmony_ci 1168c2ecf20Sopenharmony_cistatic int 1178c2ecf20Sopenharmony_ciarmpmu_map_cache_event(const unsigned (*cache_map) 1188c2ecf20Sopenharmony_ci [PERF_COUNT_HW_CACHE_MAX] 1198c2ecf20Sopenharmony_ci [PERF_COUNT_HW_CACHE_OP_MAX] 1208c2ecf20Sopenharmony_ci [PERF_COUNT_HW_CACHE_RESULT_MAX], 1218c2ecf20Sopenharmony_ci u64 config) 1228c2ecf20Sopenharmony_ci{ 1238c2ecf20Sopenharmony_ci unsigned int cache_type, cache_op, cache_result, ret; 1248c2ecf20Sopenharmony_ci 1258c2ecf20Sopenharmony_ci cache_type = (config >> 0) & 0xff; 1268c2ecf20Sopenharmony_ci if (cache_type >= PERF_COUNT_HW_CACHE_MAX) 1278c2ecf20Sopenharmony_ci return -EINVAL; 1288c2ecf20Sopenharmony_ci 1298c2ecf20Sopenharmony_ci cache_op = (config >> 8) & 0xff; 1308c2ecf20Sopenharmony_ci if (cache_op >= PERF_COUNT_HW_CACHE_OP_MAX) 1318c2ecf20Sopenharmony_ci return -EINVAL; 1328c2ecf20Sopenharmony_ci 1338c2ecf20Sopenharmony_ci cache_result = (config >> 16) & 0xff; 1348c2ecf20Sopenharmony_ci if (cache_result >= PERF_COUNT_HW_CACHE_RESULT_MAX) 1358c2ecf20Sopenharmony_ci return -EINVAL; 1368c2ecf20Sopenharmony_ci 1378c2ecf20Sopenharmony_ci if (!cache_map) 1388c2ecf20Sopenharmony_ci return -ENOENT; 1398c2ecf20Sopenharmony_ci 1408c2ecf20Sopenharmony_ci ret = (int)(*cache_map)[cache_type][cache_op][cache_result]; 1418c2ecf20Sopenharmony_ci 1428c2ecf20Sopenharmony_ci if (ret == CACHE_OP_UNSUPPORTED) 1438c2ecf20Sopenharmony_ci return -ENOENT; 1448c2ecf20Sopenharmony_ci 1458c2ecf20Sopenharmony_ci return ret; 1468c2ecf20Sopenharmony_ci} 1478c2ecf20Sopenharmony_ci 1488c2ecf20Sopenharmony_cistatic int 1498c2ecf20Sopenharmony_ciarmpmu_map_hw_event(const unsigned (*event_map)[PERF_COUNT_HW_MAX], u64 config) 1508c2ecf20Sopenharmony_ci{ 1518c2ecf20Sopenharmony_ci int mapping; 1528c2ecf20Sopenharmony_ci 1538c2ecf20Sopenharmony_ci if (config >= PERF_COUNT_HW_MAX) 1548c2ecf20Sopenharmony_ci return -EINVAL; 1558c2ecf20Sopenharmony_ci 1568c2ecf20Sopenharmony_ci if (!event_map) 1578c2ecf20Sopenharmony_ci return -ENOENT; 1588c2ecf20Sopenharmony_ci 1598c2ecf20Sopenharmony_ci mapping = (*event_map)[config]; 1608c2ecf20Sopenharmony_ci return mapping == HW_OP_UNSUPPORTED ? -ENOENT : mapping; 1618c2ecf20Sopenharmony_ci} 1628c2ecf20Sopenharmony_ci 1638c2ecf20Sopenharmony_cistatic int 1648c2ecf20Sopenharmony_ciarmpmu_map_raw_event(u32 raw_event_mask, u64 config) 1658c2ecf20Sopenharmony_ci{ 1668c2ecf20Sopenharmony_ci return (int)(config & raw_event_mask); 1678c2ecf20Sopenharmony_ci} 1688c2ecf20Sopenharmony_ci 1698c2ecf20Sopenharmony_ciint 1708c2ecf20Sopenharmony_ciarmpmu_map_event(struct perf_event *event, 1718c2ecf20Sopenharmony_ci const unsigned (*event_map)[PERF_COUNT_HW_MAX], 1728c2ecf20Sopenharmony_ci const unsigned (*cache_map) 1738c2ecf20Sopenharmony_ci [PERF_COUNT_HW_CACHE_MAX] 1748c2ecf20Sopenharmony_ci [PERF_COUNT_HW_CACHE_OP_MAX] 1758c2ecf20Sopenharmony_ci [PERF_COUNT_HW_CACHE_RESULT_MAX], 1768c2ecf20Sopenharmony_ci u32 raw_event_mask) 1778c2ecf20Sopenharmony_ci{ 1788c2ecf20Sopenharmony_ci u64 config = event->attr.config; 1798c2ecf20Sopenharmony_ci int type = event->attr.type; 1808c2ecf20Sopenharmony_ci 1818c2ecf20Sopenharmony_ci if (type == event->pmu->type) 1828c2ecf20Sopenharmony_ci return armpmu_map_raw_event(raw_event_mask, config); 1838c2ecf20Sopenharmony_ci 1848c2ecf20Sopenharmony_ci switch (type) { 1858c2ecf20Sopenharmony_ci case PERF_TYPE_HARDWARE: 1868c2ecf20Sopenharmony_ci return armpmu_map_hw_event(event_map, config); 1878c2ecf20Sopenharmony_ci case PERF_TYPE_HW_CACHE: 1888c2ecf20Sopenharmony_ci return armpmu_map_cache_event(cache_map, config); 1898c2ecf20Sopenharmony_ci case PERF_TYPE_RAW: 1908c2ecf20Sopenharmony_ci return armpmu_map_raw_event(raw_event_mask, config); 1918c2ecf20Sopenharmony_ci } 1928c2ecf20Sopenharmony_ci 1938c2ecf20Sopenharmony_ci return -ENOENT; 1948c2ecf20Sopenharmony_ci} 1958c2ecf20Sopenharmony_ci 1968c2ecf20Sopenharmony_ciint armpmu_event_set_period(struct perf_event *event) 1978c2ecf20Sopenharmony_ci{ 1988c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(event->pmu); 1998c2ecf20Sopenharmony_ci struct hw_perf_event *hwc = &event->hw; 2008c2ecf20Sopenharmony_ci s64 left = local64_read(&hwc->period_left); 2018c2ecf20Sopenharmony_ci s64 period = hwc->sample_period; 2028c2ecf20Sopenharmony_ci u64 max_period; 2038c2ecf20Sopenharmony_ci int ret = 0; 2048c2ecf20Sopenharmony_ci 2058c2ecf20Sopenharmony_ci max_period = arm_pmu_event_max_period(event); 2068c2ecf20Sopenharmony_ci if (unlikely(left <= -period)) { 2078c2ecf20Sopenharmony_ci left = period; 2088c2ecf20Sopenharmony_ci local64_set(&hwc->period_left, left); 2098c2ecf20Sopenharmony_ci hwc->last_period = period; 2108c2ecf20Sopenharmony_ci ret = 1; 2118c2ecf20Sopenharmony_ci } 2128c2ecf20Sopenharmony_ci 2138c2ecf20Sopenharmony_ci if (unlikely(left <= 0)) { 2148c2ecf20Sopenharmony_ci left += period; 2158c2ecf20Sopenharmony_ci local64_set(&hwc->period_left, left); 2168c2ecf20Sopenharmony_ci hwc->last_period = period; 2178c2ecf20Sopenharmony_ci ret = 1; 2188c2ecf20Sopenharmony_ci } 2198c2ecf20Sopenharmony_ci 2208c2ecf20Sopenharmony_ci /* 2218c2ecf20Sopenharmony_ci * Limit the maximum period to prevent the counter value 2228c2ecf20Sopenharmony_ci * from overtaking the one we are about to program. In 2238c2ecf20Sopenharmony_ci * effect we are reducing max_period to account for 2248c2ecf20Sopenharmony_ci * interrupt latency (and we are being very conservative). 2258c2ecf20Sopenharmony_ci */ 2268c2ecf20Sopenharmony_ci if (left > (max_period >> 1)) 2278c2ecf20Sopenharmony_ci left = (max_period >> 1); 2288c2ecf20Sopenharmony_ci 2298c2ecf20Sopenharmony_ci local64_set(&hwc->prev_count, (u64)-left); 2308c2ecf20Sopenharmony_ci 2318c2ecf20Sopenharmony_ci armpmu->write_counter(event, (u64)(-left) & max_period); 2328c2ecf20Sopenharmony_ci 2338c2ecf20Sopenharmony_ci perf_event_update_userpage(event); 2348c2ecf20Sopenharmony_ci 2358c2ecf20Sopenharmony_ci return ret; 2368c2ecf20Sopenharmony_ci} 2378c2ecf20Sopenharmony_ci 2388c2ecf20Sopenharmony_ciu64 armpmu_event_update(struct perf_event *event) 2398c2ecf20Sopenharmony_ci{ 2408c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(event->pmu); 2418c2ecf20Sopenharmony_ci struct hw_perf_event *hwc = &event->hw; 2428c2ecf20Sopenharmony_ci u64 delta, prev_raw_count, new_raw_count; 2438c2ecf20Sopenharmony_ci u64 max_period = arm_pmu_event_max_period(event); 2448c2ecf20Sopenharmony_ci 2458c2ecf20Sopenharmony_ciagain: 2468c2ecf20Sopenharmony_ci prev_raw_count = local64_read(&hwc->prev_count); 2478c2ecf20Sopenharmony_ci new_raw_count = armpmu->read_counter(event); 2488c2ecf20Sopenharmony_ci 2498c2ecf20Sopenharmony_ci if (local64_cmpxchg(&hwc->prev_count, prev_raw_count, 2508c2ecf20Sopenharmony_ci new_raw_count) != prev_raw_count) 2518c2ecf20Sopenharmony_ci goto again; 2528c2ecf20Sopenharmony_ci 2538c2ecf20Sopenharmony_ci delta = (new_raw_count - prev_raw_count) & max_period; 2548c2ecf20Sopenharmony_ci 2558c2ecf20Sopenharmony_ci local64_add(delta, &event->count); 2568c2ecf20Sopenharmony_ci local64_sub(delta, &hwc->period_left); 2578c2ecf20Sopenharmony_ci 2588c2ecf20Sopenharmony_ci return new_raw_count; 2598c2ecf20Sopenharmony_ci} 2608c2ecf20Sopenharmony_ci 2618c2ecf20Sopenharmony_cistatic void 2628c2ecf20Sopenharmony_ciarmpmu_read(struct perf_event *event) 2638c2ecf20Sopenharmony_ci{ 2648c2ecf20Sopenharmony_ci armpmu_event_update(event); 2658c2ecf20Sopenharmony_ci} 2668c2ecf20Sopenharmony_ci 2678c2ecf20Sopenharmony_cistatic void 2688c2ecf20Sopenharmony_ciarmpmu_stop(struct perf_event *event, int flags) 2698c2ecf20Sopenharmony_ci{ 2708c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(event->pmu); 2718c2ecf20Sopenharmony_ci struct hw_perf_event *hwc = &event->hw; 2728c2ecf20Sopenharmony_ci 2738c2ecf20Sopenharmony_ci /* 2748c2ecf20Sopenharmony_ci * ARM pmu always has to update the counter, so ignore 2758c2ecf20Sopenharmony_ci * PERF_EF_UPDATE, see comments in armpmu_start(). 2768c2ecf20Sopenharmony_ci */ 2778c2ecf20Sopenharmony_ci if (!(hwc->state & PERF_HES_STOPPED)) { 2788c2ecf20Sopenharmony_ci armpmu->disable(event); 2798c2ecf20Sopenharmony_ci armpmu_event_update(event); 2808c2ecf20Sopenharmony_ci hwc->state |= PERF_HES_STOPPED | PERF_HES_UPTODATE; 2818c2ecf20Sopenharmony_ci } 2828c2ecf20Sopenharmony_ci} 2838c2ecf20Sopenharmony_ci 2848c2ecf20Sopenharmony_cistatic void armpmu_start(struct perf_event *event, int flags) 2858c2ecf20Sopenharmony_ci{ 2868c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(event->pmu); 2878c2ecf20Sopenharmony_ci struct hw_perf_event *hwc = &event->hw; 2888c2ecf20Sopenharmony_ci 2898c2ecf20Sopenharmony_ci /* 2908c2ecf20Sopenharmony_ci * ARM pmu always has to reprogram the period, so ignore 2918c2ecf20Sopenharmony_ci * PERF_EF_RELOAD, see the comment below. 2928c2ecf20Sopenharmony_ci */ 2938c2ecf20Sopenharmony_ci if (flags & PERF_EF_RELOAD) 2948c2ecf20Sopenharmony_ci WARN_ON_ONCE(!(hwc->state & PERF_HES_UPTODATE)); 2958c2ecf20Sopenharmony_ci 2968c2ecf20Sopenharmony_ci hwc->state = 0; 2978c2ecf20Sopenharmony_ci /* 2988c2ecf20Sopenharmony_ci * Set the period again. Some counters can't be stopped, so when we 2998c2ecf20Sopenharmony_ci * were stopped we simply disabled the IRQ source and the counter 3008c2ecf20Sopenharmony_ci * may have been left counting. If we don't do this step then we may 3018c2ecf20Sopenharmony_ci * get an interrupt too soon or *way* too late if the overflow has 3028c2ecf20Sopenharmony_ci * happened since disabling. 3038c2ecf20Sopenharmony_ci */ 3048c2ecf20Sopenharmony_ci armpmu_event_set_period(event); 3058c2ecf20Sopenharmony_ci armpmu->enable(event); 3068c2ecf20Sopenharmony_ci} 3078c2ecf20Sopenharmony_ci 3088c2ecf20Sopenharmony_cistatic void 3098c2ecf20Sopenharmony_ciarmpmu_del(struct perf_event *event, int flags) 3108c2ecf20Sopenharmony_ci{ 3118c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(event->pmu); 3128c2ecf20Sopenharmony_ci struct pmu_hw_events *hw_events = this_cpu_ptr(armpmu->hw_events); 3138c2ecf20Sopenharmony_ci struct hw_perf_event *hwc = &event->hw; 3148c2ecf20Sopenharmony_ci int idx = hwc->idx; 3158c2ecf20Sopenharmony_ci 3168c2ecf20Sopenharmony_ci armpmu_stop(event, PERF_EF_UPDATE); 3178c2ecf20Sopenharmony_ci hw_events->events[idx] = NULL; 3188c2ecf20Sopenharmony_ci armpmu->clear_event_idx(hw_events, event); 3198c2ecf20Sopenharmony_ci perf_event_update_userpage(event); 3208c2ecf20Sopenharmony_ci /* Clear the allocated counter */ 3218c2ecf20Sopenharmony_ci hwc->idx = -1; 3228c2ecf20Sopenharmony_ci} 3238c2ecf20Sopenharmony_ci 3248c2ecf20Sopenharmony_cistatic int 3258c2ecf20Sopenharmony_ciarmpmu_add(struct perf_event *event, int flags) 3268c2ecf20Sopenharmony_ci{ 3278c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(event->pmu); 3288c2ecf20Sopenharmony_ci struct pmu_hw_events *hw_events = this_cpu_ptr(armpmu->hw_events); 3298c2ecf20Sopenharmony_ci struct hw_perf_event *hwc = &event->hw; 3308c2ecf20Sopenharmony_ci int idx; 3318c2ecf20Sopenharmony_ci 3328c2ecf20Sopenharmony_ci /* An event following a process won't be stopped earlier */ 3338c2ecf20Sopenharmony_ci if (!cpumask_test_cpu(smp_processor_id(), &armpmu->supported_cpus)) 3348c2ecf20Sopenharmony_ci return -ENOENT; 3358c2ecf20Sopenharmony_ci 3368c2ecf20Sopenharmony_ci /* If we don't have a space for the counter then finish early. */ 3378c2ecf20Sopenharmony_ci idx = armpmu->get_event_idx(hw_events, event); 3388c2ecf20Sopenharmony_ci if (idx < 0) 3398c2ecf20Sopenharmony_ci return idx; 3408c2ecf20Sopenharmony_ci 3418c2ecf20Sopenharmony_ci /* 3428c2ecf20Sopenharmony_ci * If there is an event in the counter we are going to use then make 3438c2ecf20Sopenharmony_ci * sure it is disabled. 3448c2ecf20Sopenharmony_ci */ 3458c2ecf20Sopenharmony_ci event->hw.idx = idx; 3468c2ecf20Sopenharmony_ci armpmu->disable(event); 3478c2ecf20Sopenharmony_ci hw_events->events[idx] = event; 3488c2ecf20Sopenharmony_ci 3498c2ecf20Sopenharmony_ci hwc->state = PERF_HES_STOPPED | PERF_HES_UPTODATE; 3508c2ecf20Sopenharmony_ci if (flags & PERF_EF_START) 3518c2ecf20Sopenharmony_ci armpmu_start(event, PERF_EF_RELOAD); 3528c2ecf20Sopenharmony_ci 3538c2ecf20Sopenharmony_ci /* Propagate our changes to the userspace mapping. */ 3548c2ecf20Sopenharmony_ci perf_event_update_userpage(event); 3558c2ecf20Sopenharmony_ci 3568c2ecf20Sopenharmony_ci return 0; 3578c2ecf20Sopenharmony_ci} 3588c2ecf20Sopenharmony_ci 3598c2ecf20Sopenharmony_cistatic int 3608c2ecf20Sopenharmony_civalidate_event(struct pmu *pmu, struct pmu_hw_events *hw_events, 3618c2ecf20Sopenharmony_ci struct perf_event *event) 3628c2ecf20Sopenharmony_ci{ 3638c2ecf20Sopenharmony_ci struct arm_pmu *armpmu; 3648c2ecf20Sopenharmony_ci 3658c2ecf20Sopenharmony_ci if (is_software_event(event)) 3668c2ecf20Sopenharmony_ci return 1; 3678c2ecf20Sopenharmony_ci 3688c2ecf20Sopenharmony_ci /* 3698c2ecf20Sopenharmony_ci * Reject groups spanning multiple HW PMUs (e.g. CPU + CCI). The 3708c2ecf20Sopenharmony_ci * core perf code won't check that the pmu->ctx == leader->ctx 3718c2ecf20Sopenharmony_ci * until after pmu->event_init(event). 3728c2ecf20Sopenharmony_ci */ 3738c2ecf20Sopenharmony_ci if (event->pmu != pmu) 3748c2ecf20Sopenharmony_ci return 0; 3758c2ecf20Sopenharmony_ci 3768c2ecf20Sopenharmony_ci if (event->state < PERF_EVENT_STATE_OFF) 3778c2ecf20Sopenharmony_ci return 1; 3788c2ecf20Sopenharmony_ci 3798c2ecf20Sopenharmony_ci if (event->state == PERF_EVENT_STATE_OFF && !event->attr.enable_on_exec) 3808c2ecf20Sopenharmony_ci return 1; 3818c2ecf20Sopenharmony_ci 3828c2ecf20Sopenharmony_ci armpmu = to_arm_pmu(event->pmu); 3838c2ecf20Sopenharmony_ci return armpmu->get_event_idx(hw_events, event) >= 0; 3848c2ecf20Sopenharmony_ci} 3858c2ecf20Sopenharmony_ci 3868c2ecf20Sopenharmony_cistatic int 3878c2ecf20Sopenharmony_civalidate_group(struct perf_event *event) 3888c2ecf20Sopenharmony_ci{ 3898c2ecf20Sopenharmony_ci struct perf_event *sibling, *leader = event->group_leader; 3908c2ecf20Sopenharmony_ci struct pmu_hw_events fake_pmu; 3918c2ecf20Sopenharmony_ci 3928c2ecf20Sopenharmony_ci /* 3938c2ecf20Sopenharmony_ci * Initialise the fake PMU. We only need to populate the 3948c2ecf20Sopenharmony_ci * used_mask for the purposes of validation. 3958c2ecf20Sopenharmony_ci */ 3968c2ecf20Sopenharmony_ci memset(&fake_pmu.used_mask, 0, sizeof(fake_pmu.used_mask)); 3978c2ecf20Sopenharmony_ci 3988c2ecf20Sopenharmony_ci if (!validate_event(event->pmu, &fake_pmu, leader)) 3998c2ecf20Sopenharmony_ci return -EINVAL; 4008c2ecf20Sopenharmony_ci 4018c2ecf20Sopenharmony_ci if (event == leader) 4028c2ecf20Sopenharmony_ci return 0; 4038c2ecf20Sopenharmony_ci 4048c2ecf20Sopenharmony_ci for_each_sibling_event(sibling, leader) { 4058c2ecf20Sopenharmony_ci if (!validate_event(event->pmu, &fake_pmu, sibling)) 4068c2ecf20Sopenharmony_ci return -EINVAL; 4078c2ecf20Sopenharmony_ci } 4088c2ecf20Sopenharmony_ci 4098c2ecf20Sopenharmony_ci if (!validate_event(event->pmu, &fake_pmu, event)) 4108c2ecf20Sopenharmony_ci return -EINVAL; 4118c2ecf20Sopenharmony_ci 4128c2ecf20Sopenharmony_ci return 0; 4138c2ecf20Sopenharmony_ci} 4148c2ecf20Sopenharmony_ci 4158c2ecf20Sopenharmony_cistatic irqreturn_t armpmu_dispatch_irq(int irq, void *dev) 4168c2ecf20Sopenharmony_ci{ 4178c2ecf20Sopenharmony_ci struct arm_pmu *armpmu; 4188c2ecf20Sopenharmony_ci int ret; 4198c2ecf20Sopenharmony_ci u64 start_clock, finish_clock; 4208c2ecf20Sopenharmony_ci 4218c2ecf20Sopenharmony_ci /* 4228c2ecf20Sopenharmony_ci * we request the IRQ with a (possibly percpu) struct arm_pmu**, but 4238c2ecf20Sopenharmony_ci * the handlers expect a struct arm_pmu*. The percpu_irq framework will 4248c2ecf20Sopenharmony_ci * do any necessary shifting, we just need to perform the first 4258c2ecf20Sopenharmony_ci * dereference. 4268c2ecf20Sopenharmony_ci */ 4278c2ecf20Sopenharmony_ci armpmu = *(void **)dev; 4288c2ecf20Sopenharmony_ci if (WARN_ON_ONCE(!armpmu)) 4298c2ecf20Sopenharmony_ci return IRQ_NONE; 4308c2ecf20Sopenharmony_ci 4318c2ecf20Sopenharmony_ci start_clock = sched_clock(); 4328c2ecf20Sopenharmony_ci ret = armpmu->handle_irq(armpmu); 4338c2ecf20Sopenharmony_ci finish_clock = sched_clock(); 4348c2ecf20Sopenharmony_ci 4358c2ecf20Sopenharmony_ci perf_sample_event_took(finish_clock - start_clock); 4368c2ecf20Sopenharmony_ci return ret; 4378c2ecf20Sopenharmony_ci} 4388c2ecf20Sopenharmony_ci 4398c2ecf20Sopenharmony_cistatic int 4408c2ecf20Sopenharmony_ci__hw_perf_event_init(struct perf_event *event) 4418c2ecf20Sopenharmony_ci{ 4428c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(event->pmu); 4438c2ecf20Sopenharmony_ci struct hw_perf_event *hwc = &event->hw; 4448c2ecf20Sopenharmony_ci int mapping; 4458c2ecf20Sopenharmony_ci 4468c2ecf20Sopenharmony_ci hwc->flags = 0; 4478c2ecf20Sopenharmony_ci mapping = armpmu->map_event(event); 4488c2ecf20Sopenharmony_ci 4498c2ecf20Sopenharmony_ci if (mapping < 0) { 4508c2ecf20Sopenharmony_ci pr_debug("event %x:%llx not supported\n", event->attr.type, 4518c2ecf20Sopenharmony_ci event->attr.config); 4528c2ecf20Sopenharmony_ci return mapping; 4538c2ecf20Sopenharmony_ci } 4548c2ecf20Sopenharmony_ci 4558c2ecf20Sopenharmony_ci /* 4568c2ecf20Sopenharmony_ci * We don't assign an index until we actually place the event onto 4578c2ecf20Sopenharmony_ci * hardware. Use -1 to signify that we haven't decided where to put it 4588c2ecf20Sopenharmony_ci * yet. For SMP systems, each core has it's own PMU so we can't do any 4598c2ecf20Sopenharmony_ci * clever allocation or constraints checking at this point. 4608c2ecf20Sopenharmony_ci */ 4618c2ecf20Sopenharmony_ci hwc->idx = -1; 4628c2ecf20Sopenharmony_ci hwc->config_base = 0; 4638c2ecf20Sopenharmony_ci hwc->config = 0; 4648c2ecf20Sopenharmony_ci hwc->event_base = 0; 4658c2ecf20Sopenharmony_ci 4668c2ecf20Sopenharmony_ci /* 4678c2ecf20Sopenharmony_ci * Check whether we need to exclude the counter from certain modes. 4688c2ecf20Sopenharmony_ci */ 4698c2ecf20Sopenharmony_ci if (armpmu->set_event_filter && 4708c2ecf20Sopenharmony_ci armpmu->set_event_filter(hwc, &event->attr)) { 4718c2ecf20Sopenharmony_ci pr_debug("ARM performance counters do not support " 4728c2ecf20Sopenharmony_ci "mode exclusion\n"); 4738c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 4748c2ecf20Sopenharmony_ci } 4758c2ecf20Sopenharmony_ci 4768c2ecf20Sopenharmony_ci /* 4778c2ecf20Sopenharmony_ci * Store the event encoding into the config_base field. 4788c2ecf20Sopenharmony_ci */ 4798c2ecf20Sopenharmony_ci hwc->config_base |= (unsigned long)mapping; 4808c2ecf20Sopenharmony_ci 4818c2ecf20Sopenharmony_ci if (!is_sampling_event(event)) { 4828c2ecf20Sopenharmony_ci /* 4838c2ecf20Sopenharmony_ci * For non-sampling runs, limit the sample_period to half 4848c2ecf20Sopenharmony_ci * of the counter width. That way, the new counter value 4858c2ecf20Sopenharmony_ci * is far less likely to overtake the previous one unless 4868c2ecf20Sopenharmony_ci * you have some serious IRQ latency issues. 4878c2ecf20Sopenharmony_ci */ 4888c2ecf20Sopenharmony_ci hwc->sample_period = arm_pmu_event_max_period(event) >> 1; 4898c2ecf20Sopenharmony_ci hwc->last_period = hwc->sample_period; 4908c2ecf20Sopenharmony_ci local64_set(&hwc->period_left, hwc->sample_period); 4918c2ecf20Sopenharmony_ci } 4928c2ecf20Sopenharmony_ci 4938c2ecf20Sopenharmony_ci return validate_group(event); 4948c2ecf20Sopenharmony_ci} 4958c2ecf20Sopenharmony_ci 4968c2ecf20Sopenharmony_cistatic int armpmu_event_init(struct perf_event *event) 4978c2ecf20Sopenharmony_ci{ 4988c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(event->pmu); 4998c2ecf20Sopenharmony_ci 5008c2ecf20Sopenharmony_ci /* 5018c2ecf20Sopenharmony_ci * Reject CPU-affine events for CPUs that are of a different class to 5028c2ecf20Sopenharmony_ci * that which this PMU handles. Process-following events (where 5038c2ecf20Sopenharmony_ci * event->cpu == -1) can be migrated between CPUs, and thus we have to 5048c2ecf20Sopenharmony_ci * reject them later (in armpmu_add) if they're scheduled on a 5058c2ecf20Sopenharmony_ci * different class of CPU. 5068c2ecf20Sopenharmony_ci */ 5078c2ecf20Sopenharmony_ci if (event->cpu != -1 && 5088c2ecf20Sopenharmony_ci !cpumask_test_cpu(event->cpu, &armpmu->supported_cpus)) 5098c2ecf20Sopenharmony_ci return -ENOENT; 5108c2ecf20Sopenharmony_ci 5118c2ecf20Sopenharmony_ci /* does not support taken branch sampling */ 5128c2ecf20Sopenharmony_ci if (has_branch_stack(event)) 5138c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 5148c2ecf20Sopenharmony_ci 5158c2ecf20Sopenharmony_ci if (armpmu->map_event(event) == -ENOENT) 5168c2ecf20Sopenharmony_ci return -ENOENT; 5178c2ecf20Sopenharmony_ci 5188c2ecf20Sopenharmony_ci return __hw_perf_event_init(event); 5198c2ecf20Sopenharmony_ci} 5208c2ecf20Sopenharmony_ci 5218c2ecf20Sopenharmony_cistatic void armpmu_enable(struct pmu *pmu) 5228c2ecf20Sopenharmony_ci{ 5238c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(pmu); 5248c2ecf20Sopenharmony_ci struct pmu_hw_events *hw_events = this_cpu_ptr(armpmu->hw_events); 5258c2ecf20Sopenharmony_ci int enabled = bitmap_weight(hw_events->used_mask, armpmu->num_events); 5268c2ecf20Sopenharmony_ci 5278c2ecf20Sopenharmony_ci /* For task-bound events we may be called on other CPUs */ 5288c2ecf20Sopenharmony_ci if (!cpumask_test_cpu(smp_processor_id(), &armpmu->supported_cpus)) 5298c2ecf20Sopenharmony_ci return; 5308c2ecf20Sopenharmony_ci 5318c2ecf20Sopenharmony_ci if (enabled) 5328c2ecf20Sopenharmony_ci armpmu->start(armpmu); 5338c2ecf20Sopenharmony_ci} 5348c2ecf20Sopenharmony_ci 5358c2ecf20Sopenharmony_cistatic void armpmu_disable(struct pmu *pmu) 5368c2ecf20Sopenharmony_ci{ 5378c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(pmu); 5388c2ecf20Sopenharmony_ci 5398c2ecf20Sopenharmony_ci /* For task-bound events we may be called on other CPUs */ 5408c2ecf20Sopenharmony_ci if (!cpumask_test_cpu(smp_processor_id(), &armpmu->supported_cpus)) 5418c2ecf20Sopenharmony_ci return; 5428c2ecf20Sopenharmony_ci 5438c2ecf20Sopenharmony_ci armpmu->stop(armpmu); 5448c2ecf20Sopenharmony_ci} 5458c2ecf20Sopenharmony_ci 5468c2ecf20Sopenharmony_ci/* 5478c2ecf20Sopenharmony_ci * In heterogeneous systems, events are specific to a particular 5488c2ecf20Sopenharmony_ci * microarchitecture, and aren't suitable for another. Thus, only match CPUs of 5498c2ecf20Sopenharmony_ci * the same microarchitecture. 5508c2ecf20Sopenharmony_ci */ 5518c2ecf20Sopenharmony_cistatic int armpmu_filter_match(struct perf_event *event) 5528c2ecf20Sopenharmony_ci{ 5538c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(event->pmu); 5548c2ecf20Sopenharmony_ci unsigned int cpu = smp_processor_id(); 5558c2ecf20Sopenharmony_ci int ret; 5568c2ecf20Sopenharmony_ci 5578c2ecf20Sopenharmony_ci ret = cpumask_test_cpu(cpu, &armpmu->supported_cpus); 5588c2ecf20Sopenharmony_ci if (ret && armpmu->filter_match) 5598c2ecf20Sopenharmony_ci return armpmu->filter_match(event); 5608c2ecf20Sopenharmony_ci 5618c2ecf20Sopenharmony_ci return ret; 5628c2ecf20Sopenharmony_ci} 5638c2ecf20Sopenharmony_ci 5648c2ecf20Sopenharmony_cistatic ssize_t armpmu_cpumask_show(struct device *dev, 5658c2ecf20Sopenharmony_ci struct device_attribute *attr, char *buf) 5668c2ecf20Sopenharmony_ci{ 5678c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = to_arm_pmu(dev_get_drvdata(dev)); 5688c2ecf20Sopenharmony_ci return cpumap_print_to_pagebuf(true, buf, &armpmu->supported_cpus); 5698c2ecf20Sopenharmony_ci} 5708c2ecf20Sopenharmony_ci 5718c2ecf20Sopenharmony_cistatic DEVICE_ATTR(cpus, S_IRUGO, armpmu_cpumask_show, NULL); 5728c2ecf20Sopenharmony_ci 5738c2ecf20Sopenharmony_cistatic struct attribute *armpmu_common_attrs[] = { 5748c2ecf20Sopenharmony_ci &dev_attr_cpus.attr, 5758c2ecf20Sopenharmony_ci NULL, 5768c2ecf20Sopenharmony_ci}; 5778c2ecf20Sopenharmony_ci 5788c2ecf20Sopenharmony_cistatic struct attribute_group armpmu_common_attr_group = { 5798c2ecf20Sopenharmony_ci .attrs = armpmu_common_attrs, 5808c2ecf20Sopenharmony_ci}; 5818c2ecf20Sopenharmony_ci 5828c2ecf20Sopenharmony_ci/* Set at runtime when we know what CPU type we are. */ 5838c2ecf20Sopenharmony_cistatic struct arm_pmu *__oprofile_cpu_pmu; 5848c2ecf20Sopenharmony_ci 5858c2ecf20Sopenharmony_ci/* 5868c2ecf20Sopenharmony_ci * Despite the names, these two functions are CPU-specific and are used 5878c2ecf20Sopenharmony_ci * by the OProfile/perf code. 5888c2ecf20Sopenharmony_ci */ 5898c2ecf20Sopenharmony_ciconst char *perf_pmu_name(void) 5908c2ecf20Sopenharmony_ci{ 5918c2ecf20Sopenharmony_ci if (!__oprofile_cpu_pmu) 5928c2ecf20Sopenharmony_ci return NULL; 5938c2ecf20Sopenharmony_ci 5948c2ecf20Sopenharmony_ci return __oprofile_cpu_pmu->name; 5958c2ecf20Sopenharmony_ci} 5968c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(perf_pmu_name); 5978c2ecf20Sopenharmony_ci 5988c2ecf20Sopenharmony_ciint perf_num_counters(void) 5998c2ecf20Sopenharmony_ci{ 6008c2ecf20Sopenharmony_ci int max_events = 0; 6018c2ecf20Sopenharmony_ci 6028c2ecf20Sopenharmony_ci if (__oprofile_cpu_pmu != NULL) 6038c2ecf20Sopenharmony_ci max_events = __oprofile_cpu_pmu->num_events; 6048c2ecf20Sopenharmony_ci 6058c2ecf20Sopenharmony_ci return max_events; 6068c2ecf20Sopenharmony_ci} 6078c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(perf_num_counters); 6088c2ecf20Sopenharmony_ci 6098c2ecf20Sopenharmony_cistatic int armpmu_count_irq_users(const int irq) 6108c2ecf20Sopenharmony_ci{ 6118c2ecf20Sopenharmony_ci int cpu, count = 0; 6128c2ecf20Sopenharmony_ci 6138c2ecf20Sopenharmony_ci for_each_possible_cpu(cpu) { 6148c2ecf20Sopenharmony_ci if (per_cpu(cpu_irq, cpu) == irq) 6158c2ecf20Sopenharmony_ci count++; 6168c2ecf20Sopenharmony_ci } 6178c2ecf20Sopenharmony_ci 6188c2ecf20Sopenharmony_ci return count; 6198c2ecf20Sopenharmony_ci} 6208c2ecf20Sopenharmony_ci 6218c2ecf20Sopenharmony_cistatic const struct pmu_irq_ops *armpmu_find_irq_ops(int irq) 6228c2ecf20Sopenharmony_ci{ 6238c2ecf20Sopenharmony_ci const struct pmu_irq_ops *ops = NULL; 6248c2ecf20Sopenharmony_ci int cpu; 6258c2ecf20Sopenharmony_ci 6268c2ecf20Sopenharmony_ci for_each_possible_cpu(cpu) { 6278c2ecf20Sopenharmony_ci if (per_cpu(cpu_irq, cpu) != irq) 6288c2ecf20Sopenharmony_ci continue; 6298c2ecf20Sopenharmony_ci 6308c2ecf20Sopenharmony_ci ops = per_cpu(cpu_irq_ops, cpu); 6318c2ecf20Sopenharmony_ci if (ops) 6328c2ecf20Sopenharmony_ci break; 6338c2ecf20Sopenharmony_ci } 6348c2ecf20Sopenharmony_ci 6358c2ecf20Sopenharmony_ci return ops; 6368c2ecf20Sopenharmony_ci} 6378c2ecf20Sopenharmony_ci 6388c2ecf20Sopenharmony_civoid armpmu_free_irq(int irq, int cpu) 6398c2ecf20Sopenharmony_ci{ 6408c2ecf20Sopenharmony_ci if (per_cpu(cpu_irq, cpu) == 0) 6418c2ecf20Sopenharmony_ci return; 6428c2ecf20Sopenharmony_ci if (WARN_ON(irq != per_cpu(cpu_irq, cpu))) 6438c2ecf20Sopenharmony_ci return; 6448c2ecf20Sopenharmony_ci 6458c2ecf20Sopenharmony_ci per_cpu(cpu_irq_ops, cpu)->free_pmuirq(irq, cpu, &cpu_armpmu); 6468c2ecf20Sopenharmony_ci 6478c2ecf20Sopenharmony_ci per_cpu(cpu_irq, cpu) = 0; 6488c2ecf20Sopenharmony_ci per_cpu(cpu_irq_ops, cpu) = NULL; 6498c2ecf20Sopenharmony_ci} 6508c2ecf20Sopenharmony_ci 6518c2ecf20Sopenharmony_ciint armpmu_request_irq(int irq, int cpu) 6528c2ecf20Sopenharmony_ci{ 6538c2ecf20Sopenharmony_ci int err = 0; 6548c2ecf20Sopenharmony_ci const irq_handler_t handler = armpmu_dispatch_irq; 6558c2ecf20Sopenharmony_ci const struct pmu_irq_ops *irq_ops; 6568c2ecf20Sopenharmony_ci 6578c2ecf20Sopenharmony_ci if (!irq) 6588c2ecf20Sopenharmony_ci return 0; 6598c2ecf20Sopenharmony_ci 6608c2ecf20Sopenharmony_ci if (!irq_is_percpu_devid(irq)) { 6618c2ecf20Sopenharmony_ci unsigned long irq_flags; 6628c2ecf20Sopenharmony_ci 6638c2ecf20Sopenharmony_ci err = irq_force_affinity(irq, cpumask_of(cpu)); 6648c2ecf20Sopenharmony_ci 6658c2ecf20Sopenharmony_ci if (err && num_possible_cpus() > 1) { 6668c2ecf20Sopenharmony_ci pr_warn("unable to set irq affinity (irq=%d, cpu=%u)\n", 6678c2ecf20Sopenharmony_ci irq, cpu); 6688c2ecf20Sopenharmony_ci goto err_out; 6698c2ecf20Sopenharmony_ci } 6708c2ecf20Sopenharmony_ci 6718c2ecf20Sopenharmony_ci irq_flags = IRQF_PERCPU | 6728c2ecf20Sopenharmony_ci IRQF_NOBALANCING | 6738c2ecf20Sopenharmony_ci IRQF_NO_THREAD; 6748c2ecf20Sopenharmony_ci 6758c2ecf20Sopenharmony_ci irq_set_status_flags(irq, IRQ_NOAUTOEN); 6768c2ecf20Sopenharmony_ci 6778c2ecf20Sopenharmony_ci err = request_nmi(irq, handler, irq_flags, "arm-pmu", 6788c2ecf20Sopenharmony_ci per_cpu_ptr(&cpu_armpmu, cpu)); 6798c2ecf20Sopenharmony_ci 6808c2ecf20Sopenharmony_ci /* If cannot get an NMI, get a normal interrupt */ 6818c2ecf20Sopenharmony_ci if (err) { 6828c2ecf20Sopenharmony_ci err = request_irq(irq, handler, irq_flags, "arm-pmu", 6838c2ecf20Sopenharmony_ci per_cpu_ptr(&cpu_armpmu, cpu)); 6848c2ecf20Sopenharmony_ci irq_ops = &pmuirq_ops; 6858c2ecf20Sopenharmony_ci } else { 6868c2ecf20Sopenharmony_ci has_nmi = true; 6878c2ecf20Sopenharmony_ci irq_ops = &pmunmi_ops; 6888c2ecf20Sopenharmony_ci } 6898c2ecf20Sopenharmony_ci } else if (armpmu_count_irq_users(irq) == 0) { 6908c2ecf20Sopenharmony_ci err = request_percpu_nmi(irq, handler, "arm-pmu", &cpu_armpmu); 6918c2ecf20Sopenharmony_ci 6928c2ecf20Sopenharmony_ci /* If cannot get an NMI, get a normal interrupt */ 6938c2ecf20Sopenharmony_ci if (err) { 6948c2ecf20Sopenharmony_ci err = request_percpu_irq(irq, handler, "arm-pmu", 6958c2ecf20Sopenharmony_ci &cpu_armpmu); 6968c2ecf20Sopenharmony_ci irq_ops = &percpu_pmuirq_ops; 6978c2ecf20Sopenharmony_ci } else { 6988c2ecf20Sopenharmony_ci has_nmi= true; 6998c2ecf20Sopenharmony_ci irq_ops = &percpu_pmunmi_ops; 7008c2ecf20Sopenharmony_ci } 7018c2ecf20Sopenharmony_ci } else { 7028c2ecf20Sopenharmony_ci /* Per cpudevid irq was already requested by another CPU */ 7038c2ecf20Sopenharmony_ci irq_ops = armpmu_find_irq_ops(irq); 7048c2ecf20Sopenharmony_ci 7058c2ecf20Sopenharmony_ci if (WARN_ON(!irq_ops)) 7068c2ecf20Sopenharmony_ci err = -EINVAL; 7078c2ecf20Sopenharmony_ci } 7088c2ecf20Sopenharmony_ci 7098c2ecf20Sopenharmony_ci if (err) 7108c2ecf20Sopenharmony_ci goto err_out; 7118c2ecf20Sopenharmony_ci 7128c2ecf20Sopenharmony_ci per_cpu(cpu_irq, cpu) = irq; 7138c2ecf20Sopenharmony_ci per_cpu(cpu_irq_ops, cpu) = irq_ops; 7148c2ecf20Sopenharmony_ci return 0; 7158c2ecf20Sopenharmony_ci 7168c2ecf20Sopenharmony_cierr_out: 7178c2ecf20Sopenharmony_ci pr_err("unable to request IRQ%d for ARM PMU counters\n", irq); 7188c2ecf20Sopenharmony_ci return err; 7198c2ecf20Sopenharmony_ci} 7208c2ecf20Sopenharmony_ci 7218c2ecf20Sopenharmony_cistatic int armpmu_get_cpu_irq(struct arm_pmu *pmu, int cpu) 7228c2ecf20Sopenharmony_ci{ 7238c2ecf20Sopenharmony_ci struct pmu_hw_events __percpu *hw_events = pmu->hw_events; 7248c2ecf20Sopenharmony_ci return per_cpu(hw_events->irq, cpu); 7258c2ecf20Sopenharmony_ci} 7268c2ecf20Sopenharmony_ci 7278c2ecf20Sopenharmony_ci/* 7288c2ecf20Sopenharmony_ci * PMU hardware loses all context when a CPU goes offline. 7298c2ecf20Sopenharmony_ci * When a CPU is hotplugged back in, since some hardware registers are 7308c2ecf20Sopenharmony_ci * UNKNOWN at reset, the PMU must be explicitly reset to avoid reading 7318c2ecf20Sopenharmony_ci * junk values out of them. 7328c2ecf20Sopenharmony_ci */ 7338c2ecf20Sopenharmony_cistatic int arm_perf_starting_cpu(unsigned int cpu, struct hlist_node *node) 7348c2ecf20Sopenharmony_ci{ 7358c2ecf20Sopenharmony_ci struct arm_pmu *pmu = hlist_entry_safe(node, struct arm_pmu, node); 7368c2ecf20Sopenharmony_ci int irq; 7378c2ecf20Sopenharmony_ci 7388c2ecf20Sopenharmony_ci if (!cpumask_test_cpu(cpu, &pmu->supported_cpus)) 7398c2ecf20Sopenharmony_ci return 0; 7408c2ecf20Sopenharmony_ci if (pmu->reset) 7418c2ecf20Sopenharmony_ci pmu->reset(pmu); 7428c2ecf20Sopenharmony_ci 7438c2ecf20Sopenharmony_ci per_cpu(cpu_armpmu, cpu) = pmu; 7448c2ecf20Sopenharmony_ci 7458c2ecf20Sopenharmony_ci irq = armpmu_get_cpu_irq(pmu, cpu); 7468c2ecf20Sopenharmony_ci if (irq) 7478c2ecf20Sopenharmony_ci per_cpu(cpu_irq_ops, cpu)->enable_pmuirq(irq); 7488c2ecf20Sopenharmony_ci 7498c2ecf20Sopenharmony_ci return 0; 7508c2ecf20Sopenharmony_ci} 7518c2ecf20Sopenharmony_ci 7528c2ecf20Sopenharmony_cistatic int arm_perf_teardown_cpu(unsigned int cpu, struct hlist_node *node) 7538c2ecf20Sopenharmony_ci{ 7548c2ecf20Sopenharmony_ci struct arm_pmu *pmu = hlist_entry_safe(node, struct arm_pmu, node); 7558c2ecf20Sopenharmony_ci int irq; 7568c2ecf20Sopenharmony_ci 7578c2ecf20Sopenharmony_ci if (!cpumask_test_cpu(cpu, &pmu->supported_cpus)) 7588c2ecf20Sopenharmony_ci return 0; 7598c2ecf20Sopenharmony_ci 7608c2ecf20Sopenharmony_ci irq = armpmu_get_cpu_irq(pmu, cpu); 7618c2ecf20Sopenharmony_ci if (irq) 7628c2ecf20Sopenharmony_ci per_cpu(cpu_irq_ops, cpu)->disable_pmuirq(irq); 7638c2ecf20Sopenharmony_ci 7648c2ecf20Sopenharmony_ci per_cpu(cpu_armpmu, cpu) = NULL; 7658c2ecf20Sopenharmony_ci 7668c2ecf20Sopenharmony_ci return 0; 7678c2ecf20Sopenharmony_ci} 7688c2ecf20Sopenharmony_ci 7698c2ecf20Sopenharmony_ci#ifdef CONFIG_CPU_PM 7708c2ecf20Sopenharmony_cistatic void cpu_pm_pmu_setup(struct arm_pmu *armpmu, unsigned long cmd) 7718c2ecf20Sopenharmony_ci{ 7728c2ecf20Sopenharmony_ci struct pmu_hw_events *hw_events = this_cpu_ptr(armpmu->hw_events); 7738c2ecf20Sopenharmony_ci struct perf_event *event; 7748c2ecf20Sopenharmony_ci int idx; 7758c2ecf20Sopenharmony_ci 7768c2ecf20Sopenharmony_ci for (idx = 0; idx < armpmu->num_events; idx++) { 7778c2ecf20Sopenharmony_ci event = hw_events->events[idx]; 7788c2ecf20Sopenharmony_ci if (!event) 7798c2ecf20Sopenharmony_ci continue; 7808c2ecf20Sopenharmony_ci 7818c2ecf20Sopenharmony_ci switch (cmd) { 7828c2ecf20Sopenharmony_ci case CPU_PM_ENTER: 7838c2ecf20Sopenharmony_ci /* 7848c2ecf20Sopenharmony_ci * Stop and update the counter 7858c2ecf20Sopenharmony_ci */ 7868c2ecf20Sopenharmony_ci armpmu_stop(event, PERF_EF_UPDATE); 7878c2ecf20Sopenharmony_ci break; 7888c2ecf20Sopenharmony_ci case CPU_PM_EXIT: 7898c2ecf20Sopenharmony_ci case CPU_PM_ENTER_FAILED: 7908c2ecf20Sopenharmony_ci /* 7918c2ecf20Sopenharmony_ci * Restore and enable the counter. 7928c2ecf20Sopenharmony_ci * armpmu_start() indirectly calls 7938c2ecf20Sopenharmony_ci * 7948c2ecf20Sopenharmony_ci * perf_event_update_userpage() 7958c2ecf20Sopenharmony_ci * 7968c2ecf20Sopenharmony_ci * that requires RCU read locking to be functional, 7978c2ecf20Sopenharmony_ci * wrap the call within RCU_NONIDLE to make the 7988c2ecf20Sopenharmony_ci * RCU subsystem aware this cpu is not idle from 7998c2ecf20Sopenharmony_ci * an RCU perspective for the armpmu_start() call 8008c2ecf20Sopenharmony_ci * duration. 8018c2ecf20Sopenharmony_ci */ 8028c2ecf20Sopenharmony_ci RCU_NONIDLE(armpmu_start(event, PERF_EF_RELOAD)); 8038c2ecf20Sopenharmony_ci break; 8048c2ecf20Sopenharmony_ci default: 8058c2ecf20Sopenharmony_ci break; 8068c2ecf20Sopenharmony_ci } 8078c2ecf20Sopenharmony_ci } 8088c2ecf20Sopenharmony_ci} 8098c2ecf20Sopenharmony_ci 8108c2ecf20Sopenharmony_cistatic int cpu_pm_pmu_notify(struct notifier_block *b, unsigned long cmd, 8118c2ecf20Sopenharmony_ci void *v) 8128c2ecf20Sopenharmony_ci{ 8138c2ecf20Sopenharmony_ci struct arm_pmu *armpmu = container_of(b, struct arm_pmu, cpu_pm_nb); 8148c2ecf20Sopenharmony_ci struct pmu_hw_events *hw_events = this_cpu_ptr(armpmu->hw_events); 8158c2ecf20Sopenharmony_ci int enabled = bitmap_weight(hw_events->used_mask, armpmu->num_events); 8168c2ecf20Sopenharmony_ci 8178c2ecf20Sopenharmony_ci if (!cpumask_test_cpu(smp_processor_id(), &armpmu->supported_cpus)) 8188c2ecf20Sopenharmony_ci return NOTIFY_DONE; 8198c2ecf20Sopenharmony_ci 8208c2ecf20Sopenharmony_ci /* 8218c2ecf20Sopenharmony_ci * Always reset the PMU registers on power-up even if 8228c2ecf20Sopenharmony_ci * there are no events running. 8238c2ecf20Sopenharmony_ci */ 8248c2ecf20Sopenharmony_ci if (cmd == CPU_PM_EXIT && armpmu->reset) 8258c2ecf20Sopenharmony_ci armpmu->reset(armpmu); 8268c2ecf20Sopenharmony_ci 8278c2ecf20Sopenharmony_ci if (!enabled) 8288c2ecf20Sopenharmony_ci return NOTIFY_OK; 8298c2ecf20Sopenharmony_ci 8308c2ecf20Sopenharmony_ci switch (cmd) { 8318c2ecf20Sopenharmony_ci case CPU_PM_ENTER: 8328c2ecf20Sopenharmony_ci armpmu->stop(armpmu); 8338c2ecf20Sopenharmony_ci cpu_pm_pmu_setup(armpmu, cmd); 8348c2ecf20Sopenharmony_ci break; 8358c2ecf20Sopenharmony_ci case CPU_PM_EXIT: 8368c2ecf20Sopenharmony_ci case CPU_PM_ENTER_FAILED: 8378c2ecf20Sopenharmony_ci cpu_pm_pmu_setup(armpmu, cmd); 8388c2ecf20Sopenharmony_ci armpmu->start(armpmu); 8398c2ecf20Sopenharmony_ci break; 8408c2ecf20Sopenharmony_ci default: 8418c2ecf20Sopenharmony_ci return NOTIFY_DONE; 8428c2ecf20Sopenharmony_ci } 8438c2ecf20Sopenharmony_ci 8448c2ecf20Sopenharmony_ci return NOTIFY_OK; 8458c2ecf20Sopenharmony_ci} 8468c2ecf20Sopenharmony_ci 8478c2ecf20Sopenharmony_cistatic int cpu_pm_pmu_register(struct arm_pmu *cpu_pmu) 8488c2ecf20Sopenharmony_ci{ 8498c2ecf20Sopenharmony_ci cpu_pmu->cpu_pm_nb.notifier_call = cpu_pm_pmu_notify; 8508c2ecf20Sopenharmony_ci return cpu_pm_register_notifier(&cpu_pmu->cpu_pm_nb); 8518c2ecf20Sopenharmony_ci} 8528c2ecf20Sopenharmony_ci 8538c2ecf20Sopenharmony_cistatic void cpu_pm_pmu_unregister(struct arm_pmu *cpu_pmu) 8548c2ecf20Sopenharmony_ci{ 8558c2ecf20Sopenharmony_ci cpu_pm_unregister_notifier(&cpu_pmu->cpu_pm_nb); 8568c2ecf20Sopenharmony_ci} 8578c2ecf20Sopenharmony_ci#else 8588c2ecf20Sopenharmony_cistatic inline int cpu_pm_pmu_register(struct arm_pmu *cpu_pmu) { return 0; } 8598c2ecf20Sopenharmony_cistatic inline void cpu_pm_pmu_unregister(struct arm_pmu *cpu_pmu) { } 8608c2ecf20Sopenharmony_ci#endif 8618c2ecf20Sopenharmony_ci 8628c2ecf20Sopenharmony_cistatic int cpu_pmu_init(struct arm_pmu *cpu_pmu) 8638c2ecf20Sopenharmony_ci{ 8648c2ecf20Sopenharmony_ci int err; 8658c2ecf20Sopenharmony_ci 8668c2ecf20Sopenharmony_ci err = cpuhp_state_add_instance(CPUHP_AP_PERF_ARM_STARTING, 8678c2ecf20Sopenharmony_ci &cpu_pmu->node); 8688c2ecf20Sopenharmony_ci if (err) 8698c2ecf20Sopenharmony_ci goto out; 8708c2ecf20Sopenharmony_ci 8718c2ecf20Sopenharmony_ci err = cpu_pm_pmu_register(cpu_pmu); 8728c2ecf20Sopenharmony_ci if (err) 8738c2ecf20Sopenharmony_ci goto out_unregister; 8748c2ecf20Sopenharmony_ci 8758c2ecf20Sopenharmony_ci return 0; 8768c2ecf20Sopenharmony_ci 8778c2ecf20Sopenharmony_ciout_unregister: 8788c2ecf20Sopenharmony_ci cpuhp_state_remove_instance_nocalls(CPUHP_AP_PERF_ARM_STARTING, 8798c2ecf20Sopenharmony_ci &cpu_pmu->node); 8808c2ecf20Sopenharmony_ciout: 8818c2ecf20Sopenharmony_ci return err; 8828c2ecf20Sopenharmony_ci} 8838c2ecf20Sopenharmony_ci 8848c2ecf20Sopenharmony_cistatic void cpu_pmu_destroy(struct arm_pmu *cpu_pmu) 8858c2ecf20Sopenharmony_ci{ 8868c2ecf20Sopenharmony_ci cpu_pm_pmu_unregister(cpu_pmu); 8878c2ecf20Sopenharmony_ci cpuhp_state_remove_instance_nocalls(CPUHP_AP_PERF_ARM_STARTING, 8888c2ecf20Sopenharmony_ci &cpu_pmu->node); 8898c2ecf20Sopenharmony_ci} 8908c2ecf20Sopenharmony_ci 8918c2ecf20Sopenharmony_cistatic struct arm_pmu *__armpmu_alloc(gfp_t flags) 8928c2ecf20Sopenharmony_ci{ 8938c2ecf20Sopenharmony_ci struct arm_pmu *pmu; 8948c2ecf20Sopenharmony_ci int cpu; 8958c2ecf20Sopenharmony_ci 8968c2ecf20Sopenharmony_ci pmu = kzalloc(sizeof(*pmu), flags); 8978c2ecf20Sopenharmony_ci if (!pmu) { 8988c2ecf20Sopenharmony_ci pr_info("failed to allocate PMU device!\n"); 8998c2ecf20Sopenharmony_ci goto out; 9008c2ecf20Sopenharmony_ci } 9018c2ecf20Sopenharmony_ci 9028c2ecf20Sopenharmony_ci pmu->hw_events = alloc_percpu_gfp(struct pmu_hw_events, flags); 9038c2ecf20Sopenharmony_ci if (!pmu->hw_events) { 9048c2ecf20Sopenharmony_ci pr_info("failed to allocate per-cpu PMU data.\n"); 9058c2ecf20Sopenharmony_ci goto out_free_pmu; 9068c2ecf20Sopenharmony_ci } 9078c2ecf20Sopenharmony_ci 9088c2ecf20Sopenharmony_ci pmu->pmu = (struct pmu) { 9098c2ecf20Sopenharmony_ci .pmu_enable = armpmu_enable, 9108c2ecf20Sopenharmony_ci .pmu_disable = armpmu_disable, 9118c2ecf20Sopenharmony_ci .event_init = armpmu_event_init, 9128c2ecf20Sopenharmony_ci .add = armpmu_add, 9138c2ecf20Sopenharmony_ci .del = armpmu_del, 9148c2ecf20Sopenharmony_ci .start = armpmu_start, 9158c2ecf20Sopenharmony_ci .stop = armpmu_stop, 9168c2ecf20Sopenharmony_ci .read = armpmu_read, 9178c2ecf20Sopenharmony_ci .filter_match = armpmu_filter_match, 9188c2ecf20Sopenharmony_ci .attr_groups = pmu->attr_groups, 9198c2ecf20Sopenharmony_ci /* 9208c2ecf20Sopenharmony_ci * This is a CPU PMU potentially in a heterogeneous 9218c2ecf20Sopenharmony_ci * configuration (e.g. big.LITTLE). This is not an uncore PMU, 9228c2ecf20Sopenharmony_ci * and we have taken ctx sharing into account (e.g. with our 9238c2ecf20Sopenharmony_ci * pmu::filter_match callback and pmu::event_init group 9248c2ecf20Sopenharmony_ci * validation). 9258c2ecf20Sopenharmony_ci */ 9268c2ecf20Sopenharmony_ci .capabilities = PERF_PMU_CAP_HETEROGENEOUS_CPUS, 9278c2ecf20Sopenharmony_ci }; 9288c2ecf20Sopenharmony_ci 9298c2ecf20Sopenharmony_ci pmu->attr_groups[ARMPMU_ATTR_GROUP_COMMON] = 9308c2ecf20Sopenharmony_ci &armpmu_common_attr_group; 9318c2ecf20Sopenharmony_ci 9328c2ecf20Sopenharmony_ci for_each_possible_cpu(cpu) { 9338c2ecf20Sopenharmony_ci struct pmu_hw_events *events; 9348c2ecf20Sopenharmony_ci 9358c2ecf20Sopenharmony_ci events = per_cpu_ptr(pmu->hw_events, cpu); 9368c2ecf20Sopenharmony_ci raw_spin_lock_init(&events->pmu_lock); 9378c2ecf20Sopenharmony_ci events->percpu_pmu = pmu; 9388c2ecf20Sopenharmony_ci } 9398c2ecf20Sopenharmony_ci 9408c2ecf20Sopenharmony_ci return pmu; 9418c2ecf20Sopenharmony_ci 9428c2ecf20Sopenharmony_ciout_free_pmu: 9438c2ecf20Sopenharmony_ci kfree(pmu); 9448c2ecf20Sopenharmony_ciout: 9458c2ecf20Sopenharmony_ci return NULL; 9468c2ecf20Sopenharmony_ci} 9478c2ecf20Sopenharmony_ci 9488c2ecf20Sopenharmony_cistruct arm_pmu *armpmu_alloc(void) 9498c2ecf20Sopenharmony_ci{ 9508c2ecf20Sopenharmony_ci return __armpmu_alloc(GFP_KERNEL); 9518c2ecf20Sopenharmony_ci} 9528c2ecf20Sopenharmony_ci 9538c2ecf20Sopenharmony_cistruct arm_pmu *armpmu_alloc_atomic(void) 9548c2ecf20Sopenharmony_ci{ 9558c2ecf20Sopenharmony_ci return __armpmu_alloc(GFP_ATOMIC); 9568c2ecf20Sopenharmony_ci} 9578c2ecf20Sopenharmony_ci 9588c2ecf20Sopenharmony_ci 9598c2ecf20Sopenharmony_civoid armpmu_free(struct arm_pmu *pmu) 9608c2ecf20Sopenharmony_ci{ 9618c2ecf20Sopenharmony_ci free_percpu(pmu->hw_events); 9628c2ecf20Sopenharmony_ci kfree(pmu); 9638c2ecf20Sopenharmony_ci} 9648c2ecf20Sopenharmony_ci 9658c2ecf20Sopenharmony_ciint armpmu_register(struct arm_pmu *pmu) 9668c2ecf20Sopenharmony_ci{ 9678c2ecf20Sopenharmony_ci int ret; 9688c2ecf20Sopenharmony_ci 9698c2ecf20Sopenharmony_ci ret = cpu_pmu_init(pmu); 9708c2ecf20Sopenharmony_ci if (ret) 9718c2ecf20Sopenharmony_ci return ret; 9728c2ecf20Sopenharmony_ci 9738c2ecf20Sopenharmony_ci if (!pmu->set_event_filter) 9748c2ecf20Sopenharmony_ci pmu->pmu.capabilities |= PERF_PMU_CAP_NO_EXCLUDE; 9758c2ecf20Sopenharmony_ci 9768c2ecf20Sopenharmony_ci ret = perf_pmu_register(&pmu->pmu, pmu->name, -1); 9778c2ecf20Sopenharmony_ci if (ret) 9788c2ecf20Sopenharmony_ci goto out_destroy; 9798c2ecf20Sopenharmony_ci 9808c2ecf20Sopenharmony_ci if (!__oprofile_cpu_pmu) 9818c2ecf20Sopenharmony_ci __oprofile_cpu_pmu = pmu; 9828c2ecf20Sopenharmony_ci 9838c2ecf20Sopenharmony_ci pr_info("enabled with %s PMU driver, %d counters available%s\n", 9848c2ecf20Sopenharmony_ci pmu->name, pmu->num_events, 9858c2ecf20Sopenharmony_ci has_nmi ? ", using NMIs" : ""); 9868c2ecf20Sopenharmony_ci 9878c2ecf20Sopenharmony_ci return 0; 9888c2ecf20Sopenharmony_ci 9898c2ecf20Sopenharmony_ciout_destroy: 9908c2ecf20Sopenharmony_ci cpu_pmu_destroy(pmu); 9918c2ecf20Sopenharmony_ci return ret; 9928c2ecf20Sopenharmony_ci} 9938c2ecf20Sopenharmony_ci 9948c2ecf20Sopenharmony_cistatic int arm_pmu_hp_init(void) 9958c2ecf20Sopenharmony_ci{ 9968c2ecf20Sopenharmony_ci int ret; 9978c2ecf20Sopenharmony_ci 9988c2ecf20Sopenharmony_ci ret = cpuhp_setup_state_multi(CPUHP_AP_PERF_ARM_STARTING, 9998c2ecf20Sopenharmony_ci "perf/arm/pmu:starting", 10008c2ecf20Sopenharmony_ci arm_perf_starting_cpu, 10018c2ecf20Sopenharmony_ci arm_perf_teardown_cpu); 10028c2ecf20Sopenharmony_ci if (ret) 10038c2ecf20Sopenharmony_ci pr_err("CPU hotplug notifier for ARM PMU could not be registered: %d\n", 10048c2ecf20Sopenharmony_ci ret); 10058c2ecf20Sopenharmony_ci return ret; 10068c2ecf20Sopenharmony_ci} 10078c2ecf20Sopenharmony_cisubsys_initcall(arm_pmu_hp_init); 1008