162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * CPU PMU driver for the Apple M1 and derivatives 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Copyright (C) 2021 Google LLC 662306a36Sopenharmony_ci * 762306a36Sopenharmony_ci * Author: Marc Zyngier <maz@kernel.org> 862306a36Sopenharmony_ci * 962306a36Sopenharmony_ci * Most of the information used in this driver was provided by the 1062306a36Sopenharmony_ci * Asahi Linux project. The rest was experimentally discovered. 1162306a36Sopenharmony_ci */ 1262306a36Sopenharmony_ci 1362306a36Sopenharmony_ci#include <linux/of.h> 1462306a36Sopenharmony_ci#include <linux/perf/arm_pmu.h> 1562306a36Sopenharmony_ci#include <linux/platform_device.h> 1662306a36Sopenharmony_ci 1762306a36Sopenharmony_ci#include <asm/apple_m1_pmu.h> 1862306a36Sopenharmony_ci#include <asm/irq_regs.h> 1962306a36Sopenharmony_ci#include <asm/perf_event.h> 2062306a36Sopenharmony_ci 2162306a36Sopenharmony_ci#define M1_PMU_NR_COUNTERS 10 2262306a36Sopenharmony_ci 2362306a36Sopenharmony_ci#define M1_PMU_CFG_EVENT GENMASK(7, 0) 2462306a36Sopenharmony_ci 2562306a36Sopenharmony_ci#define ANY_BUT_0_1 GENMASK(9, 2) 2662306a36Sopenharmony_ci#define ONLY_2_TO_7 GENMASK(7, 2) 2762306a36Sopenharmony_ci#define ONLY_2_4_6 (BIT(2) | BIT(4) | BIT(6)) 2862306a36Sopenharmony_ci#define ONLY_5_6_7 (BIT(5) | BIT(6) | BIT(7)) 2962306a36Sopenharmony_ci 3062306a36Sopenharmony_ci/* 3162306a36Sopenharmony_ci * Description of the events we actually know about, as well as those with 3262306a36Sopenharmony_ci * a specific counter affinity. Yes, this is a grand total of two known 3362306a36Sopenharmony_ci * counters, and the rest is anybody's guess. 3462306a36Sopenharmony_ci * 3562306a36Sopenharmony_ci * Not all counters can count all events. Counters #0 and #1 are wired to 3662306a36Sopenharmony_ci * count cycles and instructions respectively, and some events have 3762306a36Sopenharmony_ci * bizarre mappings (every other counter, or even *one* counter). These 3862306a36Sopenharmony_ci * restrictions equally apply to both P and E cores. 3962306a36Sopenharmony_ci * 4062306a36Sopenharmony_ci * It is worth noting that the PMUs attached to P and E cores are likely 4162306a36Sopenharmony_ci * to be different because the underlying uarches are different. At the 4262306a36Sopenharmony_ci * moment, we don't really need to distinguish between the two because we 4362306a36Sopenharmony_ci * know next to nothing about the events themselves, and we already have 4462306a36Sopenharmony_ci * per cpu-type PMU abstractions. 4562306a36Sopenharmony_ci * 4662306a36Sopenharmony_ci * If we eventually find out that the events are different across 4762306a36Sopenharmony_ci * implementations, we'll have to introduce per cpu-type tables. 4862306a36Sopenharmony_ci */ 4962306a36Sopenharmony_cienum m1_pmu_events { 5062306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_01 = 0x01, 5162306a36Sopenharmony_ci M1_PMU_PERFCTR_CPU_CYCLES = 0x02, 5262306a36Sopenharmony_ci M1_PMU_PERFCTR_INSTRUCTIONS = 0x8c, 5362306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_8d = 0x8d, 5462306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_8e = 0x8e, 5562306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_8f = 0x8f, 5662306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_90 = 0x90, 5762306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_93 = 0x93, 5862306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_94 = 0x94, 5962306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_95 = 0x95, 6062306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_96 = 0x96, 6162306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_97 = 0x97, 6262306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_98 = 0x98, 6362306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_99 = 0x99, 6462306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_9a = 0x9a, 6562306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_9b = 0x9b, 6662306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_9c = 0x9c, 6762306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_9f = 0x9f, 6862306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_bf = 0xbf, 6962306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_c0 = 0xc0, 7062306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_c1 = 0xc1, 7162306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_c4 = 0xc4, 7262306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_c5 = 0xc5, 7362306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_c6 = 0xc6, 7462306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_c8 = 0xc8, 7562306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_ca = 0xca, 7662306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_cb = 0xcb, 7762306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_f5 = 0xf5, 7862306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_f6 = 0xf6, 7962306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_f7 = 0xf7, 8062306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_f8 = 0xf8, 8162306a36Sopenharmony_ci M1_PMU_PERFCTR_UNKNOWN_fd = 0xfd, 8262306a36Sopenharmony_ci M1_PMU_PERFCTR_LAST = M1_PMU_CFG_EVENT, 8362306a36Sopenharmony_ci 8462306a36Sopenharmony_ci /* 8562306a36Sopenharmony_ci * From this point onwards, these are not actual HW events, 8662306a36Sopenharmony_ci * but attributes that get stored in hw->config_base. 8762306a36Sopenharmony_ci */ 8862306a36Sopenharmony_ci M1_PMU_CFG_COUNT_USER = BIT(8), 8962306a36Sopenharmony_ci M1_PMU_CFG_COUNT_KERNEL = BIT(9), 9062306a36Sopenharmony_ci}; 9162306a36Sopenharmony_ci 9262306a36Sopenharmony_ci/* 9362306a36Sopenharmony_ci * Per-event affinity table. Most events can be installed on counter 9462306a36Sopenharmony_ci * 2-9, but there are a number of exceptions. Note that this table 9562306a36Sopenharmony_ci * has been created experimentally, and I wouldn't be surprised if more 9662306a36Sopenharmony_ci * counters had strange affinities. 9762306a36Sopenharmony_ci */ 9862306a36Sopenharmony_cistatic const u16 m1_pmu_event_affinity[M1_PMU_PERFCTR_LAST + 1] = { 9962306a36Sopenharmony_ci [0 ... M1_PMU_PERFCTR_LAST] = ANY_BUT_0_1, 10062306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_01] = BIT(7), 10162306a36Sopenharmony_ci [M1_PMU_PERFCTR_CPU_CYCLES] = ANY_BUT_0_1 | BIT(0), 10262306a36Sopenharmony_ci [M1_PMU_PERFCTR_INSTRUCTIONS] = BIT(7) | BIT(1), 10362306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_8d] = ONLY_5_6_7, 10462306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_8e] = ONLY_5_6_7, 10562306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_8f] = ONLY_5_6_7, 10662306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_90] = ONLY_5_6_7, 10762306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_93] = ONLY_5_6_7, 10862306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_94] = ONLY_5_6_7, 10962306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_95] = ONLY_5_6_7, 11062306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_96] = ONLY_5_6_7, 11162306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_97] = BIT(7), 11262306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_98] = ONLY_5_6_7, 11362306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_99] = ONLY_5_6_7, 11462306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_9a] = BIT(7), 11562306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_9b] = ONLY_5_6_7, 11662306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_9c] = ONLY_5_6_7, 11762306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_9f] = BIT(7), 11862306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_bf] = ONLY_5_6_7, 11962306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_c0] = ONLY_5_6_7, 12062306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_c1] = ONLY_5_6_7, 12162306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_c4] = ONLY_5_6_7, 12262306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_c5] = ONLY_5_6_7, 12362306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_c6] = ONLY_5_6_7, 12462306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_c8] = ONLY_5_6_7, 12562306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_ca] = ONLY_5_6_7, 12662306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_cb] = ONLY_5_6_7, 12762306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_f5] = ONLY_2_4_6, 12862306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_f6] = ONLY_2_4_6, 12962306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_f7] = ONLY_2_4_6, 13062306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_f8] = ONLY_2_TO_7, 13162306a36Sopenharmony_ci [M1_PMU_PERFCTR_UNKNOWN_fd] = ONLY_2_4_6, 13262306a36Sopenharmony_ci}; 13362306a36Sopenharmony_ci 13462306a36Sopenharmony_cistatic const unsigned m1_pmu_perf_map[PERF_COUNT_HW_MAX] = { 13562306a36Sopenharmony_ci PERF_MAP_ALL_UNSUPPORTED, 13662306a36Sopenharmony_ci [PERF_COUNT_HW_CPU_CYCLES] = M1_PMU_PERFCTR_CPU_CYCLES, 13762306a36Sopenharmony_ci [PERF_COUNT_HW_INSTRUCTIONS] = M1_PMU_PERFCTR_INSTRUCTIONS, 13862306a36Sopenharmony_ci /* No idea about the rest yet */ 13962306a36Sopenharmony_ci}; 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_ci/* sysfs definitions */ 14262306a36Sopenharmony_cistatic ssize_t m1_pmu_events_sysfs_show(struct device *dev, 14362306a36Sopenharmony_ci struct device_attribute *attr, 14462306a36Sopenharmony_ci char *page) 14562306a36Sopenharmony_ci{ 14662306a36Sopenharmony_ci struct perf_pmu_events_attr *pmu_attr; 14762306a36Sopenharmony_ci 14862306a36Sopenharmony_ci pmu_attr = container_of(attr, struct perf_pmu_events_attr, attr); 14962306a36Sopenharmony_ci 15062306a36Sopenharmony_ci return sprintf(page, "event=0x%04llx\n", pmu_attr->id); 15162306a36Sopenharmony_ci} 15262306a36Sopenharmony_ci 15362306a36Sopenharmony_ci#define M1_PMU_EVENT_ATTR(name, config) \ 15462306a36Sopenharmony_ci PMU_EVENT_ATTR_ID(name, m1_pmu_events_sysfs_show, config) 15562306a36Sopenharmony_ci 15662306a36Sopenharmony_cistatic struct attribute *m1_pmu_event_attrs[] = { 15762306a36Sopenharmony_ci M1_PMU_EVENT_ATTR(cycles, M1_PMU_PERFCTR_CPU_CYCLES), 15862306a36Sopenharmony_ci M1_PMU_EVENT_ATTR(instructions, M1_PMU_PERFCTR_INSTRUCTIONS), 15962306a36Sopenharmony_ci NULL, 16062306a36Sopenharmony_ci}; 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_cistatic const struct attribute_group m1_pmu_events_attr_group = { 16362306a36Sopenharmony_ci .name = "events", 16462306a36Sopenharmony_ci .attrs = m1_pmu_event_attrs, 16562306a36Sopenharmony_ci}; 16662306a36Sopenharmony_ci 16762306a36Sopenharmony_ciPMU_FORMAT_ATTR(event, "config:0-7"); 16862306a36Sopenharmony_ci 16962306a36Sopenharmony_cistatic struct attribute *m1_pmu_format_attrs[] = { 17062306a36Sopenharmony_ci &format_attr_event.attr, 17162306a36Sopenharmony_ci NULL, 17262306a36Sopenharmony_ci}; 17362306a36Sopenharmony_ci 17462306a36Sopenharmony_cistatic const struct attribute_group m1_pmu_format_attr_group = { 17562306a36Sopenharmony_ci .name = "format", 17662306a36Sopenharmony_ci .attrs = m1_pmu_format_attrs, 17762306a36Sopenharmony_ci}; 17862306a36Sopenharmony_ci 17962306a36Sopenharmony_ci/* Low level accessors. No synchronisation. */ 18062306a36Sopenharmony_ci#define PMU_READ_COUNTER(_idx) \ 18162306a36Sopenharmony_ci case _idx: return read_sysreg_s(SYS_IMP_APL_PMC## _idx ##_EL1) 18262306a36Sopenharmony_ci 18362306a36Sopenharmony_ci#define PMU_WRITE_COUNTER(_val, _idx) \ 18462306a36Sopenharmony_ci case _idx: \ 18562306a36Sopenharmony_ci write_sysreg_s(_val, SYS_IMP_APL_PMC## _idx ##_EL1); \ 18662306a36Sopenharmony_ci return 18762306a36Sopenharmony_ci 18862306a36Sopenharmony_cistatic u64 m1_pmu_read_hw_counter(unsigned int index) 18962306a36Sopenharmony_ci{ 19062306a36Sopenharmony_ci switch (index) { 19162306a36Sopenharmony_ci PMU_READ_COUNTER(0); 19262306a36Sopenharmony_ci PMU_READ_COUNTER(1); 19362306a36Sopenharmony_ci PMU_READ_COUNTER(2); 19462306a36Sopenharmony_ci PMU_READ_COUNTER(3); 19562306a36Sopenharmony_ci PMU_READ_COUNTER(4); 19662306a36Sopenharmony_ci PMU_READ_COUNTER(5); 19762306a36Sopenharmony_ci PMU_READ_COUNTER(6); 19862306a36Sopenharmony_ci PMU_READ_COUNTER(7); 19962306a36Sopenharmony_ci PMU_READ_COUNTER(8); 20062306a36Sopenharmony_ci PMU_READ_COUNTER(9); 20162306a36Sopenharmony_ci } 20262306a36Sopenharmony_ci 20362306a36Sopenharmony_ci BUG(); 20462306a36Sopenharmony_ci} 20562306a36Sopenharmony_ci 20662306a36Sopenharmony_cistatic void m1_pmu_write_hw_counter(u64 val, unsigned int index) 20762306a36Sopenharmony_ci{ 20862306a36Sopenharmony_ci switch (index) { 20962306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 0); 21062306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 1); 21162306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 2); 21262306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 3); 21362306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 4); 21462306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 5); 21562306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 6); 21662306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 7); 21762306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 8); 21862306a36Sopenharmony_ci PMU_WRITE_COUNTER(val, 9); 21962306a36Sopenharmony_ci } 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_ci BUG(); 22262306a36Sopenharmony_ci} 22362306a36Sopenharmony_ci 22462306a36Sopenharmony_ci#define get_bit_offset(index, mask) (__ffs(mask) + (index)) 22562306a36Sopenharmony_ci 22662306a36Sopenharmony_cistatic void __m1_pmu_enable_counter(unsigned int index, bool en) 22762306a36Sopenharmony_ci{ 22862306a36Sopenharmony_ci u64 val, bit; 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_ci switch (index) { 23162306a36Sopenharmony_ci case 0 ... 7: 23262306a36Sopenharmony_ci bit = BIT(get_bit_offset(index, PMCR0_CNT_ENABLE_0_7)); 23362306a36Sopenharmony_ci break; 23462306a36Sopenharmony_ci case 8 ... 9: 23562306a36Sopenharmony_ci bit = BIT(get_bit_offset(index - 8, PMCR0_CNT_ENABLE_8_9)); 23662306a36Sopenharmony_ci break; 23762306a36Sopenharmony_ci default: 23862306a36Sopenharmony_ci BUG(); 23962306a36Sopenharmony_ci } 24062306a36Sopenharmony_ci 24162306a36Sopenharmony_ci val = read_sysreg_s(SYS_IMP_APL_PMCR0_EL1); 24262306a36Sopenharmony_ci 24362306a36Sopenharmony_ci if (en) 24462306a36Sopenharmony_ci val |= bit; 24562306a36Sopenharmony_ci else 24662306a36Sopenharmony_ci val &= ~bit; 24762306a36Sopenharmony_ci 24862306a36Sopenharmony_ci write_sysreg_s(val, SYS_IMP_APL_PMCR0_EL1); 24962306a36Sopenharmony_ci} 25062306a36Sopenharmony_ci 25162306a36Sopenharmony_cistatic void m1_pmu_enable_counter(unsigned int index) 25262306a36Sopenharmony_ci{ 25362306a36Sopenharmony_ci __m1_pmu_enable_counter(index, true); 25462306a36Sopenharmony_ci} 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_cistatic void m1_pmu_disable_counter(unsigned int index) 25762306a36Sopenharmony_ci{ 25862306a36Sopenharmony_ci __m1_pmu_enable_counter(index, false); 25962306a36Sopenharmony_ci} 26062306a36Sopenharmony_ci 26162306a36Sopenharmony_cistatic void __m1_pmu_enable_counter_interrupt(unsigned int index, bool en) 26262306a36Sopenharmony_ci{ 26362306a36Sopenharmony_ci u64 val, bit; 26462306a36Sopenharmony_ci 26562306a36Sopenharmony_ci switch (index) { 26662306a36Sopenharmony_ci case 0 ... 7: 26762306a36Sopenharmony_ci bit = BIT(get_bit_offset(index, PMCR0_PMI_ENABLE_0_7)); 26862306a36Sopenharmony_ci break; 26962306a36Sopenharmony_ci case 8 ... 9: 27062306a36Sopenharmony_ci bit = BIT(get_bit_offset(index - 8, PMCR0_PMI_ENABLE_8_9)); 27162306a36Sopenharmony_ci break; 27262306a36Sopenharmony_ci default: 27362306a36Sopenharmony_ci BUG(); 27462306a36Sopenharmony_ci } 27562306a36Sopenharmony_ci 27662306a36Sopenharmony_ci val = read_sysreg_s(SYS_IMP_APL_PMCR0_EL1); 27762306a36Sopenharmony_ci 27862306a36Sopenharmony_ci if (en) 27962306a36Sopenharmony_ci val |= bit; 28062306a36Sopenharmony_ci else 28162306a36Sopenharmony_ci val &= ~bit; 28262306a36Sopenharmony_ci 28362306a36Sopenharmony_ci write_sysreg_s(val, SYS_IMP_APL_PMCR0_EL1); 28462306a36Sopenharmony_ci} 28562306a36Sopenharmony_ci 28662306a36Sopenharmony_cistatic void m1_pmu_enable_counter_interrupt(unsigned int index) 28762306a36Sopenharmony_ci{ 28862306a36Sopenharmony_ci __m1_pmu_enable_counter_interrupt(index, true); 28962306a36Sopenharmony_ci} 29062306a36Sopenharmony_ci 29162306a36Sopenharmony_cistatic void m1_pmu_disable_counter_interrupt(unsigned int index) 29262306a36Sopenharmony_ci{ 29362306a36Sopenharmony_ci __m1_pmu_enable_counter_interrupt(index, false); 29462306a36Sopenharmony_ci} 29562306a36Sopenharmony_ci 29662306a36Sopenharmony_cistatic void m1_pmu_configure_counter(unsigned int index, u8 event, 29762306a36Sopenharmony_ci bool user, bool kernel) 29862306a36Sopenharmony_ci{ 29962306a36Sopenharmony_ci u64 val, user_bit, kernel_bit; 30062306a36Sopenharmony_ci int shift; 30162306a36Sopenharmony_ci 30262306a36Sopenharmony_ci switch (index) { 30362306a36Sopenharmony_ci case 0 ... 7: 30462306a36Sopenharmony_ci user_bit = BIT(get_bit_offset(index, PMCR1_COUNT_A64_EL0_0_7)); 30562306a36Sopenharmony_ci kernel_bit = BIT(get_bit_offset(index, PMCR1_COUNT_A64_EL1_0_7)); 30662306a36Sopenharmony_ci break; 30762306a36Sopenharmony_ci case 8 ... 9: 30862306a36Sopenharmony_ci user_bit = BIT(get_bit_offset(index - 8, PMCR1_COUNT_A64_EL0_8_9)); 30962306a36Sopenharmony_ci kernel_bit = BIT(get_bit_offset(index - 8, PMCR1_COUNT_A64_EL1_8_9)); 31062306a36Sopenharmony_ci break; 31162306a36Sopenharmony_ci default: 31262306a36Sopenharmony_ci BUG(); 31362306a36Sopenharmony_ci } 31462306a36Sopenharmony_ci 31562306a36Sopenharmony_ci val = read_sysreg_s(SYS_IMP_APL_PMCR1_EL1); 31662306a36Sopenharmony_ci 31762306a36Sopenharmony_ci if (user) 31862306a36Sopenharmony_ci val |= user_bit; 31962306a36Sopenharmony_ci else 32062306a36Sopenharmony_ci val &= ~user_bit; 32162306a36Sopenharmony_ci 32262306a36Sopenharmony_ci if (kernel) 32362306a36Sopenharmony_ci val |= kernel_bit; 32462306a36Sopenharmony_ci else 32562306a36Sopenharmony_ci val &= ~kernel_bit; 32662306a36Sopenharmony_ci 32762306a36Sopenharmony_ci write_sysreg_s(val, SYS_IMP_APL_PMCR1_EL1); 32862306a36Sopenharmony_ci 32962306a36Sopenharmony_ci /* 33062306a36Sopenharmony_ci * Counters 0 and 1 have fixed events. For anything else, 33162306a36Sopenharmony_ci * place the event at the expected location in the relevant 33262306a36Sopenharmony_ci * register (PMESR0 holds the event configuration for counters 33362306a36Sopenharmony_ci * 2-5, resp. PMESR1 for counters 6-9). 33462306a36Sopenharmony_ci */ 33562306a36Sopenharmony_ci switch (index) { 33662306a36Sopenharmony_ci case 0 ... 1: 33762306a36Sopenharmony_ci break; 33862306a36Sopenharmony_ci case 2 ... 5: 33962306a36Sopenharmony_ci shift = (index - 2) * 8; 34062306a36Sopenharmony_ci val = read_sysreg_s(SYS_IMP_APL_PMESR0_EL1); 34162306a36Sopenharmony_ci val &= ~((u64)0xff << shift); 34262306a36Sopenharmony_ci val |= (u64)event << shift; 34362306a36Sopenharmony_ci write_sysreg_s(val, SYS_IMP_APL_PMESR0_EL1); 34462306a36Sopenharmony_ci break; 34562306a36Sopenharmony_ci case 6 ... 9: 34662306a36Sopenharmony_ci shift = (index - 6) * 8; 34762306a36Sopenharmony_ci val = read_sysreg_s(SYS_IMP_APL_PMESR1_EL1); 34862306a36Sopenharmony_ci val &= ~((u64)0xff << shift); 34962306a36Sopenharmony_ci val |= (u64)event << shift; 35062306a36Sopenharmony_ci write_sysreg_s(val, SYS_IMP_APL_PMESR1_EL1); 35162306a36Sopenharmony_ci break; 35262306a36Sopenharmony_ci } 35362306a36Sopenharmony_ci} 35462306a36Sopenharmony_ci 35562306a36Sopenharmony_ci/* arm_pmu backend */ 35662306a36Sopenharmony_cistatic void m1_pmu_enable_event(struct perf_event *event) 35762306a36Sopenharmony_ci{ 35862306a36Sopenharmony_ci bool user, kernel; 35962306a36Sopenharmony_ci u8 evt; 36062306a36Sopenharmony_ci 36162306a36Sopenharmony_ci evt = event->hw.config_base & M1_PMU_CFG_EVENT; 36262306a36Sopenharmony_ci user = event->hw.config_base & M1_PMU_CFG_COUNT_USER; 36362306a36Sopenharmony_ci kernel = event->hw.config_base & M1_PMU_CFG_COUNT_KERNEL; 36462306a36Sopenharmony_ci 36562306a36Sopenharmony_ci m1_pmu_disable_counter_interrupt(event->hw.idx); 36662306a36Sopenharmony_ci m1_pmu_disable_counter(event->hw.idx); 36762306a36Sopenharmony_ci isb(); 36862306a36Sopenharmony_ci 36962306a36Sopenharmony_ci m1_pmu_configure_counter(event->hw.idx, evt, user, kernel); 37062306a36Sopenharmony_ci m1_pmu_enable_counter(event->hw.idx); 37162306a36Sopenharmony_ci m1_pmu_enable_counter_interrupt(event->hw.idx); 37262306a36Sopenharmony_ci isb(); 37362306a36Sopenharmony_ci} 37462306a36Sopenharmony_ci 37562306a36Sopenharmony_cistatic void m1_pmu_disable_event(struct perf_event *event) 37662306a36Sopenharmony_ci{ 37762306a36Sopenharmony_ci m1_pmu_disable_counter_interrupt(event->hw.idx); 37862306a36Sopenharmony_ci m1_pmu_disable_counter(event->hw.idx); 37962306a36Sopenharmony_ci isb(); 38062306a36Sopenharmony_ci} 38162306a36Sopenharmony_ci 38262306a36Sopenharmony_cistatic irqreturn_t m1_pmu_handle_irq(struct arm_pmu *cpu_pmu) 38362306a36Sopenharmony_ci{ 38462306a36Sopenharmony_ci struct pmu_hw_events *cpuc = this_cpu_ptr(cpu_pmu->hw_events); 38562306a36Sopenharmony_ci struct pt_regs *regs; 38662306a36Sopenharmony_ci u64 overflow, state; 38762306a36Sopenharmony_ci int idx; 38862306a36Sopenharmony_ci 38962306a36Sopenharmony_ci overflow = read_sysreg_s(SYS_IMP_APL_PMSR_EL1); 39062306a36Sopenharmony_ci if (!overflow) { 39162306a36Sopenharmony_ci /* Spurious interrupt? */ 39262306a36Sopenharmony_ci state = read_sysreg_s(SYS_IMP_APL_PMCR0_EL1); 39362306a36Sopenharmony_ci state &= ~PMCR0_IACT; 39462306a36Sopenharmony_ci write_sysreg_s(state, SYS_IMP_APL_PMCR0_EL1); 39562306a36Sopenharmony_ci isb(); 39662306a36Sopenharmony_ci return IRQ_NONE; 39762306a36Sopenharmony_ci } 39862306a36Sopenharmony_ci 39962306a36Sopenharmony_ci cpu_pmu->stop(cpu_pmu); 40062306a36Sopenharmony_ci 40162306a36Sopenharmony_ci regs = get_irq_regs(); 40262306a36Sopenharmony_ci 40362306a36Sopenharmony_ci for (idx = 0; idx < cpu_pmu->num_events; idx++) { 40462306a36Sopenharmony_ci struct perf_event *event = cpuc->events[idx]; 40562306a36Sopenharmony_ci struct perf_sample_data data; 40662306a36Sopenharmony_ci 40762306a36Sopenharmony_ci if (!event) 40862306a36Sopenharmony_ci continue; 40962306a36Sopenharmony_ci 41062306a36Sopenharmony_ci armpmu_event_update(event); 41162306a36Sopenharmony_ci perf_sample_data_init(&data, 0, event->hw.last_period); 41262306a36Sopenharmony_ci if (!armpmu_event_set_period(event)) 41362306a36Sopenharmony_ci continue; 41462306a36Sopenharmony_ci 41562306a36Sopenharmony_ci if (perf_event_overflow(event, &data, regs)) 41662306a36Sopenharmony_ci m1_pmu_disable_event(event); 41762306a36Sopenharmony_ci } 41862306a36Sopenharmony_ci 41962306a36Sopenharmony_ci cpu_pmu->start(cpu_pmu); 42062306a36Sopenharmony_ci 42162306a36Sopenharmony_ci return IRQ_HANDLED; 42262306a36Sopenharmony_ci} 42362306a36Sopenharmony_ci 42462306a36Sopenharmony_cistatic u64 m1_pmu_read_counter(struct perf_event *event) 42562306a36Sopenharmony_ci{ 42662306a36Sopenharmony_ci return m1_pmu_read_hw_counter(event->hw.idx); 42762306a36Sopenharmony_ci} 42862306a36Sopenharmony_ci 42962306a36Sopenharmony_cistatic void m1_pmu_write_counter(struct perf_event *event, u64 value) 43062306a36Sopenharmony_ci{ 43162306a36Sopenharmony_ci m1_pmu_write_hw_counter(value, event->hw.idx); 43262306a36Sopenharmony_ci isb(); 43362306a36Sopenharmony_ci} 43462306a36Sopenharmony_ci 43562306a36Sopenharmony_cistatic int m1_pmu_get_event_idx(struct pmu_hw_events *cpuc, 43662306a36Sopenharmony_ci struct perf_event *event) 43762306a36Sopenharmony_ci{ 43862306a36Sopenharmony_ci unsigned long evtype = event->hw.config_base & M1_PMU_CFG_EVENT; 43962306a36Sopenharmony_ci unsigned long affinity = m1_pmu_event_affinity[evtype]; 44062306a36Sopenharmony_ci int idx; 44162306a36Sopenharmony_ci 44262306a36Sopenharmony_ci /* 44362306a36Sopenharmony_ci * Place the event on the first free counter that can count 44462306a36Sopenharmony_ci * this event. 44562306a36Sopenharmony_ci * 44662306a36Sopenharmony_ci * We could do a better job if we had a view of all the events 44762306a36Sopenharmony_ci * counting on the PMU at any given time, and by placing the 44862306a36Sopenharmony_ci * most constraining events first. 44962306a36Sopenharmony_ci */ 45062306a36Sopenharmony_ci for_each_set_bit(idx, &affinity, M1_PMU_NR_COUNTERS) { 45162306a36Sopenharmony_ci if (!test_and_set_bit(idx, cpuc->used_mask)) 45262306a36Sopenharmony_ci return idx; 45362306a36Sopenharmony_ci } 45462306a36Sopenharmony_ci 45562306a36Sopenharmony_ci return -EAGAIN; 45662306a36Sopenharmony_ci} 45762306a36Sopenharmony_ci 45862306a36Sopenharmony_cistatic void m1_pmu_clear_event_idx(struct pmu_hw_events *cpuc, 45962306a36Sopenharmony_ci struct perf_event *event) 46062306a36Sopenharmony_ci{ 46162306a36Sopenharmony_ci clear_bit(event->hw.idx, cpuc->used_mask); 46262306a36Sopenharmony_ci} 46362306a36Sopenharmony_ci 46462306a36Sopenharmony_cistatic void __m1_pmu_set_mode(u8 mode) 46562306a36Sopenharmony_ci{ 46662306a36Sopenharmony_ci u64 val; 46762306a36Sopenharmony_ci 46862306a36Sopenharmony_ci val = read_sysreg_s(SYS_IMP_APL_PMCR0_EL1); 46962306a36Sopenharmony_ci val &= ~(PMCR0_IMODE | PMCR0_IACT); 47062306a36Sopenharmony_ci val |= FIELD_PREP(PMCR0_IMODE, mode); 47162306a36Sopenharmony_ci write_sysreg_s(val, SYS_IMP_APL_PMCR0_EL1); 47262306a36Sopenharmony_ci isb(); 47362306a36Sopenharmony_ci} 47462306a36Sopenharmony_ci 47562306a36Sopenharmony_cistatic void m1_pmu_start(struct arm_pmu *cpu_pmu) 47662306a36Sopenharmony_ci{ 47762306a36Sopenharmony_ci __m1_pmu_set_mode(PMCR0_IMODE_FIQ); 47862306a36Sopenharmony_ci} 47962306a36Sopenharmony_ci 48062306a36Sopenharmony_cistatic void m1_pmu_stop(struct arm_pmu *cpu_pmu) 48162306a36Sopenharmony_ci{ 48262306a36Sopenharmony_ci __m1_pmu_set_mode(PMCR0_IMODE_OFF); 48362306a36Sopenharmony_ci} 48462306a36Sopenharmony_ci 48562306a36Sopenharmony_cistatic int m1_pmu_map_event(struct perf_event *event) 48662306a36Sopenharmony_ci{ 48762306a36Sopenharmony_ci /* 48862306a36Sopenharmony_ci * Although the counters are 48bit wide, bit 47 is what 48962306a36Sopenharmony_ci * triggers the overflow interrupt. Advertise the counters 49062306a36Sopenharmony_ci * being 47bit wide to mimick the behaviour of the ARM PMU. 49162306a36Sopenharmony_ci */ 49262306a36Sopenharmony_ci event->hw.flags |= ARMPMU_EVT_47BIT; 49362306a36Sopenharmony_ci return armpmu_map_event(event, &m1_pmu_perf_map, NULL, M1_PMU_CFG_EVENT); 49462306a36Sopenharmony_ci} 49562306a36Sopenharmony_ci 49662306a36Sopenharmony_cistatic int m2_pmu_map_event(struct perf_event *event) 49762306a36Sopenharmony_ci{ 49862306a36Sopenharmony_ci /* 49962306a36Sopenharmony_ci * Same deal as the above, except that M2 has 64bit counters. 50062306a36Sopenharmony_ci * Which, as far as we're concerned, actually means 63 bits. 50162306a36Sopenharmony_ci * Yes, this is getting awkward. 50262306a36Sopenharmony_ci */ 50362306a36Sopenharmony_ci event->hw.flags |= ARMPMU_EVT_63BIT; 50462306a36Sopenharmony_ci return armpmu_map_event(event, &m1_pmu_perf_map, NULL, M1_PMU_CFG_EVENT); 50562306a36Sopenharmony_ci} 50662306a36Sopenharmony_ci 50762306a36Sopenharmony_cistatic void m1_pmu_reset(void *info) 50862306a36Sopenharmony_ci{ 50962306a36Sopenharmony_ci int i; 51062306a36Sopenharmony_ci 51162306a36Sopenharmony_ci __m1_pmu_set_mode(PMCR0_IMODE_OFF); 51262306a36Sopenharmony_ci 51362306a36Sopenharmony_ci for (i = 0; i < M1_PMU_NR_COUNTERS; i++) { 51462306a36Sopenharmony_ci m1_pmu_disable_counter(i); 51562306a36Sopenharmony_ci m1_pmu_disable_counter_interrupt(i); 51662306a36Sopenharmony_ci m1_pmu_write_hw_counter(0, i); 51762306a36Sopenharmony_ci } 51862306a36Sopenharmony_ci 51962306a36Sopenharmony_ci isb(); 52062306a36Sopenharmony_ci} 52162306a36Sopenharmony_ci 52262306a36Sopenharmony_cistatic int m1_pmu_set_event_filter(struct hw_perf_event *event, 52362306a36Sopenharmony_ci struct perf_event_attr *attr) 52462306a36Sopenharmony_ci{ 52562306a36Sopenharmony_ci unsigned long config_base = 0; 52662306a36Sopenharmony_ci 52762306a36Sopenharmony_ci if (!attr->exclude_guest) 52862306a36Sopenharmony_ci return -EINVAL; 52962306a36Sopenharmony_ci if (!attr->exclude_kernel) 53062306a36Sopenharmony_ci config_base |= M1_PMU_CFG_COUNT_KERNEL; 53162306a36Sopenharmony_ci if (!attr->exclude_user) 53262306a36Sopenharmony_ci config_base |= M1_PMU_CFG_COUNT_USER; 53362306a36Sopenharmony_ci 53462306a36Sopenharmony_ci event->config_base = config_base; 53562306a36Sopenharmony_ci 53662306a36Sopenharmony_ci return 0; 53762306a36Sopenharmony_ci} 53862306a36Sopenharmony_ci 53962306a36Sopenharmony_cistatic int m1_pmu_init(struct arm_pmu *cpu_pmu, u32 flags) 54062306a36Sopenharmony_ci{ 54162306a36Sopenharmony_ci cpu_pmu->handle_irq = m1_pmu_handle_irq; 54262306a36Sopenharmony_ci cpu_pmu->enable = m1_pmu_enable_event; 54362306a36Sopenharmony_ci cpu_pmu->disable = m1_pmu_disable_event; 54462306a36Sopenharmony_ci cpu_pmu->read_counter = m1_pmu_read_counter; 54562306a36Sopenharmony_ci cpu_pmu->write_counter = m1_pmu_write_counter; 54662306a36Sopenharmony_ci cpu_pmu->get_event_idx = m1_pmu_get_event_idx; 54762306a36Sopenharmony_ci cpu_pmu->clear_event_idx = m1_pmu_clear_event_idx; 54862306a36Sopenharmony_ci cpu_pmu->start = m1_pmu_start; 54962306a36Sopenharmony_ci cpu_pmu->stop = m1_pmu_stop; 55062306a36Sopenharmony_ci 55162306a36Sopenharmony_ci if (flags & ARMPMU_EVT_47BIT) 55262306a36Sopenharmony_ci cpu_pmu->map_event = m1_pmu_map_event; 55362306a36Sopenharmony_ci else if (flags & ARMPMU_EVT_63BIT) 55462306a36Sopenharmony_ci cpu_pmu->map_event = m2_pmu_map_event; 55562306a36Sopenharmony_ci else 55662306a36Sopenharmony_ci return WARN_ON(-EINVAL); 55762306a36Sopenharmony_ci 55862306a36Sopenharmony_ci cpu_pmu->reset = m1_pmu_reset; 55962306a36Sopenharmony_ci cpu_pmu->set_event_filter = m1_pmu_set_event_filter; 56062306a36Sopenharmony_ci 56162306a36Sopenharmony_ci cpu_pmu->num_events = M1_PMU_NR_COUNTERS; 56262306a36Sopenharmony_ci cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_EVENTS] = &m1_pmu_events_attr_group; 56362306a36Sopenharmony_ci cpu_pmu->attr_groups[ARMPMU_ATTR_GROUP_FORMATS] = &m1_pmu_format_attr_group; 56462306a36Sopenharmony_ci return 0; 56562306a36Sopenharmony_ci} 56662306a36Sopenharmony_ci 56762306a36Sopenharmony_ci/* Device driver gunk */ 56862306a36Sopenharmony_cistatic int m1_pmu_ice_init(struct arm_pmu *cpu_pmu) 56962306a36Sopenharmony_ci{ 57062306a36Sopenharmony_ci cpu_pmu->name = "apple_icestorm_pmu"; 57162306a36Sopenharmony_ci return m1_pmu_init(cpu_pmu, ARMPMU_EVT_47BIT); 57262306a36Sopenharmony_ci} 57362306a36Sopenharmony_ci 57462306a36Sopenharmony_cistatic int m1_pmu_fire_init(struct arm_pmu *cpu_pmu) 57562306a36Sopenharmony_ci{ 57662306a36Sopenharmony_ci cpu_pmu->name = "apple_firestorm_pmu"; 57762306a36Sopenharmony_ci return m1_pmu_init(cpu_pmu, ARMPMU_EVT_47BIT); 57862306a36Sopenharmony_ci} 57962306a36Sopenharmony_ci 58062306a36Sopenharmony_cistatic int m2_pmu_avalanche_init(struct arm_pmu *cpu_pmu) 58162306a36Sopenharmony_ci{ 58262306a36Sopenharmony_ci cpu_pmu->name = "apple_avalanche_pmu"; 58362306a36Sopenharmony_ci return m1_pmu_init(cpu_pmu, ARMPMU_EVT_63BIT); 58462306a36Sopenharmony_ci} 58562306a36Sopenharmony_ci 58662306a36Sopenharmony_cistatic int m2_pmu_blizzard_init(struct arm_pmu *cpu_pmu) 58762306a36Sopenharmony_ci{ 58862306a36Sopenharmony_ci cpu_pmu->name = "apple_blizzard_pmu"; 58962306a36Sopenharmony_ci return m1_pmu_init(cpu_pmu, ARMPMU_EVT_63BIT); 59062306a36Sopenharmony_ci} 59162306a36Sopenharmony_ci 59262306a36Sopenharmony_cistatic const struct of_device_id m1_pmu_of_device_ids[] = { 59362306a36Sopenharmony_ci { .compatible = "apple,avalanche-pmu", .data = m2_pmu_avalanche_init, }, 59462306a36Sopenharmony_ci { .compatible = "apple,blizzard-pmu", .data = m2_pmu_blizzard_init, }, 59562306a36Sopenharmony_ci { .compatible = "apple,icestorm-pmu", .data = m1_pmu_ice_init, }, 59662306a36Sopenharmony_ci { .compatible = "apple,firestorm-pmu", .data = m1_pmu_fire_init, }, 59762306a36Sopenharmony_ci { }, 59862306a36Sopenharmony_ci}; 59962306a36Sopenharmony_ciMODULE_DEVICE_TABLE(of, m1_pmu_of_device_ids); 60062306a36Sopenharmony_ci 60162306a36Sopenharmony_cistatic int m1_pmu_device_probe(struct platform_device *pdev) 60262306a36Sopenharmony_ci{ 60362306a36Sopenharmony_ci return arm_pmu_device_probe(pdev, m1_pmu_of_device_ids, NULL); 60462306a36Sopenharmony_ci} 60562306a36Sopenharmony_ci 60662306a36Sopenharmony_cistatic struct platform_driver m1_pmu_driver = { 60762306a36Sopenharmony_ci .driver = { 60862306a36Sopenharmony_ci .name = "apple-m1-cpu-pmu", 60962306a36Sopenharmony_ci .of_match_table = m1_pmu_of_device_ids, 61062306a36Sopenharmony_ci .suppress_bind_attrs = true, 61162306a36Sopenharmony_ci }, 61262306a36Sopenharmony_ci .probe = m1_pmu_device_probe, 61362306a36Sopenharmony_ci}; 61462306a36Sopenharmony_ci 61562306a36Sopenharmony_cimodule_platform_driver(m1_pmu_driver); 616