18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 28c2ecf20Sopenharmony_ci/* 38c2ecf20Sopenharmony_ci * Intel(R) Processor Trace PMU driver for perf 48c2ecf20Sopenharmony_ci * Copyright (c) 2013-2014, Intel Corporation. 58c2ecf20Sopenharmony_ci * 68c2ecf20Sopenharmony_ci * Intel PT is specified in the Intel Architecture Instruction Set Extensions 78c2ecf20Sopenharmony_ci * Programming Reference: 88c2ecf20Sopenharmony_ci * http://software.intel.com/en-us/intel-isa-extensions 98c2ecf20Sopenharmony_ci */ 108c2ecf20Sopenharmony_ci 118c2ecf20Sopenharmony_ci#undef DEBUG 128c2ecf20Sopenharmony_ci 138c2ecf20Sopenharmony_ci#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 148c2ecf20Sopenharmony_ci 158c2ecf20Sopenharmony_ci#include <linux/types.h> 168c2ecf20Sopenharmony_ci#include <linux/bits.h> 178c2ecf20Sopenharmony_ci#include <linux/limits.h> 188c2ecf20Sopenharmony_ci#include <linux/slab.h> 198c2ecf20Sopenharmony_ci#include <linux/device.h> 208c2ecf20Sopenharmony_ci 218c2ecf20Sopenharmony_ci#include <asm/perf_event.h> 228c2ecf20Sopenharmony_ci#include <asm/insn.h> 238c2ecf20Sopenharmony_ci#include <asm/io.h> 248c2ecf20Sopenharmony_ci#include <asm/intel_pt.h> 258c2ecf20Sopenharmony_ci#include <asm/intel-family.h> 268c2ecf20Sopenharmony_ci 278c2ecf20Sopenharmony_ci#include "../perf_event.h" 288c2ecf20Sopenharmony_ci#include "pt.h" 298c2ecf20Sopenharmony_ci 308c2ecf20Sopenharmony_cistatic DEFINE_PER_CPU(struct pt, pt_ctx); 318c2ecf20Sopenharmony_ci 328c2ecf20Sopenharmony_cistatic struct pt_pmu pt_pmu; 338c2ecf20Sopenharmony_ci 348c2ecf20Sopenharmony_ci/* 358c2ecf20Sopenharmony_ci * Capabilities of Intel PT hardware, such as number of address bits or 368c2ecf20Sopenharmony_ci * supported output schemes, are cached and exported to userspace as "caps" 378c2ecf20Sopenharmony_ci * attribute group of pt pmu device 388c2ecf20Sopenharmony_ci * (/sys/bus/event_source/devices/intel_pt/caps/) so that userspace can store 398c2ecf20Sopenharmony_ci * relevant bits together with intel_pt traces. 408c2ecf20Sopenharmony_ci * 418c2ecf20Sopenharmony_ci * These are necessary for both trace decoding (payloads_lip, contains address 428c2ecf20Sopenharmony_ci * width encoded in IP-related packets), and event configuration (bitmasks with 438c2ecf20Sopenharmony_ci * permitted values for certain bit fields). 448c2ecf20Sopenharmony_ci */ 458c2ecf20Sopenharmony_ci#define PT_CAP(_n, _l, _r, _m) \ 468c2ecf20Sopenharmony_ci [PT_CAP_ ## _n] = { .name = __stringify(_n), .leaf = _l, \ 478c2ecf20Sopenharmony_ci .reg = _r, .mask = _m } 488c2ecf20Sopenharmony_ci 498c2ecf20Sopenharmony_cistatic struct pt_cap_desc { 508c2ecf20Sopenharmony_ci const char *name; 518c2ecf20Sopenharmony_ci u32 leaf; 528c2ecf20Sopenharmony_ci u8 reg; 538c2ecf20Sopenharmony_ci u32 mask; 548c2ecf20Sopenharmony_ci} pt_caps[] = { 558c2ecf20Sopenharmony_ci PT_CAP(max_subleaf, 0, CPUID_EAX, 0xffffffff), 568c2ecf20Sopenharmony_ci PT_CAP(cr3_filtering, 0, CPUID_EBX, BIT(0)), 578c2ecf20Sopenharmony_ci PT_CAP(psb_cyc, 0, CPUID_EBX, BIT(1)), 588c2ecf20Sopenharmony_ci PT_CAP(ip_filtering, 0, CPUID_EBX, BIT(2)), 598c2ecf20Sopenharmony_ci PT_CAP(mtc, 0, CPUID_EBX, BIT(3)), 608c2ecf20Sopenharmony_ci PT_CAP(ptwrite, 0, CPUID_EBX, BIT(4)), 618c2ecf20Sopenharmony_ci PT_CAP(power_event_trace, 0, CPUID_EBX, BIT(5)), 628c2ecf20Sopenharmony_ci PT_CAP(topa_output, 0, CPUID_ECX, BIT(0)), 638c2ecf20Sopenharmony_ci PT_CAP(topa_multiple_entries, 0, CPUID_ECX, BIT(1)), 648c2ecf20Sopenharmony_ci PT_CAP(single_range_output, 0, CPUID_ECX, BIT(2)), 658c2ecf20Sopenharmony_ci PT_CAP(output_subsys, 0, CPUID_ECX, BIT(3)), 668c2ecf20Sopenharmony_ci PT_CAP(payloads_lip, 0, CPUID_ECX, BIT(31)), 678c2ecf20Sopenharmony_ci PT_CAP(num_address_ranges, 1, CPUID_EAX, 0x7), 688c2ecf20Sopenharmony_ci PT_CAP(mtc_periods, 1, CPUID_EAX, 0xffff0000), 698c2ecf20Sopenharmony_ci PT_CAP(cycle_thresholds, 1, CPUID_EBX, 0xffff), 708c2ecf20Sopenharmony_ci PT_CAP(psb_periods, 1, CPUID_EBX, 0xffff0000), 718c2ecf20Sopenharmony_ci}; 728c2ecf20Sopenharmony_ci 738c2ecf20Sopenharmony_ciu32 intel_pt_validate_cap(u32 *caps, enum pt_capabilities capability) 748c2ecf20Sopenharmony_ci{ 758c2ecf20Sopenharmony_ci struct pt_cap_desc *cd = &pt_caps[capability]; 768c2ecf20Sopenharmony_ci u32 c = caps[cd->leaf * PT_CPUID_REGS_NUM + cd->reg]; 778c2ecf20Sopenharmony_ci unsigned int shift = __ffs(cd->mask); 788c2ecf20Sopenharmony_ci 798c2ecf20Sopenharmony_ci return (c & cd->mask) >> shift; 808c2ecf20Sopenharmony_ci} 818c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(intel_pt_validate_cap); 828c2ecf20Sopenharmony_ci 838c2ecf20Sopenharmony_ciu32 intel_pt_validate_hw_cap(enum pt_capabilities cap) 848c2ecf20Sopenharmony_ci{ 858c2ecf20Sopenharmony_ci return intel_pt_validate_cap(pt_pmu.caps, cap); 868c2ecf20Sopenharmony_ci} 878c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(intel_pt_validate_hw_cap); 888c2ecf20Sopenharmony_ci 898c2ecf20Sopenharmony_cistatic ssize_t pt_cap_show(struct device *cdev, 908c2ecf20Sopenharmony_ci struct device_attribute *attr, 918c2ecf20Sopenharmony_ci char *buf) 928c2ecf20Sopenharmony_ci{ 938c2ecf20Sopenharmony_ci struct dev_ext_attribute *ea = 948c2ecf20Sopenharmony_ci container_of(attr, struct dev_ext_attribute, attr); 958c2ecf20Sopenharmony_ci enum pt_capabilities cap = (long)ea->var; 968c2ecf20Sopenharmony_ci 978c2ecf20Sopenharmony_ci return snprintf(buf, PAGE_SIZE, "%x\n", intel_pt_validate_hw_cap(cap)); 988c2ecf20Sopenharmony_ci} 998c2ecf20Sopenharmony_ci 1008c2ecf20Sopenharmony_cistatic struct attribute_group pt_cap_group __ro_after_init = { 1018c2ecf20Sopenharmony_ci .name = "caps", 1028c2ecf20Sopenharmony_ci}; 1038c2ecf20Sopenharmony_ci 1048c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(pt, "config:0" ); 1058c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(cyc, "config:1" ); 1068c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(pwr_evt, "config:4" ); 1078c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(fup_on_ptw, "config:5" ); 1088c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(mtc, "config:9" ); 1098c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(tsc, "config:10" ); 1108c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(noretcomp, "config:11" ); 1118c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(ptw, "config:12" ); 1128c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(branch, "config:13" ); 1138c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(mtc_period, "config:14-17" ); 1148c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(cyc_thresh, "config:19-22" ); 1158c2ecf20Sopenharmony_ciPMU_FORMAT_ATTR(psb_period, "config:24-27" ); 1168c2ecf20Sopenharmony_ci 1178c2ecf20Sopenharmony_cistatic struct attribute *pt_formats_attr[] = { 1188c2ecf20Sopenharmony_ci &format_attr_pt.attr, 1198c2ecf20Sopenharmony_ci &format_attr_cyc.attr, 1208c2ecf20Sopenharmony_ci &format_attr_pwr_evt.attr, 1218c2ecf20Sopenharmony_ci &format_attr_fup_on_ptw.attr, 1228c2ecf20Sopenharmony_ci &format_attr_mtc.attr, 1238c2ecf20Sopenharmony_ci &format_attr_tsc.attr, 1248c2ecf20Sopenharmony_ci &format_attr_noretcomp.attr, 1258c2ecf20Sopenharmony_ci &format_attr_ptw.attr, 1268c2ecf20Sopenharmony_ci &format_attr_branch.attr, 1278c2ecf20Sopenharmony_ci &format_attr_mtc_period.attr, 1288c2ecf20Sopenharmony_ci &format_attr_cyc_thresh.attr, 1298c2ecf20Sopenharmony_ci &format_attr_psb_period.attr, 1308c2ecf20Sopenharmony_ci NULL, 1318c2ecf20Sopenharmony_ci}; 1328c2ecf20Sopenharmony_ci 1338c2ecf20Sopenharmony_cistatic struct attribute_group pt_format_group = { 1348c2ecf20Sopenharmony_ci .name = "format", 1358c2ecf20Sopenharmony_ci .attrs = pt_formats_attr, 1368c2ecf20Sopenharmony_ci}; 1378c2ecf20Sopenharmony_ci 1388c2ecf20Sopenharmony_cistatic ssize_t 1398c2ecf20Sopenharmony_cipt_timing_attr_show(struct device *dev, struct device_attribute *attr, 1408c2ecf20Sopenharmony_ci char *page) 1418c2ecf20Sopenharmony_ci{ 1428c2ecf20Sopenharmony_ci struct perf_pmu_events_attr *pmu_attr = 1438c2ecf20Sopenharmony_ci container_of(attr, struct perf_pmu_events_attr, attr); 1448c2ecf20Sopenharmony_ci 1458c2ecf20Sopenharmony_ci switch (pmu_attr->id) { 1468c2ecf20Sopenharmony_ci case 0: 1478c2ecf20Sopenharmony_ci return sprintf(page, "%lu\n", pt_pmu.max_nonturbo_ratio); 1488c2ecf20Sopenharmony_ci case 1: 1498c2ecf20Sopenharmony_ci return sprintf(page, "%u:%u\n", 1508c2ecf20Sopenharmony_ci pt_pmu.tsc_art_num, 1518c2ecf20Sopenharmony_ci pt_pmu.tsc_art_den); 1528c2ecf20Sopenharmony_ci default: 1538c2ecf20Sopenharmony_ci break; 1548c2ecf20Sopenharmony_ci } 1558c2ecf20Sopenharmony_ci 1568c2ecf20Sopenharmony_ci return -EINVAL; 1578c2ecf20Sopenharmony_ci} 1588c2ecf20Sopenharmony_ci 1598c2ecf20Sopenharmony_ciPMU_EVENT_ATTR(max_nonturbo_ratio, timing_attr_max_nonturbo_ratio, 0, 1608c2ecf20Sopenharmony_ci pt_timing_attr_show); 1618c2ecf20Sopenharmony_ciPMU_EVENT_ATTR(tsc_art_ratio, timing_attr_tsc_art_ratio, 1, 1628c2ecf20Sopenharmony_ci pt_timing_attr_show); 1638c2ecf20Sopenharmony_ci 1648c2ecf20Sopenharmony_cistatic struct attribute *pt_timing_attr[] = { 1658c2ecf20Sopenharmony_ci &timing_attr_max_nonturbo_ratio.attr.attr, 1668c2ecf20Sopenharmony_ci &timing_attr_tsc_art_ratio.attr.attr, 1678c2ecf20Sopenharmony_ci NULL, 1688c2ecf20Sopenharmony_ci}; 1698c2ecf20Sopenharmony_ci 1708c2ecf20Sopenharmony_cistatic struct attribute_group pt_timing_group = { 1718c2ecf20Sopenharmony_ci .attrs = pt_timing_attr, 1728c2ecf20Sopenharmony_ci}; 1738c2ecf20Sopenharmony_ci 1748c2ecf20Sopenharmony_cistatic const struct attribute_group *pt_attr_groups[] = { 1758c2ecf20Sopenharmony_ci &pt_cap_group, 1768c2ecf20Sopenharmony_ci &pt_format_group, 1778c2ecf20Sopenharmony_ci &pt_timing_group, 1788c2ecf20Sopenharmony_ci NULL, 1798c2ecf20Sopenharmony_ci}; 1808c2ecf20Sopenharmony_ci 1818c2ecf20Sopenharmony_cistatic int __init pt_pmu_hw_init(void) 1828c2ecf20Sopenharmony_ci{ 1838c2ecf20Sopenharmony_ci struct dev_ext_attribute *de_attrs; 1848c2ecf20Sopenharmony_ci struct attribute **attrs; 1858c2ecf20Sopenharmony_ci size_t size; 1868c2ecf20Sopenharmony_ci u64 reg; 1878c2ecf20Sopenharmony_ci int ret; 1888c2ecf20Sopenharmony_ci long i; 1898c2ecf20Sopenharmony_ci 1908c2ecf20Sopenharmony_ci rdmsrl(MSR_PLATFORM_INFO, reg); 1918c2ecf20Sopenharmony_ci pt_pmu.max_nonturbo_ratio = (reg & 0xff00) >> 8; 1928c2ecf20Sopenharmony_ci 1938c2ecf20Sopenharmony_ci /* 1948c2ecf20Sopenharmony_ci * if available, read in TSC to core crystal clock ratio, 1958c2ecf20Sopenharmony_ci * otherwise, zero for numerator stands for "not enumerated" 1968c2ecf20Sopenharmony_ci * as per SDM 1978c2ecf20Sopenharmony_ci */ 1988c2ecf20Sopenharmony_ci if (boot_cpu_data.cpuid_level >= CPUID_TSC_LEAF) { 1998c2ecf20Sopenharmony_ci u32 eax, ebx, ecx, edx; 2008c2ecf20Sopenharmony_ci 2018c2ecf20Sopenharmony_ci cpuid(CPUID_TSC_LEAF, &eax, &ebx, &ecx, &edx); 2028c2ecf20Sopenharmony_ci 2038c2ecf20Sopenharmony_ci pt_pmu.tsc_art_num = ebx; 2048c2ecf20Sopenharmony_ci pt_pmu.tsc_art_den = eax; 2058c2ecf20Sopenharmony_ci } 2068c2ecf20Sopenharmony_ci 2078c2ecf20Sopenharmony_ci /* model-specific quirks */ 2088c2ecf20Sopenharmony_ci switch (boot_cpu_data.x86_model) { 2098c2ecf20Sopenharmony_ci case INTEL_FAM6_BROADWELL: 2108c2ecf20Sopenharmony_ci case INTEL_FAM6_BROADWELL_D: 2118c2ecf20Sopenharmony_ci case INTEL_FAM6_BROADWELL_G: 2128c2ecf20Sopenharmony_ci case INTEL_FAM6_BROADWELL_X: 2138c2ecf20Sopenharmony_ci /* not setting BRANCH_EN will #GP, erratum BDM106 */ 2148c2ecf20Sopenharmony_ci pt_pmu.branch_en_always_on = true; 2158c2ecf20Sopenharmony_ci break; 2168c2ecf20Sopenharmony_ci default: 2178c2ecf20Sopenharmony_ci break; 2188c2ecf20Sopenharmony_ci } 2198c2ecf20Sopenharmony_ci 2208c2ecf20Sopenharmony_ci if (boot_cpu_has(X86_FEATURE_VMX)) { 2218c2ecf20Sopenharmony_ci /* 2228c2ecf20Sopenharmony_ci * Intel SDM, 36.5 "Tracing post-VMXON" says that 2238c2ecf20Sopenharmony_ci * "IA32_VMX_MISC[bit 14]" being 1 means PT can trace 2248c2ecf20Sopenharmony_ci * post-VMXON. 2258c2ecf20Sopenharmony_ci */ 2268c2ecf20Sopenharmony_ci rdmsrl(MSR_IA32_VMX_MISC, reg); 2278c2ecf20Sopenharmony_ci if (reg & BIT(14)) 2288c2ecf20Sopenharmony_ci pt_pmu.vmx = true; 2298c2ecf20Sopenharmony_ci } 2308c2ecf20Sopenharmony_ci 2318c2ecf20Sopenharmony_ci for (i = 0; i < PT_CPUID_LEAVES; i++) { 2328c2ecf20Sopenharmony_ci cpuid_count(20, i, 2338c2ecf20Sopenharmony_ci &pt_pmu.caps[CPUID_EAX + i*PT_CPUID_REGS_NUM], 2348c2ecf20Sopenharmony_ci &pt_pmu.caps[CPUID_EBX + i*PT_CPUID_REGS_NUM], 2358c2ecf20Sopenharmony_ci &pt_pmu.caps[CPUID_ECX + i*PT_CPUID_REGS_NUM], 2368c2ecf20Sopenharmony_ci &pt_pmu.caps[CPUID_EDX + i*PT_CPUID_REGS_NUM]); 2378c2ecf20Sopenharmony_ci } 2388c2ecf20Sopenharmony_ci 2398c2ecf20Sopenharmony_ci ret = -ENOMEM; 2408c2ecf20Sopenharmony_ci size = sizeof(struct attribute *) * (ARRAY_SIZE(pt_caps)+1); 2418c2ecf20Sopenharmony_ci attrs = kzalloc(size, GFP_KERNEL); 2428c2ecf20Sopenharmony_ci if (!attrs) 2438c2ecf20Sopenharmony_ci goto fail; 2448c2ecf20Sopenharmony_ci 2458c2ecf20Sopenharmony_ci size = sizeof(struct dev_ext_attribute) * (ARRAY_SIZE(pt_caps)+1); 2468c2ecf20Sopenharmony_ci de_attrs = kzalloc(size, GFP_KERNEL); 2478c2ecf20Sopenharmony_ci if (!de_attrs) 2488c2ecf20Sopenharmony_ci goto fail; 2498c2ecf20Sopenharmony_ci 2508c2ecf20Sopenharmony_ci for (i = 0; i < ARRAY_SIZE(pt_caps); i++) { 2518c2ecf20Sopenharmony_ci struct dev_ext_attribute *de_attr = de_attrs + i; 2528c2ecf20Sopenharmony_ci 2538c2ecf20Sopenharmony_ci de_attr->attr.attr.name = pt_caps[i].name; 2548c2ecf20Sopenharmony_ci 2558c2ecf20Sopenharmony_ci sysfs_attr_init(&de_attr->attr.attr); 2568c2ecf20Sopenharmony_ci 2578c2ecf20Sopenharmony_ci de_attr->attr.attr.mode = S_IRUGO; 2588c2ecf20Sopenharmony_ci de_attr->attr.show = pt_cap_show; 2598c2ecf20Sopenharmony_ci de_attr->var = (void *)i; 2608c2ecf20Sopenharmony_ci 2618c2ecf20Sopenharmony_ci attrs[i] = &de_attr->attr.attr; 2628c2ecf20Sopenharmony_ci } 2638c2ecf20Sopenharmony_ci 2648c2ecf20Sopenharmony_ci pt_cap_group.attrs = attrs; 2658c2ecf20Sopenharmony_ci 2668c2ecf20Sopenharmony_ci return 0; 2678c2ecf20Sopenharmony_ci 2688c2ecf20Sopenharmony_cifail: 2698c2ecf20Sopenharmony_ci kfree(attrs); 2708c2ecf20Sopenharmony_ci 2718c2ecf20Sopenharmony_ci return ret; 2728c2ecf20Sopenharmony_ci} 2738c2ecf20Sopenharmony_ci 2748c2ecf20Sopenharmony_ci#define RTIT_CTL_CYC_PSB (RTIT_CTL_CYCLEACC | \ 2758c2ecf20Sopenharmony_ci RTIT_CTL_CYC_THRESH | \ 2768c2ecf20Sopenharmony_ci RTIT_CTL_PSB_FREQ) 2778c2ecf20Sopenharmony_ci 2788c2ecf20Sopenharmony_ci#define RTIT_CTL_MTC (RTIT_CTL_MTC_EN | \ 2798c2ecf20Sopenharmony_ci RTIT_CTL_MTC_RANGE) 2808c2ecf20Sopenharmony_ci 2818c2ecf20Sopenharmony_ci#define RTIT_CTL_PTW (RTIT_CTL_PTW_EN | \ 2828c2ecf20Sopenharmony_ci RTIT_CTL_FUP_ON_PTW) 2838c2ecf20Sopenharmony_ci 2848c2ecf20Sopenharmony_ci/* 2858c2ecf20Sopenharmony_ci * Bit 0 (TraceEn) in the attr.config is meaningless as the 2868c2ecf20Sopenharmony_ci * corresponding bit in the RTIT_CTL can only be controlled 2878c2ecf20Sopenharmony_ci * by the driver; therefore, repurpose it to mean: pass 2888c2ecf20Sopenharmony_ci * through the bit that was previously assumed to be always 2898c2ecf20Sopenharmony_ci * on for PT, thereby allowing the user to *not* set it if 2908c2ecf20Sopenharmony_ci * they so wish. See also pt_event_valid() and pt_config(). 2918c2ecf20Sopenharmony_ci */ 2928c2ecf20Sopenharmony_ci#define RTIT_CTL_PASSTHROUGH RTIT_CTL_TRACEEN 2938c2ecf20Sopenharmony_ci 2948c2ecf20Sopenharmony_ci#define PT_CONFIG_MASK (RTIT_CTL_TRACEEN | \ 2958c2ecf20Sopenharmony_ci RTIT_CTL_TSC_EN | \ 2968c2ecf20Sopenharmony_ci RTIT_CTL_DISRETC | \ 2978c2ecf20Sopenharmony_ci RTIT_CTL_BRANCH_EN | \ 2988c2ecf20Sopenharmony_ci RTIT_CTL_CYC_PSB | \ 2998c2ecf20Sopenharmony_ci RTIT_CTL_MTC | \ 3008c2ecf20Sopenharmony_ci RTIT_CTL_PWR_EVT_EN | \ 3018c2ecf20Sopenharmony_ci RTIT_CTL_FUP_ON_PTW | \ 3028c2ecf20Sopenharmony_ci RTIT_CTL_PTW_EN) 3038c2ecf20Sopenharmony_ci 3048c2ecf20Sopenharmony_cistatic bool pt_event_valid(struct perf_event *event) 3058c2ecf20Sopenharmony_ci{ 3068c2ecf20Sopenharmony_ci u64 config = event->attr.config; 3078c2ecf20Sopenharmony_ci u64 allowed, requested; 3088c2ecf20Sopenharmony_ci 3098c2ecf20Sopenharmony_ci if ((config & PT_CONFIG_MASK) != config) 3108c2ecf20Sopenharmony_ci return false; 3118c2ecf20Sopenharmony_ci 3128c2ecf20Sopenharmony_ci if (config & RTIT_CTL_CYC_PSB) { 3138c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_psb_cyc)) 3148c2ecf20Sopenharmony_ci return false; 3158c2ecf20Sopenharmony_ci 3168c2ecf20Sopenharmony_ci allowed = intel_pt_validate_hw_cap(PT_CAP_psb_periods); 3178c2ecf20Sopenharmony_ci requested = (config & RTIT_CTL_PSB_FREQ) >> 3188c2ecf20Sopenharmony_ci RTIT_CTL_PSB_FREQ_OFFSET; 3198c2ecf20Sopenharmony_ci if (requested && (!(allowed & BIT(requested)))) 3208c2ecf20Sopenharmony_ci return false; 3218c2ecf20Sopenharmony_ci 3228c2ecf20Sopenharmony_ci allowed = intel_pt_validate_hw_cap(PT_CAP_cycle_thresholds); 3238c2ecf20Sopenharmony_ci requested = (config & RTIT_CTL_CYC_THRESH) >> 3248c2ecf20Sopenharmony_ci RTIT_CTL_CYC_THRESH_OFFSET; 3258c2ecf20Sopenharmony_ci if (requested && (!(allowed & BIT(requested)))) 3268c2ecf20Sopenharmony_ci return false; 3278c2ecf20Sopenharmony_ci } 3288c2ecf20Sopenharmony_ci 3298c2ecf20Sopenharmony_ci if (config & RTIT_CTL_MTC) { 3308c2ecf20Sopenharmony_ci /* 3318c2ecf20Sopenharmony_ci * In the unlikely case that CPUID lists valid mtc periods, 3328c2ecf20Sopenharmony_ci * but not the mtc capability, drop out here. 3338c2ecf20Sopenharmony_ci * 3348c2ecf20Sopenharmony_ci * Spec says that setting mtc period bits while mtc bit in 3358c2ecf20Sopenharmony_ci * CPUID is 0 will #GP, so better safe than sorry. 3368c2ecf20Sopenharmony_ci */ 3378c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_mtc)) 3388c2ecf20Sopenharmony_ci return false; 3398c2ecf20Sopenharmony_ci 3408c2ecf20Sopenharmony_ci allowed = intel_pt_validate_hw_cap(PT_CAP_mtc_periods); 3418c2ecf20Sopenharmony_ci if (!allowed) 3428c2ecf20Sopenharmony_ci return false; 3438c2ecf20Sopenharmony_ci 3448c2ecf20Sopenharmony_ci requested = (config & RTIT_CTL_MTC_RANGE) >> 3458c2ecf20Sopenharmony_ci RTIT_CTL_MTC_RANGE_OFFSET; 3468c2ecf20Sopenharmony_ci 3478c2ecf20Sopenharmony_ci if (!(allowed & BIT(requested))) 3488c2ecf20Sopenharmony_ci return false; 3498c2ecf20Sopenharmony_ci } 3508c2ecf20Sopenharmony_ci 3518c2ecf20Sopenharmony_ci if (config & RTIT_CTL_PWR_EVT_EN && 3528c2ecf20Sopenharmony_ci !intel_pt_validate_hw_cap(PT_CAP_power_event_trace)) 3538c2ecf20Sopenharmony_ci return false; 3548c2ecf20Sopenharmony_ci 3558c2ecf20Sopenharmony_ci if (config & RTIT_CTL_PTW) { 3568c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_ptwrite)) 3578c2ecf20Sopenharmony_ci return false; 3588c2ecf20Sopenharmony_ci 3598c2ecf20Sopenharmony_ci /* FUPonPTW without PTW doesn't make sense */ 3608c2ecf20Sopenharmony_ci if ((config & RTIT_CTL_FUP_ON_PTW) && 3618c2ecf20Sopenharmony_ci !(config & RTIT_CTL_PTW_EN)) 3628c2ecf20Sopenharmony_ci return false; 3638c2ecf20Sopenharmony_ci } 3648c2ecf20Sopenharmony_ci 3658c2ecf20Sopenharmony_ci /* 3668c2ecf20Sopenharmony_ci * Setting bit 0 (TraceEn in RTIT_CTL MSR) in the attr.config 3678c2ecf20Sopenharmony_ci * clears the assomption that BranchEn must always be enabled, 3688c2ecf20Sopenharmony_ci * as was the case with the first implementation of PT. 3698c2ecf20Sopenharmony_ci * If this bit is not set, the legacy behavior is preserved 3708c2ecf20Sopenharmony_ci * for compatibility with the older userspace. 3718c2ecf20Sopenharmony_ci * 3728c2ecf20Sopenharmony_ci * Re-using bit 0 for this purpose is fine because it is never 3738c2ecf20Sopenharmony_ci * directly set by the user; previous attempts at setting it in 3748c2ecf20Sopenharmony_ci * the attr.config resulted in -EINVAL. 3758c2ecf20Sopenharmony_ci */ 3768c2ecf20Sopenharmony_ci if (config & RTIT_CTL_PASSTHROUGH) { 3778c2ecf20Sopenharmony_ci /* 3788c2ecf20Sopenharmony_ci * Disallow not setting BRANCH_EN where BRANCH_EN is 3798c2ecf20Sopenharmony_ci * always required. 3808c2ecf20Sopenharmony_ci */ 3818c2ecf20Sopenharmony_ci if (pt_pmu.branch_en_always_on && 3828c2ecf20Sopenharmony_ci !(config & RTIT_CTL_BRANCH_EN)) 3838c2ecf20Sopenharmony_ci return false; 3848c2ecf20Sopenharmony_ci } else { 3858c2ecf20Sopenharmony_ci /* 3868c2ecf20Sopenharmony_ci * Disallow BRANCH_EN without the PASSTHROUGH. 3878c2ecf20Sopenharmony_ci */ 3888c2ecf20Sopenharmony_ci if (config & RTIT_CTL_BRANCH_EN) 3898c2ecf20Sopenharmony_ci return false; 3908c2ecf20Sopenharmony_ci } 3918c2ecf20Sopenharmony_ci 3928c2ecf20Sopenharmony_ci return true; 3938c2ecf20Sopenharmony_ci} 3948c2ecf20Sopenharmony_ci 3958c2ecf20Sopenharmony_ci/* 3968c2ecf20Sopenharmony_ci * PT configuration helpers 3978c2ecf20Sopenharmony_ci * These all are cpu affine and operate on a local PT 3988c2ecf20Sopenharmony_ci */ 3998c2ecf20Sopenharmony_ci 4008c2ecf20Sopenharmony_cistatic void pt_config_start(struct perf_event *event) 4018c2ecf20Sopenharmony_ci{ 4028c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 4038c2ecf20Sopenharmony_ci u64 ctl = event->hw.config; 4048c2ecf20Sopenharmony_ci 4058c2ecf20Sopenharmony_ci ctl |= RTIT_CTL_TRACEEN; 4068c2ecf20Sopenharmony_ci if (READ_ONCE(pt->vmx_on)) 4078c2ecf20Sopenharmony_ci perf_aux_output_flag(&pt->handle, PERF_AUX_FLAG_PARTIAL); 4088c2ecf20Sopenharmony_ci else 4098c2ecf20Sopenharmony_ci wrmsrl(MSR_IA32_RTIT_CTL, ctl); 4108c2ecf20Sopenharmony_ci 4118c2ecf20Sopenharmony_ci WRITE_ONCE(event->hw.config, ctl); 4128c2ecf20Sopenharmony_ci} 4138c2ecf20Sopenharmony_ci 4148c2ecf20Sopenharmony_ci/* Address ranges and their corresponding msr configuration registers */ 4158c2ecf20Sopenharmony_cistatic const struct pt_address_range { 4168c2ecf20Sopenharmony_ci unsigned long msr_a; 4178c2ecf20Sopenharmony_ci unsigned long msr_b; 4188c2ecf20Sopenharmony_ci unsigned int reg_off; 4198c2ecf20Sopenharmony_ci} pt_address_ranges[] = { 4208c2ecf20Sopenharmony_ci { 4218c2ecf20Sopenharmony_ci .msr_a = MSR_IA32_RTIT_ADDR0_A, 4228c2ecf20Sopenharmony_ci .msr_b = MSR_IA32_RTIT_ADDR0_B, 4238c2ecf20Sopenharmony_ci .reg_off = RTIT_CTL_ADDR0_OFFSET, 4248c2ecf20Sopenharmony_ci }, 4258c2ecf20Sopenharmony_ci { 4268c2ecf20Sopenharmony_ci .msr_a = MSR_IA32_RTIT_ADDR1_A, 4278c2ecf20Sopenharmony_ci .msr_b = MSR_IA32_RTIT_ADDR1_B, 4288c2ecf20Sopenharmony_ci .reg_off = RTIT_CTL_ADDR1_OFFSET, 4298c2ecf20Sopenharmony_ci }, 4308c2ecf20Sopenharmony_ci { 4318c2ecf20Sopenharmony_ci .msr_a = MSR_IA32_RTIT_ADDR2_A, 4328c2ecf20Sopenharmony_ci .msr_b = MSR_IA32_RTIT_ADDR2_B, 4338c2ecf20Sopenharmony_ci .reg_off = RTIT_CTL_ADDR2_OFFSET, 4348c2ecf20Sopenharmony_ci }, 4358c2ecf20Sopenharmony_ci { 4368c2ecf20Sopenharmony_ci .msr_a = MSR_IA32_RTIT_ADDR3_A, 4378c2ecf20Sopenharmony_ci .msr_b = MSR_IA32_RTIT_ADDR3_B, 4388c2ecf20Sopenharmony_ci .reg_off = RTIT_CTL_ADDR3_OFFSET, 4398c2ecf20Sopenharmony_ci } 4408c2ecf20Sopenharmony_ci}; 4418c2ecf20Sopenharmony_ci 4428c2ecf20Sopenharmony_cistatic u64 pt_config_filters(struct perf_event *event) 4438c2ecf20Sopenharmony_ci{ 4448c2ecf20Sopenharmony_ci struct pt_filters *filters = event->hw.addr_filters; 4458c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 4468c2ecf20Sopenharmony_ci unsigned int range = 0; 4478c2ecf20Sopenharmony_ci u64 rtit_ctl = 0; 4488c2ecf20Sopenharmony_ci 4498c2ecf20Sopenharmony_ci if (!filters) 4508c2ecf20Sopenharmony_ci return 0; 4518c2ecf20Sopenharmony_ci 4528c2ecf20Sopenharmony_ci perf_event_addr_filters_sync(event); 4538c2ecf20Sopenharmony_ci 4548c2ecf20Sopenharmony_ci for (range = 0; range < filters->nr_filters; range++) { 4558c2ecf20Sopenharmony_ci struct pt_filter *filter = &filters->filter[range]; 4568c2ecf20Sopenharmony_ci 4578c2ecf20Sopenharmony_ci /* 4588c2ecf20Sopenharmony_ci * Note, if the range has zero start/end addresses due 4598c2ecf20Sopenharmony_ci * to its dynamic object not being loaded yet, we just 4608c2ecf20Sopenharmony_ci * go ahead and program zeroed range, which will simply 4618c2ecf20Sopenharmony_ci * produce no data. Note^2: if executable code at 0x0 4628c2ecf20Sopenharmony_ci * is a concern, we can set up an "invalid" configuration 4638c2ecf20Sopenharmony_ci * such as msr_b < msr_a. 4648c2ecf20Sopenharmony_ci */ 4658c2ecf20Sopenharmony_ci 4668c2ecf20Sopenharmony_ci /* avoid redundant msr writes */ 4678c2ecf20Sopenharmony_ci if (pt->filters.filter[range].msr_a != filter->msr_a) { 4688c2ecf20Sopenharmony_ci wrmsrl(pt_address_ranges[range].msr_a, filter->msr_a); 4698c2ecf20Sopenharmony_ci pt->filters.filter[range].msr_a = filter->msr_a; 4708c2ecf20Sopenharmony_ci } 4718c2ecf20Sopenharmony_ci 4728c2ecf20Sopenharmony_ci if (pt->filters.filter[range].msr_b != filter->msr_b) { 4738c2ecf20Sopenharmony_ci wrmsrl(pt_address_ranges[range].msr_b, filter->msr_b); 4748c2ecf20Sopenharmony_ci pt->filters.filter[range].msr_b = filter->msr_b; 4758c2ecf20Sopenharmony_ci } 4768c2ecf20Sopenharmony_ci 4778c2ecf20Sopenharmony_ci rtit_ctl |= (u64)filter->config << pt_address_ranges[range].reg_off; 4788c2ecf20Sopenharmony_ci } 4798c2ecf20Sopenharmony_ci 4808c2ecf20Sopenharmony_ci return rtit_ctl; 4818c2ecf20Sopenharmony_ci} 4828c2ecf20Sopenharmony_ci 4838c2ecf20Sopenharmony_cistatic void pt_config(struct perf_event *event) 4848c2ecf20Sopenharmony_ci{ 4858c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 4868c2ecf20Sopenharmony_ci struct pt_buffer *buf = perf_get_aux(&pt->handle); 4878c2ecf20Sopenharmony_ci u64 reg; 4888c2ecf20Sopenharmony_ci 4898c2ecf20Sopenharmony_ci /* First round: clear STATUS, in particular the PSB byte counter. */ 4908c2ecf20Sopenharmony_ci if (!event->hw.config) { 4918c2ecf20Sopenharmony_ci perf_event_itrace_started(event); 4928c2ecf20Sopenharmony_ci wrmsrl(MSR_IA32_RTIT_STATUS, 0); 4938c2ecf20Sopenharmony_ci } 4948c2ecf20Sopenharmony_ci 4958c2ecf20Sopenharmony_ci reg = pt_config_filters(event); 4968c2ecf20Sopenharmony_ci reg |= RTIT_CTL_TRACEEN; 4978c2ecf20Sopenharmony_ci if (!buf->single) 4988c2ecf20Sopenharmony_ci reg |= RTIT_CTL_TOPA; 4998c2ecf20Sopenharmony_ci 5008c2ecf20Sopenharmony_ci /* 5018c2ecf20Sopenharmony_ci * Previously, we had BRANCH_EN on by default, but now that PT has 5028c2ecf20Sopenharmony_ci * grown features outside of branch tracing, it is useful to allow 5038c2ecf20Sopenharmony_ci * the user to disable it. Setting bit 0 in the event's attr.config 5048c2ecf20Sopenharmony_ci * allows BRANCH_EN to pass through instead of being always on. See 5058c2ecf20Sopenharmony_ci * also the comment in pt_event_valid(). 5068c2ecf20Sopenharmony_ci */ 5078c2ecf20Sopenharmony_ci if (event->attr.config & BIT(0)) { 5088c2ecf20Sopenharmony_ci reg |= event->attr.config & RTIT_CTL_BRANCH_EN; 5098c2ecf20Sopenharmony_ci } else { 5108c2ecf20Sopenharmony_ci reg |= RTIT_CTL_BRANCH_EN; 5118c2ecf20Sopenharmony_ci } 5128c2ecf20Sopenharmony_ci 5138c2ecf20Sopenharmony_ci if (!event->attr.exclude_kernel) 5148c2ecf20Sopenharmony_ci reg |= RTIT_CTL_OS; 5158c2ecf20Sopenharmony_ci if (!event->attr.exclude_user) 5168c2ecf20Sopenharmony_ci reg |= RTIT_CTL_USR; 5178c2ecf20Sopenharmony_ci 5188c2ecf20Sopenharmony_ci reg |= (event->attr.config & PT_CONFIG_MASK); 5198c2ecf20Sopenharmony_ci 5208c2ecf20Sopenharmony_ci event->hw.config = reg; 5218c2ecf20Sopenharmony_ci pt_config_start(event); 5228c2ecf20Sopenharmony_ci} 5238c2ecf20Sopenharmony_ci 5248c2ecf20Sopenharmony_cistatic void pt_config_stop(struct perf_event *event) 5258c2ecf20Sopenharmony_ci{ 5268c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 5278c2ecf20Sopenharmony_ci u64 ctl = READ_ONCE(event->hw.config); 5288c2ecf20Sopenharmony_ci 5298c2ecf20Sopenharmony_ci /* may be already stopped by a PMI */ 5308c2ecf20Sopenharmony_ci if (!(ctl & RTIT_CTL_TRACEEN)) 5318c2ecf20Sopenharmony_ci return; 5328c2ecf20Sopenharmony_ci 5338c2ecf20Sopenharmony_ci ctl &= ~RTIT_CTL_TRACEEN; 5348c2ecf20Sopenharmony_ci if (!READ_ONCE(pt->vmx_on)) 5358c2ecf20Sopenharmony_ci wrmsrl(MSR_IA32_RTIT_CTL, ctl); 5368c2ecf20Sopenharmony_ci 5378c2ecf20Sopenharmony_ci WRITE_ONCE(event->hw.config, ctl); 5388c2ecf20Sopenharmony_ci 5398c2ecf20Sopenharmony_ci /* 5408c2ecf20Sopenharmony_ci * A wrmsr that disables trace generation serializes other PT 5418c2ecf20Sopenharmony_ci * registers and causes all data packets to be written to memory, 5428c2ecf20Sopenharmony_ci * but a fence is required for the data to become globally visible. 5438c2ecf20Sopenharmony_ci * 5448c2ecf20Sopenharmony_ci * The below WMB, separating data store and aux_head store matches 5458c2ecf20Sopenharmony_ci * the consumer's RMB that separates aux_head load and data load. 5468c2ecf20Sopenharmony_ci */ 5478c2ecf20Sopenharmony_ci wmb(); 5488c2ecf20Sopenharmony_ci} 5498c2ecf20Sopenharmony_ci 5508c2ecf20Sopenharmony_ci/** 5518c2ecf20Sopenharmony_ci * struct topa - ToPA metadata 5528c2ecf20Sopenharmony_ci * @list: linkage to struct pt_buffer's list of tables 5538c2ecf20Sopenharmony_ci * @offset: offset of the first entry in this table in the buffer 5548c2ecf20Sopenharmony_ci * @size: total size of all entries in this table 5558c2ecf20Sopenharmony_ci * @last: index of the last initialized entry in this table 5568c2ecf20Sopenharmony_ci * @z_count: how many times the first entry repeats 5578c2ecf20Sopenharmony_ci */ 5588c2ecf20Sopenharmony_cistruct topa { 5598c2ecf20Sopenharmony_ci struct list_head list; 5608c2ecf20Sopenharmony_ci u64 offset; 5618c2ecf20Sopenharmony_ci size_t size; 5628c2ecf20Sopenharmony_ci int last; 5638c2ecf20Sopenharmony_ci unsigned int z_count; 5648c2ecf20Sopenharmony_ci}; 5658c2ecf20Sopenharmony_ci 5668c2ecf20Sopenharmony_ci/* 5678c2ecf20Sopenharmony_ci * Keep ToPA table-related metadata on the same page as the actual table, 5688c2ecf20Sopenharmony_ci * taking up a few words from the top 5698c2ecf20Sopenharmony_ci */ 5708c2ecf20Sopenharmony_ci 5718c2ecf20Sopenharmony_ci#define TENTS_PER_PAGE \ 5728c2ecf20Sopenharmony_ci ((PAGE_SIZE - sizeof(struct topa)) / sizeof(struct topa_entry)) 5738c2ecf20Sopenharmony_ci 5748c2ecf20Sopenharmony_ci/** 5758c2ecf20Sopenharmony_ci * struct topa_page - page-sized ToPA table with metadata at the top 5768c2ecf20Sopenharmony_ci * @table: actual ToPA table entries, as understood by PT hardware 5778c2ecf20Sopenharmony_ci * @topa: metadata 5788c2ecf20Sopenharmony_ci */ 5798c2ecf20Sopenharmony_cistruct topa_page { 5808c2ecf20Sopenharmony_ci struct topa_entry table[TENTS_PER_PAGE]; 5818c2ecf20Sopenharmony_ci struct topa topa; 5828c2ecf20Sopenharmony_ci}; 5838c2ecf20Sopenharmony_ci 5848c2ecf20Sopenharmony_cistatic inline struct topa_page *topa_to_page(struct topa *topa) 5858c2ecf20Sopenharmony_ci{ 5868c2ecf20Sopenharmony_ci return container_of(topa, struct topa_page, topa); 5878c2ecf20Sopenharmony_ci} 5888c2ecf20Sopenharmony_ci 5898c2ecf20Sopenharmony_cistatic inline struct topa_page *topa_entry_to_page(struct topa_entry *te) 5908c2ecf20Sopenharmony_ci{ 5918c2ecf20Sopenharmony_ci return (struct topa_page *)((unsigned long)te & PAGE_MASK); 5928c2ecf20Sopenharmony_ci} 5938c2ecf20Sopenharmony_ci 5948c2ecf20Sopenharmony_cistatic inline phys_addr_t topa_pfn(struct topa *topa) 5958c2ecf20Sopenharmony_ci{ 5968c2ecf20Sopenharmony_ci return PFN_DOWN(virt_to_phys(topa_to_page(topa))); 5978c2ecf20Sopenharmony_ci} 5988c2ecf20Sopenharmony_ci 5998c2ecf20Sopenharmony_ci/* make -1 stand for the last table entry */ 6008c2ecf20Sopenharmony_ci#define TOPA_ENTRY(t, i) \ 6018c2ecf20Sopenharmony_ci ((i) == -1 \ 6028c2ecf20Sopenharmony_ci ? &topa_to_page(t)->table[(t)->last] \ 6038c2ecf20Sopenharmony_ci : &topa_to_page(t)->table[(i)]) 6048c2ecf20Sopenharmony_ci#define TOPA_ENTRY_SIZE(t, i) (sizes(TOPA_ENTRY((t), (i))->size)) 6058c2ecf20Sopenharmony_ci#define TOPA_ENTRY_PAGES(t, i) (1 << TOPA_ENTRY((t), (i))->size) 6068c2ecf20Sopenharmony_ci 6078c2ecf20Sopenharmony_cistatic void pt_config_buffer(struct pt_buffer *buf) 6088c2ecf20Sopenharmony_ci{ 6098c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 6108c2ecf20Sopenharmony_ci u64 reg, mask; 6118c2ecf20Sopenharmony_ci void *base; 6128c2ecf20Sopenharmony_ci 6138c2ecf20Sopenharmony_ci if (buf->single) { 6148c2ecf20Sopenharmony_ci base = buf->data_pages[0]; 6158c2ecf20Sopenharmony_ci mask = (buf->nr_pages * PAGE_SIZE - 1) >> 7; 6168c2ecf20Sopenharmony_ci } else { 6178c2ecf20Sopenharmony_ci base = topa_to_page(buf->cur)->table; 6188c2ecf20Sopenharmony_ci mask = (u64)buf->cur_idx; 6198c2ecf20Sopenharmony_ci } 6208c2ecf20Sopenharmony_ci 6218c2ecf20Sopenharmony_ci reg = virt_to_phys(base); 6228c2ecf20Sopenharmony_ci if (pt->output_base != reg) { 6238c2ecf20Sopenharmony_ci pt->output_base = reg; 6248c2ecf20Sopenharmony_ci wrmsrl(MSR_IA32_RTIT_OUTPUT_BASE, reg); 6258c2ecf20Sopenharmony_ci } 6268c2ecf20Sopenharmony_ci 6278c2ecf20Sopenharmony_ci reg = 0x7f | (mask << 7) | ((u64)buf->output_off << 32); 6288c2ecf20Sopenharmony_ci if (pt->output_mask != reg) { 6298c2ecf20Sopenharmony_ci pt->output_mask = reg; 6308c2ecf20Sopenharmony_ci wrmsrl(MSR_IA32_RTIT_OUTPUT_MASK, reg); 6318c2ecf20Sopenharmony_ci } 6328c2ecf20Sopenharmony_ci} 6338c2ecf20Sopenharmony_ci 6348c2ecf20Sopenharmony_ci/** 6358c2ecf20Sopenharmony_ci * topa_alloc() - allocate page-sized ToPA table 6368c2ecf20Sopenharmony_ci * @cpu: CPU on which to allocate. 6378c2ecf20Sopenharmony_ci * @gfp: Allocation flags. 6388c2ecf20Sopenharmony_ci * 6398c2ecf20Sopenharmony_ci * Return: On success, return the pointer to ToPA table page. 6408c2ecf20Sopenharmony_ci */ 6418c2ecf20Sopenharmony_cistatic struct topa *topa_alloc(int cpu, gfp_t gfp) 6428c2ecf20Sopenharmony_ci{ 6438c2ecf20Sopenharmony_ci int node = cpu_to_node(cpu); 6448c2ecf20Sopenharmony_ci struct topa_page *tp; 6458c2ecf20Sopenharmony_ci struct page *p; 6468c2ecf20Sopenharmony_ci 6478c2ecf20Sopenharmony_ci p = alloc_pages_node(node, gfp | __GFP_ZERO, 0); 6488c2ecf20Sopenharmony_ci if (!p) 6498c2ecf20Sopenharmony_ci return NULL; 6508c2ecf20Sopenharmony_ci 6518c2ecf20Sopenharmony_ci tp = page_address(p); 6528c2ecf20Sopenharmony_ci tp->topa.last = 0; 6538c2ecf20Sopenharmony_ci 6548c2ecf20Sopenharmony_ci /* 6558c2ecf20Sopenharmony_ci * In case of singe-entry ToPA, always put the self-referencing END 6568c2ecf20Sopenharmony_ci * link as the 2nd entry in the table 6578c2ecf20Sopenharmony_ci */ 6588c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries)) { 6598c2ecf20Sopenharmony_ci TOPA_ENTRY(&tp->topa, 1)->base = page_to_phys(p) >> TOPA_SHIFT; 6608c2ecf20Sopenharmony_ci TOPA_ENTRY(&tp->topa, 1)->end = 1; 6618c2ecf20Sopenharmony_ci } 6628c2ecf20Sopenharmony_ci 6638c2ecf20Sopenharmony_ci return &tp->topa; 6648c2ecf20Sopenharmony_ci} 6658c2ecf20Sopenharmony_ci 6668c2ecf20Sopenharmony_ci/** 6678c2ecf20Sopenharmony_ci * topa_free() - free a page-sized ToPA table 6688c2ecf20Sopenharmony_ci * @topa: Table to deallocate. 6698c2ecf20Sopenharmony_ci */ 6708c2ecf20Sopenharmony_cistatic void topa_free(struct topa *topa) 6718c2ecf20Sopenharmony_ci{ 6728c2ecf20Sopenharmony_ci free_page((unsigned long)topa); 6738c2ecf20Sopenharmony_ci} 6748c2ecf20Sopenharmony_ci 6758c2ecf20Sopenharmony_ci/** 6768c2ecf20Sopenharmony_ci * topa_insert_table() - insert a ToPA table into a buffer 6778c2ecf20Sopenharmony_ci * @buf: PT buffer that's being extended. 6788c2ecf20Sopenharmony_ci * @topa: New topa table to be inserted. 6798c2ecf20Sopenharmony_ci * 6808c2ecf20Sopenharmony_ci * If it's the first table in this buffer, set up buffer's pointers 6818c2ecf20Sopenharmony_ci * accordingly; otherwise, add a END=1 link entry to @topa to the current 6828c2ecf20Sopenharmony_ci * "last" table and adjust the last table pointer to @topa. 6838c2ecf20Sopenharmony_ci */ 6848c2ecf20Sopenharmony_cistatic void topa_insert_table(struct pt_buffer *buf, struct topa *topa) 6858c2ecf20Sopenharmony_ci{ 6868c2ecf20Sopenharmony_ci struct topa *last = buf->last; 6878c2ecf20Sopenharmony_ci 6888c2ecf20Sopenharmony_ci list_add_tail(&topa->list, &buf->tables); 6898c2ecf20Sopenharmony_ci 6908c2ecf20Sopenharmony_ci if (!buf->first) { 6918c2ecf20Sopenharmony_ci buf->first = buf->last = buf->cur = topa; 6928c2ecf20Sopenharmony_ci return; 6938c2ecf20Sopenharmony_ci } 6948c2ecf20Sopenharmony_ci 6958c2ecf20Sopenharmony_ci topa->offset = last->offset + last->size; 6968c2ecf20Sopenharmony_ci buf->last = topa; 6978c2ecf20Sopenharmony_ci 6988c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries)) 6998c2ecf20Sopenharmony_ci return; 7008c2ecf20Sopenharmony_ci 7018c2ecf20Sopenharmony_ci BUG_ON(last->last != TENTS_PER_PAGE - 1); 7028c2ecf20Sopenharmony_ci 7038c2ecf20Sopenharmony_ci TOPA_ENTRY(last, -1)->base = topa_pfn(topa); 7048c2ecf20Sopenharmony_ci TOPA_ENTRY(last, -1)->end = 1; 7058c2ecf20Sopenharmony_ci} 7068c2ecf20Sopenharmony_ci 7078c2ecf20Sopenharmony_ci/** 7088c2ecf20Sopenharmony_ci * topa_table_full() - check if a ToPA table is filled up 7098c2ecf20Sopenharmony_ci * @topa: ToPA table. 7108c2ecf20Sopenharmony_ci */ 7118c2ecf20Sopenharmony_cistatic bool topa_table_full(struct topa *topa) 7128c2ecf20Sopenharmony_ci{ 7138c2ecf20Sopenharmony_ci /* single-entry ToPA is a special case */ 7148c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries)) 7158c2ecf20Sopenharmony_ci return !!topa->last; 7168c2ecf20Sopenharmony_ci 7178c2ecf20Sopenharmony_ci return topa->last == TENTS_PER_PAGE - 1; 7188c2ecf20Sopenharmony_ci} 7198c2ecf20Sopenharmony_ci 7208c2ecf20Sopenharmony_ci/** 7218c2ecf20Sopenharmony_ci * topa_insert_pages() - create a list of ToPA tables 7228c2ecf20Sopenharmony_ci * @buf: PT buffer being initialized. 7238c2ecf20Sopenharmony_ci * @gfp: Allocation flags. 7248c2ecf20Sopenharmony_ci * 7258c2ecf20Sopenharmony_ci * This initializes a list of ToPA tables with entries from 7268c2ecf20Sopenharmony_ci * the data_pages provided by rb_alloc_aux(). 7278c2ecf20Sopenharmony_ci * 7288c2ecf20Sopenharmony_ci * Return: 0 on success or error code. 7298c2ecf20Sopenharmony_ci */ 7308c2ecf20Sopenharmony_cistatic int topa_insert_pages(struct pt_buffer *buf, int cpu, gfp_t gfp) 7318c2ecf20Sopenharmony_ci{ 7328c2ecf20Sopenharmony_ci struct topa *topa = buf->last; 7338c2ecf20Sopenharmony_ci int order = 0; 7348c2ecf20Sopenharmony_ci struct page *p; 7358c2ecf20Sopenharmony_ci 7368c2ecf20Sopenharmony_ci p = virt_to_page(buf->data_pages[buf->nr_pages]); 7378c2ecf20Sopenharmony_ci if (PagePrivate(p)) 7388c2ecf20Sopenharmony_ci order = page_private(p); 7398c2ecf20Sopenharmony_ci 7408c2ecf20Sopenharmony_ci if (topa_table_full(topa)) { 7418c2ecf20Sopenharmony_ci topa = topa_alloc(cpu, gfp); 7428c2ecf20Sopenharmony_ci if (!topa) 7438c2ecf20Sopenharmony_ci return -ENOMEM; 7448c2ecf20Sopenharmony_ci 7458c2ecf20Sopenharmony_ci topa_insert_table(buf, topa); 7468c2ecf20Sopenharmony_ci } 7478c2ecf20Sopenharmony_ci 7488c2ecf20Sopenharmony_ci if (topa->z_count == topa->last - 1) { 7498c2ecf20Sopenharmony_ci if (order == TOPA_ENTRY(topa, topa->last - 1)->size) 7508c2ecf20Sopenharmony_ci topa->z_count++; 7518c2ecf20Sopenharmony_ci } 7528c2ecf20Sopenharmony_ci 7538c2ecf20Sopenharmony_ci TOPA_ENTRY(topa, -1)->base = page_to_phys(p) >> TOPA_SHIFT; 7548c2ecf20Sopenharmony_ci TOPA_ENTRY(topa, -1)->size = order; 7558c2ecf20Sopenharmony_ci if (!buf->snapshot && 7568c2ecf20Sopenharmony_ci !intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries)) { 7578c2ecf20Sopenharmony_ci TOPA_ENTRY(topa, -1)->intr = 1; 7588c2ecf20Sopenharmony_ci TOPA_ENTRY(topa, -1)->stop = 1; 7598c2ecf20Sopenharmony_ci } 7608c2ecf20Sopenharmony_ci 7618c2ecf20Sopenharmony_ci topa->last++; 7628c2ecf20Sopenharmony_ci topa->size += sizes(order); 7638c2ecf20Sopenharmony_ci 7648c2ecf20Sopenharmony_ci buf->nr_pages += 1ul << order; 7658c2ecf20Sopenharmony_ci 7668c2ecf20Sopenharmony_ci return 0; 7678c2ecf20Sopenharmony_ci} 7688c2ecf20Sopenharmony_ci 7698c2ecf20Sopenharmony_ci/** 7708c2ecf20Sopenharmony_ci * pt_topa_dump() - print ToPA tables and their entries 7718c2ecf20Sopenharmony_ci * @buf: PT buffer. 7728c2ecf20Sopenharmony_ci */ 7738c2ecf20Sopenharmony_cistatic void pt_topa_dump(struct pt_buffer *buf) 7748c2ecf20Sopenharmony_ci{ 7758c2ecf20Sopenharmony_ci struct topa *topa; 7768c2ecf20Sopenharmony_ci 7778c2ecf20Sopenharmony_ci list_for_each_entry(topa, &buf->tables, list) { 7788c2ecf20Sopenharmony_ci struct topa_page *tp = topa_to_page(topa); 7798c2ecf20Sopenharmony_ci int i; 7808c2ecf20Sopenharmony_ci 7818c2ecf20Sopenharmony_ci pr_debug("# table @%p, off %llx size %zx\n", tp->table, 7828c2ecf20Sopenharmony_ci topa->offset, topa->size); 7838c2ecf20Sopenharmony_ci for (i = 0; i < TENTS_PER_PAGE; i++) { 7848c2ecf20Sopenharmony_ci pr_debug("# entry @%p (%lx sz %u %c%c%c) raw=%16llx\n", 7858c2ecf20Sopenharmony_ci &tp->table[i], 7868c2ecf20Sopenharmony_ci (unsigned long)tp->table[i].base << TOPA_SHIFT, 7878c2ecf20Sopenharmony_ci sizes(tp->table[i].size), 7888c2ecf20Sopenharmony_ci tp->table[i].end ? 'E' : ' ', 7898c2ecf20Sopenharmony_ci tp->table[i].intr ? 'I' : ' ', 7908c2ecf20Sopenharmony_ci tp->table[i].stop ? 'S' : ' ', 7918c2ecf20Sopenharmony_ci *(u64 *)&tp->table[i]); 7928c2ecf20Sopenharmony_ci if ((intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries) && 7938c2ecf20Sopenharmony_ci tp->table[i].stop) || 7948c2ecf20Sopenharmony_ci tp->table[i].end) 7958c2ecf20Sopenharmony_ci break; 7968c2ecf20Sopenharmony_ci if (!i && topa->z_count) 7978c2ecf20Sopenharmony_ci i += topa->z_count; 7988c2ecf20Sopenharmony_ci } 7998c2ecf20Sopenharmony_ci } 8008c2ecf20Sopenharmony_ci} 8018c2ecf20Sopenharmony_ci 8028c2ecf20Sopenharmony_ci/** 8038c2ecf20Sopenharmony_ci * pt_buffer_advance() - advance to the next output region 8048c2ecf20Sopenharmony_ci * @buf: PT buffer. 8058c2ecf20Sopenharmony_ci * 8068c2ecf20Sopenharmony_ci * Advance the current pointers in the buffer to the next ToPA entry. 8078c2ecf20Sopenharmony_ci */ 8088c2ecf20Sopenharmony_cistatic void pt_buffer_advance(struct pt_buffer *buf) 8098c2ecf20Sopenharmony_ci{ 8108c2ecf20Sopenharmony_ci buf->output_off = 0; 8118c2ecf20Sopenharmony_ci buf->cur_idx++; 8128c2ecf20Sopenharmony_ci 8138c2ecf20Sopenharmony_ci if (buf->cur_idx == buf->cur->last) { 8148c2ecf20Sopenharmony_ci if (buf->cur == buf->last) 8158c2ecf20Sopenharmony_ci buf->cur = buf->first; 8168c2ecf20Sopenharmony_ci else 8178c2ecf20Sopenharmony_ci buf->cur = list_entry(buf->cur->list.next, struct topa, 8188c2ecf20Sopenharmony_ci list); 8198c2ecf20Sopenharmony_ci buf->cur_idx = 0; 8208c2ecf20Sopenharmony_ci } 8218c2ecf20Sopenharmony_ci} 8228c2ecf20Sopenharmony_ci 8238c2ecf20Sopenharmony_ci/** 8248c2ecf20Sopenharmony_ci * pt_update_head() - calculate current offsets and sizes 8258c2ecf20Sopenharmony_ci * @pt: Per-cpu pt context. 8268c2ecf20Sopenharmony_ci * 8278c2ecf20Sopenharmony_ci * Update buffer's current write pointer position and data size. 8288c2ecf20Sopenharmony_ci */ 8298c2ecf20Sopenharmony_cistatic void pt_update_head(struct pt *pt) 8308c2ecf20Sopenharmony_ci{ 8318c2ecf20Sopenharmony_ci struct pt_buffer *buf = perf_get_aux(&pt->handle); 8328c2ecf20Sopenharmony_ci u64 topa_idx, base, old; 8338c2ecf20Sopenharmony_ci 8348c2ecf20Sopenharmony_ci if (buf->single) { 8358c2ecf20Sopenharmony_ci local_set(&buf->data_size, buf->output_off); 8368c2ecf20Sopenharmony_ci return; 8378c2ecf20Sopenharmony_ci } 8388c2ecf20Sopenharmony_ci 8398c2ecf20Sopenharmony_ci /* offset of the first region in this table from the beginning of buf */ 8408c2ecf20Sopenharmony_ci base = buf->cur->offset + buf->output_off; 8418c2ecf20Sopenharmony_ci 8428c2ecf20Sopenharmony_ci /* offset of the current output region within this table */ 8438c2ecf20Sopenharmony_ci for (topa_idx = 0; topa_idx < buf->cur_idx; topa_idx++) 8448c2ecf20Sopenharmony_ci base += TOPA_ENTRY_SIZE(buf->cur, topa_idx); 8458c2ecf20Sopenharmony_ci 8468c2ecf20Sopenharmony_ci if (buf->snapshot) { 8478c2ecf20Sopenharmony_ci local_set(&buf->data_size, base); 8488c2ecf20Sopenharmony_ci } else { 8498c2ecf20Sopenharmony_ci old = (local64_xchg(&buf->head, base) & 8508c2ecf20Sopenharmony_ci ((buf->nr_pages << PAGE_SHIFT) - 1)); 8518c2ecf20Sopenharmony_ci if (base < old) 8528c2ecf20Sopenharmony_ci base += buf->nr_pages << PAGE_SHIFT; 8538c2ecf20Sopenharmony_ci 8548c2ecf20Sopenharmony_ci local_add(base - old, &buf->data_size); 8558c2ecf20Sopenharmony_ci } 8568c2ecf20Sopenharmony_ci} 8578c2ecf20Sopenharmony_ci 8588c2ecf20Sopenharmony_ci/** 8598c2ecf20Sopenharmony_ci * pt_buffer_region() - obtain current output region's address 8608c2ecf20Sopenharmony_ci * @buf: PT buffer. 8618c2ecf20Sopenharmony_ci */ 8628c2ecf20Sopenharmony_cistatic void *pt_buffer_region(struct pt_buffer *buf) 8638c2ecf20Sopenharmony_ci{ 8648c2ecf20Sopenharmony_ci return phys_to_virt(TOPA_ENTRY(buf->cur, buf->cur_idx)->base << TOPA_SHIFT); 8658c2ecf20Sopenharmony_ci} 8668c2ecf20Sopenharmony_ci 8678c2ecf20Sopenharmony_ci/** 8688c2ecf20Sopenharmony_ci * pt_buffer_region_size() - obtain current output region's size 8698c2ecf20Sopenharmony_ci * @buf: PT buffer. 8708c2ecf20Sopenharmony_ci */ 8718c2ecf20Sopenharmony_cistatic size_t pt_buffer_region_size(struct pt_buffer *buf) 8728c2ecf20Sopenharmony_ci{ 8738c2ecf20Sopenharmony_ci return TOPA_ENTRY_SIZE(buf->cur, buf->cur_idx); 8748c2ecf20Sopenharmony_ci} 8758c2ecf20Sopenharmony_ci 8768c2ecf20Sopenharmony_ci/** 8778c2ecf20Sopenharmony_ci * pt_handle_status() - take care of possible status conditions 8788c2ecf20Sopenharmony_ci * @pt: Per-cpu pt context. 8798c2ecf20Sopenharmony_ci */ 8808c2ecf20Sopenharmony_cistatic void pt_handle_status(struct pt *pt) 8818c2ecf20Sopenharmony_ci{ 8828c2ecf20Sopenharmony_ci struct pt_buffer *buf = perf_get_aux(&pt->handle); 8838c2ecf20Sopenharmony_ci int advance = 0; 8848c2ecf20Sopenharmony_ci u64 status; 8858c2ecf20Sopenharmony_ci 8868c2ecf20Sopenharmony_ci rdmsrl(MSR_IA32_RTIT_STATUS, status); 8878c2ecf20Sopenharmony_ci 8888c2ecf20Sopenharmony_ci if (status & RTIT_STATUS_ERROR) { 8898c2ecf20Sopenharmony_ci pr_err_ratelimited("ToPA ERROR encountered, trying to recover\n"); 8908c2ecf20Sopenharmony_ci pt_topa_dump(buf); 8918c2ecf20Sopenharmony_ci status &= ~RTIT_STATUS_ERROR; 8928c2ecf20Sopenharmony_ci } 8938c2ecf20Sopenharmony_ci 8948c2ecf20Sopenharmony_ci if (status & RTIT_STATUS_STOPPED) { 8958c2ecf20Sopenharmony_ci status &= ~RTIT_STATUS_STOPPED; 8968c2ecf20Sopenharmony_ci 8978c2ecf20Sopenharmony_ci /* 8988c2ecf20Sopenharmony_ci * On systems that only do single-entry ToPA, hitting STOP 8998c2ecf20Sopenharmony_ci * means we are already losing data; need to let the decoder 9008c2ecf20Sopenharmony_ci * know. 9018c2ecf20Sopenharmony_ci */ 9028c2ecf20Sopenharmony_ci if (!buf->single && 9038c2ecf20Sopenharmony_ci (!intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries) || 9048c2ecf20Sopenharmony_ci buf->output_off == pt_buffer_region_size(buf))) { 9058c2ecf20Sopenharmony_ci perf_aux_output_flag(&pt->handle, 9068c2ecf20Sopenharmony_ci PERF_AUX_FLAG_TRUNCATED); 9078c2ecf20Sopenharmony_ci advance++; 9088c2ecf20Sopenharmony_ci } 9098c2ecf20Sopenharmony_ci } 9108c2ecf20Sopenharmony_ci 9118c2ecf20Sopenharmony_ci /* 9128c2ecf20Sopenharmony_ci * Also on single-entry ToPA implementations, interrupt will come 9138c2ecf20Sopenharmony_ci * before the output reaches its output region's boundary. 9148c2ecf20Sopenharmony_ci */ 9158c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries) && 9168c2ecf20Sopenharmony_ci !buf->snapshot && 9178c2ecf20Sopenharmony_ci pt_buffer_region_size(buf) - buf->output_off <= TOPA_PMI_MARGIN) { 9188c2ecf20Sopenharmony_ci void *head = pt_buffer_region(buf); 9198c2ecf20Sopenharmony_ci 9208c2ecf20Sopenharmony_ci /* everything within this margin needs to be zeroed out */ 9218c2ecf20Sopenharmony_ci memset(head + buf->output_off, 0, 9228c2ecf20Sopenharmony_ci pt_buffer_region_size(buf) - 9238c2ecf20Sopenharmony_ci buf->output_off); 9248c2ecf20Sopenharmony_ci advance++; 9258c2ecf20Sopenharmony_ci } 9268c2ecf20Sopenharmony_ci 9278c2ecf20Sopenharmony_ci if (advance) 9288c2ecf20Sopenharmony_ci pt_buffer_advance(buf); 9298c2ecf20Sopenharmony_ci 9308c2ecf20Sopenharmony_ci wrmsrl(MSR_IA32_RTIT_STATUS, status); 9318c2ecf20Sopenharmony_ci} 9328c2ecf20Sopenharmony_ci 9338c2ecf20Sopenharmony_ci/** 9348c2ecf20Sopenharmony_ci * pt_read_offset() - translate registers into buffer pointers 9358c2ecf20Sopenharmony_ci * @buf: PT buffer. 9368c2ecf20Sopenharmony_ci * 9378c2ecf20Sopenharmony_ci * Set buffer's output pointers from MSR values. 9388c2ecf20Sopenharmony_ci */ 9398c2ecf20Sopenharmony_cistatic void pt_read_offset(struct pt_buffer *buf) 9408c2ecf20Sopenharmony_ci{ 9418c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 9428c2ecf20Sopenharmony_ci struct topa_page *tp; 9438c2ecf20Sopenharmony_ci 9448c2ecf20Sopenharmony_ci if (!buf->single) { 9458c2ecf20Sopenharmony_ci rdmsrl(MSR_IA32_RTIT_OUTPUT_BASE, pt->output_base); 9468c2ecf20Sopenharmony_ci tp = phys_to_virt(pt->output_base); 9478c2ecf20Sopenharmony_ci buf->cur = &tp->topa; 9488c2ecf20Sopenharmony_ci } 9498c2ecf20Sopenharmony_ci 9508c2ecf20Sopenharmony_ci rdmsrl(MSR_IA32_RTIT_OUTPUT_MASK, pt->output_mask); 9518c2ecf20Sopenharmony_ci /* offset within current output region */ 9528c2ecf20Sopenharmony_ci buf->output_off = pt->output_mask >> 32; 9538c2ecf20Sopenharmony_ci /* index of current output region within this table */ 9548c2ecf20Sopenharmony_ci if (!buf->single) 9558c2ecf20Sopenharmony_ci buf->cur_idx = (pt->output_mask & 0xffffff80) >> 7; 9568c2ecf20Sopenharmony_ci} 9578c2ecf20Sopenharmony_ci 9588c2ecf20Sopenharmony_cistatic struct topa_entry * 9598c2ecf20Sopenharmony_cipt_topa_entry_for_page(struct pt_buffer *buf, unsigned int pg) 9608c2ecf20Sopenharmony_ci{ 9618c2ecf20Sopenharmony_ci struct topa_page *tp; 9628c2ecf20Sopenharmony_ci struct topa *topa; 9638c2ecf20Sopenharmony_ci unsigned int idx, cur_pg = 0, z_pg = 0, start_idx = 0; 9648c2ecf20Sopenharmony_ci 9658c2ecf20Sopenharmony_ci /* 9668c2ecf20Sopenharmony_ci * Indicates a bug in the caller. 9678c2ecf20Sopenharmony_ci */ 9688c2ecf20Sopenharmony_ci if (WARN_ON_ONCE(pg >= buf->nr_pages)) 9698c2ecf20Sopenharmony_ci return NULL; 9708c2ecf20Sopenharmony_ci 9718c2ecf20Sopenharmony_ci /* 9728c2ecf20Sopenharmony_ci * First, find the ToPA table where @pg fits. With high 9738c2ecf20Sopenharmony_ci * order allocations, there shouldn't be many of these. 9748c2ecf20Sopenharmony_ci */ 9758c2ecf20Sopenharmony_ci list_for_each_entry(topa, &buf->tables, list) { 9768c2ecf20Sopenharmony_ci if (topa->offset + topa->size > pg << PAGE_SHIFT) 9778c2ecf20Sopenharmony_ci goto found; 9788c2ecf20Sopenharmony_ci } 9798c2ecf20Sopenharmony_ci 9808c2ecf20Sopenharmony_ci /* 9818c2ecf20Sopenharmony_ci * Hitting this means we have a problem in the ToPA 9828c2ecf20Sopenharmony_ci * allocation code. 9838c2ecf20Sopenharmony_ci */ 9848c2ecf20Sopenharmony_ci WARN_ON_ONCE(1); 9858c2ecf20Sopenharmony_ci 9868c2ecf20Sopenharmony_ci return NULL; 9878c2ecf20Sopenharmony_ci 9888c2ecf20Sopenharmony_cifound: 9898c2ecf20Sopenharmony_ci /* 9908c2ecf20Sopenharmony_ci * Indicates a problem in the ToPA allocation code. 9918c2ecf20Sopenharmony_ci */ 9928c2ecf20Sopenharmony_ci if (WARN_ON_ONCE(topa->last == -1)) 9938c2ecf20Sopenharmony_ci return NULL; 9948c2ecf20Sopenharmony_ci 9958c2ecf20Sopenharmony_ci tp = topa_to_page(topa); 9968c2ecf20Sopenharmony_ci cur_pg = PFN_DOWN(topa->offset); 9978c2ecf20Sopenharmony_ci if (topa->z_count) { 9988c2ecf20Sopenharmony_ci z_pg = TOPA_ENTRY_PAGES(topa, 0) * (topa->z_count + 1); 9998c2ecf20Sopenharmony_ci start_idx = topa->z_count + 1; 10008c2ecf20Sopenharmony_ci } 10018c2ecf20Sopenharmony_ci 10028c2ecf20Sopenharmony_ci /* 10038c2ecf20Sopenharmony_ci * Multiple entries at the beginning of the table have the same size, 10048c2ecf20Sopenharmony_ci * ideally all of them; if @pg falls there, the search is done. 10058c2ecf20Sopenharmony_ci */ 10068c2ecf20Sopenharmony_ci if (pg >= cur_pg && pg < cur_pg + z_pg) { 10078c2ecf20Sopenharmony_ci idx = (pg - cur_pg) / TOPA_ENTRY_PAGES(topa, 0); 10088c2ecf20Sopenharmony_ci return &tp->table[idx]; 10098c2ecf20Sopenharmony_ci } 10108c2ecf20Sopenharmony_ci 10118c2ecf20Sopenharmony_ci /* 10128c2ecf20Sopenharmony_ci * Otherwise, slow path: iterate through the remaining entries. 10138c2ecf20Sopenharmony_ci */ 10148c2ecf20Sopenharmony_ci for (idx = start_idx, cur_pg += z_pg; idx < topa->last; idx++) { 10158c2ecf20Sopenharmony_ci if (cur_pg + TOPA_ENTRY_PAGES(topa, idx) > pg) 10168c2ecf20Sopenharmony_ci return &tp->table[idx]; 10178c2ecf20Sopenharmony_ci 10188c2ecf20Sopenharmony_ci cur_pg += TOPA_ENTRY_PAGES(topa, idx); 10198c2ecf20Sopenharmony_ci } 10208c2ecf20Sopenharmony_ci 10218c2ecf20Sopenharmony_ci /* 10228c2ecf20Sopenharmony_ci * Means we couldn't find a ToPA entry in the table that does match. 10238c2ecf20Sopenharmony_ci */ 10248c2ecf20Sopenharmony_ci WARN_ON_ONCE(1); 10258c2ecf20Sopenharmony_ci 10268c2ecf20Sopenharmony_ci return NULL; 10278c2ecf20Sopenharmony_ci} 10288c2ecf20Sopenharmony_ci 10298c2ecf20Sopenharmony_cistatic struct topa_entry * 10308c2ecf20Sopenharmony_cipt_topa_prev_entry(struct pt_buffer *buf, struct topa_entry *te) 10318c2ecf20Sopenharmony_ci{ 10328c2ecf20Sopenharmony_ci unsigned long table = (unsigned long)te & ~(PAGE_SIZE - 1); 10338c2ecf20Sopenharmony_ci struct topa_page *tp; 10348c2ecf20Sopenharmony_ci struct topa *topa; 10358c2ecf20Sopenharmony_ci 10368c2ecf20Sopenharmony_ci tp = (struct topa_page *)table; 10378c2ecf20Sopenharmony_ci if (tp->table != te) 10388c2ecf20Sopenharmony_ci return --te; 10398c2ecf20Sopenharmony_ci 10408c2ecf20Sopenharmony_ci topa = &tp->topa; 10418c2ecf20Sopenharmony_ci if (topa == buf->first) 10428c2ecf20Sopenharmony_ci topa = buf->last; 10438c2ecf20Sopenharmony_ci else 10448c2ecf20Sopenharmony_ci topa = list_prev_entry(topa, list); 10458c2ecf20Sopenharmony_ci 10468c2ecf20Sopenharmony_ci tp = topa_to_page(topa); 10478c2ecf20Sopenharmony_ci 10488c2ecf20Sopenharmony_ci return &tp->table[topa->last - 1]; 10498c2ecf20Sopenharmony_ci} 10508c2ecf20Sopenharmony_ci 10518c2ecf20Sopenharmony_ci/** 10528c2ecf20Sopenharmony_ci * pt_buffer_reset_markers() - place interrupt and stop bits in the buffer 10538c2ecf20Sopenharmony_ci * @buf: PT buffer. 10548c2ecf20Sopenharmony_ci * @handle: Current output handle. 10558c2ecf20Sopenharmony_ci * 10568c2ecf20Sopenharmony_ci * Place INT and STOP marks to prevent overwriting old data that the consumer 10578c2ecf20Sopenharmony_ci * hasn't yet collected and waking up the consumer after a certain fraction of 10588c2ecf20Sopenharmony_ci * the buffer has filled up. Only needed and sensible for non-snapshot counters. 10598c2ecf20Sopenharmony_ci * 10608c2ecf20Sopenharmony_ci * This obviously relies on buf::head to figure out buffer markers, so it has 10618c2ecf20Sopenharmony_ci * to be called after pt_buffer_reset_offsets() and before the hardware tracing 10628c2ecf20Sopenharmony_ci * is enabled. 10638c2ecf20Sopenharmony_ci */ 10648c2ecf20Sopenharmony_cistatic int pt_buffer_reset_markers(struct pt_buffer *buf, 10658c2ecf20Sopenharmony_ci struct perf_output_handle *handle) 10668c2ecf20Sopenharmony_ci 10678c2ecf20Sopenharmony_ci{ 10688c2ecf20Sopenharmony_ci unsigned long head = local64_read(&buf->head); 10698c2ecf20Sopenharmony_ci unsigned long idx, npages, wakeup; 10708c2ecf20Sopenharmony_ci 10718c2ecf20Sopenharmony_ci if (buf->single) 10728c2ecf20Sopenharmony_ci return 0; 10738c2ecf20Sopenharmony_ci 10748c2ecf20Sopenharmony_ci /* can't stop in the middle of an output region */ 10758c2ecf20Sopenharmony_ci if (buf->output_off + handle->size + 1 < pt_buffer_region_size(buf)) { 10768c2ecf20Sopenharmony_ci perf_aux_output_flag(handle, PERF_AUX_FLAG_TRUNCATED); 10778c2ecf20Sopenharmony_ci return -EINVAL; 10788c2ecf20Sopenharmony_ci } 10798c2ecf20Sopenharmony_ci 10808c2ecf20Sopenharmony_ci 10818c2ecf20Sopenharmony_ci /* single entry ToPA is handled by marking all regions STOP=1 INT=1 */ 10828c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries)) 10838c2ecf20Sopenharmony_ci return 0; 10848c2ecf20Sopenharmony_ci 10858c2ecf20Sopenharmony_ci /* clear STOP and INT from current entry */ 10868c2ecf20Sopenharmony_ci if (buf->stop_te) { 10878c2ecf20Sopenharmony_ci buf->stop_te->stop = 0; 10888c2ecf20Sopenharmony_ci buf->stop_te->intr = 0; 10898c2ecf20Sopenharmony_ci } 10908c2ecf20Sopenharmony_ci 10918c2ecf20Sopenharmony_ci if (buf->intr_te) 10928c2ecf20Sopenharmony_ci buf->intr_te->intr = 0; 10938c2ecf20Sopenharmony_ci 10948c2ecf20Sopenharmony_ci /* how many pages till the STOP marker */ 10958c2ecf20Sopenharmony_ci npages = handle->size >> PAGE_SHIFT; 10968c2ecf20Sopenharmony_ci 10978c2ecf20Sopenharmony_ci /* if it's on a page boundary, fill up one more page */ 10988c2ecf20Sopenharmony_ci if (!offset_in_page(head + handle->size + 1)) 10998c2ecf20Sopenharmony_ci npages++; 11008c2ecf20Sopenharmony_ci 11018c2ecf20Sopenharmony_ci idx = (head >> PAGE_SHIFT) + npages; 11028c2ecf20Sopenharmony_ci idx &= buf->nr_pages - 1; 11038c2ecf20Sopenharmony_ci 11048c2ecf20Sopenharmony_ci if (idx != buf->stop_pos) { 11058c2ecf20Sopenharmony_ci buf->stop_pos = idx; 11068c2ecf20Sopenharmony_ci buf->stop_te = pt_topa_entry_for_page(buf, idx); 11078c2ecf20Sopenharmony_ci buf->stop_te = pt_topa_prev_entry(buf, buf->stop_te); 11088c2ecf20Sopenharmony_ci } 11098c2ecf20Sopenharmony_ci 11108c2ecf20Sopenharmony_ci wakeup = handle->wakeup >> PAGE_SHIFT; 11118c2ecf20Sopenharmony_ci 11128c2ecf20Sopenharmony_ci /* in the worst case, wake up the consumer one page before hard stop */ 11138c2ecf20Sopenharmony_ci idx = (head >> PAGE_SHIFT) + npages - 1; 11148c2ecf20Sopenharmony_ci if (idx > wakeup) 11158c2ecf20Sopenharmony_ci idx = wakeup; 11168c2ecf20Sopenharmony_ci 11178c2ecf20Sopenharmony_ci idx &= buf->nr_pages - 1; 11188c2ecf20Sopenharmony_ci if (idx != buf->intr_pos) { 11198c2ecf20Sopenharmony_ci buf->intr_pos = idx; 11208c2ecf20Sopenharmony_ci buf->intr_te = pt_topa_entry_for_page(buf, idx); 11218c2ecf20Sopenharmony_ci buf->intr_te = pt_topa_prev_entry(buf, buf->intr_te); 11228c2ecf20Sopenharmony_ci } 11238c2ecf20Sopenharmony_ci 11248c2ecf20Sopenharmony_ci buf->stop_te->stop = 1; 11258c2ecf20Sopenharmony_ci buf->stop_te->intr = 1; 11268c2ecf20Sopenharmony_ci buf->intr_te->intr = 1; 11278c2ecf20Sopenharmony_ci 11288c2ecf20Sopenharmony_ci return 0; 11298c2ecf20Sopenharmony_ci} 11308c2ecf20Sopenharmony_ci 11318c2ecf20Sopenharmony_ci/** 11328c2ecf20Sopenharmony_ci * pt_buffer_reset_offsets() - adjust buffer's write pointers from aux_head 11338c2ecf20Sopenharmony_ci * @buf: PT buffer. 11348c2ecf20Sopenharmony_ci * @head: Write pointer (aux_head) from AUX buffer. 11358c2ecf20Sopenharmony_ci * 11368c2ecf20Sopenharmony_ci * Find the ToPA table and entry corresponding to given @head and set buffer's 11378c2ecf20Sopenharmony_ci * "current" pointers accordingly. This is done after we have obtained the 11388c2ecf20Sopenharmony_ci * current aux_head position from a successful call to perf_aux_output_begin() 11398c2ecf20Sopenharmony_ci * to make sure the hardware is writing to the right place. 11408c2ecf20Sopenharmony_ci * 11418c2ecf20Sopenharmony_ci * This function modifies buf::{cur,cur_idx,output_off} that will be programmed 11428c2ecf20Sopenharmony_ci * into PT msrs when the tracing is enabled and buf::head and buf::data_size, 11438c2ecf20Sopenharmony_ci * which are used to determine INT and STOP markers' locations by a subsequent 11448c2ecf20Sopenharmony_ci * call to pt_buffer_reset_markers(). 11458c2ecf20Sopenharmony_ci */ 11468c2ecf20Sopenharmony_cistatic void pt_buffer_reset_offsets(struct pt_buffer *buf, unsigned long head) 11478c2ecf20Sopenharmony_ci{ 11488c2ecf20Sopenharmony_ci struct topa_page *cur_tp; 11498c2ecf20Sopenharmony_ci struct topa_entry *te; 11508c2ecf20Sopenharmony_ci int pg; 11518c2ecf20Sopenharmony_ci 11528c2ecf20Sopenharmony_ci if (buf->snapshot) 11538c2ecf20Sopenharmony_ci head &= (buf->nr_pages << PAGE_SHIFT) - 1; 11548c2ecf20Sopenharmony_ci 11558c2ecf20Sopenharmony_ci if (!buf->single) { 11568c2ecf20Sopenharmony_ci pg = (head >> PAGE_SHIFT) & (buf->nr_pages - 1); 11578c2ecf20Sopenharmony_ci te = pt_topa_entry_for_page(buf, pg); 11588c2ecf20Sopenharmony_ci 11598c2ecf20Sopenharmony_ci cur_tp = topa_entry_to_page(te); 11608c2ecf20Sopenharmony_ci buf->cur = &cur_tp->topa; 11618c2ecf20Sopenharmony_ci buf->cur_idx = te - TOPA_ENTRY(buf->cur, 0); 11628c2ecf20Sopenharmony_ci buf->output_off = head & (pt_buffer_region_size(buf) - 1); 11638c2ecf20Sopenharmony_ci } else { 11648c2ecf20Sopenharmony_ci buf->output_off = head; 11658c2ecf20Sopenharmony_ci } 11668c2ecf20Sopenharmony_ci 11678c2ecf20Sopenharmony_ci local64_set(&buf->head, head); 11688c2ecf20Sopenharmony_ci local_set(&buf->data_size, 0); 11698c2ecf20Sopenharmony_ci} 11708c2ecf20Sopenharmony_ci 11718c2ecf20Sopenharmony_ci/** 11728c2ecf20Sopenharmony_ci * pt_buffer_fini_topa() - deallocate ToPA structure of a buffer 11738c2ecf20Sopenharmony_ci * @buf: PT buffer. 11748c2ecf20Sopenharmony_ci */ 11758c2ecf20Sopenharmony_cistatic void pt_buffer_fini_topa(struct pt_buffer *buf) 11768c2ecf20Sopenharmony_ci{ 11778c2ecf20Sopenharmony_ci struct topa *topa, *iter; 11788c2ecf20Sopenharmony_ci 11798c2ecf20Sopenharmony_ci if (buf->single) 11808c2ecf20Sopenharmony_ci return; 11818c2ecf20Sopenharmony_ci 11828c2ecf20Sopenharmony_ci list_for_each_entry_safe(topa, iter, &buf->tables, list) { 11838c2ecf20Sopenharmony_ci /* 11848c2ecf20Sopenharmony_ci * right now, this is in free_aux() path only, so 11858c2ecf20Sopenharmony_ci * no need to unlink this table from the list 11868c2ecf20Sopenharmony_ci */ 11878c2ecf20Sopenharmony_ci topa_free(topa); 11888c2ecf20Sopenharmony_ci } 11898c2ecf20Sopenharmony_ci} 11908c2ecf20Sopenharmony_ci 11918c2ecf20Sopenharmony_ci/** 11928c2ecf20Sopenharmony_ci * pt_buffer_init_topa() - initialize ToPA table for pt buffer 11938c2ecf20Sopenharmony_ci * @buf: PT buffer. 11948c2ecf20Sopenharmony_ci * @size: Total size of all regions within this ToPA. 11958c2ecf20Sopenharmony_ci * @gfp: Allocation flags. 11968c2ecf20Sopenharmony_ci */ 11978c2ecf20Sopenharmony_cistatic int pt_buffer_init_topa(struct pt_buffer *buf, int cpu, 11988c2ecf20Sopenharmony_ci unsigned long nr_pages, gfp_t gfp) 11998c2ecf20Sopenharmony_ci{ 12008c2ecf20Sopenharmony_ci struct topa *topa; 12018c2ecf20Sopenharmony_ci int err; 12028c2ecf20Sopenharmony_ci 12038c2ecf20Sopenharmony_ci topa = topa_alloc(cpu, gfp); 12048c2ecf20Sopenharmony_ci if (!topa) 12058c2ecf20Sopenharmony_ci return -ENOMEM; 12068c2ecf20Sopenharmony_ci 12078c2ecf20Sopenharmony_ci topa_insert_table(buf, topa); 12088c2ecf20Sopenharmony_ci 12098c2ecf20Sopenharmony_ci while (buf->nr_pages < nr_pages) { 12108c2ecf20Sopenharmony_ci err = topa_insert_pages(buf, cpu, gfp); 12118c2ecf20Sopenharmony_ci if (err) { 12128c2ecf20Sopenharmony_ci pt_buffer_fini_topa(buf); 12138c2ecf20Sopenharmony_ci return -ENOMEM; 12148c2ecf20Sopenharmony_ci } 12158c2ecf20Sopenharmony_ci } 12168c2ecf20Sopenharmony_ci 12178c2ecf20Sopenharmony_ci /* link last table to the first one, unless we're double buffering */ 12188c2ecf20Sopenharmony_ci if (intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries)) { 12198c2ecf20Sopenharmony_ci TOPA_ENTRY(buf->last, -1)->base = topa_pfn(buf->first); 12208c2ecf20Sopenharmony_ci TOPA_ENTRY(buf->last, -1)->end = 1; 12218c2ecf20Sopenharmony_ci } 12228c2ecf20Sopenharmony_ci 12238c2ecf20Sopenharmony_ci pt_topa_dump(buf); 12248c2ecf20Sopenharmony_ci return 0; 12258c2ecf20Sopenharmony_ci} 12268c2ecf20Sopenharmony_ci 12278c2ecf20Sopenharmony_cistatic int pt_buffer_try_single(struct pt_buffer *buf, int nr_pages) 12288c2ecf20Sopenharmony_ci{ 12298c2ecf20Sopenharmony_ci struct page *p = virt_to_page(buf->data_pages[0]); 12308c2ecf20Sopenharmony_ci int ret = -ENOTSUPP, order = 0; 12318c2ecf20Sopenharmony_ci 12328c2ecf20Sopenharmony_ci /* 12338c2ecf20Sopenharmony_ci * We can use single range output mode 12348c2ecf20Sopenharmony_ci * + in snapshot mode, where we don't need interrupts; 12358c2ecf20Sopenharmony_ci * + if the hardware supports it; 12368c2ecf20Sopenharmony_ci * + if the entire buffer is one contiguous allocation. 12378c2ecf20Sopenharmony_ci */ 12388c2ecf20Sopenharmony_ci if (!buf->snapshot) 12398c2ecf20Sopenharmony_ci goto out; 12408c2ecf20Sopenharmony_ci 12418c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_single_range_output)) 12428c2ecf20Sopenharmony_ci goto out; 12438c2ecf20Sopenharmony_ci 12448c2ecf20Sopenharmony_ci if (PagePrivate(p)) 12458c2ecf20Sopenharmony_ci order = page_private(p); 12468c2ecf20Sopenharmony_ci 12478c2ecf20Sopenharmony_ci if (1 << order != nr_pages) 12488c2ecf20Sopenharmony_ci goto out; 12498c2ecf20Sopenharmony_ci 12508c2ecf20Sopenharmony_ci /* 12518c2ecf20Sopenharmony_ci * Some processors cannot always support single range for more than 12528c2ecf20Sopenharmony_ci * 4KB - refer errata TGL052, ADL037 and RPL017. Future processors might 12538c2ecf20Sopenharmony_ci * also be affected, so for now rather than trying to keep track of 12548c2ecf20Sopenharmony_ci * which ones, just disable it for all. 12558c2ecf20Sopenharmony_ci */ 12568c2ecf20Sopenharmony_ci if (nr_pages > 1) 12578c2ecf20Sopenharmony_ci goto out; 12588c2ecf20Sopenharmony_ci 12598c2ecf20Sopenharmony_ci buf->single = true; 12608c2ecf20Sopenharmony_ci buf->nr_pages = nr_pages; 12618c2ecf20Sopenharmony_ci ret = 0; 12628c2ecf20Sopenharmony_ciout: 12638c2ecf20Sopenharmony_ci return ret; 12648c2ecf20Sopenharmony_ci} 12658c2ecf20Sopenharmony_ci 12668c2ecf20Sopenharmony_ci/** 12678c2ecf20Sopenharmony_ci * pt_buffer_setup_aux() - set up topa tables for a PT buffer 12688c2ecf20Sopenharmony_ci * @cpu: Cpu on which to allocate, -1 means current. 12698c2ecf20Sopenharmony_ci * @pages: Array of pointers to buffer pages passed from perf core. 12708c2ecf20Sopenharmony_ci * @nr_pages: Number of pages in the buffer. 12718c2ecf20Sopenharmony_ci * @snapshot: If this is a snapshot/overwrite counter. 12728c2ecf20Sopenharmony_ci * 12738c2ecf20Sopenharmony_ci * This is a pmu::setup_aux callback that sets up ToPA tables and all the 12748c2ecf20Sopenharmony_ci * bookkeeping for an AUX buffer. 12758c2ecf20Sopenharmony_ci * 12768c2ecf20Sopenharmony_ci * Return: Our private PT buffer structure. 12778c2ecf20Sopenharmony_ci */ 12788c2ecf20Sopenharmony_cistatic void * 12798c2ecf20Sopenharmony_cipt_buffer_setup_aux(struct perf_event *event, void **pages, 12808c2ecf20Sopenharmony_ci int nr_pages, bool snapshot) 12818c2ecf20Sopenharmony_ci{ 12828c2ecf20Sopenharmony_ci struct pt_buffer *buf; 12838c2ecf20Sopenharmony_ci int node, ret, cpu = event->cpu; 12848c2ecf20Sopenharmony_ci 12858c2ecf20Sopenharmony_ci if (!nr_pages) 12868c2ecf20Sopenharmony_ci return NULL; 12878c2ecf20Sopenharmony_ci 12888c2ecf20Sopenharmony_ci /* 12898c2ecf20Sopenharmony_ci * Only support AUX sampling in snapshot mode, where we don't 12908c2ecf20Sopenharmony_ci * generate NMIs. 12918c2ecf20Sopenharmony_ci */ 12928c2ecf20Sopenharmony_ci if (event->attr.aux_sample_size && !snapshot) 12938c2ecf20Sopenharmony_ci return NULL; 12948c2ecf20Sopenharmony_ci 12958c2ecf20Sopenharmony_ci if (cpu == -1) 12968c2ecf20Sopenharmony_ci cpu = raw_smp_processor_id(); 12978c2ecf20Sopenharmony_ci node = cpu_to_node(cpu); 12988c2ecf20Sopenharmony_ci 12998c2ecf20Sopenharmony_ci buf = kzalloc_node(sizeof(struct pt_buffer), GFP_KERNEL, node); 13008c2ecf20Sopenharmony_ci if (!buf) 13018c2ecf20Sopenharmony_ci return NULL; 13028c2ecf20Sopenharmony_ci 13038c2ecf20Sopenharmony_ci buf->snapshot = snapshot; 13048c2ecf20Sopenharmony_ci buf->data_pages = pages; 13058c2ecf20Sopenharmony_ci buf->stop_pos = -1; 13068c2ecf20Sopenharmony_ci buf->intr_pos = -1; 13078c2ecf20Sopenharmony_ci 13088c2ecf20Sopenharmony_ci INIT_LIST_HEAD(&buf->tables); 13098c2ecf20Sopenharmony_ci 13108c2ecf20Sopenharmony_ci ret = pt_buffer_try_single(buf, nr_pages); 13118c2ecf20Sopenharmony_ci if (!ret) 13128c2ecf20Sopenharmony_ci return buf; 13138c2ecf20Sopenharmony_ci 13148c2ecf20Sopenharmony_ci ret = pt_buffer_init_topa(buf, cpu, nr_pages, GFP_KERNEL); 13158c2ecf20Sopenharmony_ci if (ret) { 13168c2ecf20Sopenharmony_ci kfree(buf); 13178c2ecf20Sopenharmony_ci return NULL; 13188c2ecf20Sopenharmony_ci } 13198c2ecf20Sopenharmony_ci 13208c2ecf20Sopenharmony_ci return buf; 13218c2ecf20Sopenharmony_ci} 13228c2ecf20Sopenharmony_ci 13238c2ecf20Sopenharmony_ci/** 13248c2ecf20Sopenharmony_ci * pt_buffer_free_aux() - perf AUX deallocation path callback 13258c2ecf20Sopenharmony_ci * @data: PT buffer. 13268c2ecf20Sopenharmony_ci */ 13278c2ecf20Sopenharmony_cistatic void pt_buffer_free_aux(void *data) 13288c2ecf20Sopenharmony_ci{ 13298c2ecf20Sopenharmony_ci struct pt_buffer *buf = data; 13308c2ecf20Sopenharmony_ci 13318c2ecf20Sopenharmony_ci pt_buffer_fini_topa(buf); 13328c2ecf20Sopenharmony_ci kfree(buf); 13338c2ecf20Sopenharmony_ci} 13348c2ecf20Sopenharmony_ci 13358c2ecf20Sopenharmony_cistatic int pt_addr_filters_init(struct perf_event *event) 13368c2ecf20Sopenharmony_ci{ 13378c2ecf20Sopenharmony_ci struct pt_filters *filters; 13388c2ecf20Sopenharmony_ci int node = event->cpu == -1 ? -1 : cpu_to_node(event->cpu); 13398c2ecf20Sopenharmony_ci 13408c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_num_address_ranges)) 13418c2ecf20Sopenharmony_ci return 0; 13428c2ecf20Sopenharmony_ci 13438c2ecf20Sopenharmony_ci filters = kzalloc_node(sizeof(struct pt_filters), GFP_KERNEL, node); 13448c2ecf20Sopenharmony_ci if (!filters) 13458c2ecf20Sopenharmony_ci return -ENOMEM; 13468c2ecf20Sopenharmony_ci 13478c2ecf20Sopenharmony_ci if (event->parent) 13488c2ecf20Sopenharmony_ci memcpy(filters, event->parent->hw.addr_filters, 13498c2ecf20Sopenharmony_ci sizeof(*filters)); 13508c2ecf20Sopenharmony_ci 13518c2ecf20Sopenharmony_ci event->hw.addr_filters = filters; 13528c2ecf20Sopenharmony_ci 13538c2ecf20Sopenharmony_ci return 0; 13548c2ecf20Sopenharmony_ci} 13558c2ecf20Sopenharmony_ci 13568c2ecf20Sopenharmony_cistatic void pt_addr_filters_fini(struct perf_event *event) 13578c2ecf20Sopenharmony_ci{ 13588c2ecf20Sopenharmony_ci kfree(event->hw.addr_filters); 13598c2ecf20Sopenharmony_ci event->hw.addr_filters = NULL; 13608c2ecf20Sopenharmony_ci} 13618c2ecf20Sopenharmony_ci 13628c2ecf20Sopenharmony_ci#ifdef CONFIG_X86_64 13638c2ecf20Sopenharmony_ci/* Clamp to a canonical address greater-than-or-equal-to the address given */ 13648c2ecf20Sopenharmony_cistatic u64 clamp_to_ge_canonical_addr(u64 vaddr, u8 vaddr_bits) 13658c2ecf20Sopenharmony_ci{ 13668c2ecf20Sopenharmony_ci return __is_canonical_address(vaddr, vaddr_bits) ? 13678c2ecf20Sopenharmony_ci vaddr : 13688c2ecf20Sopenharmony_ci -BIT_ULL(vaddr_bits - 1); 13698c2ecf20Sopenharmony_ci} 13708c2ecf20Sopenharmony_ci 13718c2ecf20Sopenharmony_ci/* Clamp to a canonical address less-than-or-equal-to the address given */ 13728c2ecf20Sopenharmony_cistatic u64 clamp_to_le_canonical_addr(u64 vaddr, u8 vaddr_bits) 13738c2ecf20Sopenharmony_ci{ 13748c2ecf20Sopenharmony_ci return __is_canonical_address(vaddr, vaddr_bits) ? 13758c2ecf20Sopenharmony_ci vaddr : 13768c2ecf20Sopenharmony_ci BIT_ULL(vaddr_bits - 1) - 1; 13778c2ecf20Sopenharmony_ci} 13788c2ecf20Sopenharmony_ci#else 13798c2ecf20Sopenharmony_ci#define clamp_to_ge_canonical_addr(x, y) (x) 13808c2ecf20Sopenharmony_ci#define clamp_to_le_canonical_addr(x, y) (x) 13818c2ecf20Sopenharmony_ci#endif 13828c2ecf20Sopenharmony_ci 13838c2ecf20Sopenharmony_cistatic int pt_event_addr_filters_validate(struct list_head *filters) 13848c2ecf20Sopenharmony_ci{ 13858c2ecf20Sopenharmony_ci struct perf_addr_filter *filter; 13868c2ecf20Sopenharmony_ci int range = 0; 13878c2ecf20Sopenharmony_ci 13888c2ecf20Sopenharmony_ci list_for_each_entry(filter, filters, entry) { 13898c2ecf20Sopenharmony_ci /* 13908c2ecf20Sopenharmony_ci * PT doesn't support single address triggers and 13918c2ecf20Sopenharmony_ci * 'start' filters. 13928c2ecf20Sopenharmony_ci */ 13938c2ecf20Sopenharmony_ci if (!filter->size || 13948c2ecf20Sopenharmony_ci filter->action == PERF_ADDR_FILTER_ACTION_START) 13958c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 13968c2ecf20Sopenharmony_ci 13978c2ecf20Sopenharmony_ci if (++range > intel_pt_validate_hw_cap(PT_CAP_num_address_ranges)) 13988c2ecf20Sopenharmony_ci return -EOPNOTSUPP; 13998c2ecf20Sopenharmony_ci } 14008c2ecf20Sopenharmony_ci 14018c2ecf20Sopenharmony_ci return 0; 14028c2ecf20Sopenharmony_ci} 14038c2ecf20Sopenharmony_ci 14048c2ecf20Sopenharmony_cistatic void pt_event_addr_filters_sync(struct perf_event *event) 14058c2ecf20Sopenharmony_ci{ 14068c2ecf20Sopenharmony_ci struct perf_addr_filters_head *head = perf_event_addr_filters(event); 14078c2ecf20Sopenharmony_ci unsigned long msr_a, msr_b; 14088c2ecf20Sopenharmony_ci struct perf_addr_filter_range *fr = event->addr_filter_ranges; 14098c2ecf20Sopenharmony_ci struct pt_filters *filters = event->hw.addr_filters; 14108c2ecf20Sopenharmony_ci struct perf_addr_filter *filter; 14118c2ecf20Sopenharmony_ci int range = 0; 14128c2ecf20Sopenharmony_ci 14138c2ecf20Sopenharmony_ci if (!filters) 14148c2ecf20Sopenharmony_ci return; 14158c2ecf20Sopenharmony_ci 14168c2ecf20Sopenharmony_ci list_for_each_entry(filter, &head->list, entry) { 14178c2ecf20Sopenharmony_ci if (filter->path.dentry && !fr[range].start) { 14188c2ecf20Sopenharmony_ci msr_a = msr_b = 0; 14198c2ecf20Sopenharmony_ci } else { 14208c2ecf20Sopenharmony_ci unsigned long n = fr[range].size - 1; 14218c2ecf20Sopenharmony_ci unsigned long a = fr[range].start; 14228c2ecf20Sopenharmony_ci unsigned long b; 14238c2ecf20Sopenharmony_ci 14248c2ecf20Sopenharmony_ci if (a > ULONG_MAX - n) 14258c2ecf20Sopenharmony_ci b = ULONG_MAX; 14268c2ecf20Sopenharmony_ci else 14278c2ecf20Sopenharmony_ci b = a + n; 14288c2ecf20Sopenharmony_ci /* 14298c2ecf20Sopenharmony_ci * Apply the offset. 64-bit addresses written to the 14308c2ecf20Sopenharmony_ci * MSRs must be canonical, but the range can encompass 14318c2ecf20Sopenharmony_ci * non-canonical addresses. Since software cannot 14328c2ecf20Sopenharmony_ci * execute at non-canonical addresses, adjusting to 14338c2ecf20Sopenharmony_ci * canonical addresses does not affect the result of the 14348c2ecf20Sopenharmony_ci * address filter. 14358c2ecf20Sopenharmony_ci */ 14368c2ecf20Sopenharmony_ci msr_a = clamp_to_ge_canonical_addr(a, boot_cpu_data.x86_virt_bits); 14378c2ecf20Sopenharmony_ci msr_b = clamp_to_le_canonical_addr(b, boot_cpu_data.x86_virt_bits); 14388c2ecf20Sopenharmony_ci if (msr_b < msr_a) 14398c2ecf20Sopenharmony_ci msr_a = msr_b = 0; 14408c2ecf20Sopenharmony_ci } 14418c2ecf20Sopenharmony_ci 14428c2ecf20Sopenharmony_ci filters->filter[range].msr_a = msr_a; 14438c2ecf20Sopenharmony_ci filters->filter[range].msr_b = msr_b; 14448c2ecf20Sopenharmony_ci if (filter->action == PERF_ADDR_FILTER_ACTION_FILTER) 14458c2ecf20Sopenharmony_ci filters->filter[range].config = 1; 14468c2ecf20Sopenharmony_ci else 14478c2ecf20Sopenharmony_ci filters->filter[range].config = 2; 14488c2ecf20Sopenharmony_ci range++; 14498c2ecf20Sopenharmony_ci } 14508c2ecf20Sopenharmony_ci 14518c2ecf20Sopenharmony_ci filters->nr_filters = range; 14528c2ecf20Sopenharmony_ci} 14538c2ecf20Sopenharmony_ci 14548c2ecf20Sopenharmony_ci/** 14558c2ecf20Sopenharmony_ci * intel_pt_interrupt() - PT PMI handler 14568c2ecf20Sopenharmony_ci */ 14578c2ecf20Sopenharmony_civoid intel_pt_interrupt(void) 14588c2ecf20Sopenharmony_ci{ 14598c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 14608c2ecf20Sopenharmony_ci struct pt_buffer *buf; 14618c2ecf20Sopenharmony_ci struct perf_event *event = pt->handle.event; 14628c2ecf20Sopenharmony_ci 14638c2ecf20Sopenharmony_ci /* 14648c2ecf20Sopenharmony_ci * There may be a dangling PT bit in the interrupt status register 14658c2ecf20Sopenharmony_ci * after PT has been disabled by pt_event_stop(). Make sure we don't 14668c2ecf20Sopenharmony_ci * do anything (particularly, re-enable) for this event here. 14678c2ecf20Sopenharmony_ci */ 14688c2ecf20Sopenharmony_ci if (!READ_ONCE(pt->handle_nmi)) 14698c2ecf20Sopenharmony_ci return; 14708c2ecf20Sopenharmony_ci 14718c2ecf20Sopenharmony_ci if (!event) 14728c2ecf20Sopenharmony_ci return; 14738c2ecf20Sopenharmony_ci 14748c2ecf20Sopenharmony_ci pt_config_stop(event); 14758c2ecf20Sopenharmony_ci 14768c2ecf20Sopenharmony_ci buf = perf_get_aux(&pt->handle); 14778c2ecf20Sopenharmony_ci if (!buf) 14788c2ecf20Sopenharmony_ci return; 14798c2ecf20Sopenharmony_ci 14808c2ecf20Sopenharmony_ci pt_read_offset(buf); 14818c2ecf20Sopenharmony_ci 14828c2ecf20Sopenharmony_ci pt_handle_status(pt); 14838c2ecf20Sopenharmony_ci 14848c2ecf20Sopenharmony_ci pt_update_head(pt); 14858c2ecf20Sopenharmony_ci 14868c2ecf20Sopenharmony_ci perf_aux_output_end(&pt->handle, local_xchg(&buf->data_size, 0)); 14878c2ecf20Sopenharmony_ci 14888c2ecf20Sopenharmony_ci if (!event->hw.state) { 14898c2ecf20Sopenharmony_ci int ret; 14908c2ecf20Sopenharmony_ci 14918c2ecf20Sopenharmony_ci buf = perf_aux_output_begin(&pt->handle, event); 14928c2ecf20Sopenharmony_ci if (!buf) { 14938c2ecf20Sopenharmony_ci event->hw.state = PERF_HES_STOPPED; 14948c2ecf20Sopenharmony_ci return; 14958c2ecf20Sopenharmony_ci } 14968c2ecf20Sopenharmony_ci 14978c2ecf20Sopenharmony_ci pt_buffer_reset_offsets(buf, pt->handle.head); 14988c2ecf20Sopenharmony_ci /* snapshot counters don't use PMI, so it's safe */ 14998c2ecf20Sopenharmony_ci ret = pt_buffer_reset_markers(buf, &pt->handle); 15008c2ecf20Sopenharmony_ci if (ret) { 15018c2ecf20Sopenharmony_ci perf_aux_output_end(&pt->handle, 0); 15028c2ecf20Sopenharmony_ci return; 15038c2ecf20Sopenharmony_ci } 15048c2ecf20Sopenharmony_ci 15058c2ecf20Sopenharmony_ci pt_config_buffer(buf); 15068c2ecf20Sopenharmony_ci pt_config_start(event); 15078c2ecf20Sopenharmony_ci } 15088c2ecf20Sopenharmony_ci} 15098c2ecf20Sopenharmony_ci 15108c2ecf20Sopenharmony_civoid intel_pt_handle_vmx(int on) 15118c2ecf20Sopenharmony_ci{ 15128c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 15138c2ecf20Sopenharmony_ci struct perf_event *event; 15148c2ecf20Sopenharmony_ci unsigned long flags; 15158c2ecf20Sopenharmony_ci 15168c2ecf20Sopenharmony_ci /* PT plays nice with VMX, do nothing */ 15178c2ecf20Sopenharmony_ci if (pt_pmu.vmx) 15188c2ecf20Sopenharmony_ci return; 15198c2ecf20Sopenharmony_ci 15208c2ecf20Sopenharmony_ci /* 15218c2ecf20Sopenharmony_ci * VMXON will clear RTIT_CTL.TraceEn; we need to make 15228c2ecf20Sopenharmony_ci * sure to not try to set it while VMX is on. Disable 15238c2ecf20Sopenharmony_ci * interrupts to avoid racing with pmu callbacks; 15248c2ecf20Sopenharmony_ci * concurrent PMI should be handled fine. 15258c2ecf20Sopenharmony_ci */ 15268c2ecf20Sopenharmony_ci local_irq_save(flags); 15278c2ecf20Sopenharmony_ci WRITE_ONCE(pt->vmx_on, on); 15288c2ecf20Sopenharmony_ci 15298c2ecf20Sopenharmony_ci /* 15308c2ecf20Sopenharmony_ci * If an AUX transaction is in progress, it will contain 15318c2ecf20Sopenharmony_ci * gap(s), so flag it PARTIAL to inform the user. 15328c2ecf20Sopenharmony_ci */ 15338c2ecf20Sopenharmony_ci event = pt->handle.event; 15348c2ecf20Sopenharmony_ci if (event) 15358c2ecf20Sopenharmony_ci perf_aux_output_flag(&pt->handle, 15368c2ecf20Sopenharmony_ci PERF_AUX_FLAG_PARTIAL); 15378c2ecf20Sopenharmony_ci 15388c2ecf20Sopenharmony_ci /* Turn PTs back on */ 15398c2ecf20Sopenharmony_ci if (!on && event) 15408c2ecf20Sopenharmony_ci wrmsrl(MSR_IA32_RTIT_CTL, event->hw.config); 15418c2ecf20Sopenharmony_ci 15428c2ecf20Sopenharmony_ci local_irq_restore(flags); 15438c2ecf20Sopenharmony_ci} 15448c2ecf20Sopenharmony_ciEXPORT_SYMBOL_GPL(intel_pt_handle_vmx); 15458c2ecf20Sopenharmony_ci 15468c2ecf20Sopenharmony_ci/* 15478c2ecf20Sopenharmony_ci * PMU callbacks 15488c2ecf20Sopenharmony_ci */ 15498c2ecf20Sopenharmony_ci 15508c2ecf20Sopenharmony_cistatic void pt_event_start(struct perf_event *event, int mode) 15518c2ecf20Sopenharmony_ci{ 15528c2ecf20Sopenharmony_ci struct hw_perf_event *hwc = &event->hw; 15538c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 15548c2ecf20Sopenharmony_ci struct pt_buffer *buf; 15558c2ecf20Sopenharmony_ci 15568c2ecf20Sopenharmony_ci buf = perf_aux_output_begin(&pt->handle, event); 15578c2ecf20Sopenharmony_ci if (!buf) 15588c2ecf20Sopenharmony_ci goto fail_stop; 15598c2ecf20Sopenharmony_ci 15608c2ecf20Sopenharmony_ci pt_buffer_reset_offsets(buf, pt->handle.head); 15618c2ecf20Sopenharmony_ci if (!buf->snapshot) { 15628c2ecf20Sopenharmony_ci if (pt_buffer_reset_markers(buf, &pt->handle)) 15638c2ecf20Sopenharmony_ci goto fail_end_stop; 15648c2ecf20Sopenharmony_ci } 15658c2ecf20Sopenharmony_ci 15668c2ecf20Sopenharmony_ci WRITE_ONCE(pt->handle_nmi, 1); 15678c2ecf20Sopenharmony_ci hwc->state = 0; 15688c2ecf20Sopenharmony_ci 15698c2ecf20Sopenharmony_ci pt_config_buffer(buf); 15708c2ecf20Sopenharmony_ci pt_config(event); 15718c2ecf20Sopenharmony_ci 15728c2ecf20Sopenharmony_ci return; 15738c2ecf20Sopenharmony_ci 15748c2ecf20Sopenharmony_cifail_end_stop: 15758c2ecf20Sopenharmony_ci perf_aux_output_end(&pt->handle, 0); 15768c2ecf20Sopenharmony_cifail_stop: 15778c2ecf20Sopenharmony_ci hwc->state = PERF_HES_STOPPED; 15788c2ecf20Sopenharmony_ci} 15798c2ecf20Sopenharmony_ci 15808c2ecf20Sopenharmony_cistatic void pt_event_stop(struct perf_event *event, int mode) 15818c2ecf20Sopenharmony_ci{ 15828c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 15838c2ecf20Sopenharmony_ci 15848c2ecf20Sopenharmony_ci /* 15858c2ecf20Sopenharmony_ci * Protect against the PMI racing with disabling wrmsr, 15868c2ecf20Sopenharmony_ci * see comment in intel_pt_interrupt(). 15878c2ecf20Sopenharmony_ci */ 15888c2ecf20Sopenharmony_ci WRITE_ONCE(pt->handle_nmi, 0); 15898c2ecf20Sopenharmony_ci 15908c2ecf20Sopenharmony_ci pt_config_stop(event); 15918c2ecf20Sopenharmony_ci 15928c2ecf20Sopenharmony_ci if (event->hw.state == PERF_HES_STOPPED) 15938c2ecf20Sopenharmony_ci return; 15948c2ecf20Sopenharmony_ci 15958c2ecf20Sopenharmony_ci event->hw.state = PERF_HES_STOPPED; 15968c2ecf20Sopenharmony_ci 15978c2ecf20Sopenharmony_ci if (mode & PERF_EF_UPDATE) { 15988c2ecf20Sopenharmony_ci struct pt_buffer *buf = perf_get_aux(&pt->handle); 15998c2ecf20Sopenharmony_ci 16008c2ecf20Sopenharmony_ci if (!buf) 16018c2ecf20Sopenharmony_ci return; 16028c2ecf20Sopenharmony_ci 16038c2ecf20Sopenharmony_ci if (WARN_ON_ONCE(pt->handle.event != event)) 16048c2ecf20Sopenharmony_ci return; 16058c2ecf20Sopenharmony_ci 16068c2ecf20Sopenharmony_ci pt_read_offset(buf); 16078c2ecf20Sopenharmony_ci 16088c2ecf20Sopenharmony_ci pt_handle_status(pt); 16098c2ecf20Sopenharmony_ci 16108c2ecf20Sopenharmony_ci pt_update_head(pt); 16118c2ecf20Sopenharmony_ci 16128c2ecf20Sopenharmony_ci if (buf->snapshot) 16138c2ecf20Sopenharmony_ci pt->handle.head = 16148c2ecf20Sopenharmony_ci local_xchg(&buf->data_size, 16158c2ecf20Sopenharmony_ci buf->nr_pages << PAGE_SHIFT); 16168c2ecf20Sopenharmony_ci perf_aux_output_end(&pt->handle, local_xchg(&buf->data_size, 0)); 16178c2ecf20Sopenharmony_ci } 16188c2ecf20Sopenharmony_ci} 16198c2ecf20Sopenharmony_ci 16208c2ecf20Sopenharmony_cistatic long pt_event_snapshot_aux(struct perf_event *event, 16218c2ecf20Sopenharmony_ci struct perf_output_handle *handle, 16228c2ecf20Sopenharmony_ci unsigned long size) 16238c2ecf20Sopenharmony_ci{ 16248c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 16258c2ecf20Sopenharmony_ci struct pt_buffer *buf = perf_get_aux(&pt->handle); 16268c2ecf20Sopenharmony_ci unsigned long from = 0, to; 16278c2ecf20Sopenharmony_ci long ret; 16288c2ecf20Sopenharmony_ci 16298c2ecf20Sopenharmony_ci if (WARN_ON_ONCE(!buf)) 16308c2ecf20Sopenharmony_ci return 0; 16318c2ecf20Sopenharmony_ci 16328c2ecf20Sopenharmony_ci /* 16338c2ecf20Sopenharmony_ci * Sampling is only allowed on snapshot events; 16348c2ecf20Sopenharmony_ci * see pt_buffer_setup_aux(). 16358c2ecf20Sopenharmony_ci */ 16368c2ecf20Sopenharmony_ci if (WARN_ON_ONCE(!buf->snapshot)) 16378c2ecf20Sopenharmony_ci return 0; 16388c2ecf20Sopenharmony_ci 16398c2ecf20Sopenharmony_ci /* 16408c2ecf20Sopenharmony_ci * Here, handle_nmi tells us if the tracing is on 16418c2ecf20Sopenharmony_ci */ 16428c2ecf20Sopenharmony_ci if (READ_ONCE(pt->handle_nmi)) 16438c2ecf20Sopenharmony_ci pt_config_stop(event); 16448c2ecf20Sopenharmony_ci 16458c2ecf20Sopenharmony_ci pt_read_offset(buf); 16468c2ecf20Sopenharmony_ci pt_update_head(pt); 16478c2ecf20Sopenharmony_ci 16488c2ecf20Sopenharmony_ci to = local_read(&buf->data_size); 16498c2ecf20Sopenharmony_ci if (to < size) 16508c2ecf20Sopenharmony_ci from = buf->nr_pages << PAGE_SHIFT; 16518c2ecf20Sopenharmony_ci from += to - size; 16528c2ecf20Sopenharmony_ci 16538c2ecf20Sopenharmony_ci ret = perf_output_copy_aux(&pt->handle, handle, from, to); 16548c2ecf20Sopenharmony_ci 16558c2ecf20Sopenharmony_ci /* 16568c2ecf20Sopenharmony_ci * If the tracing was on when we turned up, restart it. 16578c2ecf20Sopenharmony_ci * Compiler barrier not needed as we couldn't have been 16588c2ecf20Sopenharmony_ci * preempted by anything that touches pt->handle_nmi. 16598c2ecf20Sopenharmony_ci */ 16608c2ecf20Sopenharmony_ci if (pt->handle_nmi) 16618c2ecf20Sopenharmony_ci pt_config_start(event); 16628c2ecf20Sopenharmony_ci 16638c2ecf20Sopenharmony_ci return ret; 16648c2ecf20Sopenharmony_ci} 16658c2ecf20Sopenharmony_ci 16668c2ecf20Sopenharmony_cistatic void pt_event_del(struct perf_event *event, int mode) 16678c2ecf20Sopenharmony_ci{ 16688c2ecf20Sopenharmony_ci pt_event_stop(event, PERF_EF_UPDATE); 16698c2ecf20Sopenharmony_ci} 16708c2ecf20Sopenharmony_ci 16718c2ecf20Sopenharmony_cistatic int pt_event_add(struct perf_event *event, int mode) 16728c2ecf20Sopenharmony_ci{ 16738c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 16748c2ecf20Sopenharmony_ci struct hw_perf_event *hwc = &event->hw; 16758c2ecf20Sopenharmony_ci int ret = -EBUSY; 16768c2ecf20Sopenharmony_ci 16778c2ecf20Sopenharmony_ci if (pt->handle.event) 16788c2ecf20Sopenharmony_ci goto fail; 16798c2ecf20Sopenharmony_ci 16808c2ecf20Sopenharmony_ci if (mode & PERF_EF_START) { 16818c2ecf20Sopenharmony_ci pt_event_start(event, 0); 16828c2ecf20Sopenharmony_ci ret = -EINVAL; 16838c2ecf20Sopenharmony_ci if (hwc->state == PERF_HES_STOPPED) 16848c2ecf20Sopenharmony_ci goto fail; 16858c2ecf20Sopenharmony_ci } else { 16868c2ecf20Sopenharmony_ci hwc->state = PERF_HES_STOPPED; 16878c2ecf20Sopenharmony_ci } 16888c2ecf20Sopenharmony_ci 16898c2ecf20Sopenharmony_ci ret = 0; 16908c2ecf20Sopenharmony_cifail: 16918c2ecf20Sopenharmony_ci 16928c2ecf20Sopenharmony_ci return ret; 16938c2ecf20Sopenharmony_ci} 16948c2ecf20Sopenharmony_ci 16958c2ecf20Sopenharmony_cistatic void pt_event_read(struct perf_event *event) 16968c2ecf20Sopenharmony_ci{ 16978c2ecf20Sopenharmony_ci} 16988c2ecf20Sopenharmony_ci 16998c2ecf20Sopenharmony_cistatic void pt_event_destroy(struct perf_event *event) 17008c2ecf20Sopenharmony_ci{ 17018c2ecf20Sopenharmony_ci pt_addr_filters_fini(event); 17028c2ecf20Sopenharmony_ci x86_del_exclusive(x86_lbr_exclusive_pt); 17038c2ecf20Sopenharmony_ci} 17048c2ecf20Sopenharmony_ci 17058c2ecf20Sopenharmony_cistatic int pt_event_init(struct perf_event *event) 17068c2ecf20Sopenharmony_ci{ 17078c2ecf20Sopenharmony_ci if (event->attr.type != pt_pmu.pmu.type) 17088c2ecf20Sopenharmony_ci return -ENOENT; 17098c2ecf20Sopenharmony_ci 17108c2ecf20Sopenharmony_ci if (!pt_event_valid(event)) 17118c2ecf20Sopenharmony_ci return -EINVAL; 17128c2ecf20Sopenharmony_ci 17138c2ecf20Sopenharmony_ci if (x86_add_exclusive(x86_lbr_exclusive_pt)) 17148c2ecf20Sopenharmony_ci return -EBUSY; 17158c2ecf20Sopenharmony_ci 17168c2ecf20Sopenharmony_ci if (pt_addr_filters_init(event)) { 17178c2ecf20Sopenharmony_ci x86_del_exclusive(x86_lbr_exclusive_pt); 17188c2ecf20Sopenharmony_ci return -ENOMEM; 17198c2ecf20Sopenharmony_ci } 17208c2ecf20Sopenharmony_ci 17218c2ecf20Sopenharmony_ci event->destroy = pt_event_destroy; 17228c2ecf20Sopenharmony_ci 17238c2ecf20Sopenharmony_ci return 0; 17248c2ecf20Sopenharmony_ci} 17258c2ecf20Sopenharmony_ci 17268c2ecf20Sopenharmony_civoid cpu_emergency_stop_pt(void) 17278c2ecf20Sopenharmony_ci{ 17288c2ecf20Sopenharmony_ci struct pt *pt = this_cpu_ptr(&pt_ctx); 17298c2ecf20Sopenharmony_ci 17308c2ecf20Sopenharmony_ci if (pt->handle.event) 17318c2ecf20Sopenharmony_ci pt_event_stop(pt->handle.event, PERF_EF_UPDATE); 17328c2ecf20Sopenharmony_ci} 17338c2ecf20Sopenharmony_ci 17348c2ecf20Sopenharmony_ciint is_intel_pt_event(struct perf_event *event) 17358c2ecf20Sopenharmony_ci{ 17368c2ecf20Sopenharmony_ci return event->pmu == &pt_pmu.pmu; 17378c2ecf20Sopenharmony_ci} 17388c2ecf20Sopenharmony_ci 17398c2ecf20Sopenharmony_cistatic __init int pt_init(void) 17408c2ecf20Sopenharmony_ci{ 17418c2ecf20Sopenharmony_ci int ret, cpu, prior_warn = 0; 17428c2ecf20Sopenharmony_ci 17438c2ecf20Sopenharmony_ci BUILD_BUG_ON(sizeof(struct topa) > PAGE_SIZE); 17448c2ecf20Sopenharmony_ci 17458c2ecf20Sopenharmony_ci if (!boot_cpu_has(X86_FEATURE_INTEL_PT)) 17468c2ecf20Sopenharmony_ci return -ENODEV; 17478c2ecf20Sopenharmony_ci 17488c2ecf20Sopenharmony_ci get_online_cpus(); 17498c2ecf20Sopenharmony_ci for_each_online_cpu(cpu) { 17508c2ecf20Sopenharmony_ci u64 ctl; 17518c2ecf20Sopenharmony_ci 17528c2ecf20Sopenharmony_ci ret = rdmsrl_safe_on_cpu(cpu, MSR_IA32_RTIT_CTL, &ctl); 17538c2ecf20Sopenharmony_ci if (!ret && (ctl & RTIT_CTL_TRACEEN)) 17548c2ecf20Sopenharmony_ci prior_warn++; 17558c2ecf20Sopenharmony_ci } 17568c2ecf20Sopenharmony_ci put_online_cpus(); 17578c2ecf20Sopenharmony_ci 17588c2ecf20Sopenharmony_ci if (prior_warn) { 17598c2ecf20Sopenharmony_ci x86_add_exclusive(x86_lbr_exclusive_pt); 17608c2ecf20Sopenharmony_ci pr_warn("PT is enabled at boot time, doing nothing\n"); 17618c2ecf20Sopenharmony_ci 17628c2ecf20Sopenharmony_ci return -EBUSY; 17638c2ecf20Sopenharmony_ci } 17648c2ecf20Sopenharmony_ci 17658c2ecf20Sopenharmony_ci ret = pt_pmu_hw_init(); 17668c2ecf20Sopenharmony_ci if (ret) 17678c2ecf20Sopenharmony_ci return ret; 17688c2ecf20Sopenharmony_ci 17698c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_topa_output)) { 17708c2ecf20Sopenharmony_ci pr_warn("ToPA output is not supported on this CPU\n"); 17718c2ecf20Sopenharmony_ci return -ENODEV; 17728c2ecf20Sopenharmony_ci } 17738c2ecf20Sopenharmony_ci 17748c2ecf20Sopenharmony_ci if (!intel_pt_validate_hw_cap(PT_CAP_topa_multiple_entries)) 17758c2ecf20Sopenharmony_ci pt_pmu.pmu.capabilities = PERF_PMU_CAP_AUX_NO_SG; 17768c2ecf20Sopenharmony_ci 17778c2ecf20Sopenharmony_ci pt_pmu.pmu.capabilities |= PERF_PMU_CAP_EXCLUSIVE | PERF_PMU_CAP_ITRACE; 17788c2ecf20Sopenharmony_ci pt_pmu.pmu.attr_groups = pt_attr_groups; 17798c2ecf20Sopenharmony_ci pt_pmu.pmu.task_ctx_nr = perf_sw_context; 17808c2ecf20Sopenharmony_ci pt_pmu.pmu.event_init = pt_event_init; 17818c2ecf20Sopenharmony_ci pt_pmu.pmu.add = pt_event_add; 17828c2ecf20Sopenharmony_ci pt_pmu.pmu.del = pt_event_del; 17838c2ecf20Sopenharmony_ci pt_pmu.pmu.start = pt_event_start; 17848c2ecf20Sopenharmony_ci pt_pmu.pmu.stop = pt_event_stop; 17858c2ecf20Sopenharmony_ci pt_pmu.pmu.snapshot_aux = pt_event_snapshot_aux; 17868c2ecf20Sopenharmony_ci pt_pmu.pmu.read = pt_event_read; 17878c2ecf20Sopenharmony_ci pt_pmu.pmu.setup_aux = pt_buffer_setup_aux; 17888c2ecf20Sopenharmony_ci pt_pmu.pmu.free_aux = pt_buffer_free_aux; 17898c2ecf20Sopenharmony_ci pt_pmu.pmu.addr_filters_sync = pt_event_addr_filters_sync; 17908c2ecf20Sopenharmony_ci pt_pmu.pmu.addr_filters_validate = pt_event_addr_filters_validate; 17918c2ecf20Sopenharmony_ci pt_pmu.pmu.nr_addr_filters = 17928c2ecf20Sopenharmony_ci intel_pt_validate_hw_cap(PT_CAP_num_address_ranges); 17938c2ecf20Sopenharmony_ci 17948c2ecf20Sopenharmony_ci ret = perf_pmu_register(&pt_pmu.pmu, "intel_pt", -1); 17958c2ecf20Sopenharmony_ci 17968c2ecf20Sopenharmony_ci return ret; 17978c2ecf20Sopenharmony_ci} 17988c2ecf20Sopenharmony_ciarch_initcall(pt_init); 1799