162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Use DWARF Debug information to skip unnecessary callchain entries. 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Copyright (C) 2014 Sukadev Bhattiprolu, IBM Corporation. 662306a36Sopenharmony_ci * Copyright (C) 2014 Ulrich Weigand, IBM Corporation. 762306a36Sopenharmony_ci */ 862306a36Sopenharmony_ci#include <inttypes.h> 962306a36Sopenharmony_ci#include <dwarf.h> 1062306a36Sopenharmony_ci#include <elfutils/libdwfl.h> 1162306a36Sopenharmony_ci 1262306a36Sopenharmony_ci#include "util/thread.h" 1362306a36Sopenharmony_ci#include "util/callchain.h" 1462306a36Sopenharmony_ci#include "util/debug.h" 1562306a36Sopenharmony_ci#include "util/dso.h" 1662306a36Sopenharmony_ci#include "util/event.h" // struct ip_callchain 1762306a36Sopenharmony_ci#include "util/map.h" 1862306a36Sopenharmony_ci#include "util/symbol.h" 1962306a36Sopenharmony_ci 2062306a36Sopenharmony_ci/* 2162306a36Sopenharmony_ci * When saving the callchain on Power, the kernel conservatively saves 2262306a36Sopenharmony_ci * excess entries in the callchain. A few of these entries are needed 2362306a36Sopenharmony_ci * in some cases but not others. If the unnecessary entries are not 2462306a36Sopenharmony_ci * ignored, we end up with duplicate arcs in the call-graphs. Use 2562306a36Sopenharmony_ci * DWARF debug information to skip over any unnecessary callchain 2662306a36Sopenharmony_ci * entries. 2762306a36Sopenharmony_ci * 2862306a36Sopenharmony_ci * See function header for arch_adjust_callchain() below for more details. 2962306a36Sopenharmony_ci * 3062306a36Sopenharmony_ci * The libdwfl code in this file is based on code from elfutils 3162306a36Sopenharmony_ci * (libdwfl/argp-std.c, libdwfl/tests/addrcfi.c, etc). 3262306a36Sopenharmony_ci */ 3362306a36Sopenharmony_cistatic char *debuginfo_path; 3462306a36Sopenharmony_ci 3562306a36Sopenharmony_cistatic const Dwfl_Callbacks offline_callbacks = { 3662306a36Sopenharmony_ci .debuginfo_path = &debuginfo_path, 3762306a36Sopenharmony_ci .find_debuginfo = dwfl_standard_find_debuginfo, 3862306a36Sopenharmony_ci .section_address = dwfl_offline_section_address, 3962306a36Sopenharmony_ci}; 4062306a36Sopenharmony_ci 4162306a36Sopenharmony_ci 4262306a36Sopenharmony_ci/* 4362306a36Sopenharmony_ci * Use the DWARF expression for the Call-frame-address and determine 4462306a36Sopenharmony_ci * if return address is in LR and if a new frame was allocated. 4562306a36Sopenharmony_ci */ 4662306a36Sopenharmony_cistatic int check_return_reg(int ra_regno, Dwarf_Frame *frame) 4762306a36Sopenharmony_ci{ 4862306a36Sopenharmony_ci Dwarf_Op ops_mem[3]; 4962306a36Sopenharmony_ci Dwarf_Op dummy; 5062306a36Sopenharmony_ci Dwarf_Op *ops = &dummy; 5162306a36Sopenharmony_ci size_t nops; 5262306a36Sopenharmony_ci int result; 5362306a36Sopenharmony_ci 5462306a36Sopenharmony_ci result = dwarf_frame_register(frame, ra_regno, ops_mem, &ops, &nops); 5562306a36Sopenharmony_ci if (result < 0) { 5662306a36Sopenharmony_ci pr_debug("dwarf_frame_register() %s\n", dwarf_errmsg(-1)); 5762306a36Sopenharmony_ci return -1; 5862306a36Sopenharmony_ci } 5962306a36Sopenharmony_ci 6062306a36Sopenharmony_ci /* 6162306a36Sopenharmony_ci * Check if return address is on the stack. If return address 6262306a36Sopenharmony_ci * is in a register (typically R0), it is yet to be saved on 6362306a36Sopenharmony_ci * the stack. 6462306a36Sopenharmony_ci */ 6562306a36Sopenharmony_ci if ((nops != 0 || ops != NULL) && 6662306a36Sopenharmony_ci !(nops == 1 && ops[0].atom == DW_OP_regx && 6762306a36Sopenharmony_ci ops[0].number2 == 0 && ops[0].offset == 0)) 6862306a36Sopenharmony_ci return 0; 6962306a36Sopenharmony_ci 7062306a36Sopenharmony_ci /* 7162306a36Sopenharmony_ci * Return address is in LR. Check if a frame was allocated 7262306a36Sopenharmony_ci * but not-yet used. 7362306a36Sopenharmony_ci */ 7462306a36Sopenharmony_ci result = dwarf_frame_cfa(frame, &ops, &nops); 7562306a36Sopenharmony_ci if (result < 0) { 7662306a36Sopenharmony_ci pr_debug("dwarf_frame_cfa() returns %d, %s\n", result, 7762306a36Sopenharmony_ci dwarf_errmsg(-1)); 7862306a36Sopenharmony_ci return -1; 7962306a36Sopenharmony_ci } 8062306a36Sopenharmony_ci 8162306a36Sopenharmony_ci /* 8262306a36Sopenharmony_ci * If call frame address is in r1, no new frame was allocated. 8362306a36Sopenharmony_ci */ 8462306a36Sopenharmony_ci if (nops == 1 && ops[0].atom == DW_OP_bregx && ops[0].number == 1 && 8562306a36Sopenharmony_ci ops[0].number2 == 0) 8662306a36Sopenharmony_ci return 1; 8762306a36Sopenharmony_ci 8862306a36Sopenharmony_ci /* 8962306a36Sopenharmony_ci * A new frame was allocated but has not yet been used. 9062306a36Sopenharmony_ci */ 9162306a36Sopenharmony_ci return 2; 9262306a36Sopenharmony_ci} 9362306a36Sopenharmony_ci 9462306a36Sopenharmony_ci/* 9562306a36Sopenharmony_ci * Get the DWARF frame from the .eh_frame section. 9662306a36Sopenharmony_ci */ 9762306a36Sopenharmony_cistatic Dwarf_Frame *get_eh_frame(Dwfl_Module *mod, Dwarf_Addr pc) 9862306a36Sopenharmony_ci{ 9962306a36Sopenharmony_ci int result; 10062306a36Sopenharmony_ci Dwarf_Addr bias; 10162306a36Sopenharmony_ci Dwarf_CFI *cfi; 10262306a36Sopenharmony_ci Dwarf_Frame *frame; 10362306a36Sopenharmony_ci 10462306a36Sopenharmony_ci cfi = dwfl_module_eh_cfi(mod, &bias); 10562306a36Sopenharmony_ci if (!cfi) { 10662306a36Sopenharmony_ci pr_debug("%s(): no CFI - %s\n", __func__, dwfl_errmsg(-1)); 10762306a36Sopenharmony_ci return NULL; 10862306a36Sopenharmony_ci } 10962306a36Sopenharmony_ci 11062306a36Sopenharmony_ci result = dwarf_cfi_addrframe(cfi, pc-bias, &frame); 11162306a36Sopenharmony_ci if (result) { 11262306a36Sopenharmony_ci pr_debug("%s(): %s\n", __func__, dwfl_errmsg(-1)); 11362306a36Sopenharmony_ci return NULL; 11462306a36Sopenharmony_ci } 11562306a36Sopenharmony_ci 11662306a36Sopenharmony_ci return frame; 11762306a36Sopenharmony_ci} 11862306a36Sopenharmony_ci 11962306a36Sopenharmony_ci/* 12062306a36Sopenharmony_ci * Get the DWARF frame from the .debug_frame section. 12162306a36Sopenharmony_ci */ 12262306a36Sopenharmony_cistatic Dwarf_Frame *get_dwarf_frame(Dwfl_Module *mod, Dwarf_Addr pc) 12362306a36Sopenharmony_ci{ 12462306a36Sopenharmony_ci Dwarf_CFI *cfi; 12562306a36Sopenharmony_ci Dwarf_Addr bias; 12662306a36Sopenharmony_ci Dwarf_Frame *frame; 12762306a36Sopenharmony_ci int result; 12862306a36Sopenharmony_ci 12962306a36Sopenharmony_ci cfi = dwfl_module_dwarf_cfi(mod, &bias); 13062306a36Sopenharmony_ci if (!cfi) { 13162306a36Sopenharmony_ci pr_debug("%s(): no CFI - %s\n", __func__, dwfl_errmsg(-1)); 13262306a36Sopenharmony_ci return NULL; 13362306a36Sopenharmony_ci } 13462306a36Sopenharmony_ci 13562306a36Sopenharmony_ci result = dwarf_cfi_addrframe(cfi, pc-bias, &frame); 13662306a36Sopenharmony_ci if (result) { 13762306a36Sopenharmony_ci pr_debug("%s(): %s\n", __func__, dwfl_errmsg(-1)); 13862306a36Sopenharmony_ci return NULL; 13962306a36Sopenharmony_ci } 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_ci return frame; 14262306a36Sopenharmony_ci} 14362306a36Sopenharmony_ci 14462306a36Sopenharmony_ci/* 14562306a36Sopenharmony_ci * Return: 14662306a36Sopenharmony_ci * 0 if return address for the program counter @pc is on stack 14762306a36Sopenharmony_ci * 1 if return address is in LR and no new stack frame was allocated 14862306a36Sopenharmony_ci * 2 if return address is in LR and a new frame was allocated (but not 14962306a36Sopenharmony_ci * yet used) 15062306a36Sopenharmony_ci * -1 in case of errors 15162306a36Sopenharmony_ci */ 15262306a36Sopenharmony_cistatic int check_return_addr(struct dso *dso, u64 map_start, Dwarf_Addr pc) 15362306a36Sopenharmony_ci{ 15462306a36Sopenharmony_ci int rc = -1; 15562306a36Sopenharmony_ci Dwfl *dwfl; 15662306a36Sopenharmony_ci Dwfl_Module *mod; 15762306a36Sopenharmony_ci Dwarf_Frame *frame; 15862306a36Sopenharmony_ci int ra_regno; 15962306a36Sopenharmony_ci Dwarf_Addr start = pc; 16062306a36Sopenharmony_ci Dwarf_Addr end = pc; 16162306a36Sopenharmony_ci bool signalp; 16262306a36Sopenharmony_ci const char *exec_file = dso->long_name; 16362306a36Sopenharmony_ci 16462306a36Sopenharmony_ci dwfl = dso->dwfl; 16562306a36Sopenharmony_ci 16662306a36Sopenharmony_ci if (!dwfl) { 16762306a36Sopenharmony_ci dwfl = dwfl_begin(&offline_callbacks); 16862306a36Sopenharmony_ci if (!dwfl) { 16962306a36Sopenharmony_ci pr_debug("dwfl_begin() failed: %s\n", dwarf_errmsg(-1)); 17062306a36Sopenharmony_ci return -1; 17162306a36Sopenharmony_ci } 17262306a36Sopenharmony_ci 17362306a36Sopenharmony_ci mod = dwfl_report_elf(dwfl, exec_file, exec_file, -1, 17462306a36Sopenharmony_ci map_start, false); 17562306a36Sopenharmony_ci if (!mod) { 17662306a36Sopenharmony_ci pr_debug("dwfl_report_elf() failed %s\n", 17762306a36Sopenharmony_ci dwarf_errmsg(-1)); 17862306a36Sopenharmony_ci /* 17962306a36Sopenharmony_ci * We normally cache the DWARF debug info and never 18062306a36Sopenharmony_ci * call dwfl_end(). But to prevent fd leak, free in 18162306a36Sopenharmony_ci * case of error. 18262306a36Sopenharmony_ci */ 18362306a36Sopenharmony_ci dwfl_end(dwfl); 18462306a36Sopenharmony_ci goto out; 18562306a36Sopenharmony_ci } 18662306a36Sopenharmony_ci dso->dwfl = dwfl; 18762306a36Sopenharmony_ci } 18862306a36Sopenharmony_ci 18962306a36Sopenharmony_ci mod = dwfl_addrmodule(dwfl, pc); 19062306a36Sopenharmony_ci if (!mod) { 19162306a36Sopenharmony_ci pr_debug("dwfl_addrmodule() failed, %s\n", dwarf_errmsg(-1)); 19262306a36Sopenharmony_ci goto out; 19362306a36Sopenharmony_ci } 19462306a36Sopenharmony_ci 19562306a36Sopenharmony_ci /* 19662306a36Sopenharmony_ci * To work with split debug info files (eg: glibc), check both 19762306a36Sopenharmony_ci * .eh_frame and .debug_frame sections of the ELF header. 19862306a36Sopenharmony_ci */ 19962306a36Sopenharmony_ci frame = get_eh_frame(mod, pc); 20062306a36Sopenharmony_ci if (!frame) { 20162306a36Sopenharmony_ci frame = get_dwarf_frame(mod, pc); 20262306a36Sopenharmony_ci if (!frame) 20362306a36Sopenharmony_ci goto out; 20462306a36Sopenharmony_ci } 20562306a36Sopenharmony_ci 20662306a36Sopenharmony_ci ra_regno = dwarf_frame_info(frame, &start, &end, &signalp); 20762306a36Sopenharmony_ci if (ra_regno < 0) { 20862306a36Sopenharmony_ci pr_debug("Return address register unavailable: %s\n", 20962306a36Sopenharmony_ci dwarf_errmsg(-1)); 21062306a36Sopenharmony_ci goto out; 21162306a36Sopenharmony_ci } 21262306a36Sopenharmony_ci 21362306a36Sopenharmony_ci rc = check_return_reg(ra_regno, frame); 21462306a36Sopenharmony_ci 21562306a36Sopenharmony_ciout: 21662306a36Sopenharmony_ci return rc; 21762306a36Sopenharmony_ci} 21862306a36Sopenharmony_ci 21962306a36Sopenharmony_ci/* 22062306a36Sopenharmony_ci * The callchain saved by the kernel always includes the link register (LR). 22162306a36Sopenharmony_ci * 22262306a36Sopenharmony_ci * 0: PERF_CONTEXT_USER 22362306a36Sopenharmony_ci * 1: Program counter (Next instruction pointer) 22462306a36Sopenharmony_ci * 2: LR value 22562306a36Sopenharmony_ci * 3: Caller's caller 22662306a36Sopenharmony_ci * 4: ... 22762306a36Sopenharmony_ci * 22862306a36Sopenharmony_ci * The value in LR is only needed when it holds a return address. If the 22962306a36Sopenharmony_ci * return address is on the stack, we should ignore the LR value. 23062306a36Sopenharmony_ci * 23162306a36Sopenharmony_ci * Further, when the return address is in the LR, if a new frame was just 23262306a36Sopenharmony_ci * allocated but the LR was not saved into it, then the LR contains the 23362306a36Sopenharmony_ci * caller, slot 4: contains the caller's caller and the contents of slot 3: 23462306a36Sopenharmony_ci * (chain->ips[3]) is undefined and must be ignored. 23562306a36Sopenharmony_ci * 23662306a36Sopenharmony_ci * Use DWARF debug information to determine if any entries need to be skipped. 23762306a36Sopenharmony_ci * 23862306a36Sopenharmony_ci * Return: 23962306a36Sopenharmony_ci * index: of callchain entry that needs to be ignored (if any) 24062306a36Sopenharmony_ci * -1 if no entry needs to be ignored or in case of errors 24162306a36Sopenharmony_ci */ 24262306a36Sopenharmony_ciint arch_skip_callchain_idx(struct thread *thread, struct ip_callchain *chain) 24362306a36Sopenharmony_ci{ 24462306a36Sopenharmony_ci struct addr_location al; 24562306a36Sopenharmony_ci struct dso *dso = NULL; 24662306a36Sopenharmony_ci int rc; 24762306a36Sopenharmony_ci u64 ip; 24862306a36Sopenharmony_ci u64 skip_slot = -1; 24962306a36Sopenharmony_ci 25062306a36Sopenharmony_ci if (!chain || chain->nr < 3) 25162306a36Sopenharmony_ci return skip_slot; 25262306a36Sopenharmony_ci 25362306a36Sopenharmony_ci addr_location__init(&al); 25462306a36Sopenharmony_ci ip = chain->ips[1]; 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_ci thread__find_symbol(thread, PERF_RECORD_MISC_USER, ip, &al); 25762306a36Sopenharmony_ci 25862306a36Sopenharmony_ci if (al.map) 25962306a36Sopenharmony_ci dso = map__dso(al.map); 26062306a36Sopenharmony_ci 26162306a36Sopenharmony_ci if (!dso) { 26262306a36Sopenharmony_ci pr_debug("%" PRIx64 " dso is NULL\n", ip); 26362306a36Sopenharmony_ci addr_location__exit(&al); 26462306a36Sopenharmony_ci return skip_slot; 26562306a36Sopenharmony_ci } 26662306a36Sopenharmony_ci 26762306a36Sopenharmony_ci rc = check_return_addr(dso, map__start(al.map), ip); 26862306a36Sopenharmony_ci 26962306a36Sopenharmony_ci pr_debug("[DSO %s, sym %s, ip 0x%" PRIx64 "] rc %d\n", 27062306a36Sopenharmony_ci dso->long_name, al.sym->name, ip, rc); 27162306a36Sopenharmony_ci 27262306a36Sopenharmony_ci if (rc == 0) { 27362306a36Sopenharmony_ci /* 27462306a36Sopenharmony_ci * Return address on stack. Ignore LR value in callchain 27562306a36Sopenharmony_ci */ 27662306a36Sopenharmony_ci skip_slot = 2; 27762306a36Sopenharmony_ci } else if (rc == 2) { 27862306a36Sopenharmony_ci /* 27962306a36Sopenharmony_ci * New frame allocated but return address still in LR. 28062306a36Sopenharmony_ci * Ignore the caller's caller entry in callchain. 28162306a36Sopenharmony_ci */ 28262306a36Sopenharmony_ci skip_slot = 3; 28362306a36Sopenharmony_ci } 28462306a36Sopenharmony_ci 28562306a36Sopenharmony_ci addr_location__exit(&al); 28662306a36Sopenharmony_ci return skip_slot; 28762306a36Sopenharmony_ci} 288