162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * thread-stack.c: Synthesize a thread's stack using call / return events 462306a36Sopenharmony_ci * Copyright (c) 2014, Intel Corporation. 562306a36Sopenharmony_ci */ 662306a36Sopenharmony_ci 762306a36Sopenharmony_ci#include <linux/rbtree.h> 862306a36Sopenharmony_ci#include <linux/list.h> 962306a36Sopenharmony_ci#include <linux/log2.h> 1062306a36Sopenharmony_ci#include <linux/zalloc.h> 1162306a36Sopenharmony_ci#include <errno.h> 1262306a36Sopenharmony_ci#include <stdlib.h> 1362306a36Sopenharmony_ci#include <string.h> 1462306a36Sopenharmony_ci#include "thread.h" 1562306a36Sopenharmony_ci#include "event.h" 1662306a36Sopenharmony_ci#include "machine.h" 1762306a36Sopenharmony_ci#include "env.h" 1862306a36Sopenharmony_ci#include "debug.h" 1962306a36Sopenharmony_ci#include "symbol.h" 2062306a36Sopenharmony_ci#include "comm.h" 2162306a36Sopenharmony_ci#include "call-path.h" 2262306a36Sopenharmony_ci#include "thread-stack.h" 2362306a36Sopenharmony_ci 2462306a36Sopenharmony_ci#define STACK_GROWTH 2048 2562306a36Sopenharmony_ci 2662306a36Sopenharmony_ci/* 2762306a36Sopenharmony_ci * State of retpoline detection. 2862306a36Sopenharmony_ci * 2962306a36Sopenharmony_ci * RETPOLINE_NONE: no retpoline detection 3062306a36Sopenharmony_ci * X86_RETPOLINE_POSSIBLE: x86 retpoline possible 3162306a36Sopenharmony_ci * X86_RETPOLINE_DETECTED: x86 retpoline detected 3262306a36Sopenharmony_ci */ 3362306a36Sopenharmony_cienum retpoline_state_t { 3462306a36Sopenharmony_ci RETPOLINE_NONE, 3562306a36Sopenharmony_ci X86_RETPOLINE_POSSIBLE, 3662306a36Sopenharmony_ci X86_RETPOLINE_DETECTED, 3762306a36Sopenharmony_ci}; 3862306a36Sopenharmony_ci 3962306a36Sopenharmony_ci/** 4062306a36Sopenharmony_ci * struct thread_stack_entry - thread stack entry. 4162306a36Sopenharmony_ci * @ret_addr: return address 4262306a36Sopenharmony_ci * @timestamp: timestamp (if known) 4362306a36Sopenharmony_ci * @ref: external reference (e.g. db_id of sample) 4462306a36Sopenharmony_ci * @branch_count: the branch count when the entry was created 4562306a36Sopenharmony_ci * @insn_count: the instruction count when the entry was created 4662306a36Sopenharmony_ci * @cyc_count the cycle count when the entry was created 4762306a36Sopenharmony_ci * @db_id: id used for db-export 4862306a36Sopenharmony_ci * @cp: call path 4962306a36Sopenharmony_ci * @no_call: a 'call' was not seen 5062306a36Sopenharmony_ci * @trace_end: a 'call' but trace ended 5162306a36Sopenharmony_ci * @non_call: a branch but not a 'call' to the start of a different symbol 5262306a36Sopenharmony_ci */ 5362306a36Sopenharmony_cistruct thread_stack_entry { 5462306a36Sopenharmony_ci u64 ret_addr; 5562306a36Sopenharmony_ci u64 timestamp; 5662306a36Sopenharmony_ci u64 ref; 5762306a36Sopenharmony_ci u64 branch_count; 5862306a36Sopenharmony_ci u64 insn_count; 5962306a36Sopenharmony_ci u64 cyc_count; 6062306a36Sopenharmony_ci u64 db_id; 6162306a36Sopenharmony_ci struct call_path *cp; 6262306a36Sopenharmony_ci bool no_call; 6362306a36Sopenharmony_ci bool trace_end; 6462306a36Sopenharmony_ci bool non_call; 6562306a36Sopenharmony_ci}; 6662306a36Sopenharmony_ci 6762306a36Sopenharmony_ci/** 6862306a36Sopenharmony_ci * struct thread_stack - thread stack constructed from 'call' and 'return' 6962306a36Sopenharmony_ci * branch samples. 7062306a36Sopenharmony_ci * @stack: array that holds the stack 7162306a36Sopenharmony_ci * @cnt: number of entries in the stack 7262306a36Sopenharmony_ci * @sz: current maximum stack size 7362306a36Sopenharmony_ci * @trace_nr: current trace number 7462306a36Sopenharmony_ci * @branch_count: running branch count 7562306a36Sopenharmony_ci * @insn_count: running instruction count 7662306a36Sopenharmony_ci * @cyc_count running cycle count 7762306a36Sopenharmony_ci * @kernel_start: kernel start address 7862306a36Sopenharmony_ci * @last_time: last timestamp 7962306a36Sopenharmony_ci * @crp: call/return processor 8062306a36Sopenharmony_ci * @comm: current comm 8162306a36Sopenharmony_ci * @arr_sz: size of array if this is the first element of an array 8262306a36Sopenharmony_ci * @rstate: used to detect retpolines 8362306a36Sopenharmony_ci * @br_stack_rb: branch stack (ring buffer) 8462306a36Sopenharmony_ci * @br_stack_sz: maximum branch stack size 8562306a36Sopenharmony_ci * @br_stack_pos: current position in @br_stack_rb 8662306a36Sopenharmony_ci * @mispred_all: mark all branches as mispredicted 8762306a36Sopenharmony_ci */ 8862306a36Sopenharmony_cistruct thread_stack { 8962306a36Sopenharmony_ci struct thread_stack_entry *stack; 9062306a36Sopenharmony_ci size_t cnt; 9162306a36Sopenharmony_ci size_t sz; 9262306a36Sopenharmony_ci u64 trace_nr; 9362306a36Sopenharmony_ci u64 branch_count; 9462306a36Sopenharmony_ci u64 insn_count; 9562306a36Sopenharmony_ci u64 cyc_count; 9662306a36Sopenharmony_ci u64 kernel_start; 9762306a36Sopenharmony_ci u64 last_time; 9862306a36Sopenharmony_ci struct call_return_processor *crp; 9962306a36Sopenharmony_ci struct comm *comm; 10062306a36Sopenharmony_ci unsigned int arr_sz; 10162306a36Sopenharmony_ci enum retpoline_state_t rstate; 10262306a36Sopenharmony_ci struct branch_stack *br_stack_rb; 10362306a36Sopenharmony_ci unsigned int br_stack_sz; 10462306a36Sopenharmony_ci unsigned int br_stack_pos; 10562306a36Sopenharmony_ci bool mispred_all; 10662306a36Sopenharmony_ci}; 10762306a36Sopenharmony_ci 10862306a36Sopenharmony_ci/* 10962306a36Sopenharmony_ci * Assume pid == tid == 0 identifies the idle task as defined by 11062306a36Sopenharmony_ci * perf_session__register_idle_thread(). The idle task is really 1 task per cpu, 11162306a36Sopenharmony_ci * and therefore requires a stack for each cpu. 11262306a36Sopenharmony_ci */ 11362306a36Sopenharmony_cistatic inline bool thread_stack__per_cpu(struct thread *thread) 11462306a36Sopenharmony_ci{ 11562306a36Sopenharmony_ci return !(thread__tid(thread) || thread__pid(thread)); 11662306a36Sopenharmony_ci} 11762306a36Sopenharmony_ci 11862306a36Sopenharmony_cistatic int thread_stack__grow(struct thread_stack *ts) 11962306a36Sopenharmony_ci{ 12062306a36Sopenharmony_ci struct thread_stack_entry *new_stack; 12162306a36Sopenharmony_ci size_t sz, new_sz; 12262306a36Sopenharmony_ci 12362306a36Sopenharmony_ci new_sz = ts->sz + STACK_GROWTH; 12462306a36Sopenharmony_ci sz = new_sz * sizeof(struct thread_stack_entry); 12562306a36Sopenharmony_ci 12662306a36Sopenharmony_ci new_stack = realloc(ts->stack, sz); 12762306a36Sopenharmony_ci if (!new_stack) 12862306a36Sopenharmony_ci return -ENOMEM; 12962306a36Sopenharmony_ci 13062306a36Sopenharmony_ci ts->stack = new_stack; 13162306a36Sopenharmony_ci ts->sz = new_sz; 13262306a36Sopenharmony_ci 13362306a36Sopenharmony_ci return 0; 13462306a36Sopenharmony_ci} 13562306a36Sopenharmony_ci 13662306a36Sopenharmony_cistatic int thread_stack__init(struct thread_stack *ts, struct thread *thread, 13762306a36Sopenharmony_ci struct call_return_processor *crp, 13862306a36Sopenharmony_ci bool callstack, unsigned int br_stack_sz) 13962306a36Sopenharmony_ci{ 14062306a36Sopenharmony_ci int err; 14162306a36Sopenharmony_ci 14262306a36Sopenharmony_ci if (callstack) { 14362306a36Sopenharmony_ci err = thread_stack__grow(ts); 14462306a36Sopenharmony_ci if (err) 14562306a36Sopenharmony_ci return err; 14662306a36Sopenharmony_ci } 14762306a36Sopenharmony_ci 14862306a36Sopenharmony_ci if (br_stack_sz) { 14962306a36Sopenharmony_ci size_t sz = sizeof(struct branch_stack); 15062306a36Sopenharmony_ci 15162306a36Sopenharmony_ci sz += br_stack_sz * sizeof(struct branch_entry); 15262306a36Sopenharmony_ci ts->br_stack_rb = zalloc(sz); 15362306a36Sopenharmony_ci if (!ts->br_stack_rb) 15462306a36Sopenharmony_ci return -ENOMEM; 15562306a36Sopenharmony_ci ts->br_stack_sz = br_stack_sz; 15662306a36Sopenharmony_ci } 15762306a36Sopenharmony_ci 15862306a36Sopenharmony_ci if (thread__maps(thread) && maps__machine(thread__maps(thread))) { 15962306a36Sopenharmony_ci struct machine *machine = maps__machine(thread__maps(thread)); 16062306a36Sopenharmony_ci const char *arch = perf_env__arch(machine->env); 16162306a36Sopenharmony_ci 16262306a36Sopenharmony_ci ts->kernel_start = machine__kernel_start(machine); 16362306a36Sopenharmony_ci if (!strcmp(arch, "x86")) 16462306a36Sopenharmony_ci ts->rstate = X86_RETPOLINE_POSSIBLE; 16562306a36Sopenharmony_ci } else { 16662306a36Sopenharmony_ci ts->kernel_start = 1ULL << 63; 16762306a36Sopenharmony_ci } 16862306a36Sopenharmony_ci ts->crp = crp; 16962306a36Sopenharmony_ci 17062306a36Sopenharmony_ci return 0; 17162306a36Sopenharmony_ci} 17262306a36Sopenharmony_ci 17362306a36Sopenharmony_cistatic struct thread_stack *thread_stack__new(struct thread *thread, int cpu, 17462306a36Sopenharmony_ci struct call_return_processor *crp, 17562306a36Sopenharmony_ci bool callstack, 17662306a36Sopenharmony_ci unsigned int br_stack_sz) 17762306a36Sopenharmony_ci{ 17862306a36Sopenharmony_ci struct thread_stack *ts = thread__ts(thread), *new_ts; 17962306a36Sopenharmony_ci unsigned int old_sz = ts ? ts->arr_sz : 0; 18062306a36Sopenharmony_ci unsigned int new_sz = 1; 18162306a36Sopenharmony_ci 18262306a36Sopenharmony_ci if (thread_stack__per_cpu(thread) && cpu > 0) 18362306a36Sopenharmony_ci new_sz = roundup_pow_of_two(cpu + 1); 18462306a36Sopenharmony_ci 18562306a36Sopenharmony_ci if (!ts || new_sz > old_sz) { 18662306a36Sopenharmony_ci new_ts = calloc(new_sz, sizeof(*ts)); 18762306a36Sopenharmony_ci if (!new_ts) 18862306a36Sopenharmony_ci return NULL; 18962306a36Sopenharmony_ci if (ts) 19062306a36Sopenharmony_ci memcpy(new_ts, ts, old_sz * sizeof(*ts)); 19162306a36Sopenharmony_ci new_ts->arr_sz = new_sz; 19262306a36Sopenharmony_ci free(thread__ts(thread)); 19362306a36Sopenharmony_ci thread__set_ts(thread, new_ts); 19462306a36Sopenharmony_ci ts = new_ts; 19562306a36Sopenharmony_ci } 19662306a36Sopenharmony_ci 19762306a36Sopenharmony_ci if (thread_stack__per_cpu(thread) && cpu > 0 && 19862306a36Sopenharmony_ci (unsigned int)cpu < ts->arr_sz) 19962306a36Sopenharmony_ci ts += cpu; 20062306a36Sopenharmony_ci 20162306a36Sopenharmony_ci if (!ts->stack && 20262306a36Sopenharmony_ci thread_stack__init(ts, thread, crp, callstack, br_stack_sz)) 20362306a36Sopenharmony_ci return NULL; 20462306a36Sopenharmony_ci 20562306a36Sopenharmony_ci return ts; 20662306a36Sopenharmony_ci} 20762306a36Sopenharmony_ci 20862306a36Sopenharmony_cistatic struct thread_stack *thread__cpu_stack(struct thread *thread, int cpu) 20962306a36Sopenharmony_ci{ 21062306a36Sopenharmony_ci struct thread_stack *ts = thread__ts(thread); 21162306a36Sopenharmony_ci 21262306a36Sopenharmony_ci if (cpu < 0) 21362306a36Sopenharmony_ci cpu = 0; 21462306a36Sopenharmony_ci 21562306a36Sopenharmony_ci if (!ts || (unsigned int)cpu >= ts->arr_sz) 21662306a36Sopenharmony_ci return NULL; 21762306a36Sopenharmony_ci 21862306a36Sopenharmony_ci ts += cpu; 21962306a36Sopenharmony_ci 22062306a36Sopenharmony_ci if (!ts->stack) 22162306a36Sopenharmony_ci return NULL; 22262306a36Sopenharmony_ci 22362306a36Sopenharmony_ci return ts; 22462306a36Sopenharmony_ci} 22562306a36Sopenharmony_ci 22662306a36Sopenharmony_cistatic inline struct thread_stack *thread__stack(struct thread *thread, 22762306a36Sopenharmony_ci int cpu) 22862306a36Sopenharmony_ci{ 22962306a36Sopenharmony_ci if (!thread) 23062306a36Sopenharmony_ci return NULL; 23162306a36Sopenharmony_ci 23262306a36Sopenharmony_ci if (thread_stack__per_cpu(thread)) 23362306a36Sopenharmony_ci return thread__cpu_stack(thread, cpu); 23462306a36Sopenharmony_ci 23562306a36Sopenharmony_ci return thread__ts(thread); 23662306a36Sopenharmony_ci} 23762306a36Sopenharmony_ci 23862306a36Sopenharmony_cistatic int thread_stack__push(struct thread_stack *ts, u64 ret_addr, 23962306a36Sopenharmony_ci bool trace_end) 24062306a36Sopenharmony_ci{ 24162306a36Sopenharmony_ci int err = 0; 24262306a36Sopenharmony_ci 24362306a36Sopenharmony_ci if (ts->cnt == ts->sz) { 24462306a36Sopenharmony_ci err = thread_stack__grow(ts); 24562306a36Sopenharmony_ci if (err) { 24662306a36Sopenharmony_ci pr_warning("Out of memory: discarding thread stack\n"); 24762306a36Sopenharmony_ci ts->cnt = 0; 24862306a36Sopenharmony_ci } 24962306a36Sopenharmony_ci } 25062306a36Sopenharmony_ci 25162306a36Sopenharmony_ci ts->stack[ts->cnt].trace_end = trace_end; 25262306a36Sopenharmony_ci ts->stack[ts->cnt++].ret_addr = ret_addr; 25362306a36Sopenharmony_ci 25462306a36Sopenharmony_ci return err; 25562306a36Sopenharmony_ci} 25662306a36Sopenharmony_ci 25762306a36Sopenharmony_cistatic void thread_stack__pop(struct thread_stack *ts, u64 ret_addr) 25862306a36Sopenharmony_ci{ 25962306a36Sopenharmony_ci size_t i; 26062306a36Sopenharmony_ci 26162306a36Sopenharmony_ci /* 26262306a36Sopenharmony_ci * In some cases there may be functions which are not seen to return. 26362306a36Sopenharmony_ci * For example when setjmp / longjmp has been used. Or the perf context 26462306a36Sopenharmony_ci * switch in the kernel which doesn't stop and start tracing in exactly 26562306a36Sopenharmony_ci * the same code path. When that happens the return address will be 26662306a36Sopenharmony_ci * further down the stack. If the return address is not found at all, 26762306a36Sopenharmony_ci * we assume the opposite (i.e. this is a return for a call that wasn't 26862306a36Sopenharmony_ci * seen for some reason) and leave the stack alone. 26962306a36Sopenharmony_ci */ 27062306a36Sopenharmony_ci for (i = ts->cnt; i; ) { 27162306a36Sopenharmony_ci if (ts->stack[--i].ret_addr == ret_addr) { 27262306a36Sopenharmony_ci ts->cnt = i; 27362306a36Sopenharmony_ci return; 27462306a36Sopenharmony_ci } 27562306a36Sopenharmony_ci } 27662306a36Sopenharmony_ci} 27762306a36Sopenharmony_ci 27862306a36Sopenharmony_cistatic void thread_stack__pop_trace_end(struct thread_stack *ts) 27962306a36Sopenharmony_ci{ 28062306a36Sopenharmony_ci size_t i; 28162306a36Sopenharmony_ci 28262306a36Sopenharmony_ci for (i = ts->cnt; i; ) { 28362306a36Sopenharmony_ci if (ts->stack[--i].trace_end) 28462306a36Sopenharmony_ci ts->cnt = i; 28562306a36Sopenharmony_ci else 28662306a36Sopenharmony_ci return; 28762306a36Sopenharmony_ci } 28862306a36Sopenharmony_ci} 28962306a36Sopenharmony_ci 29062306a36Sopenharmony_cistatic bool thread_stack__in_kernel(struct thread_stack *ts) 29162306a36Sopenharmony_ci{ 29262306a36Sopenharmony_ci if (!ts->cnt) 29362306a36Sopenharmony_ci return false; 29462306a36Sopenharmony_ci 29562306a36Sopenharmony_ci return ts->stack[ts->cnt - 1].cp->in_kernel; 29662306a36Sopenharmony_ci} 29762306a36Sopenharmony_ci 29862306a36Sopenharmony_cistatic int thread_stack__call_return(struct thread *thread, 29962306a36Sopenharmony_ci struct thread_stack *ts, size_t idx, 30062306a36Sopenharmony_ci u64 timestamp, u64 ref, bool no_return) 30162306a36Sopenharmony_ci{ 30262306a36Sopenharmony_ci struct call_return_processor *crp = ts->crp; 30362306a36Sopenharmony_ci struct thread_stack_entry *tse; 30462306a36Sopenharmony_ci struct call_return cr = { 30562306a36Sopenharmony_ci .thread = thread, 30662306a36Sopenharmony_ci .comm = ts->comm, 30762306a36Sopenharmony_ci .db_id = 0, 30862306a36Sopenharmony_ci }; 30962306a36Sopenharmony_ci u64 *parent_db_id; 31062306a36Sopenharmony_ci 31162306a36Sopenharmony_ci tse = &ts->stack[idx]; 31262306a36Sopenharmony_ci cr.cp = tse->cp; 31362306a36Sopenharmony_ci cr.call_time = tse->timestamp; 31462306a36Sopenharmony_ci cr.return_time = timestamp; 31562306a36Sopenharmony_ci cr.branch_count = ts->branch_count - tse->branch_count; 31662306a36Sopenharmony_ci cr.insn_count = ts->insn_count - tse->insn_count; 31762306a36Sopenharmony_ci cr.cyc_count = ts->cyc_count - tse->cyc_count; 31862306a36Sopenharmony_ci cr.db_id = tse->db_id; 31962306a36Sopenharmony_ci cr.call_ref = tse->ref; 32062306a36Sopenharmony_ci cr.return_ref = ref; 32162306a36Sopenharmony_ci if (tse->no_call) 32262306a36Sopenharmony_ci cr.flags |= CALL_RETURN_NO_CALL; 32362306a36Sopenharmony_ci if (no_return) 32462306a36Sopenharmony_ci cr.flags |= CALL_RETURN_NO_RETURN; 32562306a36Sopenharmony_ci if (tse->non_call) 32662306a36Sopenharmony_ci cr.flags |= CALL_RETURN_NON_CALL; 32762306a36Sopenharmony_ci 32862306a36Sopenharmony_ci /* 32962306a36Sopenharmony_ci * The parent db_id must be assigned before exporting the child. Note 33062306a36Sopenharmony_ci * it is not possible to export the parent first because its information 33162306a36Sopenharmony_ci * is not yet complete because its 'return' has not yet been processed. 33262306a36Sopenharmony_ci */ 33362306a36Sopenharmony_ci parent_db_id = idx ? &(tse - 1)->db_id : NULL; 33462306a36Sopenharmony_ci 33562306a36Sopenharmony_ci return crp->process(&cr, parent_db_id, crp->data); 33662306a36Sopenharmony_ci} 33762306a36Sopenharmony_ci 33862306a36Sopenharmony_cistatic int __thread_stack__flush(struct thread *thread, struct thread_stack *ts) 33962306a36Sopenharmony_ci{ 34062306a36Sopenharmony_ci struct call_return_processor *crp = ts->crp; 34162306a36Sopenharmony_ci int err; 34262306a36Sopenharmony_ci 34362306a36Sopenharmony_ci if (!crp) { 34462306a36Sopenharmony_ci ts->cnt = 0; 34562306a36Sopenharmony_ci ts->br_stack_pos = 0; 34662306a36Sopenharmony_ci if (ts->br_stack_rb) 34762306a36Sopenharmony_ci ts->br_stack_rb->nr = 0; 34862306a36Sopenharmony_ci return 0; 34962306a36Sopenharmony_ci } 35062306a36Sopenharmony_ci 35162306a36Sopenharmony_ci while (ts->cnt) { 35262306a36Sopenharmony_ci err = thread_stack__call_return(thread, ts, --ts->cnt, 35362306a36Sopenharmony_ci ts->last_time, 0, true); 35462306a36Sopenharmony_ci if (err) { 35562306a36Sopenharmony_ci pr_err("Error flushing thread stack!\n"); 35662306a36Sopenharmony_ci ts->cnt = 0; 35762306a36Sopenharmony_ci return err; 35862306a36Sopenharmony_ci } 35962306a36Sopenharmony_ci } 36062306a36Sopenharmony_ci 36162306a36Sopenharmony_ci return 0; 36262306a36Sopenharmony_ci} 36362306a36Sopenharmony_ci 36462306a36Sopenharmony_ciint thread_stack__flush(struct thread *thread) 36562306a36Sopenharmony_ci{ 36662306a36Sopenharmony_ci struct thread_stack *ts = thread__ts(thread); 36762306a36Sopenharmony_ci unsigned int pos; 36862306a36Sopenharmony_ci int err = 0; 36962306a36Sopenharmony_ci 37062306a36Sopenharmony_ci if (ts) { 37162306a36Sopenharmony_ci for (pos = 0; pos < ts->arr_sz; pos++) { 37262306a36Sopenharmony_ci int ret = __thread_stack__flush(thread, ts + pos); 37362306a36Sopenharmony_ci 37462306a36Sopenharmony_ci if (ret) 37562306a36Sopenharmony_ci err = ret; 37662306a36Sopenharmony_ci } 37762306a36Sopenharmony_ci } 37862306a36Sopenharmony_ci 37962306a36Sopenharmony_ci return err; 38062306a36Sopenharmony_ci} 38162306a36Sopenharmony_ci 38262306a36Sopenharmony_cistatic void thread_stack__update_br_stack(struct thread_stack *ts, u32 flags, 38362306a36Sopenharmony_ci u64 from_ip, u64 to_ip) 38462306a36Sopenharmony_ci{ 38562306a36Sopenharmony_ci struct branch_stack *bs = ts->br_stack_rb; 38662306a36Sopenharmony_ci struct branch_entry *be; 38762306a36Sopenharmony_ci 38862306a36Sopenharmony_ci if (!ts->br_stack_pos) 38962306a36Sopenharmony_ci ts->br_stack_pos = ts->br_stack_sz; 39062306a36Sopenharmony_ci 39162306a36Sopenharmony_ci ts->br_stack_pos -= 1; 39262306a36Sopenharmony_ci 39362306a36Sopenharmony_ci be = &bs->entries[ts->br_stack_pos]; 39462306a36Sopenharmony_ci be->from = from_ip; 39562306a36Sopenharmony_ci be->to = to_ip; 39662306a36Sopenharmony_ci be->flags.value = 0; 39762306a36Sopenharmony_ci be->flags.abort = !!(flags & PERF_IP_FLAG_TX_ABORT); 39862306a36Sopenharmony_ci be->flags.in_tx = !!(flags & PERF_IP_FLAG_IN_TX); 39962306a36Sopenharmony_ci /* No support for mispredict */ 40062306a36Sopenharmony_ci be->flags.mispred = ts->mispred_all; 40162306a36Sopenharmony_ci 40262306a36Sopenharmony_ci if (bs->nr < ts->br_stack_sz) 40362306a36Sopenharmony_ci bs->nr += 1; 40462306a36Sopenharmony_ci} 40562306a36Sopenharmony_ci 40662306a36Sopenharmony_ciint thread_stack__event(struct thread *thread, int cpu, u32 flags, u64 from_ip, 40762306a36Sopenharmony_ci u64 to_ip, u16 insn_len, u64 trace_nr, bool callstack, 40862306a36Sopenharmony_ci unsigned int br_stack_sz, bool mispred_all) 40962306a36Sopenharmony_ci{ 41062306a36Sopenharmony_ci struct thread_stack *ts = thread__stack(thread, cpu); 41162306a36Sopenharmony_ci 41262306a36Sopenharmony_ci if (!thread) 41362306a36Sopenharmony_ci return -EINVAL; 41462306a36Sopenharmony_ci 41562306a36Sopenharmony_ci if (!ts) { 41662306a36Sopenharmony_ci ts = thread_stack__new(thread, cpu, NULL, callstack, br_stack_sz); 41762306a36Sopenharmony_ci if (!ts) { 41862306a36Sopenharmony_ci pr_warning("Out of memory: no thread stack\n"); 41962306a36Sopenharmony_ci return -ENOMEM; 42062306a36Sopenharmony_ci } 42162306a36Sopenharmony_ci ts->trace_nr = trace_nr; 42262306a36Sopenharmony_ci ts->mispred_all = mispred_all; 42362306a36Sopenharmony_ci } 42462306a36Sopenharmony_ci 42562306a36Sopenharmony_ci /* 42662306a36Sopenharmony_ci * When the trace is discontinuous, the trace_nr changes. In that case 42762306a36Sopenharmony_ci * the stack might be completely invalid. Better to report nothing than 42862306a36Sopenharmony_ci * to report something misleading, so flush the stack. 42962306a36Sopenharmony_ci */ 43062306a36Sopenharmony_ci if (trace_nr != ts->trace_nr) { 43162306a36Sopenharmony_ci if (ts->trace_nr) 43262306a36Sopenharmony_ci __thread_stack__flush(thread, ts); 43362306a36Sopenharmony_ci ts->trace_nr = trace_nr; 43462306a36Sopenharmony_ci } 43562306a36Sopenharmony_ci 43662306a36Sopenharmony_ci if (br_stack_sz) 43762306a36Sopenharmony_ci thread_stack__update_br_stack(ts, flags, from_ip, to_ip); 43862306a36Sopenharmony_ci 43962306a36Sopenharmony_ci /* 44062306a36Sopenharmony_ci * Stop here if thread_stack__process() is in use, or not recording call 44162306a36Sopenharmony_ci * stack. 44262306a36Sopenharmony_ci */ 44362306a36Sopenharmony_ci if (ts->crp || !callstack) 44462306a36Sopenharmony_ci return 0; 44562306a36Sopenharmony_ci 44662306a36Sopenharmony_ci if (flags & PERF_IP_FLAG_CALL) { 44762306a36Sopenharmony_ci u64 ret_addr; 44862306a36Sopenharmony_ci 44962306a36Sopenharmony_ci if (!to_ip) 45062306a36Sopenharmony_ci return 0; 45162306a36Sopenharmony_ci ret_addr = from_ip + insn_len; 45262306a36Sopenharmony_ci if (ret_addr == to_ip) 45362306a36Sopenharmony_ci return 0; /* Zero-length calls are excluded */ 45462306a36Sopenharmony_ci return thread_stack__push(ts, ret_addr, 45562306a36Sopenharmony_ci flags & PERF_IP_FLAG_TRACE_END); 45662306a36Sopenharmony_ci } else if (flags & PERF_IP_FLAG_TRACE_BEGIN) { 45762306a36Sopenharmony_ci /* 45862306a36Sopenharmony_ci * If the caller did not change the trace number (which would 45962306a36Sopenharmony_ci * have flushed the stack) then try to make sense of the stack. 46062306a36Sopenharmony_ci * Possibly, tracing began after returning to the current 46162306a36Sopenharmony_ci * address, so try to pop that. Also, do not expect a call made 46262306a36Sopenharmony_ci * when the trace ended, to return, so pop that. 46362306a36Sopenharmony_ci */ 46462306a36Sopenharmony_ci thread_stack__pop(ts, to_ip); 46562306a36Sopenharmony_ci thread_stack__pop_trace_end(ts); 46662306a36Sopenharmony_ci } else if ((flags & PERF_IP_FLAG_RETURN) && from_ip) { 46762306a36Sopenharmony_ci thread_stack__pop(ts, to_ip); 46862306a36Sopenharmony_ci } 46962306a36Sopenharmony_ci 47062306a36Sopenharmony_ci return 0; 47162306a36Sopenharmony_ci} 47262306a36Sopenharmony_ci 47362306a36Sopenharmony_civoid thread_stack__set_trace_nr(struct thread *thread, int cpu, u64 trace_nr) 47462306a36Sopenharmony_ci{ 47562306a36Sopenharmony_ci struct thread_stack *ts = thread__stack(thread, cpu); 47662306a36Sopenharmony_ci 47762306a36Sopenharmony_ci if (!ts) 47862306a36Sopenharmony_ci return; 47962306a36Sopenharmony_ci 48062306a36Sopenharmony_ci if (trace_nr != ts->trace_nr) { 48162306a36Sopenharmony_ci if (ts->trace_nr) 48262306a36Sopenharmony_ci __thread_stack__flush(thread, ts); 48362306a36Sopenharmony_ci ts->trace_nr = trace_nr; 48462306a36Sopenharmony_ci } 48562306a36Sopenharmony_ci} 48662306a36Sopenharmony_ci 48762306a36Sopenharmony_cistatic void __thread_stack__free(struct thread *thread, struct thread_stack *ts) 48862306a36Sopenharmony_ci{ 48962306a36Sopenharmony_ci __thread_stack__flush(thread, ts); 49062306a36Sopenharmony_ci zfree(&ts->stack); 49162306a36Sopenharmony_ci zfree(&ts->br_stack_rb); 49262306a36Sopenharmony_ci} 49362306a36Sopenharmony_ci 49462306a36Sopenharmony_cistatic void thread_stack__reset(struct thread *thread, struct thread_stack *ts) 49562306a36Sopenharmony_ci{ 49662306a36Sopenharmony_ci unsigned int arr_sz = ts->arr_sz; 49762306a36Sopenharmony_ci 49862306a36Sopenharmony_ci __thread_stack__free(thread, ts); 49962306a36Sopenharmony_ci memset(ts, 0, sizeof(*ts)); 50062306a36Sopenharmony_ci ts->arr_sz = arr_sz; 50162306a36Sopenharmony_ci} 50262306a36Sopenharmony_ci 50362306a36Sopenharmony_civoid thread_stack__free(struct thread *thread) 50462306a36Sopenharmony_ci{ 50562306a36Sopenharmony_ci struct thread_stack *ts = thread__ts(thread); 50662306a36Sopenharmony_ci unsigned int pos; 50762306a36Sopenharmony_ci 50862306a36Sopenharmony_ci if (ts) { 50962306a36Sopenharmony_ci for (pos = 0; pos < ts->arr_sz; pos++) 51062306a36Sopenharmony_ci __thread_stack__free(thread, ts + pos); 51162306a36Sopenharmony_ci free(thread__ts(thread)); 51262306a36Sopenharmony_ci thread__set_ts(thread, NULL); 51362306a36Sopenharmony_ci } 51462306a36Sopenharmony_ci} 51562306a36Sopenharmony_ci 51662306a36Sopenharmony_cistatic inline u64 callchain_context(u64 ip, u64 kernel_start) 51762306a36Sopenharmony_ci{ 51862306a36Sopenharmony_ci return ip < kernel_start ? PERF_CONTEXT_USER : PERF_CONTEXT_KERNEL; 51962306a36Sopenharmony_ci} 52062306a36Sopenharmony_ci 52162306a36Sopenharmony_civoid thread_stack__sample(struct thread *thread, int cpu, 52262306a36Sopenharmony_ci struct ip_callchain *chain, 52362306a36Sopenharmony_ci size_t sz, u64 ip, u64 kernel_start) 52462306a36Sopenharmony_ci{ 52562306a36Sopenharmony_ci struct thread_stack *ts = thread__stack(thread, cpu); 52662306a36Sopenharmony_ci u64 context = callchain_context(ip, kernel_start); 52762306a36Sopenharmony_ci u64 last_context; 52862306a36Sopenharmony_ci size_t i, j; 52962306a36Sopenharmony_ci 53062306a36Sopenharmony_ci if (sz < 2) { 53162306a36Sopenharmony_ci chain->nr = 0; 53262306a36Sopenharmony_ci return; 53362306a36Sopenharmony_ci } 53462306a36Sopenharmony_ci 53562306a36Sopenharmony_ci chain->ips[0] = context; 53662306a36Sopenharmony_ci chain->ips[1] = ip; 53762306a36Sopenharmony_ci 53862306a36Sopenharmony_ci if (!ts) { 53962306a36Sopenharmony_ci chain->nr = 2; 54062306a36Sopenharmony_ci return; 54162306a36Sopenharmony_ci } 54262306a36Sopenharmony_ci 54362306a36Sopenharmony_ci last_context = context; 54462306a36Sopenharmony_ci 54562306a36Sopenharmony_ci for (i = 2, j = 1; i < sz && j <= ts->cnt; i++, j++) { 54662306a36Sopenharmony_ci ip = ts->stack[ts->cnt - j].ret_addr; 54762306a36Sopenharmony_ci context = callchain_context(ip, kernel_start); 54862306a36Sopenharmony_ci if (context != last_context) { 54962306a36Sopenharmony_ci if (i >= sz - 1) 55062306a36Sopenharmony_ci break; 55162306a36Sopenharmony_ci chain->ips[i++] = context; 55262306a36Sopenharmony_ci last_context = context; 55362306a36Sopenharmony_ci } 55462306a36Sopenharmony_ci chain->ips[i] = ip; 55562306a36Sopenharmony_ci } 55662306a36Sopenharmony_ci 55762306a36Sopenharmony_ci chain->nr = i; 55862306a36Sopenharmony_ci} 55962306a36Sopenharmony_ci 56062306a36Sopenharmony_ci/* 56162306a36Sopenharmony_ci * Hardware sample records, created some time after the event occurred, need to 56262306a36Sopenharmony_ci * have subsequent addresses removed from the call chain. 56362306a36Sopenharmony_ci */ 56462306a36Sopenharmony_civoid thread_stack__sample_late(struct thread *thread, int cpu, 56562306a36Sopenharmony_ci struct ip_callchain *chain, size_t sz, 56662306a36Sopenharmony_ci u64 sample_ip, u64 kernel_start) 56762306a36Sopenharmony_ci{ 56862306a36Sopenharmony_ci struct thread_stack *ts = thread__stack(thread, cpu); 56962306a36Sopenharmony_ci u64 sample_context = callchain_context(sample_ip, kernel_start); 57062306a36Sopenharmony_ci u64 last_context, context, ip; 57162306a36Sopenharmony_ci size_t nr = 0, j; 57262306a36Sopenharmony_ci 57362306a36Sopenharmony_ci if (sz < 2) { 57462306a36Sopenharmony_ci chain->nr = 0; 57562306a36Sopenharmony_ci return; 57662306a36Sopenharmony_ci } 57762306a36Sopenharmony_ci 57862306a36Sopenharmony_ci if (!ts) 57962306a36Sopenharmony_ci goto out; 58062306a36Sopenharmony_ci 58162306a36Sopenharmony_ci /* 58262306a36Sopenharmony_ci * When tracing kernel space, kernel addresses occur at the top of the 58362306a36Sopenharmony_ci * call chain after the event occurred but before tracing stopped. 58462306a36Sopenharmony_ci * Skip them. 58562306a36Sopenharmony_ci */ 58662306a36Sopenharmony_ci for (j = 1; j <= ts->cnt; j++) { 58762306a36Sopenharmony_ci ip = ts->stack[ts->cnt - j].ret_addr; 58862306a36Sopenharmony_ci context = callchain_context(ip, kernel_start); 58962306a36Sopenharmony_ci if (context == PERF_CONTEXT_USER || 59062306a36Sopenharmony_ci (context == sample_context && ip == sample_ip)) 59162306a36Sopenharmony_ci break; 59262306a36Sopenharmony_ci } 59362306a36Sopenharmony_ci 59462306a36Sopenharmony_ci last_context = sample_ip; /* Use sample_ip as an invalid context */ 59562306a36Sopenharmony_ci 59662306a36Sopenharmony_ci for (; nr < sz && j <= ts->cnt; nr++, j++) { 59762306a36Sopenharmony_ci ip = ts->stack[ts->cnt - j].ret_addr; 59862306a36Sopenharmony_ci context = callchain_context(ip, kernel_start); 59962306a36Sopenharmony_ci if (context != last_context) { 60062306a36Sopenharmony_ci if (nr >= sz - 1) 60162306a36Sopenharmony_ci break; 60262306a36Sopenharmony_ci chain->ips[nr++] = context; 60362306a36Sopenharmony_ci last_context = context; 60462306a36Sopenharmony_ci } 60562306a36Sopenharmony_ci chain->ips[nr] = ip; 60662306a36Sopenharmony_ci } 60762306a36Sopenharmony_ciout: 60862306a36Sopenharmony_ci if (nr) { 60962306a36Sopenharmony_ci chain->nr = nr; 61062306a36Sopenharmony_ci } else { 61162306a36Sopenharmony_ci chain->ips[0] = sample_context; 61262306a36Sopenharmony_ci chain->ips[1] = sample_ip; 61362306a36Sopenharmony_ci chain->nr = 2; 61462306a36Sopenharmony_ci } 61562306a36Sopenharmony_ci} 61662306a36Sopenharmony_ci 61762306a36Sopenharmony_civoid thread_stack__br_sample(struct thread *thread, int cpu, 61862306a36Sopenharmony_ci struct branch_stack *dst, unsigned int sz) 61962306a36Sopenharmony_ci{ 62062306a36Sopenharmony_ci struct thread_stack *ts = thread__stack(thread, cpu); 62162306a36Sopenharmony_ci const size_t bsz = sizeof(struct branch_entry); 62262306a36Sopenharmony_ci struct branch_stack *src; 62362306a36Sopenharmony_ci struct branch_entry *be; 62462306a36Sopenharmony_ci unsigned int nr; 62562306a36Sopenharmony_ci 62662306a36Sopenharmony_ci dst->nr = 0; 62762306a36Sopenharmony_ci 62862306a36Sopenharmony_ci if (!ts) 62962306a36Sopenharmony_ci return; 63062306a36Sopenharmony_ci 63162306a36Sopenharmony_ci src = ts->br_stack_rb; 63262306a36Sopenharmony_ci if (!src->nr) 63362306a36Sopenharmony_ci return; 63462306a36Sopenharmony_ci 63562306a36Sopenharmony_ci dst->nr = min((unsigned int)src->nr, sz); 63662306a36Sopenharmony_ci 63762306a36Sopenharmony_ci be = &dst->entries[0]; 63862306a36Sopenharmony_ci nr = min(ts->br_stack_sz - ts->br_stack_pos, (unsigned int)dst->nr); 63962306a36Sopenharmony_ci memcpy(be, &src->entries[ts->br_stack_pos], bsz * nr); 64062306a36Sopenharmony_ci 64162306a36Sopenharmony_ci if (src->nr >= ts->br_stack_sz) { 64262306a36Sopenharmony_ci sz -= nr; 64362306a36Sopenharmony_ci be = &dst->entries[nr]; 64462306a36Sopenharmony_ci nr = min(ts->br_stack_pos, sz); 64562306a36Sopenharmony_ci memcpy(be, &src->entries[0], bsz * ts->br_stack_pos); 64662306a36Sopenharmony_ci } 64762306a36Sopenharmony_ci} 64862306a36Sopenharmony_ci 64962306a36Sopenharmony_ci/* Start of user space branch entries */ 65062306a36Sopenharmony_cistatic bool us_start(struct branch_entry *be, u64 kernel_start, bool *start) 65162306a36Sopenharmony_ci{ 65262306a36Sopenharmony_ci if (!*start) 65362306a36Sopenharmony_ci *start = be->to && be->to < kernel_start; 65462306a36Sopenharmony_ci 65562306a36Sopenharmony_ci return *start; 65662306a36Sopenharmony_ci} 65762306a36Sopenharmony_ci 65862306a36Sopenharmony_ci/* 65962306a36Sopenharmony_ci * Start of branch entries after the ip fell in between 2 branches, or user 66062306a36Sopenharmony_ci * space branch entries. 66162306a36Sopenharmony_ci */ 66262306a36Sopenharmony_cistatic bool ks_start(struct branch_entry *be, u64 sample_ip, u64 kernel_start, 66362306a36Sopenharmony_ci bool *start, struct branch_entry *nb) 66462306a36Sopenharmony_ci{ 66562306a36Sopenharmony_ci if (!*start) { 66662306a36Sopenharmony_ci *start = (nb && sample_ip >= be->to && sample_ip <= nb->from) || 66762306a36Sopenharmony_ci be->from < kernel_start || 66862306a36Sopenharmony_ci (be->to && be->to < kernel_start); 66962306a36Sopenharmony_ci } 67062306a36Sopenharmony_ci 67162306a36Sopenharmony_ci return *start; 67262306a36Sopenharmony_ci} 67362306a36Sopenharmony_ci 67462306a36Sopenharmony_ci/* 67562306a36Sopenharmony_ci * Hardware sample records, created some time after the event occurred, need to 67662306a36Sopenharmony_ci * have subsequent addresses removed from the branch stack. 67762306a36Sopenharmony_ci */ 67862306a36Sopenharmony_civoid thread_stack__br_sample_late(struct thread *thread, int cpu, 67962306a36Sopenharmony_ci struct branch_stack *dst, unsigned int sz, 68062306a36Sopenharmony_ci u64 ip, u64 kernel_start) 68162306a36Sopenharmony_ci{ 68262306a36Sopenharmony_ci struct thread_stack *ts = thread__stack(thread, cpu); 68362306a36Sopenharmony_ci struct branch_entry *d, *s, *spos, *ssz; 68462306a36Sopenharmony_ci struct branch_stack *src; 68562306a36Sopenharmony_ci unsigned int nr = 0; 68662306a36Sopenharmony_ci bool start = false; 68762306a36Sopenharmony_ci 68862306a36Sopenharmony_ci dst->nr = 0; 68962306a36Sopenharmony_ci 69062306a36Sopenharmony_ci if (!ts) 69162306a36Sopenharmony_ci return; 69262306a36Sopenharmony_ci 69362306a36Sopenharmony_ci src = ts->br_stack_rb; 69462306a36Sopenharmony_ci if (!src->nr) 69562306a36Sopenharmony_ci return; 69662306a36Sopenharmony_ci 69762306a36Sopenharmony_ci spos = &src->entries[ts->br_stack_pos]; 69862306a36Sopenharmony_ci ssz = &src->entries[ts->br_stack_sz]; 69962306a36Sopenharmony_ci 70062306a36Sopenharmony_ci d = &dst->entries[0]; 70162306a36Sopenharmony_ci s = spos; 70262306a36Sopenharmony_ci 70362306a36Sopenharmony_ci if (ip < kernel_start) { 70462306a36Sopenharmony_ci /* 70562306a36Sopenharmony_ci * User space sample: start copying branch entries when the 70662306a36Sopenharmony_ci * branch is in user space. 70762306a36Sopenharmony_ci */ 70862306a36Sopenharmony_ci for (s = spos; s < ssz && nr < sz; s++) { 70962306a36Sopenharmony_ci if (us_start(s, kernel_start, &start)) { 71062306a36Sopenharmony_ci *d++ = *s; 71162306a36Sopenharmony_ci nr += 1; 71262306a36Sopenharmony_ci } 71362306a36Sopenharmony_ci } 71462306a36Sopenharmony_ci 71562306a36Sopenharmony_ci if (src->nr >= ts->br_stack_sz) { 71662306a36Sopenharmony_ci for (s = &src->entries[0]; s < spos && nr < sz; s++) { 71762306a36Sopenharmony_ci if (us_start(s, kernel_start, &start)) { 71862306a36Sopenharmony_ci *d++ = *s; 71962306a36Sopenharmony_ci nr += 1; 72062306a36Sopenharmony_ci } 72162306a36Sopenharmony_ci } 72262306a36Sopenharmony_ci } 72362306a36Sopenharmony_ci } else { 72462306a36Sopenharmony_ci struct branch_entry *nb = NULL; 72562306a36Sopenharmony_ci 72662306a36Sopenharmony_ci /* 72762306a36Sopenharmony_ci * Kernel space sample: start copying branch entries when the ip 72862306a36Sopenharmony_ci * falls in between 2 branches (or the branch is in user space 72962306a36Sopenharmony_ci * because then the start must have been missed). 73062306a36Sopenharmony_ci */ 73162306a36Sopenharmony_ci for (s = spos; s < ssz && nr < sz; s++) { 73262306a36Sopenharmony_ci if (ks_start(s, ip, kernel_start, &start, nb)) { 73362306a36Sopenharmony_ci *d++ = *s; 73462306a36Sopenharmony_ci nr += 1; 73562306a36Sopenharmony_ci } 73662306a36Sopenharmony_ci nb = s; 73762306a36Sopenharmony_ci } 73862306a36Sopenharmony_ci 73962306a36Sopenharmony_ci if (src->nr >= ts->br_stack_sz) { 74062306a36Sopenharmony_ci for (s = &src->entries[0]; s < spos && nr < sz; s++) { 74162306a36Sopenharmony_ci if (ks_start(s, ip, kernel_start, &start, nb)) { 74262306a36Sopenharmony_ci *d++ = *s; 74362306a36Sopenharmony_ci nr += 1; 74462306a36Sopenharmony_ci } 74562306a36Sopenharmony_ci nb = s; 74662306a36Sopenharmony_ci } 74762306a36Sopenharmony_ci } 74862306a36Sopenharmony_ci } 74962306a36Sopenharmony_ci 75062306a36Sopenharmony_ci dst->nr = nr; 75162306a36Sopenharmony_ci} 75262306a36Sopenharmony_ci 75362306a36Sopenharmony_cistruct call_return_processor * 75462306a36Sopenharmony_cicall_return_processor__new(int (*process)(struct call_return *cr, u64 *parent_db_id, void *data), 75562306a36Sopenharmony_ci void *data) 75662306a36Sopenharmony_ci{ 75762306a36Sopenharmony_ci struct call_return_processor *crp; 75862306a36Sopenharmony_ci 75962306a36Sopenharmony_ci crp = zalloc(sizeof(struct call_return_processor)); 76062306a36Sopenharmony_ci if (!crp) 76162306a36Sopenharmony_ci return NULL; 76262306a36Sopenharmony_ci crp->cpr = call_path_root__new(); 76362306a36Sopenharmony_ci if (!crp->cpr) 76462306a36Sopenharmony_ci goto out_free; 76562306a36Sopenharmony_ci crp->process = process; 76662306a36Sopenharmony_ci crp->data = data; 76762306a36Sopenharmony_ci return crp; 76862306a36Sopenharmony_ci 76962306a36Sopenharmony_ciout_free: 77062306a36Sopenharmony_ci free(crp); 77162306a36Sopenharmony_ci return NULL; 77262306a36Sopenharmony_ci} 77362306a36Sopenharmony_ci 77462306a36Sopenharmony_civoid call_return_processor__free(struct call_return_processor *crp) 77562306a36Sopenharmony_ci{ 77662306a36Sopenharmony_ci if (crp) { 77762306a36Sopenharmony_ci call_path_root__free(crp->cpr); 77862306a36Sopenharmony_ci free(crp); 77962306a36Sopenharmony_ci } 78062306a36Sopenharmony_ci} 78162306a36Sopenharmony_ci 78262306a36Sopenharmony_cistatic int thread_stack__push_cp(struct thread_stack *ts, u64 ret_addr, 78362306a36Sopenharmony_ci u64 timestamp, u64 ref, struct call_path *cp, 78462306a36Sopenharmony_ci bool no_call, bool trace_end) 78562306a36Sopenharmony_ci{ 78662306a36Sopenharmony_ci struct thread_stack_entry *tse; 78762306a36Sopenharmony_ci int err; 78862306a36Sopenharmony_ci 78962306a36Sopenharmony_ci if (!cp) 79062306a36Sopenharmony_ci return -ENOMEM; 79162306a36Sopenharmony_ci 79262306a36Sopenharmony_ci if (ts->cnt == ts->sz) { 79362306a36Sopenharmony_ci err = thread_stack__grow(ts); 79462306a36Sopenharmony_ci if (err) 79562306a36Sopenharmony_ci return err; 79662306a36Sopenharmony_ci } 79762306a36Sopenharmony_ci 79862306a36Sopenharmony_ci tse = &ts->stack[ts->cnt++]; 79962306a36Sopenharmony_ci tse->ret_addr = ret_addr; 80062306a36Sopenharmony_ci tse->timestamp = timestamp; 80162306a36Sopenharmony_ci tse->ref = ref; 80262306a36Sopenharmony_ci tse->branch_count = ts->branch_count; 80362306a36Sopenharmony_ci tse->insn_count = ts->insn_count; 80462306a36Sopenharmony_ci tse->cyc_count = ts->cyc_count; 80562306a36Sopenharmony_ci tse->cp = cp; 80662306a36Sopenharmony_ci tse->no_call = no_call; 80762306a36Sopenharmony_ci tse->trace_end = trace_end; 80862306a36Sopenharmony_ci tse->non_call = false; 80962306a36Sopenharmony_ci tse->db_id = 0; 81062306a36Sopenharmony_ci 81162306a36Sopenharmony_ci return 0; 81262306a36Sopenharmony_ci} 81362306a36Sopenharmony_ci 81462306a36Sopenharmony_cistatic int thread_stack__pop_cp(struct thread *thread, struct thread_stack *ts, 81562306a36Sopenharmony_ci u64 ret_addr, u64 timestamp, u64 ref, 81662306a36Sopenharmony_ci struct symbol *sym) 81762306a36Sopenharmony_ci{ 81862306a36Sopenharmony_ci int err; 81962306a36Sopenharmony_ci 82062306a36Sopenharmony_ci if (!ts->cnt) 82162306a36Sopenharmony_ci return 1; 82262306a36Sopenharmony_ci 82362306a36Sopenharmony_ci if (ts->cnt == 1) { 82462306a36Sopenharmony_ci struct thread_stack_entry *tse = &ts->stack[0]; 82562306a36Sopenharmony_ci 82662306a36Sopenharmony_ci if (tse->cp->sym == sym) 82762306a36Sopenharmony_ci return thread_stack__call_return(thread, ts, --ts->cnt, 82862306a36Sopenharmony_ci timestamp, ref, false); 82962306a36Sopenharmony_ci } 83062306a36Sopenharmony_ci 83162306a36Sopenharmony_ci if (ts->stack[ts->cnt - 1].ret_addr == ret_addr && 83262306a36Sopenharmony_ci !ts->stack[ts->cnt - 1].non_call) { 83362306a36Sopenharmony_ci return thread_stack__call_return(thread, ts, --ts->cnt, 83462306a36Sopenharmony_ci timestamp, ref, false); 83562306a36Sopenharmony_ci } else { 83662306a36Sopenharmony_ci size_t i = ts->cnt - 1; 83762306a36Sopenharmony_ci 83862306a36Sopenharmony_ci while (i--) { 83962306a36Sopenharmony_ci if (ts->stack[i].ret_addr != ret_addr || 84062306a36Sopenharmony_ci ts->stack[i].non_call) 84162306a36Sopenharmony_ci continue; 84262306a36Sopenharmony_ci i += 1; 84362306a36Sopenharmony_ci while (ts->cnt > i) { 84462306a36Sopenharmony_ci err = thread_stack__call_return(thread, ts, 84562306a36Sopenharmony_ci --ts->cnt, 84662306a36Sopenharmony_ci timestamp, ref, 84762306a36Sopenharmony_ci true); 84862306a36Sopenharmony_ci if (err) 84962306a36Sopenharmony_ci return err; 85062306a36Sopenharmony_ci } 85162306a36Sopenharmony_ci return thread_stack__call_return(thread, ts, --ts->cnt, 85262306a36Sopenharmony_ci timestamp, ref, false); 85362306a36Sopenharmony_ci } 85462306a36Sopenharmony_ci } 85562306a36Sopenharmony_ci 85662306a36Sopenharmony_ci return 1; 85762306a36Sopenharmony_ci} 85862306a36Sopenharmony_ci 85962306a36Sopenharmony_cistatic int thread_stack__bottom(struct thread_stack *ts, 86062306a36Sopenharmony_ci struct perf_sample *sample, 86162306a36Sopenharmony_ci struct addr_location *from_al, 86262306a36Sopenharmony_ci struct addr_location *to_al, u64 ref) 86362306a36Sopenharmony_ci{ 86462306a36Sopenharmony_ci struct call_path_root *cpr = ts->crp->cpr; 86562306a36Sopenharmony_ci struct call_path *cp; 86662306a36Sopenharmony_ci struct symbol *sym; 86762306a36Sopenharmony_ci u64 ip; 86862306a36Sopenharmony_ci 86962306a36Sopenharmony_ci if (sample->ip) { 87062306a36Sopenharmony_ci ip = sample->ip; 87162306a36Sopenharmony_ci sym = from_al->sym; 87262306a36Sopenharmony_ci } else if (sample->addr) { 87362306a36Sopenharmony_ci ip = sample->addr; 87462306a36Sopenharmony_ci sym = to_al->sym; 87562306a36Sopenharmony_ci } else { 87662306a36Sopenharmony_ci return 0; 87762306a36Sopenharmony_ci } 87862306a36Sopenharmony_ci 87962306a36Sopenharmony_ci cp = call_path__findnew(cpr, &cpr->call_path, sym, ip, 88062306a36Sopenharmony_ci ts->kernel_start); 88162306a36Sopenharmony_ci 88262306a36Sopenharmony_ci return thread_stack__push_cp(ts, ip, sample->time, ref, cp, 88362306a36Sopenharmony_ci true, false); 88462306a36Sopenharmony_ci} 88562306a36Sopenharmony_ci 88662306a36Sopenharmony_cistatic int thread_stack__pop_ks(struct thread *thread, struct thread_stack *ts, 88762306a36Sopenharmony_ci struct perf_sample *sample, u64 ref) 88862306a36Sopenharmony_ci{ 88962306a36Sopenharmony_ci u64 tm = sample->time; 89062306a36Sopenharmony_ci int err; 89162306a36Sopenharmony_ci 89262306a36Sopenharmony_ci /* Return to userspace, so pop all kernel addresses */ 89362306a36Sopenharmony_ci while (thread_stack__in_kernel(ts)) { 89462306a36Sopenharmony_ci err = thread_stack__call_return(thread, ts, --ts->cnt, 89562306a36Sopenharmony_ci tm, ref, true); 89662306a36Sopenharmony_ci if (err) 89762306a36Sopenharmony_ci return err; 89862306a36Sopenharmony_ci } 89962306a36Sopenharmony_ci 90062306a36Sopenharmony_ci return 0; 90162306a36Sopenharmony_ci} 90262306a36Sopenharmony_ci 90362306a36Sopenharmony_cistatic int thread_stack__no_call_return(struct thread *thread, 90462306a36Sopenharmony_ci struct thread_stack *ts, 90562306a36Sopenharmony_ci struct perf_sample *sample, 90662306a36Sopenharmony_ci struct addr_location *from_al, 90762306a36Sopenharmony_ci struct addr_location *to_al, u64 ref) 90862306a36Sopenharmony_ci{ 90962306a36Sopenharmony_ci struct call_path_root *cpr = ts->crp->cpr; 91062306a36Sopenharmony_ci struct call_path *root = &cpr->call_path; 91162306a36Sopenharmony_ci struct symbol *fsym = from_al->sym; 91262306a36Sopenharmony_ci struct symbol *tsym = to_al->sym; 91362306a36Sopenharmony_ci struct call_path *cp, *parent; 91462306a36Sopenharmony_ci u64 ks = ts->kernel_start; 91562306a36Sopenharmony_ci u64 addr = sample->addr; 91662306a36Sopenharmony_ci u64 tm = sample->time; 91762306a36Sopenharmony_ci u64 ip = sample->ip; 91862306a36Sopenharmony_ci int err; 91962306a36Sopenharmony_ci 92062306a36Sopenharmony_ci if (ip >= ks && addr < ks) { 92162306a36Sopenharmony_ci /* Return to userspace, so pop all kernel addresses */ 92262306a36Sopenharmony_ci err = thread_stack__pop_ks(thread, ts, sample, ref); 92362306a36Sopenharmony_ci if (err) 92462306a36Sopenharmony_ci return err; 92562306a36Sopenharmony_ci 92662306a36Sopenharmony_ci /* If the stack is empty, push the userspace address */ 92762306a36Sopenharmony_ci if (!ts->cnt) { 92862306a36Sopenharmony_ci cp = call_path__findnew(cpr, root, tsym, addr, ks); 92962306a36Sopenharmony_ci return thread_stack__push_cp(ts, 0, tm, ref, cp, true, 93062306a36Sopenharmony_ci false); 93162306a36Sopenharmony_ci } 93262306a36Sopenharmony_ci } else if (thread_stack__in_kernel(ts) && ip < ks) { 93362306a36Sopenharmony_ci /* Return to userspace, so pop all kernel addresses */ 93462306a36Sopenharmony_ci err = thread_stack__pop_ks(thread, ts, sample, ref); 93562306a36Sopenharmony_ci if (err) 93662306a36Sopenharmony_ci return err; 93762306a36Sopenharmony_ci } 93862306a36Sopenharmony_ci 93962306a36Sopenharmony_ci if (ts->cnt) 94062306a36Sopenharmony_ci parent = ts->stack[ts->cnt - 1].cp; 94162306a36Sopenharmony_ci else 94262306a36Sopenharmony_ci parent = root; 94362306a36Sopenharmony_ci 94462306a36Sopenharmony_ci if (parent->sym == from_al->sym) { 94562306a36Sopenharmony_ci /* 94662306a36Sopenharmony_ci * At the bottom of the stack, assume the missing 'call' was 94762306a36Sopenharmony_ci * before the trace started. So, pop the current symbol and push 94862306a36Sopenharmony_ci * the 'to' symbol. 94962306a36Sopenharmony_ci */ 95062306a36Sopenharmony_ci if (ts->cnt == 1) { 95162306a36Sopenharmony_ci err = thread_stack__call_return(thread, ts, --ts->cnt, 95262306a36Sopenharmony_ci tm, ref, false); 95362306a36Sopenharmony_ci if (err) 95462306a36Sopenharmony_ci return err; 95562306a36Sopenharmony_ci } 95662306a36Sopenharmony_ci 95762306a36Sopenharmony_ci if (!ts->cnt) { 95862306a36Sopenharmony_ci cp = call_path__findnew(cpr, root, tsym, addr, ks); 95962306a36Sopenharmony_ci 96062306a36Sopenharmony_ci return thread_stack__push_cp(ts, addr, tm, ref, cp, 96162306a36Sopenharmony_ci true, false); 96262306a36Sopenharmony_ci } 96362306a36Sopenharmony_ci 96462306a36Sopenharmony_ci /* 96562306a36Sopenharmony_ci * Otherwise assume the 'return' is being used as a jump (e.g. 96662306a36Sopenharmony_ci * retpoline) and just push the 'to' symbol. 96762306a36Sopenharmony_ci */ 96862306a36Sopenharmony_ci cp = call_path__findnew(cpr, parent, tsym, addr, ks); 96962306a36Sopenharmony_ci 97062306a36Sopenharmony_ci err = thread_stack__push_cp(ts, 0, tm, ref, cp, true, false); 97162306a36Sopenharmony_ci if (!err) 97262306a36Sopenharmony_ci ts->stack[ts->cnt - 1].non_call = true; 97362306a36Sopenharmony_ci 97462306a36Sopenharmony_ci return err; 97562306a36Sopenharmony_ci } 97662306a36Sopenharmony_ci 97762306a36Sopenharmony_ci /* 97862306a36Sopenharmony_ci * Assume 'parent' has not yet returned, so push 'to', and then push and 97962306a36Sopenharmony_ci * pop 'from'. 98062306a36Sopenharmony_ci */ 98162306a36Sopenharmony_ci 98262306a36Sopenharmony_ci cp = call_path__findnew(cpr, parent, tsym, addr, ks); 98362306a36Sopenharmony_ci 98462306a36Sopenharmony_ci err = thread_stack__push_cp(ts, addr, tm, ref, cp, true, false); 98562306a36Sopenharmony_ci if (err) 98662306a36Sopenharmony_ci return err; 98762306a36Sopenharmony_ci 98862306a36Sopenharmony_ci cp = call_path__findnew(cpr, cp, fsym, ip, ks); 98962306a36Sopenharmony_ci 99062306a36Sopenharmony_ci err = thread_stack__push_cp(ts, ip, tm, ref, cp, true, false); 99162306a36Sopenharmony_ci if (err) 99262306a36Sopenharmony_ci return err; 99362306a36Sopenharmony_ci 99462306a36Sopenharmony_ci return thread_stack__call_return(thread, ts, --ts->cnt, tm, ref, false); 99562306a36Sopenharmony_ci} 99662306a36Sopenharmony_ci 99762306a36Sopenharmony_cistatic int thread_stack__trace_begin(struct thread *thread, 99862306a36Sopenharmony_ci struct thread_stack *ts, u64 timestamp, 99962306a36Sopenharmony_ci u64 ref) 100062306a36Sopenharmony_ci{ 100162306a36Sopenharmony_ci struct thread_stack_entry *tse; 100262306a36Sopenharmony_ci int err; 100362306a36Sopenharmony_ci 100462306a36Sopenharmony_ci if (!ts->cnt) 100562306a36Sopenharmony_ci return 0; 100662306a36Sopenharmony_ci 100762306a36Sopenharmony_ci /* Pop trace end */ 100862306a36Sopenharmony_ci tse = &ts->stack[ts->cnt - 1]; 100962306a36Sopenharmony_ci if (tse->trace_end) { 101062306a36Sopenharmony_ci err = thread_stack__call_return(thread, ts, --ts->cnt, 101162306a36Sopenharmony_ci timestamp, ref, false); 101262306a36Sopenharmony_ci if (err) 101362306a36Sopenharmony_ci return err; 101462306a36Sopenharmony_ci } 101562306a36Sopenharmony_ci 101662306a36Sopenharmony_ci return 0; 101762306a36Sopenharmony_ci} 101862306a36Sopenharmony_ci 101962306a36Sopenharmony_cistatic int thread_stack__trace_end(struct thread_stack *ts, 102062306a36Sopenharmony_ci struct perf_sample *sample, u64 ref) 102162306a36Sopenharmony_ci{ 102262306a36Sopenharmony_ci struct call_path_root *cpr = ts->crp->cpr; 102362306a36Sopenharmony_ci struct call_path *cp; 102462306a36Sopenharmony_ci u64 ret_addr; 102562306a36Sopenharmony_ci 102662306a36Sopenharmony_ci /* No point having 'trace end' on the bottom of the stack */ 102762306a36Sopenharmony_ci if (!ts->cnt || (ts->cnt == 1 && ts->stack[0].ref == ref)) 102862306a36Sopenharmony_ci return 0; 102962306a36Sopenharmony_ci 103062306a36Sopenharmony_ci cp = call_path__findnew(cpr, ts->stack[ts->cnt - 1].cp, NULL, 0, 103162306a36Sopenharmony_ci ts->kernel_start); 103262306a36Sopenharmony_ci 103362306a36Sopenharmony_ci ret_addr = sample->ip + sample->insn_len; 103462306a36Sopenharmony_ci 103562306a36Sopenharmony_ci return thread_stack__push_cp(ts, ret_addr, sample->time, ref, cp, 103662306a36Sopenharmony_ci false, true); 103762306a36Sopenharmony_ci} 103862306a36Sopenharmony_ci 103962306a36Sopenharmony_cistatic bool is_x86_retpoline(const char *name) 104062306a36Sopenharmony_ci{ 104162306a36Sopenharmony_ci return strstr(name, "__x86_indirect_thunk_") == name; 104262306a36Sopenharmony_ci} 104362306a36Sopenharmony_ci 104462306a36Sopenharmony_ci/* 104562306a36Sopenharmony_ci * x86 retpoline functions pollute the call graph. This function removes them. 104662306a36Sopenharmony_ci * This does not handle function return thunks, nor is there any improvement 104762306a36Sopenharmony_ci * for the handling of inline thunks or extern thunks. 104862306a36Sopenharmony_ci */ 104962306a36Sopenharmony_cistatic int thread_stack__x86_retpoline(struct thread_stack *ts, 105062306a36Sopenharmony_ci struct perf_sample *sample, 105162306a36Sopenharmony_ci struct addr_location *to_al) 105262306a36Sopenharmony_ci{ 105362306a36Sopenharmony_ci struct thread_stack_entry *tse = &ts->stack[ts->cnt - 1]; 105462306a36Sopenharmony_ci struct call_path_root *cpr = ts->crp->cpr; 105562306a36Sopenharmony_ci struct symbol *sym = tse->cp->sym; 105662306a36Sopenharmony_ci struct symbol *tsym = to_al->sym; 105762306a36Sopenharmony_ci struct call_path *cp; 105862306a36Sopenharmony_ci 105962306a36Sopenharmony_ci if (sym && is_x86_retpoline(sym->name)) { 106062306a36Sopenharmony_ci /* 106162306a36Sopenharmony_ci * This is a x86 retpoline fn. It pollutes the call graph by 106262306a36Sopenharmony_ci * showing up everywhere there is an indirect branch, but does 106362306a36Sopenharmony_ci * not itself mean anything. Here the top-of-stack is removed, 106462306a36Sopenharmony_ci * by decrementing the stack count, and then further down, the 106562306a36Sopenharmony_ci * resulting top-of-stack is replaced with the actual target. 106662306a36Sopenharmony_ci * The result is that the retpoline functions will no longer 106762306a36Sopenharmony_ci * appear in the call graph. Note this only affects the call 106862306a36Sopenharmony_ci * graph, since all the original branches are left unchanged. 106962306a36Sopenharmony_ci */ 107062306a36Sopenharmony_ci ts->cnt -= 1; 107162306a36Sopenharmony_ci sym = ts->stack[ts->cnt - 2].cp->sym; 107262306a36Sopenharmony_ci if (sym && sym == tsym && to_al->addr != tsym->start) { 107362306a36Sopenharmony_ci /* 107462306a36Sopenharmony_ci * Target is back to the middle of the symbol we came 107562306a36Sopenharmony_ci * from so assume it is an indirect jmp and forget it 107662306a36Sopenharmony_ci * altogether. 107762306a36Sopenharmony_ci */ 107862306a36Sopenharmony_ci ts->cnt -= 1; 107962306a36Sopenharmony_ci return 0; 108062306a36Sopenharmony_ci } 108162306a36Sopenharmony_ci } else if (sym && sym == tsym) { 108262306a36Sopenharmony_ci /* 108362306a36Sopenharmony_ci * Target is back to the symbol we came from so assume it is an 108462306a36Sopenharmony_ci * indirect jmp and forget it altogether. 108562306a36Sopenharmony_ci */ 108662306a36Sopenharmony_ci ts->cnt -= 1; 108762306a36Sopenharmony_ci return 0; 108862306a36Sopenharmony_ci } 108962306a36Sopenharmony_ci 109062306a36Sopenharmony_ci cp = call_path__findnew(cpr, ts->stack[ts->cnt - 2].cp, tsym, 109162306a36Sopenharmony_ci sample->addr, ts->kernel_start); 109262306a36Sopenharmony_ci if (!cp) 109362306a36Sopenharmony_ci return -ENOMEM; 109462306a36Sopenharmony_ci 109562306a36Sopenharmony_ci /* Replace the top-of-stack with the actual target */ 109662306a36Sopenharmony_ci ts->stack[ts->cnt - 1].cp = cp; 109762306a36Sopenharmony_ci 109862306a36Sopenharmony_ci return 0; 109962306a36Sopenharmony_ci} 110062306a36Sopenharmony_ci 110162306a36Sopenharmony_ciint thread_stack__process(struct thread *thread, struct comm *comm, 110262306a36Sopenharmony_ci struct perf_sample *sample, 110362306a36Sopenharmony_ci struct addr_location *from_al, 110462306a36Sopenharmony_ci struct addr_location *to_al, u64 ref, 110562306a36Sopenharmony_ci struct call_return_processor *crp) 110662306a36Sopenharmony_ci{ 110762306a36Sopenharmony_ci struct thread_stack *ts = thread__stack(thread, sample->cpu); 110862306a36Sopenharmony_ci enum retpoline_state_t rstate; 110962306a36Sopenharmony_ci int err = 0; 111062306a36Sopenharmony_ci 111162306a36Sopenharmony_ci if (ts && !ts->crp) { 111262306a36Sopenharmony_ci /* Supersede thread_stack__event() */ 111362306a36Sopenharmony_ci thread_stack__reset(thread, ts); 111462306a36Sopenharmony_ci ts = NULL; 111562306a36Sopenharmony_ci } 111662306a36Sopenharmony_ci 111762306a36Sopenharmony_ci if (!ts) { 111862306a36Sopenharmony_ci ts = thread_stack__new(thread, sample->cpu, crp, true, 0); 111962306a36Sopenharmony_ci if (!ts) 112062306a36Sopenharmony_ci return -ENOMEM; 112162306a36Sopenharmony_ci ts->comm = comm; 112262306a36Sopenharmony_ci } 112362306a36Sopenharmony_ci 112462306a36Sopenharmony_ci rstate = ts->rstate; 112562306a36Sopenharmony_ci if (rstate == X86_RETPOLINE_DETECTED) 112662306a36Sopenharmony_ci ts->rstate = X86_RETPOLINE_POSSIBLE; 112762306a36Sopenharmony_ci 112862306a36Sopenharmony_ci /* Flush stack on exec */ 112962306a36Sopenharmony_ci if (ts->comm != comm && thread__pid(thread) == thread__tid(thread)) { 113062306a36Sopenharmony_ci err = __thread_stack__flush(thread, ts); 113162306a36Sopenharmony_ci if (err) 113262306a36Sopenharmony_ci return err; 113362306a36Sopenharmony_ci ts->comm = comm; 113462306a36Sopenharmony_ci } 113562306a36Sopenharmony_ci 113662306a36Sopenharmony_ci /* If the stack is empty, put the current symbol on the stack */ 113762306a36Sopenharmony_ci if (!ts->cnt) { 113862306a36Sopenharmony_ci err = thread_stack__bottom(ts, sample, from_al, to_al, ref); 113962306a36Sopenharmony_ci if (err) 114062306a36Sopenharmony_ci return err; 114162306a36Sopenharmony_ci } 114262306a36Sopenharmony_ci 114362306a36Sopenharmony_ci ts->branch_count += 1; 114462306a36Sopenharmony_ci ts->insn_count += sample->insn_cnt; 114562306a36Sopenharmony_ci ts->cyc_count += sample->cyc_cnt; 114662306a36Sopenharmony_ci ts->last_time = sample->time; 114762306a36Sopenharmony_ci 114862306a36Sopenharmony_ci if (sample->flags & PERF_IP_FLAG_CALL) { 114962306a36Sopenharmony_ci bool trace_end = sample->flags & PERF_IP_FLAG_TRACE_END; 115062306a36Sopenharmony_ci struct call_path_root *cpr = ts->crp->cpr; 115162306a36Sopenharmony_ci struct call_path *cp; 115262306a36Sopenharmony_ci u64 ret_addr; 115362306a36Sopenharmony_ci 115462306a36Sopenharmony_ci if (!sample->ip || !sample->addr) 115562306a36Sopenharmony_ci return 0; 115662306a36Sopenharmony_ci 115762306a36Sopenharmony_ci ret_addr = sample->ip + sample->insn_len; 115862306a36Sopenharmony_ci if (ret_addr == sample->addr) 115962306a36Sopenharmony_ci return 0; /* Zero-length calls are excluded */ 116062306a36Sopenharmony_ci 116162306a36Sopenharmony_ci cp = call_path__findnew(cpr, ts->stack[ts->cnt - 1].cp, 116262306a36Sopenharmony_ci to_al->sym, sample->addr, 116362306a36Sopenharmony_ci ts->kernel_start); 116462306a36Sopenharmony_ci err = thread_stack__push_cp(ts, ret_addr, sample->time, ref, 116562306a36Sopenharmony_ci cp, false, trace_end); 116662306a36Sopenharmony_ci 116762306a36Sopenharmony_ci /* 116862306a36Sopenharmony_ci * A call to the same symbol but not the start of the symbol, 116962306a36Sopenharmony_ci * may be the start of a x86 retpoline. 117062306a36Sopenharmony_ci */ 117162306a36Sopenharmony_ci if (!err && rstate == X86_RETPOLINE_POSSIBLE && to_al->sym && 117262306a36Sopenharmony_ci from_al->sym == to_al->sym && 117362306a36Sopenharmony_ci to_al->addr != to_al->sym->start) 117462306a36Sopenharmony_ci ts->rstate = X86_RETPOLINE_DETECTED; 117562306a36Sopenharmony_ci 117662306a36Sopenharmony_ci } else if (sample->flags & PERF_IP_FLAG_RETURN) { 117762306a36Sopenharmony_ci if (!sample->addr) { 117862306a36Sopenharmony_ci u32 return_from_kernel = PERF_IP_FLAG_SYSCALLRET | 117962306a36Sopenharmony_ci PERF_IP_FLAG_INTERRUPT; 118062306a36Sopenharmony_ci 118162306a36Sopenharmony_ci if (!(sample->flags & return_from_kernel)) 118262306a36Sopenharmony_ci return 0; 118362306a36Sopenharmony_ci 118462306a36Sopenharmony_ci /* Pop kernel stack */ 118562306a36Sopenharmony_ci return thread_stack__pop_ks(thread, ts, sample, ref); 118662306a36Sopenharmony_ci } 118762306a36Sopenharmony_ci 118862306a36Sopenharmony_ci if (!sample->ip) 118962306a36Sopenharmony_ci return 0; 119062306a36Sopenharmony_ci 119162306a36Sopenharmony_ci /* x86 retpoline 'return' doesn't match the stack */ 119262306a36Sopenharmony_ci if (rstate == X86_RETPOLINE_DETECTED && ts->cnt > 2 && 119362306a36Sopenharmony_ci ts->stack[ts->cnt - 1].ret_addr != sample->addr) 119462306a36Sopenharmony_ci return thread_stack__x86_retpoline(ts, sample, to_al); 119562306a36Sopenharmony_ci 119662306a36Sopenharmony_ci err = thread_stack__pop_cp(thread, ts, sample->addr, 119762306a36Sopenharmony_ci sample->time, ref, from_al->sym); 119862306a36Sopenharmony_ci if (err) { 119962306a36Sopenharmony_ci if (err < 0) 120062306a36Sopenharmony_ci return err; 120162306a36Sopenharmony_ci err = thread_stack__no_call_return(thread, ts, sample, 120262306a36Sopenharmony_ci from_al, to_al, ref); 120362306a36Sopenharmony_ci } 120462306a36Sopenharmony_ci } else if (sample->flags & PERF_IP_FLAG_TRACE_BEGIN) { 120562306a36Sopenharmony_ci err = thread_stack__trace_begin(thread, ts, sample->time, ref); 120662306a36Sopenharmony_ci } else if (sample->flags & PERF_IP_FLAG_TRACE_END) { 120762306a36Sopenharmony_ci err = thread_stack__trace_end(ts, sample, ref); 120862306a36Sopenharmony_ci } else if (sample->flags & PERF_IP_FLAG_BRANCH && 120962306a36Sopenharmony_ci from_al->sym != to_al->sym && to_al->sym && 121062306a36Sopenharmony_ci to_al->addr == to_al->sym->start) { 121162306a36Sopenharmony_ci struct call_path_root *cpr = ts->crp->cpr; 121262306a36Sopenharmony_ci struct call_path *cp; 121362306a36Sopenharmony_ci 121462306a36Sopenharmony_ci /* 121562306a36Sopenharmony_ci * The compiler might optimize a call/ret combination by making 121662306a36Sopenharmony_ci * it a jmp. Make that visible by recording on the stack a 121762306a36Sopenharmony_ci * branch to the start of a different symbol. Note, that means 121862306a36Sopenharmony_ci * when a ret pops the stack, all jmps must be popped off first. 121962306a36Sopenharmony_ci */ 122062306a36Sopenharmony_ci cp = call_path__findnew(cpr, ts->stack[ts->cnt - 1].cp, 122162306a36Sopenharmony_ci to_al->sym, sample->addr, 122262306a36Sopenharmony_ci ts->kernel_start); 122362306a36Sopenharmony_ci err = thread_stack__push_cp(ts, 0, sample->time, ref, cp, false, 122462306a36Sopenharmony_ci false); 122562306a36Sopenharmony_ci if (!err) 122662306a36Sopenharmony_ci ts->stack[ts->cnt - 1].non_call = true; 122762306a36Sopenharmony_ci } 122862306a36Sopenharmony_ci 122962306a36Sopenharmony_ci return err; 123062306a36Sopenharmony_ci} 123162306a36Sopenharmony_ci 123262306a36Sopenharmony_cisize_t thread_stack__depth(struct thread *thread, int cpu) 123362306a36Sopenharmony_ci{ 123462306a36Sopenharmony_ci struct thread_stack *ts = thread__stack(thread, cpu); 123562306a36Sopenharmony_ci 123662306a36Sopenharmony_ci if (!ts) 123762306a36Sopenharmony_ci return 0; 123862306a36Sopenharmony_ci return ts->cnt; 123962306a36Sopenharmony_ci} 1240