162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * thread-stack.c: Synthesize a thread's stack using call / return events
462306a36Sopenharmony_ci * Copyright (c) 2014, Intel Corporation.
562306a36Sopenharmony_ci */
662306a36Sopenharmony_ci
762306a36Sopenharmony_ci#include <linux/rbtree.h>
862306a36Sopenharmony_ci#include <linux/list.h>
962306a36Sopenharmony_ci#include <linux/log2.h>
1062306a36Sopenharmony_ci#include <linux/zalloc.h>
1162306a36Sopenharmony_ci#include <errno.h>
1262306a36Sopenharmony_ci#include <stdlib.h>
1362306a36Sopenharmony_ci#include <string.h>
1462306a36Sopenharmony_ci#include "thread.h"
1562306a36Sopenharmony_ci#include "event.h"
1662306a36Sopenharmony_ci#include "machine.h"
1762306a36Sopenharmony_ci#include "env.h"
1862306a36Sopenharmony_ci#include "debug.h"
1962306a36Sopenharmony_ci#include "symbol.h"
2062306a36Sopenharmony_ci#include "comm.h"
2162306a36Sopenharmony_ci#include "call-path.h"
2262306a36Sopenharmony_ci#include "thread-stack.h"
2362306a36Sopenharmony_ci
2462306a36Sopenharmony_ci#define STACK_GROWTH 2048
2562306a36Sopenharmony_ci
2662306a36Sopenharmony_ci/*
2762306a36Sopenharmony_ci * State of retpoline detection.
2862306a36Sopenharmony_ci *
2962306a36Sopenharmony_ci * RETPOLINE_NONE: no retpoline detection
3062306a36Sopenharmony_ci * X86_RETPOLINE_POSSIBLE: x86 retpoline possible
3162306a36Sopenharmony_ci * X86_RETPOLINE_DETECTED: x86 retpoline detected
3262306a36Sopenharmony_ci */
3362306a36Sopenharmony_cienum retpoline_state_t {
3462306a36Sopenharmony_ci	RETPOLINE_NONE,
3562306a36Sopenharmony_ci	X86_RETPOLINE_POSSIBLE,
3662306a36Sopenharmony_ci	X86_RETPOLINE_DETECTED,
3762306a36Sopenharmony_ci};
3862306a36Sopenharmony_ci
3962306a36Sopenharmony_ci/**
4062306a36Sopenharmony_ci * struct thread_stack_entry - thread stack entry.
4162306a36Sopenharmony_ci * @ret_addr: return address
4262306a36Sopenharmony_ci * @timestamp: timestamp (if known)
4362306a36Sopenharmony_ci * @ref: external reference (e.g. db_id of sample)
4462306a36Sopenharmony_ci * @branch_count: the branch count when the entry was created
4562306a36Sopenharmony_ci * @insn_count: the instruction count when the entry was created
4662306a36Sopenharmony_ci * @cyc_count the cycle count when the entry was created
4762306a36Sopenharmony_ci * @db_id: id used for db-export
4862306a36Sopenharmony_ci * @cp: call path
4962306a36Sopenharmony_ci * @no_call: a 'call' was not seen
5062306a36Sopenharmony_ci * @trace_end: a 'call' but trace ended
5162306a36Sopenharmony_ci * @non_call: a branch but not a 'call' to the start of a different symbol
5262306a36Sopenharmony_ci */
5362306a36Sopenharmony_cistruct thread_stack_entry {
5462306a36Sopenharmony_ci	u64 ret_addr;
5562306a36Sopenharmony_ci	u64 timestamp;
5662306a36Sopenharmony_ci	u64 ref;
5762306a36Sopenharmony_ci	u64 branch_count;
5862306a36Sopenharmony_ci	u64 insn_count;
5962306a36Sopenharmony_ci	u64 cyc_count;
6062306a36Sopenharmony_ci	u64 db_id;
6162306a36Sopenharmony_ci	struct call_path *cp;
6262306a36Sopenharmony_ci	bool no_call;
6362306a36Sopenharmony_ci	bool trace_end;
6462306a36Sopenharmony_ci	bool non_call;
6562306a36Sopenharmony_ci};
6662306a36Sopenharmony_ci
6762306a36Sopenharmony_ci/**
6862306a36Sopenharmony_ci * struct thread_stack - thread stack constructed from 'call' and 'return'
6962306a36Sopenharmony_ci *                       branch samples.
7062306a36Sopenharmony_ci * @stack: array that holds the stack
7162306a36Sopenharmony_ci * @cnt: number of entries in the stack
7262306a36Sopenharmony_ci * @sz: current maximum stack size
7362306a36Sopenharmony_ci * @trace_nr: current trace number
7462306a36Sopenharmony_ci * @branch_count: running branch count
7562306a36Sopenharmony_ci * @insn_count: running  instruction count
7662306a36Sopenharmony_ci * @cyc_count running  cycle count
7762306a36Sopenharmony_ci * @kernel_start: kernel start address
7862306a36Sopenharmony_ci * @last_time: last timestamp
7962306a36Sopenharmony_ci * @crp: call/return processor
8062306a36Sopenharmony_ci * @comm: current comm
8162306a36Sopenharmony_ci * @arr_sz: size of array if this is the first element of an array
8262306a36Sopenharmony_ci * @rstate: used to detect retpolines
8362306a36Sopenharmony_ci * @br_stack_rb: branch stack (ring buffer)
8462306a36Sopenharmony_ci * @br_stack_sz: maximum branch stack size
8562306a36Sopenharmony_ci * @br_stack_pos: current position in @br_stack_rb
8662306a36Sopenharmony_ci * @mispred_all: mark all branches as mispredicted
8762306a36Sopenharmony_ci */
8862306a36Sopenharmony_cistruct thread_stack {
8962306a36Sopenharmony_ci	struct thread_stack_entry *stack;
9062306a36Sopenharmony_ci	size_t cnt;
9162306a36Sopenharmony_ci	size_t sz;
9262306a36Sopenharmony_ci	u64 trace_nr;
9362306a36Sopenharmony_ci	u64 branch_count;
9462306a36Sopenharmony_ci	u64 insn_count;
9562306a36Sopenharmony_ci	u64 cyc_count;
9662306a36Sopenharmony_ci	u64 kernel_start;
9762306a36Sopenharmony_ci	u64 last_time;
9862306a36Sopenharmony_ci	struct call_return_processor *crp;
9962306a36Sopenharmony_ci	struct comm *comm;
10062306a36Sopenharmony_ci	unsigned int arr_sz;
10162306a36Sopenharmony_ci	enum retpoline_state_t rstate;
10262306a36Sopenharmony_ci	struct branch_stack *br_stack_rb;
10362306a36Sopenharmony_ci	unsigned int br_stack_sz;
10462306a36Sopenharmony_ci	unsigned int br_stack_pos;
10562306a36Sopenharmony_ci	bool mispred_all;
10662306a36Sopenharmony_ci};
10762306a36Sopenharmony_ci
10862306a36Sopenharmony_ci/*
10962306a36Sopenharmony_ci * Assume pid == tid == 0 identifies the idle task as defined by
11062306a36Sopenharmony_ci * perf_session__register_idle_thread(). The idle task is really 1 task per cpu,
11162306a36Sopenharmony_ci * and therefore requires a stack for each cpu.
11262306a36Sopenharmony_ci */
11362306a36Sopenharmony_cistatic inline bool thread_stack__per_cpu(struct thread *thread)
11462306a36Sopenharmony_ci{
11562306a36Sopenharmony_ci	return !(thread__tid(thread) || thread__pid(thread));
11662306a36Sopenharmony_ci}
11762306a36Sopenharmony_ci
11862306a36Sopenharmony_cistatic int thread_stack__grow(struct thread_stack *ts)
11962306a36Sopenharmony_ci{
12062306a36Sopenharmony_ci	struct thread_stack_entry *new_stack;
12162306a36Sopenharmony_ci	size_t sz, new_sz;
12262306a36Sopenharmony_ci
12362306a36Sopenharmony_ci	new_sz = ts->sz + STACK_GROWTH;
12462306a36Sopenharmony_ci	sz = new_sz * sizeof(struct thread_stack_entry);
12562306a36Sopenharmony_ci
12662306a36Sopenharmony_ci	new_stack = realloc(ts->stack, sz);
12762306a36Sopenharmony_ci	if (!new_stack)
12862306a36Sopenharmony_ci		return -ENOMEM;
12962306a36Sopenharmony_ci
13062306a36Sopenharmony_ci	ts->stack = new_stack;
13162306a36Sopenharmony_ci	ts->sz = new_sz;
13262306a36Sopenharmony_ci
13362306a36Sopenharmony_ci	return 0;
13462306a36Sopenharmony_ci}
13562306a36Sopenharmony_ci
13662306a36Sopenharmony_cistatic int thread_stack__init(struct thread_stack *ts, struct thread *thread,
13762306a36Sopenharmony_ci			      struct call_return_processor *crp,
13862306a36Sopenharmony_ci			      bool callstack, unsigned int br_stack_sz)
13962306a36Sopenharmony_ci{
14062306a36Sopenharmony_ci	int err;
14162306a36Sopenharmony_ci
14262306a36Sopenharmony_ci	if (callstack) {
14362306a36Sopenharmony_ci		err = thread_stack__grow(ts);
14462306a36Sopenharmony_ci		if (err)
14562306a36Sopenharmony_ci			return err;
14662306a36Sopenharmony_ci	}
14762306a36Sopenharmony_ci
14862306a36Sopenharmony_ci	if (br_stack_sz) {
14962306a36Sopenharmony_ci		size_t sz = sizeof(struct branch_stack);
15062306a36Sopenharmony_ci
15162306a36Sopenharmony_ci		sz += br_stack_sz * sizeof(struct branch_entry);
15262306a36Sopenharmony_ci		ts->br_stack_rb = zalloc(sz);
15362306a36Sopenharmony_ci		if (!ts->br_stack_rb)
15462306a36Sopenharmony_ci			return -ENOMEM;
15562306a36Sopenharmony_ci		ts->br_stack_sz = br_stack_sz;
15662306a36Sopenharmony_ci	}
15762306a36Sopenharmony_ci
15862306a36Sopenharmony_ci	if (thread__maps(thread) && maps__machine(thread__maps(thread))) {
15962306a36Sopenharmony_ci		struct machine *machine = maps__machine(thread__maps(thread));
16062306a36Sopenharmony_ci		const char *arch = perf_env__arch(machine->env);
16162306a36Sopenharmony_ci
16262306a36Sopenharmony_ci		ts->kernel_start = machine__kernel_start(machine);
16362306a36Sopenharmony_ci		if (!strcmp(arch, "x86"))
16462306a36Sopenharmony_ci			ts->rstate = X86_RETPOLINE_POSSIBLE;
16562306a36Sopenharmony_ci	} else {
16662306a36Sopenharmony_ci		ts->kernel_start = 1ULL << 63;
16762306a36Sopenharmony_ci	}
16862306a36Sopenharmony_ci	ts->crp = crp;
16962306a36Sopenharmony_ci
17062306a36Sopenharmony_ci	return 0;
17162306a36Sopenharmony_ci}
17262306a36Sopenharmony_ci
17362306a36Sopenharmony_cistatic struct thread_stack *thread_stack__new(struct thread *thread, int cpu,
17462306a36Sopenharmony_ci					      struct call_return_processor *crp,
17562306a36Sopenharmony_ci					      bool callstack,
17662306a36Sopenharmony_ci					      unsigned int br_stack_sz)
17762306a36Sopenharmony_ci{
17862306a36Sopenharmony_ci	struct thread_stack *ts = thread__ts(thread), *new_ts;
17962306a36Sopenharmony_ci	unsigned int old_sz = ts ? ts->arr_sz : 0;
18062306a36Sopenharmony_ci	unsigned int new_sz = 1;
18162306a36Sopenharmony_ci
18262306a36Sopenharmony_ci	if (thread_stack__per_cpu(thread) && cpu > 0)
18362306a36Sopenharmony_ci		new_sz = roundup_pow_of_two(cpu + 1);
18462306a36Sopenharmony_ci
18562306a36Sopenharmony_ci	if (!ts || new_sz > old_sz) {
18662306a36Sopenharmony_ci		new_ts = calloc(new_sz, sizeof(*ts));
18762306a36Sopenharmony_ci		if (!new_ts)
18862306a36Sopenharmony_ci			return NULL;
18962306a36Sopenharmony_ci		if (ts)
19062306a36Sopenharmony_ci			memcpy(new_ts, ts, old_sz * sizeof(*ts));
19162306a36Sopenharmony_ci		new_ts->arr_sz = new_sz;
19262306a36Sopenharmony_ci		free(thread__ts(thread));
19362306a36Sopenharmony_ci		thread__set_ts(thread, new_ts);
19462306a36Sopenharmony_ci		ts = new_ts;
19562306a36Sopenharmony_ci	}
19662306a36Sopenharmony_ci
19762306a36Sopenharmony_ci	if (thread_stack__per_cpu(thread) && cpu > 0 &&
19862306a36Sopenharmony_ci	    (unsigned int)cpu < ts->arr_sz)
19962306a36Sopenharmony_ci		ts += cpu;
20062306a36Sopenharmony_ci
20162306a36Sopenharmony_ci	if (!ts->stack &&
20262306a36Sopenharmony_ci	    thread_stack__init(ts, thread, crp, callstack, br_stack_sz))
20362306a36Sopenharmony_ci		return NULL;
20462306a36Sopenharmony_ci
20562306a36Sopenharmony_ci	return ts;
20662306a36Sopenharmony_ci}
20762306a36Sopenharmony_ci
20862306a36Sopenharmony_cistatic struct thread_stack *thread__cpu_stack(struct thread *thread, int cpu)
20962306a36Sopenharmony_ci{
21062306a36Sopenharmony_ci	struct thread_stack *ts = thread__ts(thread);
21162306a36Sopenharmony_ci
21262306a36Sopenharmony_ci	if (cpu < 0)
21362306a36Sopenharmony_ci		cpu = 0;
21462306a36Sopenharmony_ci
21562306a36Sopenharmony_ci	if (!ts || (unsigned int)cpu >= ts->arr_sz)
21662306a36Sopenharmony_ci		return NULL;
21762306a36Sopenharmony_ci
21862306a36Sopenharmony_ci	ts += cpu;
21962306a36Sopenharmony_ci
22062306a36Sopenharmony_ci	if (!ts->stack)
22162306a36Sopenharmony_ci		return NULL;
22262306a36Sopenharmony_ci
22362306a36Sopenharmony_ci	return ts;
22462306a36Sopenharmony_ci}
22562306a36Sopenharmony_ci
22662306a36Sopenharmony_cistatic inline struct thread_stack *thread__stack(struct thread *thread,
22762306a36Sopenharmony_ci						    int cpu)
22862306a36Sopenharmony_ci{
22962306a36Sopenharmony_ci	if (!thread)
23062306a36Sopenharmony_ci		return NULL;
23162306a36Sopenharmony_ci
23262306a36Sopenharmony_ci	if (thread_stack__per_cpu(thread))
23362306a36Sopenharmony_ci		return thread__cpu_stack(thread, cpu);
23462306a36Sopenharmony_ci
23562306a36Sopenharmony_ci	return thread__ts(thread);
23662306a36Sopenharmony_ci}
23762306a36Sopenharmony_ci
23862306a36Sopenharmony_cistatic int thread_stack__push(struct thread_stack *ts, u64 ret_addr,
23962306a36Sopenharmony_ci			      bool trace_end)
24062306a36Sopenharmony_ci{
24162306a36Sopenharmony_ci	int err = 0;
24262306a36Sopenharmony_ci
24362306a36Sopenharmony_ci	if (ts->cnt == ts->sz) {
24462306a36Sopenharmony_ci		err = thread_stack__grow(ts);
24562306a36Sopenharmony_ci		if (err) {
24662306a36Sopenharmony_ci			pr_warning("Out of memory: discarding thread stack\n");
24762306a36Sopenharmony_ci			ts->cnt = 0;
24862306a36Sopenharmony_ci		}
24962306a36Sopenharmony_ci	}
25062306a36Sopenharmony_ci
25162306a36Sopenharmony_ci	ts->stack[ts->cnt].trace_end = trace_end;
25262306a36Sopenharmony_ci	ts->stack[ts->cnt++].ret_addr = ret_addr;
25362306a36Sopenharmony_ci
25462306a36Sopenharmony_ci	return err;
25562306a36Sopenharmony_ci}
25662306a36Sopenharmony_ci
25762306a36Sopenharmony_cistatic void thread_stack__pop(struct thread_stack *ts, u64 ret_addr)
25862306a36Sopenharmony_ci{
25962306a36Sopenharmony_ci	size_t i;
26062306a36Sopenharmony_ci
26162306a36Sopenharmony_ci	/*
26262306a36Sopenharmony_ci	 * In some cases there may be functions which are not seen to return.
26362306a36Sopenharmony_ci	 * For example when setjmp / longjmp has been used.  Or the perf context
26462306a36Sopenharmony_ci	 * switch in the kernel which doesn't stop and start tracing in exactly
26562306a36Sopenharmony_ci	 * the same code path.  When that happens the return address will be
26662306a36Sopenharmony_ci	 * further down the stack.  If the return address is not found at all,
26762306a36Sopenharmony_ci	 * we assume the opposite (i.e. this is a return for a call that wasn't
26862306a36Sopenharmony_ci	 * seen for some reason) and leave the stack alone.
26962306a36Sopenharmony_ci	 */
27062306a36Sopenharmony_ci	for (i = ts->cnt; i; ) {
27162306a36Sopenharmony_ci		if (ts->stack[--i].ret_addr == ret_addr) {
27262306a36Sopenharmony_ci			ts->cnt = i;
27362306a36Sopenharmony_ci			return;
27462306a36Sopenharmony_ci		}
27562306a36Sopenharmony_ci	}
27662306a36Sopenharmony_ci}
27762306a36Sopenharmony_ci
27862306a36Sopenharmony_cistatic void thread_stack__pop_trace_end(struct thread_stack *ts)
27962306a36Sopenharmony_ci{
28062306a36Sopenharmony_ci	size_t i;
28162306a36Sopenharmony_ci
28262306a36Sopenharmony_ci	for (i = ts->cnt; i; ) {
28362306a36Sopenharmony_ci		if (ts->stack[--i].trace_end)
28462306a36Sopenharmony_ci			ts->cnt = i;
28562306a36Sopenharmony_ci		else
28662306a36Sopenharmony_ci			return;
28762306a36Sopenharmony_ci	}
28862306a36Sopenharmony_ci}
28962306a36Sopenharmony_ci
29062306a36Sopenharmony_cistatic bool thread_stack__in_kernel(struct thread_stack *ts)
29162306a36Sopenharmony_ci{
29262306a36Sopenharmony_ci	if (!ts->cnt)
29362306a36Sopenharmony_ci		return false;
29462306a36Sopenharmony_ci
29562306a36Sopenharmony_ci	return ts->stack[ts->cnt - 1].cp->in_kernel;
29662306a36Sopenharmony_ci}
29762306a36Sopenharmony_ci
29862306a36Sopenharmony_cistatic int thread_stack__call_return(struct thread *thread,
29962306a36Sopenharmony_ci				     struct thread_stack *ts, size_t idx,
30062306a36Sopenharmony_ci				     u64 timestamp, u64 ref, bool no_return)
30162306a36Sopenharmony_ci{
30262306a36Sopenharmony_ci	struct call_return_processor *crp = ts->crp;
30362306a36Sopenharmony_ci	struct thread_stack_entry *tse;
30462306a36Sopenharmony_ci	struct call_return cr = {
30562306a36Sopenharmony_ci		.thread = thread,
30662306a36Sopenharmony_ci		.comm = ts->comm,
30762306a36Sopenharmony_ci		.db_id = 0,
30862306a36Sopenharmony_ci	};
30962306a36Sopenharmony_ci	u64 *parent_db_id;
31062306a36Sopenharmony_ci
31162306a36Sopenharmony_ci	tse = &ts->stack[idx];
31262306a36Sopenharmony_ci	cr.cp = tse->cp;
31362306a36Sopenharmony_ci	cr.call_time = tse->timestamp;
31462306a36Sopenharmony_ci	cr.return_time = timestamp;
31562306a36Sopenharmony_ci	cr.branch_count = ts->branch_count - tse->branch_count;
31662306a36Sopenharmony_ci	cr.insn_count = ts->insn_count - tse->insn_count;
31762306a36Sopenharmony_ci	cr.cyc_count = ts->cyc_count - tse->cyc_count;
31862306a36Sopenharmony_ci	cr.db_id = tse->db_id;
31962306a36Sopenharmony_ci	cr.call_ref = tse->ref;
32062306a36Sopenharmony_ci	cr.return_ref = ref;
32162306a36Sopenharmony_ci	if (tse->no_call)
32262306a36Sopenharmony_ci		cr.flags |= CALL_RETURN_NO_CALL;
32362306a36Sopenharmony_ci	if (no_return)
32462306a36Sopenharmony_ci		cr.flags |= CALL_RETURN_NO_RETURN;
32562306a36Sopenharmony_ci	if (tse->non_call)
32662306a36Sopenharmony_ci		cr.flags |= CALL_RETURN_NON_CALL;
32762306a36Sopenharmony_ci
32862306a36Sopenharmony_ci	/*
32962306a36Sopenharmony_ci	 * The parent db_id must be assigned before exporting the child. Note
33062306a36Sopenharmony_ci	 * it is not possible to export the parent first because its information
33162306a36Sopenharmony_ci	 * is not yet complete because its 'return' has not yet been processed.
33262306a36Sopenharmony_ci	 */
33362306a36Sopenharmony_ci	parent_db_id = idx ? &(tse - 1)->db_id : NULL;
33462306a36Sopenharmony_ci
33562306a36Sopenharmony_ci	return crp->process(&cr, parent_db_id, crp->data);
33662306a36Sopenharmony_ci}
33762306a36Sopenharmony_ci
33862306a36Sopenharmony_cistatic int __thread_stack__flush(struct thread *thread, struct thread_stack *ts)
33962306a36Sopenharmony_ci{
34062306a36Sopenharmony_ci	struct call_return_processor *crp = ts->crp;
34162306a36Sopenharmony_ci	int err;
34262306a36Sopenharmony_ci
34362306a36Sopenharmony_ci	if (!crp) {
34462306a36Sopenharmony_ci		ts->cnt = 0;
34562306a36Sopenharmony_ci		ts->br_stack_pos = 0;
34662306a36Sopenharmony_ci		if (ts->br_stack_rb)
34762306a36Sopenharmony_ci			ts->br_stack_rb->nr = 0;
34862306a36Sopenharmony_ci		return 0;
34962306a36Sopenharmony_ci	}
35062306a36Sopenharmony_ci
35162306a36Sopenharmony_ci	while (ts->cnt) {
35262306a36Sopenharmony_ci		err = thread_stack__call_return(thread, ts, --ts->cnt,
35362306a36Sopenharmony_ci						ts->last_time, 0, true);
35462306a36Sopenharmony_ci		if (err) {
35562306a36Sopenharmony_ci			pr_err("Error flushing thread stack!\n");
35662306a36Sopenharmony_ci			ts->cnt = 0;
35762306a36Sopenharmony_ci			return err;
35862306a36Sopenharmony_ci		}
35962306a36Sopenharmony_ci	}
36062306a36Sopenharmony_ci
36162306a36Sopenharmony_ci	return 0;
36262306a36Sopenharmony_ci}
36362306a36Sopenharmony_ci
36462306a36Sopenharmony_ciint thread_stack__flush(struct thread *thread)
36562306a36Sopenharmony_ci{
36662306a36Sopenharmony_ci	struct thread_stack *ts = thread__ts(thread);
36762306a36Sopenharmony_ci	unsigned int pos;
36862306a36Sopenharmony_ci	int err = 0;
36962306a36Sopenharmony_ci
37062306a36Sopenharmony_ci	if (ts) {
37162306a36Sopenharmony_ci		for (pos = 0; pos < ts->arr_sz; pos++) {
37262306a36Sopenharmony_ci			int ret = __thread_stack__flush(thread, ts + pos);
37362306a36Sopenharmony_ci
37462306a36Sopenharmony_ci			if (ret)
37562306a36Sopenharmony_ci				err = ret;
37662306a36Sopenharmony_ci		}
37762306a36Sopenharmony_ci	}
37862306a36Sopenharmony_ci
37962306a36Sopenharmony_ci	return err;
38062306a36Sopenharmony_ci}
38162306a36Sopenharmony_ci
38262306a36Sopenharmony_cistatic void thread_stack__update_br_stack(struct thread_stack *ts, u32 flags,
38362306a36Sopenharmony_ci					  u64 from_ip, u64 to_ip)
38462306a36Sopenharmony_ci{
38562306a36Sopenharmony_ci	struct branch_stack *bs = ts->br_stack_rb;
38662306a36Sopenharmony_ci	struct branch_entry *be;
38762306a36Sopenharmony_ci
38862306a36Sopenharmony_ci	if (!ts->br_stack_pos)
38962306a36Sopenharmony_ci		ts->br_stack_pos = ts->br_stack_sz;
39062306a36Sopenharmony_ci
39162306a36Sopenharmony_ci	ts->br_stack_pos -= 1;
39262306a36Sopenharmony_ci
39362306a36Sopenharmony_ci	be              = &bs->entries[ts->br_stack_pos];
39462306a36Sopenharmony_ci	be->from        = from_ip;
39562306a36Sopenharmony_ci	be->to          = to_ip;
39662306a36Sopenharmony_ci	be->flags.value = 0;
39762306a36Sopenharmony_ci	be->flags.abort = !!(flags & PERF_IP_FLAG_TX_ABORT);
39862306a36Sopenharmony_ci	be->flags.in_tx = !!(flags & PERF_IP_FLAG_IN_TX);
39962306a36Sopenharmony_ci	/* No support for mispredict */
40062306a36Sopenharmony_ci	be->flags.mispred = ts->mispred_all;
40162306a36Sopenharmony_ci
40262306a36Sopenharmony_ci	if (bs->nr < ts->br_stack_sz)
40362306a36Sopenharmony_ci		bs->nr += 1;
40462306a36Sopenharmony_ci}
40562306a36Sopenharmony_ci
40662306a36Sopenharmony_ciint thread_stack__event(struct thread *thread, int cpu, u32 flags, u64 from_ip,
40762306a36Sopenharmony_ci			u64 to_ip, u16 insn_len, u64 trace_nr, bool callstack,
40862306a36Sopenharmony_ci			unsigned int br_stack_sz, bool mispred_all)
40962306a36Sopenharmony_ci{
41062306a36Sopenharmony_ci	struct thread_stack *ts = thread__stack(thread, cpu);
41162306a36Sopenharmony_ci
41262306a36Sopenharmony_ci	if (!thread)
41362306a36Sopenharmony_ci		return -EINVAL;
41462306a36Sopenharmony_ci
41562306a36Sopenharmony_ci	if (!ts) {
41662306a36Sopenharmony_ci		ts = thread_stack__new(thread, cpu, NULL, callstack, br_stack_sz);
41762306a36Sopenharmony_ci		if (!ts) {
41862306a36Sopenharmony_ci			pr_warning("Out of memory: no thread stack\n");
41962306a36Sopenharmony_ci			return -ENOMEM;
42062306a36Sopenharmony_ci		}
42162306a36Sopenharmony_ci		ts->trace_nr = trace_nr;
42262306a36Sopenharmony_ci		ts->mispred_all = mispred_all;
42362306a36Sopenharmony_ci	}
42462306a36Sopenharmony_ci
42562306a36Sopenharmony_ci	/*
42662306a36Sopenharmony_ci	 * When the trace is discontinuous, the trace_nr changes.  In that case
42762306a36Sopenharmony_ci	 * the stack might be completely invalid.  Better to report nothing than
42862306a36Sopenharmony_ci	 * to report something misleading, so flush the stack.
42962306a36Sopenharmony_ci	 */
43062306a36Sopenharmony_ci	if (trace_nr != ts->trace_nr) {
43162306a36Sopenharmony_ci		if (ts->trace_nr)
43262306a36Sopenharmony_ci			__thread_stack__flush(thread, ts);
43362306a36Sopenharmony_ci		ts->trace_nr = trace_nr;
43462306a36Sopenharmony_ci	}
43562306a36Sopenharmony_ci
43662306a36Sopenharmony_ci	if (br_stack_sz)
43762306a36Sopenharmony_ci		thread_stack__update_br_stack(ts, flags, from_ip, to_ip);
43862306a36Sopenharmony_ci
43962306a36Sopenharmony_ci	/*
44062306a36Sopenharmony_ci	 * Stop here if thread_stack__process() is in use, or not recording call
44162306a36Sopenharmony_ci	 * stack.
44262306a36Sopenharmony_ci	 */
44362306a36Sopenharmony_ci	if (ts->crp || !callstack)
44462306a36Sopenharmony_ci		return 0;
44562306a36Sopenharmony_ci
44662306a36Sopenharmony_ci	if (flags & PERF_IP_FLAG_CALL) {
44762306a36Sopenharmony_ci		u64 ret_addr;
44862306a36Sopenharmony_ci
44962306a36Sopenharmony_ci		if (!to_ip)
45062306a36Sopenharmony_ci			return 0;
45162306a36Sopenharmony_ci		ret_addr = from_ip + insn_len;
45262306a36Sopenharmony_ci		if (ret_addr == to_ip)
45362306a36Sopenharmony_ci			return 0; /* Zero-length calls are excluded */
45462306a36Sopenharmony_ci		return thread_stack__push(ts, ret_addr,
45562306a36Sopenharmony_ci					  flags & PERF_IP_FLAG_TRACE_END);
45662306a36Sopenharmony_ci	} else if (flags & PERF_IP_FLAG_TRACE_BEGIN) {
45762306a36Sopenharmony_ci		/*
45862306a36Sopenharmony_ci		 * If the caller did not change the trace number (which would
45962306a36Sopenharmony_ci		 * have flushed the stack) then try to make sense of the stack.
46062306a36Sopenharmony_ci		 * Possibly, tracing began after returning to the current
46162306a36Sopenharmony_ci		 * address, so try to pop that. Also, do not expect a call made
46262306a36Sopenharmony_ci		 * when the trace ended, to return, so pop that.
46362306a36Sopenharmony_ci		 */
46462306a36Sopenharmony_ci		thread_stack__pop(ts, to_ip);
46562306a36Sopenharmony_ci		thread_stack__pop_trace_end(ts);
46662306a36Sopenharmony_ci	} else if ((flags & PERF_IP_FLAG_RETURN) && from_ip) {
46762306a36Sopenharmony_ci		thread_stack__pop(ts, to_ip);
46862306a36Sopenharmony_ci	}
46962306a36Sopenharmony_ci
47062306a36Sopenharmony_ci	return 0;
47162306a36Sopenharmony_ci}
47262306a36Sopenharmony_ci
47362306a36Sopenharmony_civoid thread_stack__set_trace_nr(struct thread *thread, int cpu, u64 trace_nr)
47462306a36Sopenharmony_ci{
47562306a36Sopenharmony_ci	struct thread_stack *ts = thread__stack(thread, cpu);
47662306a36Sopenharmony_ci
47762306a36Sopenharmony_ci	if (!ts)
47862306a36Sopenharmony_ci		return;
47962306a36Sopenharmony_ci
48062306a36Sopenharmony_ci	if (trace_nr != ts->trace_nr) {
48162306a36Sopenharmony_ci		if (ts->trace_nr)
48262306a36Sopenharmony_ci			__thread_stack__flush(thread, ts);
48362306a36Sopenharmony_ci		ts->trace_nr = trace_nr;
48462306a36Sopenharmony_ci	}
48562306a36Sopenharmony_ci}
48662306a36Sopenharmony_ci
48762306a36Sopenharmony_cistatic void __thread_stack__free(struct thread *thread, struct thread_stack *ts)
48862306a36Sopenharmony_ci{
48962306a36Sopenharmony_ci	__thread_stack__flush(thread, ts);
49062306a36Sopenharmony_ci	zfree(&ts->stack);
49162306a36Sopenharmony_ci	zfree(&ts->br_stack_rb);
49262306a36Sopenharmony_ci}
49362306a36Sopenharmony_ci
49462306a36Sopenharmony_cistatic void thread_stack__reset(struct thread *thread, struct thread_stack *ts)
49562306a36Sopenharmony_ci{
49662306a36Sopenharmony_ci	unsigned int arr_sz = ts->arr_sz;
49762306a36Sopenharmony_ci
49862306a36Sopenharmony_ci	__thread_stack__free(thread, ts);
49962306a36Sopenharmony_ci	memset(ts, 0, sizeof(*ts));
50062306a36Sopenharmony_ci	ts->arr_sz = arr_sz;
50162306a36Sopenharmony_ci}
50262306a36Sopenharmony_ci
50362306a36Sopenharmony_civoid thread_stack__free(struct thread *thread)
50462306a36Sopenharmony_ci{
50562306a36Sopenharmony_ci	struct thread_stack *ts = thread__ts(thread);
50662306a36Sopenharmony_ci	unsigned int pos;
50762306a36Sopenharmony_ci
50862306a36Sopenharmony_ci	if (ts) {
50962306a36Sopenharmony_ci		for (pos = 0; pos < ts->arr_sz; pos++)
51062306a36Sopenharmony_ci			__thread_stack__free(thread, ts + pos);
51162306a36Sopenharmony_ci		free(thread__ts(thread));
51262306a36Sopenharmony_ci		thread__set_ts(thread, NULL);
51362306a36Sopenharmony_ci	}
51462306a36Sopenharmony_ci}
51562306a36Sopenharmony_ci
51662306a36Sopenharmony_cistatic inline u64 callchain_context(u64 ip, u64 kernel_start)
51762306a36Sopenharmony_ci{
51862306a36Sopenharmony_ci	return ip < kernel_start ? PERF_CONTEXT_USER : PERF_CONTEXT_KERNEL;
51962306a36Sopenharmony_ci}
52062306a36Sopenharmony_ci
52162306a36Sopenharmony_civoid thread_stack__sample(struct thread *thread, int cpu,
52262306a36Sopenharmony_ci			  struct ip_callchain *chain,
52362306a36Sopenharmony_ci			  size_t sz, u64 ip, u64 kernel_start)
52462306a36Sopenharmony_ci{
52562306a36Sopenharmony_ci	struct thread_stack *ts = thread__stack(thread, cpu);
52662306a36Sopenharmony_ci	u64 context = callchain_context(ip, kernel_start);
52762306a36Sopenharmony_ci	u64 last_context;
52862306a36Sopenharmony_ci	size_t i, j;
52962306a36Sopenharmony_ci
53062306a36Sopenharmony_ci	if (sz < 2) {
53162306a36Sopenharmony_ci		chain->nr = 0;
53262306a36Sopenharmony_ci		return;
53362306a36Sopenharmony_ci	}
53462306a36Sopenharmony_ci
53562306a36Sopenharmony_ci	chain->ips[0] = context;
53662306a36Sopenharmony_ci	chain->ips[1] = ip;
53762306a36Sopenharmony_ci
53862306a36Sopenharmony_ci	if (!ts) {
53962306a36Sopenharmony_ci		chain->nr = 2;
54062306a36Sopenharmony_ci		return;
54162306a36Sopenharmony_ci	}
54262306a36Sopenharmony_ci
54362306a36Sopenharmony_ci	last_context = context;
54462306a36Sopenharmony_ci
54562306a36Sopenharmony_ci	for (i = 2, j = 1; i < sz && j <= ts->cnt; i++, j++) {
54662306a36Sopenharmony_ci		ip = ts->stack[ts->cnt - j].ret_addr;
54762306a36Sopenharmony_ci		context = callchain_context(ip, kernel_start);
54862306a36Sopenharmony_ci		if (context != last_context) {
54962306a36Sopenharmony_ci			if (i >= sz - 1)
55062306a36Sopenharmony_ci				break;
55162306a36Sopenharmony_ci			chain->ips[i++] = context;
55262306a36Sopenharmony_ci			last_context = context;
55362306a36Sopenharmony_ci		}
55462306a36Sopenharmony_ci		chain->ips[i] = ip;
55562306a36Sopenharmony_ci	}
55662306a36Sopenharmony_ci
55762306a36Sopenharmony_ci	chain->nr = i;
55862306a36Sopenharmony_ci}
55962306a36Sopenharmony_ci
56062306a36Sopenharmony_ci/*
56162306a36Sopenharmony_ci * Hardware sample records, created some time after the event occurred, need to
56262306a36Sopenharmony_ci * have subsequent addresses removed from the call chain.
56362306a36Sopenharmony_ci */
56462306a36Sopenharmony_civoid thread_stack__sample_late(struct thread *thread, int cpu,
56562306a36Sopenharmony_ci			       struct ip_callchain *chain, size_t sz,
56662306a36Sopenharmony_ci			       u64 sample_ip, u64 kernel_start)
56762306a36Sopenharmony_ci{
56862306a36Sopenharmony_ci	struct thread_stack *ts = thread__stack(thread, cpu);
56962306a36Sopenharmony_ci	u64 sample_context = callchain_context(sample_ip, kernel_start);
57062306a36Sopenharmony_ci	u64 last_context, context, ip;
57162306a36Sopenharmony_ci	size_t nr = 0, j;
57262306a36Sopenharmony_ci
57362306a36Sopenharmony_ci	if (sz < 2) {
57462306a36Sopenharmony_ci		chain->nr = 0;
57562306a36Sopenharmony_ci		return;
57662306a36Sopenharmony_ci	}
57762306a36Sopenharmony_ci
57862306a36Sopenharmony_ci	if (!ts)
57962306a36Sopenharmony_ci		goto out;
58062306a36Sopenharmony_ci
58162306a36Sopenharmony_ci	/*
58262306a36Sopenharmony_ci	 * When tracing kernel space, kernel addresses occur at the top of the
58362306a36Sopenharmony_ci	 * call chain after the event occurred but before tracing stopped.
58462306a36Sopenharmony_ci	 * Skip them.
58562306a36Sopenharmony_ci	 */
58662306a36Sopenharmony_ci	for (j = 1; j <= ts->cnt; j++) {
58762306a36Sopenharmony_ci		ip = ts->stack[ts->cnt - j].ret_addr;
58862306a36Sopenharmony_ci		context = callchain_context(ip, kernel_start);
58962306a36Sopenharmony_ci		if (context == PERF_CONTEXT_USER ||
59062306a36Sopenharmony_ci		    (context == sample_context && ip == sample_ip))
59162306a36Sopenharmony_ci			break;
59262306a36Sopenharmony_ci	}
59362306a36Sopenharmony_ci
59462306a36Sopenharmony_ci	last_context = sample_ip; /* Use sample_ip as an invalid context */
59562306a36Sopenharmony_ci
59662306a36Sopenharmony_ci	for (; nr < sz && j <= ts->cnt; nr++, j++) {
59762306a36Sopenharmony_ci		ip = ts->stack[ts->cnt - j].ret_addr;
59862306a36Sopenharmony_ci		context = callchain_context(ip, kernel_start);
59962306a36Sopenharmony_ci		if (context != last_context) {
60062306a36Sopenharmony_ci			if (nr >= sz - 1)
60162306a36Sopenharmony_ci				break;
60262306a36Sopenharmony_ci			chain->ips[nr++] = context;
60362306a36Sopenharmony_ci			last_context = context;
60462306a36Sopenharmony_ci		}
60562306a36Sopenharmony_ci		chain->ips[nr] = ip;
60662306a36Sopenharmony_ci	}
60762306a36Sopenharmony_ciout:
60862306a36Sopenharmony_ci	if (nr) {
60962306a36Sopenharmony_ci		chain->nr = nr;
61062306a36Sopenharmony_ci	} else {
61162306a36Sopenharmony_ci		chain->ips[0] = sample_context;
61262306a36Sopenharmony_ci		chain->ips[1] = sample_ip;
61362306a36Sopenharmony_ci		chain->nr = 2;
61462306a36Sopenharmony_ci	}
61562306a36Sopenharmony_ci}
61662306a36Sopenharmony_ci
61762306a36Sopenharmony_civoid thread_stack__br_sample(struct thread *thread, int cpu,
61862306a36Sopenharmony_ci			     struct branch_stack *dst, unsigned int sz)
61962306a36Sopenharmony_ci{
62062306a36Sopenharmony_ci	struct thread_stack *ts = thread__stack(thread, cpu);
62162306a36Sopenharmony_ci	const size_t bsz = sizeof(struct branch_entry);
62262306a36Sopenharmony_ci	struct branch_stack *src;
62362306a36Sopenharmony_ci	struct branch_entry *be;
62462306a36Sopenharmony_ci	unsigned int nr;
62562306a36Sopenharmony_ci
62662306a36Sopenharmony_ci	dst->nr = 0;
62762306a36Sopenharmony_ci
62862306a36Sopenharmony_ci	if (!ts)
62962306a36Sopenharmony_ci		return;
63062306a36Sopenharmony_ci
63162306a36Sopenharmony_ci	src = ts->br_stack_rb;
63262306a36Sopenharmony_ci	if (!src->nr)
63362306a36Sopenharmony_ci		return;
63462306a36Sopenharmony_ci
63562306a36Sopenharmony_ci	dst->nr = min((unsigned int)src->nr, sz);
63662306a36Sopenharmony_ci
63762306a36Sopenharmony_ci	be = &dst->entries[0];
63862306a36Sopenharmony_ci	nr = min(ts->br_stack_sz - ts->br_stack_pos, (unsigned int)dst->nr);
63962306a36Sopenharmony_ci	memcpy(be, &src->entries[ts->br_stack_pos], bsz * nr);
64062306a36Sopenharmony_ci
64162306a36Sopenharmony_ci	if (src->nr >= ts->br_stack_sz) {
64262306a36Sopenharmony_ci		sz -= nr;
64362306a36Sopenharmony_ci		be = &dst->entries[nr];
64462306a36Sopenharmony_ci		nr = min(ts->br_stack_pos, sz);
64562306a36Sopenharmony_ci		memcpy(be, &src->entries[0], bsz * ts->br_stack_pos);
64662306a36Sopenharmony_ci	}
64762306a36Sopenharmony_ci}
64862306a36Sopenharmony_ci
64962306a36Sopenharmony_ci/* Start of user space branch entries */
65062306a36Sopenharmony_cistatic bool us_start(struct branch_entry *be, u64 kernel_start, bool *start)
65162306a36Sopenharmony_ci{
65262306a36Sopenharmony_ci	if (!*start)
65362306a36Sopenharmony_ci		*start = be->to && be->to < kernel_start;
65462306a36Sopenharmony_ci
65562306a36Sopenharmony_ci	return *start;
65662306a36Sopenharmony_ci}
65762306a36Sopenharmony_ci
65862306a36Sopenharmony_ci/*
65962306a36Sopenharmony_ci * Start of branch entries after the ip fell in between 2 branches, or user
66062306a36Sopenharmony_ci * space branch entries.
66162306a36Sopenharmony_ci */
66262306a36Sopenharmony_cistatic bool ks_start(struct branch_entry *be, u64 sample_ip, u64 kernel_start,
66362306a36Sopenharmony_ci		     bool *start, struct branch_entry *nb)
66462306a36Sopenharmony_ci{
66562306a36Sopenharmony_ci	if (!*start) {
66662306a36Sopenharmony_ci		*start = (nb && sample_ip >= be->to && sample_ip <= nb->from) ||
66762306a36Sopenharmony_ci			 be->from < kernel_start ||
66862306a36Sopenharmony_ci			 (be->to && be->to < kernel_start);
66962306a36Sopenharmony_ci	}
67062306a36Sopenharmony_ci
67162306a36Sopenharmony_ci	return *start;
67262306a36Sopenharmony_ci}
67362306a36Sopenharmony_ci
67462306a36Sopenharmony_ci/*
67562306a36Sopenharmony_ci * Hardware sample records, created some time after the event occurred, need to
67662306a36Sopenharmony_ci * have subsequent addresses removed from the branch stack.
67762306a36Sopenharmony_ci */
67862306a36Sopenharmony_civoid thread_stack__br_sample_late(struct thread *thread, int cpu,
67962306a36Sopenharmony_ci				  struct branch_stack *dst, unsigned int sz,
68062306a36Sopenharmony_ci				  u64 ip, u64 kernel_start)
68162306a36Sopenharmony_ci{
68262306a36Sopenharmony_ci	struct thread_stack *ts = thread__stack(thread, cpu);
68362306a36Sopenharmony_ci	struct branch_entry *d, *s, *spos, *ssz;
68462306a36Sopenharmony_ci	struct branch_stack *src;
68562306a36Sopenharmony_ci	unsigned int nr = 0;
68662306a36Sopenharmony_ci	bool start = false;
68762306a36Sopenharmony_ci
68862306a36Sopenharmony_ci	dst->nr = 0;
68962306a36Sopenharmony_ci
69062306a36Sopenharmony_ci	if (!ts)
69162306a36Sopenharmony_ci		return;
69262306a36Sopenharmony_ci
69362306a36Sopenharmony_ci	src = ts->br_stack_rb;
69462306a36Sopenharmony_ci	if (!src->nr)
69562306a36Sopenharmony_ci		return;
69662306a36Sopenharmony_ci
69762306a36Sopenharmony_ci	spos = &src->entries[ts->br_stack_pos];
69862306a36Sopenharmony_ci	ssz  = &src->entries[ts->br_stack_sz];
69962306a36Sopenharmony_ci
70062306a36Sopenharmony_ci	d = &dst->entries[0];
70162306a36Sopenharmony_ci	s = spos;
70262306a36Sopenharmony_ci
70362306a36Sopenharmony_ci	if (ip < kernel_start) {
70462306a36Sopenharmony_ci		/*
70562306a36Sopenharmony_ci		 * User space sample: start copying branch entries when the
70662306a36Sopenharmony_ci		 * branch is in user space.
70762306a36Sopenharmony_ci		 */
70862306a36Sopenharmony_ci		for (s = spos; s < ssz && nr < sz; s++) {
70962306a36Sopenharmony_ci			if (us_start(s, kernel_start, &start)) {
71062306a36Sopenharmony_ci				*d++ = *s;
71162306a36Sopenharmony_ci				nr += 1;
71262306a36Sopenharmony_ci			}
71362306a36Sopenharmony_ci		}
71462306a36Sopenharmony_ci
71562306a36Sopenharmony_ci		if (src->nr >= ts->br_stack_sz) {
71662306a36Sopenharmony_ci			for (s = &src->entries[0]; s < spos && nr < sz; s++) {
71762306a36Sopenharmony_ci				if (us_start(s, kernel_start, &start)) {
71862306a36Sopenharmony_ci					*d++ = *s;
71962306a36Sopenharmony_ci					nr += 1;
72062306a36Sopenharmony_ci				}
72162306a36Sopenharmony_ci			}
72262306a36Sopenharmony_ci		}
72362306a36Sopenharmony_ci	} else {
72462306a36Sopenharmony_ci		struct branch_entry *nb = NULL;
72562306a36Sopenharmony_ci
72662306a36Sopenharmony_ci		/*
72762306a36Sopenharmony_ci		 * Kernel space sample: start copying branch entries when the ip
72862306a36Sopenharmony_ci		 * falls in between 2 branches (or the branch is in user space
72962306a36Sopenharmony_ci		 * because then the start must have been missed).
73062306a36Sopenharmony_ci		 */
73162306a36Sopenharmony_ci		for (s = spos; s < ssz && nr < sz; s++) {
73262306a36Sopenharmony_ci			if (ks_start(s, ip, kernel_start, &start, nb)) {
73362306a36Sopenharmony_ci				*d++ = *s;
73462306a36Sopenharmony_ci				nr += 1;
73562306a36Sopenharmony_ci			}
73662306a36Sopenharmony_ci			nb = s;
73762306a36Sopenharmony_ci		}
73862306a36Sopenharmony_ci
73962306a36Sopenharmony_ci		if (src->nr >= ts->br_stack_sz) {
74062306a36Sopenharmony_ci			for (s = &src->entries[0]; s < spos && nr < sz; s++) {
74162306a36Sopenharmony_ci				if (ks_start(s, ip, kernel_start, &start, nb)) {
74262306a36Sopenharmony_ci					*d++ = *s;
74362306a36Sopenharmony_ci					nr += 1;
74462306a36Sopenharmony_ci				}
74562306a36Sopenharmony_ci				nb = s;
74662306a36Sopenharmony_ci			}
74762306a36Sopenharmony_ci		}
74862306a36Sopenharmony_ci	}
74962306a36Sopenharmony_ci
75062306a36Sopenharmony_ci	dst->nr = nr;
75162306a36Sopenharmony_ci}
75262306a36Sopenharmony_ci
75362306a36Sopenharmony_cistruct call_return_processor *
75462306a36Sopenharmony_cicall_return_processor__new(int (*process)(struct call_return *cr, u64 *parent_db_id, void *data),
75562306a36Sopenharmony_ci			   void *data)
75662306a36Sopenharmony_ci{
75762306a36Sopenharmony_ci	struct call_return_processor *crp;
75862306a36Sopenharmony_ci
75962306a36Sopenharmony_ci	crp = zalloc(sizeof(struct call_return_processor));
76062306a36Sopenharmony_ci	if (!crp)
76162306a36Sopenharmony_ci		return NULL;
76262306a36Sopenharmony_ci	crp->cpr = call_path_root__new();
76362306a36Sopenharmony_ci	if (!crp->cpr)
76462306a36Sopenharmony_ci		goto out_free;
76562306a36Sopenharmony_ci	crp->process = process;
76662306a36Sopenharmony_ci	crp->data = data;
76762306a36Sopenharmony_ci	return crp;
76862306a36Sopenharmony_ci
76962306a36Sopenharmony_ciout_free:
77062306a36Sopenharmony_ci	free(crp);
77162306a36Sopenharmony_ci	return NULL;
77262306a36Sopenharmony_ci}
77362306a36Sopenharmony_ci
77462306a36Sopenharmony_civoid call_return_processor__free(struct call_return_processor *crp)
77562306a36Sopenharmony_ci{
77662306a36Sopenharmony_ci	if (crp) {
77762306a36Sopenharmony_ci		call_path_root__free(crp->cpr);
77862306a36Sopenharmony_ci		free(crp);
77962306a36Sopenharmony_ci	}
78062306a36Sopenharmony_ci}
78162306a36Sopenharmony_ci
78262306a36Sopenharmony_cistatic int thread_stack__push_cp(struct thread_stack *ts, u64 ret_addr,
78362306a36Sopenharmony_ci				 u64 timestamp, u64 ref, struct call_path *cp,
78462306a36Sopenharmony_ci				 bool no_call, bool trace_end)
78562306a36Sopenharmony_ci{
78662306a36Sopenharmony_ci	struct thread_stack_entry *tse;
78762306a36Sopenharmony_ci	int err;
78862306a36Sopenharmony_ci
78962306a36Sopenharmony_ci	if (!cp)
79062306a36Sopenharmony_ci		return -ENOMEM;
79162306a36Sopenharmony_ci
79262306a36Sopenharmony_ci	if (ts->cnt == ts->sz) {
79362306a36Sopenharmony_ci		err = thread_stack__grow(ts);
79462306a36Sopenharmony_ci		if (err)
79562306a36Sopenharmony_ci			return err;
79662306a36Sopenharmony_ci	}
79762306a36Sopenharmony_ci
79862306a36Sopenharmony_ci	tse = &ts->stack[ts->cnt++];
79962306a36Sopenharmony_ci	tse->ret_addr = ret_addr;
80062306a36Sopenharmony_ci	tse->timestamp = timestamp;
80162306a36Sopenharmony_ci	tse->ref = ref;
80262306a36Sopenharmony_ci	tse->branch_count = ts->branch_count;
80362306a36Sopenharmony_ci	tse->insn_count = ts->insn_count;
80462306a36Sopenharmony_ci	tse->cyc_count = ts->cyc_count;
80562306a36Sopenharmony_ci	tse->cp = cp;
80662306a36Sopenharmony_ci	tse->no_call = no_call;
80762306a36Sopenharmony_ci	tse->trace_end = trace_end;
80862306a36Sopenharmony_ci	tse->non_call = false;
80962306a36Sopenharmony_ci	tse->db_id = 0;
81062306a36Sopenharmony_ci
81162306a36Sopenharmony_ci	return 0;
81262306a36Sopenharmony_ci}
81362306a36Sopenharmony_ci
81462306a36Sopenharmony_cistatic int thread_stack__pop_cp(struct thread *thread, struct thread_stack *ts,
81562306a36Sopenharmony_ci				u64 ret_addr, u64 timestamp, u64 ref,
81662306a36Sopenharmony_ci				struct symbol *sym)
81762306a36Sopenharmony_ci{
81862306a36Sopenharmony_ci	int err;
81962306a36Sopenharmony_ci
82062306a36Sopenharmony_ci	if (!ts->cnt)
82162306a36Sopenharmony_ci		return 1;
82262306a36Sopenharmony_ci
82362306a36Sopenharmony_ci	if (ts->cnt == 1) {
82462306a36Sopenharmony_ci		struct thread_stack_entry *tse = &ts->stack[0];
82562306a36Sopenharmony_ci
82662306a36Sopenharmony_ci		if (tse->cp->sym == sym)
82762306a36Sopenharmony_ci			return thread_stack__call_return(thread, ts, --ts->cnt,
82862306a36Sopenharmony_ci							 timestamp, ref, false);
82962306a36Sopenharmony_ci	}
83062306a36Sopenharmony_ci
83162306a36Sopenharmony_ci	if (ts->stack[ts->cnt - 1].ret_addr == ret_addr &&
83262306a36Sopenharmony_ci	    !ts->stack[ts->cnt - 1].non_call) {
83362306a36Sopenharmony_ci		return thread_stack__call_return(thread, ts, --ts->cnt,
83462306a36Sopenharmony_ci						 timestamp, ref, false);
83562306a36Sopenharmony_ci	} else {
83662306a36Sopenharmony_ci		size_t i = ts->cnt - 1;
83762306a36Sopenharmony_ci
83862306a36Sopenharmony_ci		while (i--) {
83962306a36Sopenharmony_ci			if (ts->stack[i].ret_addr != ret_addr ||
84062306a36Sopenharmony_ci			    ts->stack[i].non_call)
84162306a36Sopenharmony_ci				continue;
84262306a36Sopenharmony_ci			i += 1;
84362306a36Sopenharmony_ci			while (ts->cnt > i) {
84462306a36Sopenharmony_ci				err = thread_stack__call_return(thread, ts,
84562306a36Sopenharmony_ci								--ts->cnt,
84662306a36Sopenharmony_ci								timestamp, ref,
84762306a36Sopenharmony_ci								true);
84862306a36Sopenharmony_ci				if (err)
84962306a36Sopenharmony_ci					return err;
85062306a36Sopenharmony_ci			}
85162306a36Sopenharmony_ci			return thread_stack__call_return(thread, ts, --ts->cnt,
85262306a36Sopenharmony_ci							 timestamp, ref, false);
85362306a36Sopenharmony_ci		}
85462306a36Sopenharmony_ci	}
85562306a36Sopenharmony_ci
85662306a36Sopenharmony_ci	return 1;
85762306a36Sopenharmony_ci}
85862306a36Sopenharmony_ci
85962306a36Sopenharmony_cistatic int thread_stack__bottom(struct thread_stack *ts,
86062306a36Sopenharmony_ci				struct perf_sample *sample,
86162306a36Sopenharmony_ci				struct addr_location *from_al,
86262306a36Sopenharmony_ci				struct addr_location *to_al, u64 ref)
86362306a36Sopenharmony_ci{
86462306a36Sopenharmony_ci	struct call_path_root *cpr = ts->crp->cpr;
86562306a36Sopenharmony_ci	struct call_path *cp;
86662306a36Sopenharmony_ci	struct symbol *sym;
86762306a36Sopenharmony_ci	u64 ip;
86862306a36Sopenharmony_ci
86962306a36Sopenharmony_ci	if (sample->ip) {
87062306a36Sopenharmony_ci		ip = sample->ip;
87162306a36Sopenharmony_ci		sym = from_al->sym;
87262306a36Sopenharmony_ci	} else if (sample->addr) {
87362306a36Sopenharmony_ci		ip = sample->addr;
87462306a36Sopenharmony_ci		sym = to_al->sym;
87562306a36Sopenharmony_ci	} else {
87662306a36Sopenharmony_ci		return 0;
87762306a36Sopenharmony_ci	}
87862306a36Sopenharmony_ci
87962306a36Sopenharmony_ci	cp = call_path__findnew(cpr, &cpr->call_path, sym, ip,
88062306a36Sopenharmony_ci				ts->kernel_start);
88162306a36Sopenharmony_ci
88262306a36Sopenharmony_ci	return thread_stack__push_cp(ts, ip, sample->time, ref, cp,
88362306a36Sopenharmony_ci				     true, false);
88462306a36Sopenharmony_ci}
88562306a36Sopenharmony_ci
88662306a36Sopenharmony_cistatic int thread_stack__pop_ks(struct thread *thread, struct thread_stack *ts,
88762306a36Sopenharmony_ci				struct perf_sample *sample, u64 ref)
88862306a36Sopenharmony_ci{
88962306a36Sopenharmony_ci	u64 tm = sample->time;
89062306a36Sopenharmony_ci	int err;
89162306a36Sopenharmony_ci
89262306a36Sopenharmony_ci	/* Return to userspace, so pop all kernel addresses */
89362306a36Sopenharmony_ci	while (thread_stack__in_kernel(ts)) {
89462306a36Sopenharmony_ci		err = thread_stack__call_return(thread, ts, --ts->cnt,
89562306a36Sopenharmony_ci						tm, ref, true);
89662306a36Sopenharmony_ci		if (err)
89762306a36Sopenharmony_ci			return err;
89862306a36Sopenharmony_ci	}
89962306a36Sopenharmony_ci
90062306a36Sopenharmony_ci	return 0;
90162306a36Sopenharmony_ci}
90262306a36Sopenharmony_ci
90362306a36Sopenharmony_cistatic int thread_stack__no_call_return(struct thread *thread,
90462306a36Sopenharmony_ci					struct thread_stack *ts,
90562306a36Sopenharmony_ci					struct perf_sample *sample,
90662306a36Sopenharmony_ci					struct addr_location *from_al,
90762306a36Sopenharmony_ci					struct addr_location *to_al, u64 ref)
90862306a36Sopenharmony_ci{
90962306a36Sopenharmony_ci	struct call_path_root *cpr = ts->crp->cpr;
91062306a36Sopenharmony_ci	struct call_path *root = &cpr->call_path;
91162306a36Sopenharmony_ci	struct symbol *fsym = from_al->sym;
91262306a36Sopenharmony_ci	struct symbol *tsym = to_al->sym;
91362306a36Sopenharmony_ci	struct call_path *cp, *parent;
91462306a36Sopenharmony_ci	u64 ks = ts->kernel_start;
91562306a36Sopenharmony_ci	u64 addr = sample->addr;
91662306a36Sopenharmony_ci	u64 tm = sample->time;
91762306a36Sopenharmony_ci	u64 ip = sample->ip;
91862306a36Sopenharmony_ci	int err;
91962306a36Sopenharmony_ci
92062306a36Sopenharmony_ci	if (ip >= ks && addr < ks) {
92162306a36Sopenharmony_ci		/* Return to userspace, so pop all kernel addresses */
92262306a36Sopenharmony_ci		err = thread_stack__pop_ks(thread, ts, sample, ref);
92362306a36Sopenharmony_ci		if (err)
92462306a36Sopenharmony_ci			return err;
92562306a36Sopenharmony_ci
92662306a36Sopenharmony_ci		/* If the stack is empty, push the userspace address */
92762306a36Sopenharmony_ci		if (!ts->cnt) {
92862306a36Sopenharmony_ci			cp = call_path__findnew(cpr, root, tsym, addr, ks);
92962306a36Sopenharmony_ci			return thread_stack__push_cp(ts, 0, tm, ref, cp, true,
93062306a36Sopenharmony_ci						     false);
93162306a36Sopenharmony_ci		}
93262306a36Sopenharmony_ci	} else if (thread_stack__in_kernel(ts) && ip < ks) {
93362306a36Sopenharmony_ci		/* Return to userspace, so pop all kernel addresses */
93462306a36Sopenharmony_ci		err = thread_stack__pop_ks(thread, ts, sample, ref);
93562306a36Sopenharmony_ci		if (err)
93662306a36Sopenharmony_ci			return err;
93762306a36Sopenharmony_ci	}
93862306a36Sopenharmony_ci
93962306a36Sopenharmony_ci	if (ts->cnt)
94062306a36Sopenharmony_ci		parent = ts->stack[ts->cnt - 1].cp;
94162306a36Sopenharmony_ci	else
94262306a36Sopenharmony_ci		parent = root;
94362306a36Sopenharmony_ci
94462306a36Sopenharmony_ci	if (parent->sym == from_al->sym) {
94562306a36Sopenharmony_ci		/*
94662306a36Sopenharmony_ci		 * At the bottom of the stack, assume the missing 'call' was
94762306a36Sopenharmony_ci		 * before the trace started. So, pop the current symbol and push
94862306a36Sopenharmony_ci		 * the 'to' symbol.
94962306a36Sopenharmony_ci		 */
95062306a36Sopenharmony_ci		if (ts->cnt == 1) {
95162306a36Sopenharmony_ci			err = thread_stack__call_return(thread, ts, --ts->cnt,
95262306a36Sopenharmony_ci							tm, ref, false);
95362306a36Sopenharmony_ci			if (err)
95462306a36Sopenharmony_ci				return err;
95562306a36Sopenharmony_ci		}
95662306a36Sopenharmony_ci
95762306a36Sopenharmony_ci		if (!ts->cnt) {
95862306a36Sopenharmony_ci			cp = call_path__findnew(cpr, root, tsym, addr, ks);
95962306a36Sopenharmony_ci
96062306a36Sopenharmony_ci			return thread_stack__push_cp(ts, addr, tm, ref, cp,
96162306a36Sopenharmony_ci						     true, false);
96262306a36Sopenharmony_ci		}
96362306a36Sopenharmony_ci
96462306a36Sopenharmony_ci		/*
96562306a36Sopenharmony_ci		 * Otherwise assume the 'return' is being used as a jump (e.g.
96662306a36Sopenharmony_ci		 * retpoline) and just push the 'to' symbol.
96762306a36Sopenharmony_ci		 */
96862306a36Sopenharmony_ci		cp = call_path__findnew(cpr, parent, tsym, addr, ks);
96962306a36Sopenharmony_ci
97062306a36Sopenharmony_ci		err = thread_stack__push_cp(ts, 0, tm, ref, cp, true, false);
97162306a36Sopenharmony_ci		if (!err)
97262306a36Sopenharmony_ci			ts->stack[ts->cnt - 1].non_call = true;
97362306a36Sopenharmony_ci
97462306a36Sopenharmony_ci		return err;
97562306a36Sopenharmony_ci	}
97662306a36Sopenharmony_ci
97762306a36Sopenharmony_ci	/*
97862306a36Sopenharmony_ci	 * Assume 'parent' has not yet returned, so push 'to', and then push and
97962306a36Sopenharmony_ci	 * pop 'from'.
98062306a36Sopenharmony_ci	 */
98162306a36Sopenharmony_ci
98262306a36Sopenharmony_ci	cp = call_path__findnew(cpr, parent, tsym, addr, ks);
98362306a36Sopenharmony_ci
98462306a36Sopenharmony_ci	err = thread_stack__push_cp(ts, addr, tm, ref, cp, true, false);
98562306a36Sopenharmony_ci	if (err)
98662306a36Sopenharmony_ci		return err;
98762306a36Sopenharmony_ci
98862306a36Sopenharmony_ci	cp = call_path__findnew(cpr, cp, fsym, ip, ks);
98962306a36Sopenharmony_ci
99062306a36Sopenharmony_ci	err = thread_stack__push_cp(ts, ip, tm, ref, cp, true, false);
99162306a36Sopenharmony_ci	if (err)
99262306a36Sopenharmony_ci		return err;
99362306a36Sopenharmony_ci
99462306a36Sopenharmony_ci	return thread_stack__call_return(thread, ts, --ts->cnt, tm, ref, false);
99562306a36Sopenharmony_ci}
99662306a36Sopenharmony_ci
99762306a36Sopenharmony_cistatic int thread_stack__trace_begin(struct thread *thread,
99862306a36Sopenharmony_ci				     struct thread_stack *ts, u64 timestamp,
99962306a36Sopenharmony_ci				     u64 ref)
100062306a36Sopenharmony_ci{
100162306a36Sopenharmony_ci	struct thread_stack_entry *tse;
100262306a36Sopenharmony_ci	int err;
100362306a36Sopenharmony_ci
100462306a36Sopenharmony_ci	if (!ts->cnt)
100562306a36Sopenharmony_ci		return 0;
100662306a36Sopenharmony_ci
100762306a36Sopenharmony_ci	/* Pop trace end */
100862306a36Sopenharmony_ci	tse = &ts->stack[ts->cnt - 1];
100962306a36Sopenharmony_ci	if (tse->trace_end) {
101062306a36Sopenharmony_ci		err = thread_stack__call_return(thread, ts, --ts->cnt,
101162306a36Sopenharmony_ci						timestamp, ref, false);
101262306a36Sopenharmony_ci		if (err)
101362306a36Sopenharmony_ci			return err;
101462306a36Sopenharmony_ci	}
101562306a36Sopenharmony_ci
101662306a36Sopenharmony_ci	return 0;
101762306a36Sopenharmony_ci}
101862306a36Sopenharmony_ci
101962306a36Sopenharmony_cistatic int thread_stack__trace_end(struct thread_stack *ts,
102062306a36Sopenharmony_ci				   struct perf_sample *sample, u64 ref)
102162306a36Sopenharmony_ci{
102262306a36Sopenharmony_ci	struct call_path_root *cpr = ts->crp->cpr;
102362306a36Sopenharmony_ci	struct call_path *cp;
102462306a36Sopenharmony_ci	u64 ret_addr;
102562306a36Sopenharmony_ci
102662306a36Sopenharmony_ci	/* No point having 'trace end' on the bottom of the stack */
102762306a36Sopenharmony_ci	if (!ts->cnt || (ts->cnt == 1 && ts->stack[0].ref == ref))
102862306a36Sopenharmony_ci		return 0;
102962306a36Sopenharmony_ci
103062306a36Sopenharmony_ci	cp = call_path__findnew(cpr, ts->stack[ts->cnt - 1].cp, NULL, 0,
103162306a36Sopenharmony_ci				ts->kernel_start);
103262306a36Sopenharmony_ci
103362306a36Sopenharmony_ci	ret_addr = sample->ip + sample->insn_len;
103462306a36Sopenharmony_ci
103562306a36Sopenharmony_ci	return thread_stack__push_cp(ts, ret_addr, sample->time, ref, cp,
103662306a36Sopenharmony_ci				     false, true);
103762306a36Sopenharmony_ci}
103862306a36Sopenharmony_ci
103962306a36Sopenharmony_cistatic bool is_x86_retpoline(const char *name)
104062306a36Sopenharmony_ci{
104162306a36Sopenharmony_ci	return strstr(name, "__x86_indirect_thunk_") == name;
104262306a36Sopenharmony_ci}
104362306a36Sopenharmony_ci
104462306a36Sopenharmony_ci/*
104562306a36Sopenharmony_ci * x86 retpoline functions pollute the call graph. This function removes them.
104662306a36Sopenharmony_ci * This does not handle function return thunks, nor is there any improvement
104762306a36Sopenharmony_ci * for the handling of inline thunks or extern thunks.
104862306a36Sopenharmony_ci */
104962306a36Sopenharmony_cistatic int thread_stack__x86_retpoline(struct thread_stack *ts,
105062306a36Sopenharmony_ci				       struct perf_sample *sample,
105162306a36Sopenharmony_ci				       struct addr_location *to_al)
105262306a36Sopenharmony_ci{
105362306a36Sopenharmony_ci	struct thread_stack_entry *tse = &ts->stack[ts->cnt - 1];
105462306a36Sopenharmony_ci	struct call_path_root *cpr = ts->crp->cpr;
105562306a36Sopenharmony_ci	struct symbol *sym = tse->cp->sym;
105662306a36Sopenharmony_ci	struct symbol *tsym = to_al->sym;
105762306a36Sopenharmony_ci	struct call_path *cp;
105862306a36Sopenharmony_ci
105962306a36Sopenharmony_ci	if (sym && is_x86_retpoline(sym->name)) {
106062306a36Sopenharmony_ci		/*
106162306a36Sopenharmony_ci		 * This is a x86 retpoline fn. It pollutes the call graph by
106262306a36Sopenharmony_ci		 * showing up everywhere there is an indirect branch, but does
106362306a36Sopenharmony_ci		 * not itself mean anything. Here the top-of-stack is removed,
106462306a36Sopenharmony_ci		 * by decrementing the stack count, and then further down, the
106562306a36Sopenharmony_ci		 * resulting top-of-stack is replaced with the actual target.
106662306a36Sopenharmony_ci		 * The result is that the retpoline functions will no longer
106762306a36Sopenharmony_ci		 * appear in the call graph. Note this only affects the call
106862306a36Sopenharmony_ci		 * graph, since all the original branches are left unchanged.
106962306a36Sopenharmony_ci		 */
107062306a36Sopenharmony_ci		ts->cnt -= 1;
107162306a36Sopenharmony_ci		sym = ts->stack[ts->cnt - 2].cp->sym;
107262306a36Sopenharmony_ci		if (sym && sym == tsym && to_al->addr != tsym->start) {
107362306a36Sopenharmony_ci			/*
107462306a36Sopenharmony_ci			 * Target is back to the middle of the symbol we came
107562306a36Sopenharmony_ci			 * from so assume it is an indirect jmp and forget it
107662306a36Sopenharmony_ci			 * altogether.
107762306a36Sopenharmony_ci			 */
107862306a36Sopenharmony_ci			ts->cnt -= 1;
107962306a36Sopenharmony_ci			return 0;
108062306a36Sopenharmony_ci		}
108162306a36Sopenharmony_ci	} else if (sym && sym == tsym) {
108262306a36Sopenharmony_ci		/*
108362306a36Sopenharmony_ci		 * Target is back to the symbol we came from so assume it is an
108462306a36Sopenharmony_ci		 * indirect jmp and forget it altogether.
108562306a36Sopenharmony_ci		 */
108662306a36Sopenharmony_ci		ts->cnt -= 1;
108762306a36Sopenharmony_ci		return 0;
108862306a36Sopenharmony_ci	}
108962306a36Sopenharmony_ci
109062306a36Sopenharmony_ci	cp = call_path__findnew(cpr, ts->stack[ts->cnt - 2].cp, tsym,
109162306a36Sopenharmony_ci				sample->addr, ts->kernel_start);
109262306a36Sopenharmony_ci	if (!cp)
109362306a36Sopenharmony_ci		return -ENOMEM;
109462306a36Sopenharmony_ci
109562306a36Sopenharmony_ci	/* Replace the top-of-stack with the actual target */
109662306a36Sopenharmony_ci	ts->stack[ts->cnt - 1].cp = cp;
109762306a36Sopenharmony_ci
109862306a36Sopenharmony_ci	return 0;
109962306a36Sopenharmony_ci}
110062306a36Sopenharmony_ci
110162306a36Sopenharmony_ciint thread_stack__process(struct thread *thread, struct comm *comm,
110262306a36Sopenharmony_ci			  struct perf_sample *sample,
110362306a36Sopenharmony_ci			  struct addr_location *from_al,
110462306a36Sopenharmony_ci			  struct addr_location *to_al, u64 ref,
110562306a36Sopenharmony_ci			  struct call_return_processor *crp)
110662306a36Sopenharmony_ci{
110762306a36Sopenharmony_ci	struct thread_stack *ts = thread__stack(thread, sample->cpu);
110862306a36Sopenharmony_ci	enum retpoline_state_t rstate;
110962306a36Sopenharmony_ci	int err = 0;
111062306a36Sopenharmony_ci
111162306a36Sopenharmony_ci	if (ts && !ts->crp) {
111262306a36Sopenharmony_ci		/* Supersede thread_stack__event() */
111362306a36Sopenharmony_ci		thread_stack__reset(thread, ts);
111462306a36Sopenharmony_ci		ts = NULL;
111562306a36Sopenharmony_ci	}
111662306a36Sopenharmony_ci
111762306a36Sopenharmony_ci	if (!ts) {
111862306a36Sopenharmony_ci		ts = thread_stack__new(thread, sample->cpu, crp, true, 0);
111962306a36Sopenharmony_ci		if (!ts)
112062306a36Sopenharmony_ci			return -ENOMEM;
112162306a36Sopenharmony_ci		ts->comm = comm;
112262306a36Sopenharmony_ci	}
112362306a36Sopenharmony_ci
112462306a36Sopenharmony_ci	rstate = ts->rstate;
112562306a36Sopenharmony_ci	if (rstate == X86_RETPOLINE_DETECTED)
112662306a36Sopenharmony_ci		ts->rstate = X86_RETPOLINE_POSSIBLE;
112762306a36Sopenharmony_ci
112862306a36Sopenharmony_ci	/* Flush stack on exec */
112962306a36Sopenharmony_ci	if (ts->comm != comm && thread__pid(thread) == thread__tid(thread)) {
113062306a36Sopenharmony_ci		err = __thread_stack__flush(thread, ts);
113162306a36Sopenharmony_ci		if (err)
113262306a36Sopenharmony_ci			return err;
113362306a36Sopenharmony_ci		ts->comm = comm;
113462306a36Sopenharmony_ci	}
113562306a36Sopenharmony_ci
113662306a36Sopenharmony_ci	/* If the stack is empty, put the current symbol on the stack */
113762306a36Sopenharmony_ci	if (!ts->cnt) {
113862306a36Sopenharmony_ci		err = thread_stack__bottom(ts, sample, from_al, to_al, ref);
113962306a36Sopenharmony_ci		if (err)
114062306a36Sopenharmony_ci			return err;
114162306a36Sopenharmony_ci	}
114262306a36Sopenharmony_ci
114362306a36Sopenharmony_ci	ts->branch_count += 1;
114462306a36Sopenharmony_ci	ts->insn_count += sample->insn_cnt;
114562306a36Sopenharmony_ci	ts->cyc_count += sample->cyc_cnt;
114662306a36Sopenharmony_ci	ts->last_time = sample->time;
114762306a36Sopenharmony_ci
114862306a36Sopenharmony_ci	if (sample->flags & PERF_IP_FLAG_CALL) {
114962306a36Sopenharmony_ci		bool trace_end = sample->flags & PERF_IP_FLAG_TRACE_END;
115062306a36Sopenharmony_ci		struct call_path_root *cpr = ts->crp->cpr;
115162306a36Sopenharmony_ci		struct call_path *cp;
115262306a36Sopenharmony_ci		u64 ret_addr;
115362306a36Sopenharmony_ci
115462306a36Sopenharmony_ci		if (!sample->ip || !sample->addr)
115562306a36Sopenharmony_ci			return 0;
115662306a36Sopenharmony_ci
115762306a36Sopenharmony_ci		ret_addr = sample->ip + sample->insn_len;
115862306a36Sopenharmony_ci		if (ret_addr == sample->addr)
115962306a36Sopenharmony_ci			return 0; /* Zero-length calls are excluded */
116062306a36Sopenharmony_ci
116162306a36Sopenharmony_ci		cp = call_path__findnew(cpr, ts->stack[ts->cnt - 1].cp,
116262306a36Sopenharmony_ci					to_al->sym, sample->addr,
116362306a36Sopenharmony_ci					ts->kernel_start);
116462306a36Sopenharmony_ci		err = thread_stack__push_cp(ts, ret_addr, sample->time, ref,
116562306a36Sopenharmony_ci					    cp, false, trace_end);
116662306a36Sopenharmony_ci
116762306a36Sopenharmony_ci		/*
116862306a36Sopenharmony_ci		 * A call to the same symbol but not the start of the symbol,
116962306a36Sopenharmony_ci		 * may be the start of a x86 retpoline.
117062306a36Sopenharmony_ci		 */
117162306a36Sopenharmony_ci		if (!err && rstate == X86_RETPOLINE_POSSIBLE && to_al->sym &&
117262306a36Sopenharmony_ci		    from_al->sym == to_al->sym &&
117362306a36Sopenharmony_ci		    to_al->addr != to_al->sym->start)
117462306a36Sopenharmony_ci			ts->rstate = X86_RETPOLINE_DETECTED;
117562306a36Sopenharmony_ci
117662306a36Sopenharmony_ci	} else if (sample->flags & PERF_IP_FLAG_RETURN) {
117762306a36Sopenharmony_ci		if (!sample->addr) {
117862306a36Sopenharmony_ci			u32 return_from_kernel = PERF_IP_FLAG_SYSCALLRET |
117962306a36Sopenharmony_ci						 PERF_IP_FLAG_INTERRUPT;
118062306a36Sopenharmony_ci
118162306a36Sopenharmony_ci			if (!(sample->flags & return_from_kernel))
118262306a36Sopenharmony_ci				return 0;
118362306a36Sopenharmony_ci
118462306a36Sopenharmony_ci			/* Pop kernel stack */
118562306a36Sopenharmony_ci			return thread_stack__pop_ks(thread, ts, sample, ref);
118662306a36Sopenharmony_ci		}
118762306a36Sopenharmony_ci
118862306a36Sopenharmony_ci		if (!sample->ip)
118962306a36Sopenharmony_ci			return 0;
119062306a36Sopenharmony_ci
119162306a36Sopenharmony_ci		/* x86 retpoline 'return' doesn't match the stack */
119262306a36Sopenharmony_ci		if (rstate == X86_RETPOLINE_DETECTED && ts->cnt > 2 &&
119362306a36Sopenharmony_ci		    ts->stack[ts->cnt - 1].ret_addr != sample->addr)
119462306a36Sopenharmony_ci			return thread_stack__x86_retpoline(ts, sample, to_al);
119562306a36Sopenharmony_ci
119662306a36Sopenharmony_ci		err = thread_stack__pop_cp(thread, ts, sample->addr,
119762306a36Sopenharmony_ci					   sample->time, ref, from_al->sym);
119862306a36Sopenharmony_ci		if (err) {
119962306a36Sopenharmony_ci			if (err < 0)
120062306a36Sopenharmony_ci				return err;
120162306a36Sopenharmony_ci			err = thread_stack__no_call_return(thread, ts, sample,
120262306a36Sopenharmony_ci							   from_al, to_al, ref);
120362306a36Sopenharmony_ci		}
120462306a36Sopenharmony_ci	} else if (sample->flags & PERF_IP_FLAG_TRACE_BEGIN) {
120562306a36Sopenharmony_ci		err = thread_stack__trace_begin(thread, ts, sample->time, ref);
120662306a36Sopenharmony_ci	} else if (sample->flags & PERF_IP_FLAG_TRACE_END) {
120762306a36Sopenharmony_ci		err = thread_stack__trace_end(ts, sample, ref);
120862306a36Sopenharmony_ci	} else if (sample->flags & PERF_IP_FLAG_BRANCH &&
120962306a36Sopenharmony_ci		   from_al->sym != to_al->sym && to_al->sym &&
121062306a36Sopenharmony_ci		   to_al->addr == to_al->sym->start) {
121162306a36Sopenharmony_ci		struct call_path_root *cpr = ts->crp->cpr;
121262306a36Sopenharmony_ci		struct call_path *cp;
121362306a36Sopenharmony_ci
121462306a36Sopenharmony_ci		/*
121562306a36Sopenharmony_ci		 * The compiler might optimize a call/ret combination by making
121662306a36Sopenharmony_ci		 * it a jmp. Make that visible by recording on the stack a
121762306a36Sopenharmony_ci		 * branch to the start of a different symbol. Note, that means
121862306a36Sopenharmony_ci		 * when a ret pops the stack, all jmps must be popped off first.
121962306a36Sopenharmony_ci		 */
122062306a36Sopenharmony_ci		cp = call_path__findnew(cpr, ts->stack[ts->cnt - 1].cp,
122162306a36Sopenharmony_ci					to_al->sym, sample->addr,
122262306a36Sopenharmony_ci					ts->kernel_start);
122362306a36Sopenharmony_ci		err = thread_stack__push_cp(ts, 0, sample->time, ref, cp, false,
122462306a36Sopenharmony_ci					    false);
122562306a36Sopenharmony_ci		if (!err)
122662306a36Sopenharmony_ci			ts->stack[ts->cnt - 1].non_call = true;
122762306a36Sopenharmony_ci	}
122862306a36Sopenharmony_ci
122962306a36Sopenharmony_ci	return err;
123062306a36Sopenharmony_ci}
123162306a36Sopenharmony_ci
123262306a36Sopenharmony_cisize_t thread_stack__depth(struct thread *thread, int cpu)
123362306a36Sopenharmony_ci{
123462306a36Sopenharmony_ci	struct thread_stack *ts = thread__stack(thread, cpu);
123562306a36Sopenharmony_ci
123662306a36Sopenharmony_ci	if (!ts)
123762306a36Sopenharmony_ci		return 0;
123862306a36Sopenharmony_ci	return ts->cnt;
123962306a36Sopenharmony_ci}
1240