162306a36Sopenharmony_ci/* SPDX-License-Identifier: GPL-2.0 */
262306a36Sopenharmony_ci#ifndef __BPF_TCP_HELPERS_H
362306a36Sopenharmony_ci#define __BPF_TCP_HELPERS_H
462306a36Sopenharmony_ci
562306a36Sopenharmony_ci#include <stdbool.h>
662306a36Sopenharmony_ci#include <linux/types.h>
762306a36Sopenharmony_ci#include <bpf/bpf_helpers.h>
862306a36Sopenharmony_ci#include <bpf/bpf_core_read.h>
962306a36Sopenharmony_ci#include <bpf/bpf_tracing.h>
1062306a36Sopenharmony_ci
1162306a36Sopenharmony_ci#define BPF_STRUCT_OPS(name, args...) \
1262306a36Sopenharmony_ciSEC("struct_ops/"#name) \
1362306a36Sopenharmony_ciBPF_PROG(name, args)
1462306a36Sopenharmony_ci
1562306a36Sopenharmony_ci#ifndef SOL_TCP
1662306a36Sopenharmony_ci#define SOL_TCP 6
1762306a36Sopenharmony_ci#endif
1862306a36Sopenharmony_ci
1962306a36Sopenharmony_ci#ifndef TCP_CA_NAME_MAX
2062306a36Sopenharmony_ci#define TCP_CA_NAME_MAX	16
2162306a36Sopenharmony_ci#endif
2262306a36Sopenharmony_ci
2362306a36Sopenharmony_ci#define tcp_jiffies32 ((__u32)bpf_jiffies64())
2462306a36Sopenharmony_ci
2562306a36Sopenharmony_cistruct sock_common {
2662306a36Sopenharmony_ci	unsigned char	skc_state;
2762306a36Sopenharmony_ci	__u16		skc_num;
2862306a36Sopenharmony_ci} __attribute__((preserve_access_index));
2962306a36Sopenharmony_ci
3062306a36Sopenharmony_cienum sk_pacing {
3162306a36Sopenharmony_ci	SK_PACING_NONE		= 0,
3262306a36Sopenharmony_ci	SK_PACING_NEEDED	= 1,
3362306a36Sopenharmony_ci	SK_PACING_FQ		= 2,
3462306a36Sopenharmony_ci};
3562306a36Sopenharmony_ci
3662306a36Sopenharmony_cistruct sock {
3762306a36Sopenharmony_ci	struct sock_common	__sk_common;
3862306a36Sopenharmony_ci#define sk_state		__sk_common.skc_state
3962306a36Sopenharmony_ci	unsigned long		sk_pacing_rate;
4062306a36Sopenharmony_ci	__u32			sk_pacing_status; /* see enum sk_pacing */
4162306a36Sopenharmony_ci} __attribute__((preserve_access_index));
4262306a36Sopenharmony_ci
4362306a36Sopenharmony_cistruct inet_sock {
4462306a36Sopenharmony_ci	struct sock		sk;
4562306a36Sopenharmony_ci} __attribute__((preserve_access_index));
4662306a36Sopenharmony_ci
4762306a36Sopenharmony_cistruct inet_connection_sock {
4862306a36Sopenharmony_ci	struct inet_sock	  icsk_inet;
4962306a36Sopenharmony_ci	__u8			  icsk_ca_state:6,
5062306a36Sopenharmony_ci				  icsk_ca_setsockopt:1,
5162306a36Sopenharmony_ci				  icsk_ca_dst_locked:1;
5262306a36Sopenharmony_ci	struct {
5362306a36Sopenharmony_ci		__u8		  pending;
5462306a36Sopenharmony_ci	} icsk_ack;
5562306a36Sopenharmony_ci	__u64			  icsk_ca_priv[104 / sizeof(__u64)];
5662306a36Sopenharmony_ci} __attribute__((preserve_access_index));
5762306a36Sopenharmony_ci
5862306a36Sopenharmony_cistruct request_sock {
5962306a36Sopenharmony_ci	struct sock_common		__req_common;
6062306a36Sopenharmony_ci} __attribute__((preserve_access_index));
6162306a36Sopenharmony_ci
6262306a36Sopenharmony_cistruct tcp_sock {
6362306a36Sopenharmony_ci	struct inet_connection_sock	inet_conn;
6462306a36Sopenharmony_ci
6562306a36Sopenharmony_ci	__u32	rcv_nxt;
6662306a36Sopenharmony_ci	__u32	snd_nxt;
6762306a36Sopenharmony_ci	__u32	snd_una;
6862306a36Sopenharmony_ci	__u32	window_clamp;
6962306a36Sopenharmony_ci	__u8	ecn_flags;
7062306a36Sopenharmony_ci	__u32	delivered;
7162306a36Sopenharmony_ci	__u32	delivered_ce;
7262306a36Sopenharmony_ci	__u32	snd_cwnd;
7362306a36Sopenharmony_ci	__u32	snd_cwnd_cnt;
7462306a36Sopenharmony_ci	__u32	snd_cwnd_clamp;
7562306a36Sopenharmony_ci	__u32	snd_ssthresh;
7662306a36Sopenharmony_ci	__u8	syn_data:1,	/* SYN includes data */
7762306a36Sopenharmony_ci		syn_fastopen:1,	/* SYN includes Fast Open option */
7862306a36Sopenharmony_ci		syn_fastopen_exp:1,/* SYN includes Fast Open exp. option */
7962306a36Sopenharmony_ci		syn_fastopen_ch:1, /* Active TFO re-enabling probe */
8062306a36Sopenharmony_ci		syn_data_acked:1,/* data in SYN is acked by SYN-ACK */
8162306a36Sopenharmony_ci		save_syn:1,	/* Save headers of SYN packet */
8262306a36Sopenharmony_ci		is_cwnd_limited:1,/* forward progress limited by snd_cwnd? */
8362306a36Sopenharmony_ci		syn_smc:1;	/* SYN includes SMC */
8462306a36Sopenharmony_ci	__u32	max_packets_out;
8562306a36Sopenharmony_ci	__u32	lsndtime;
8662306a36Sopenharmony_ci	__u32	prior_cwnd;
8762306a36Sopenharmony_ci	__u64	tcp_mstamp;	/* most recent packet received/sent */
8862306a36Sopenharmony_ci	bool	is_mptcp;
8962306a36Sopenharmony_ci} __attribute__((preserve_access_index));
9062306a36Sopenharmony_ci
9162306a36Sopenharmony_cistatic __always_inline struct inet_connection_sock *inet_csk(const struct sock *sk)
9262306a36Sopenharmony_ci{
9362306a36Sopenharmony_ci	return (struct inet_connection_sock *)sk;
9462306a36Sopenharmony_ci}
9562306a36Sopenharmony_ci
9662306a36Sopenharmony_cistatic __always_inline void *inet_csk_ca(const struct sock *sk)
9762306a36Sopenharmony_ci{
9862306a36Sopenharmony_ci	return (void *)inet_csk(sk)->icsk_ca_priv;
9962306a36Sopenharmony_ci}
10062306a36Sopenharmony_ci
10162306a36Sopenharmony_cistatic __always_inline struct tcp_sock *tcp_sk(const struct sock *sk)
10262306a36Sopenharmony_ci{
10362306a36Sopenharmony_ci	return (struct tcp_sock *)sk;
10462306a36Sopenharmony_ci}
10562306a36Sopenharmony_ci
10662306a36Sopenharmony_cistatic __always_inline bool before(__u32 seq1, __u32 seq2)
10762306a36Sopenharmony_ci{
10862306a36Sopenharmony_ci	return (__s32)(seq1-seq2) < 0;
10962306a36Sopenharmony_ci}
11062306a36Sopenharmony_ci#define after(seq2, seq1) 	before(seq1, seq2)
11162306a36Sopenharmony_ci
11262306a36Sopenharmony_ci#define	TCP_ECN_OK		1
11362306a36Sopenharmony_ci#define	TCP_ECN_QUEUE_CWR	2
11462306a36Sopenharmony_ci#define	TCP_ECN_DEMAND_CWR	4
11562306a36Sopenharmony_ci#define	TCP_ECN_SEEN		8
11662306a36Sopenharmony_ci
11762306a36Sopenharmony_cienum inet_csk_ack_state_t {
11862306a36Sopenharmony_ci	ICSK_ACK_SCHED	= 1,
11962306a36Sopenharmony_ci	ICSK_ACK_TIMER  = 2,
12062306a36Sopenharmony_ci	ICSK_ACK_PUSHED = 4,
12162306a36Sopenharmony_ci	ICSK_ACK_PUSHED2 = 8,
12262306a36Sopenharmony_ci	ICSK_ACK_NOW = 16	/* Send the next ACK immediately (once) */
12362306a36Sopenharmony_ci};
12462306a36Sopenharmony_ci
12562306a36Sopenharmony_cienum tcp_ca_event {
12662306a36Sopenharmony_ci	CA_EVENT_TX_START = 0,
12762306a36Sopenharmony_ci	CA_EVENT_CWND_RESTART = 1,
12862306a36Sopenharmony_ci	CA_EVENT_COMPLETE_CWR = 2,
12962306a36Sopenharmony_ci	CA_EVENT_LOSS = 3,
13062306a36Sopenharmony_ci	CA_EVENT_ECN_NO_CE = 4,
13162306a36Sopenharmony_ci	CA_EVENT_ECN_IS_CE = 5,
13262306a36Sopenharmony_ci};
13362306a36Sopenharmony_ci
13462306a36Sopenharmony_cistruct ack_sample {
13562306a36Sopenharmony_ci	__u32 pkts_acked;
13662306a36Sopenharmony_ci	__s32 rtt_us;
13762306a36Sopenharmony_ci	__u32 in_flight;
13862306a36Sopenharmony_ci} __attribute__((preserve_access_index));
13962306a36Sopenharmony_ci
14062306a36Sopenharmony_cistruct rate_sample {
14162306a36Sopenharmony_ci	__u64  prior_mstamp; /* starting timestamp for interval */
14262306a36Sopenharmony_ci	__u32  prior_delivered;	/* tp->delivered at "prior_mstamp" */
14362306a36Sopenharmony_ci	__s32  delivered;		/* number of packets delivered over interval */
14462306a36Sopenharmony_ci	long interval_us;	/* time for tp->delivered to incr "delivered" */
14562306a36Sopenharmony_ci	__u32 snd_interval_us;	/* snd interval for delivered packets */
14662306a36Sopenharmony_ci	__u32 rcv_interval_us;	/* rcv interval for delivered packets */
14762306a36Sopenharmony_ci	long rtt_us;		/* RTT of last (S)ACKed packet (or -1) */
14862306a36Sopenharmony_ci	int  losses;		/* number of packets marked lost upon ACK */
14962306a36Sopenharmony_ci	__u32  acked_sacked;	/* number of packets newly (S)ACKed upon ACK */
15062306a36Sopenharmony_ci	__u32  prior_in_flight;	/* in flight before this ACK */
15162306a36Sopenharmony_ci	bool is_app_limited;	/* is sample from packet with bubble in pipe? */
15262306a36Sopenharmony_ci	bool is_retrans;	/* is sample from retransmission? */
15362306a36Sopenharmony_ci	bool is_ack_delayed;	/* is this (likely) a delayed ACK? */
15462306a36Sopenharmony_ci} __attribute__((preserve_access_index));
15562306a36Sopenharmony_ci
15662306a36Sopenharmony_ci#define TCP_CA_NAME_MAX		16
15762306a36Sopenharmony_ci#define TCP_CONG_NEEDS_ECN	0x2
15862306a36Sopenharmony_ci
15962306a36Sopenharmony_cistruct tcp_congestion_ops {
16062306a36Sopenharmony_ci	char name[TCP_CA_NAME_MAX];
16162306a36Sopenharmony_ci	__u32 flags;
16262306a36Sopenharmony_ci
16362306a36Sopenharmony_ci	/* initialize private data (optional) */
16462306a36Sopenharmony_ci	void (*init)(struct sock *sk);
16562306a36Sopenharmony_ci	/* cleanup private data  (optional) */
16662306a36Sopenharmony_ci	void (*release)(struct sock *sk);
16762306a36Sopenharmony_ci
16862306a36Sopenharmony_ci	/* return slow start threshold (required) */
16962306a36Sopenharmony_ci	__u32 (*ssthresh)(struct sock *sk);
17062306a36Sopenharmony_ci	/* do new cwnd calculation (required) */
17162306a36Sopenharmony_ci	void (*cong_avoid)(struct sock *sk, __u32 ack, __u32 acked);
17262306a36Sopenharmony_ci	/* call before changing ca_state (optional) */
17362306a36Sopenharmony_ci	void (*set_state)(struct sock *sk, __u8 new_state);
17462306a36Sopenharmony_ci	/* call when cwnd event occurs (optional) */
17562306a36Sopenharmony_ci	void (*cwnd_event)(struct sock *sk, enum tcp_ca_event ev);
17662306a36Sopenharmony_ci	/* call when ack arrives (optional) */
17762306a36Sopenharmony_ci	void (*in_ack_event)(struct sock *sk, __u32 flags);
17862306a36Sopenharmony_ci	/* new value of cwnd after loss (required) */
17962306a36Sopenharmony_ci	__u32  (*undo_cwnd)(struct sock *sk);
18062306a36Sopenharmony_ci	/* hook for packet ack accounting (optional) */
18162306a36Sopenharmony_ci	void (*pkts_acked)(struct sock *sk, const struct ack_sample *sample);
18262306a36Sopenharmony_ci	/* override sysctl_tcp_min_tso_segs */
18362306a36Sopenharmony_ci	__u32 (*min_tso_segs)(struct sock *sk);
18462306a36Sopenharmony_ci	/* returns the multiplier used in tcp_sndbuf_expand (optional) */
18562306a36Sopenharmony_ci	__u32 (*sndbuf_expand)(struct sock *sk);
18662306a36Sopenharmony_ci	/* call when packets are delivered to update cwnd and pacing rate,
18762306a36Sopenharmony_ci	 * after all the ca_state processing. (optional)
18862306a36Sopenharmony_ci	 */
18962306a36Sopenharmony_ci	void (*cong_control)(struct sock *sk, const struct rate_sample *rs);
19062306a36Sopenharmony_ci	void *owner;
19162306a36Sopenharmony_ci};
19262306a36Sopenharmony_ci
19362306a36Sopenharmony_ci#define min(a, b) ((a) < (b) ? (a) : (b))
19462306a36Sopenharmony_ci#define max(a, b) ((a) > (b) ? (a) : (b))
19562306a36Sopenharmony_ci#define min_not_zero(x, y) ({			\
19662306a36Sopenharmony_ci	typeof(x) __x = (x);			\
19762306a36Sopenharmony_ci	typeof(y) __y = (y);			\
19862306a36Sopenharmony_ci	__x == 0 ? __y : ((__y == 0) ? __x : min(__x, __y)); })
19962306a36Sopenharmony_ci
20062306a36Sopenharmony_cistatic __always_inline bool tcp_in_slow_start(const struct tcp_sock *tp)
20162306a36Sopenharmony_ci{
20262306a36Sopenharmony_ci	return tp->snd_cwnd < tp->snd_ssthresh;
20362306a36Sopenharmony_ci}
20462306a36Sopenharmony_ci
20562306a36Sopenharmony_cistatic __always_inline bool tcp_is_cwnd_limited(const struct sock *sk)
20662306a36Sopenharmony_ci{
20762306a36Sopenharmony_ci	const struct tcp_sock *tp = tcp_sk(sk);
20862306a36Sopenharmony_ci
20962306a36Sopenharmony_ci	/* If in slow start, ensure cwnd grows to twice what was ACKed. */
21062306a36Sopenharmony_ci	if (tcp_in_slow_start(tp))
21162306a36Sopenharmony_ci		return tp->snd_cwnd < 2 * tp->max_packets_out;
21262306a36Sopenharmony_ci
21362306a36Sopenharmony_ci	return !!BPF_CORE_READ_BITFIELD(tp, is_cwnd_limited);
21462306a36Sopenharmony_ci}
21562306a36Sopenharmony_ci
21662306a36Sopenharmony_cistatic __always_inline bool tcp_cc_eq(const char *a, const char *b)
21762306a36Sopenharmony_ci{
21862306a36Sopenharmony_ci	int i;
21962306a36Sopenharmony_ci
22062306a36Sopenharmony_ci	for (i = 0; i < TCP_CA_NAME_MAX; i++) {
22162306a36Sopenharmony_ci		if (a[i] != b[i])
22262306a36Sopenharmony_ci			return false;
22362306a36Sopenharmony_ci		if (!a[i])
22462306a36Sopenharmony_ci			break;
22562306a36Sopenharmony_ci	}
22662306a36Sopenharmony_ci
22762306a36Sopenharmony_ci	return true;
22862306a36Sopenharmony_ci}
22962306a36Sopenharmony_ci
23062306a36Sopenharmony_ciextern __u32 tcp_slow_start(struct tcp_sock *tp, __u32 acked) __ksym;
23162306a36Sopenharmony_ciextern void tcp_cong_avoid_ai(struct tcp_sock *tp, __u32 w, __u32 acked) __ksym;
23262306a36Sopenharmony_ci
23362306a36Sopenharmony_cistruct mptcp_sock {
23462306a36Sopenharmony_ci	struct inet_connection_sock	sk;
23562306a36Sopenharmony_ci
23662306a36Sopenharmony_ci	__u32		token;
23762306a36Sopenharmony_ci	struct sock	*first;
23862306a36Sopenharmony_ci	char		ca_name[TCP_CA_NAME_MAX];
23962306a36Sopenharmony_ci} __attribute__((preserve_access_index));
24062306a36Sopenharmony_ci
24162306a36Sopenharmony_ci#endif
242