162306a36Sopenharmony_ci/* SPDX-License-Identifier: GPL-2.0 */ 262306a36Sopenharmony_ci#ifndef __BPF_TCP_HELPERS_H 362306a36Sopenharmony_ci#define __BPF_TCP_HELPERS_H 462306a36Sopenharmony_ci 562306a36Sopenharmony_ci#include <stdbool.h> 662306a36Sopenharmony_ci#include <linux/types.h> 762306a36Sopenharmony_ci#include <bpf/bpf_helpers.h> 862306a36Sopenharmony_ci#include <bpf/bpf_core_read.h> 962306a36Sopenharmony_ci#include <bpf/bpf_tracing.h> 1062306a36Sopenharmony_ci 1162306a36Sopenharmony_ci#define BPF_STRUCT_OPS(name, args...) \ 1262306a36Sopenharmony_ciSEC("struct_ops/"#name) \ 1362306a36Sopenharmony_ciBPF_PROG(name, args) 1462306a36Sopenharmony_ci 1562306a36Sopenharmony_ci#ifndef SOL_TCP 1662306a36Sopenharmony_ci#define SOL_TCP 6 1762306a36Sopenharmony_ci#endif 1862306a36Sopenharmony_ci 1962306a36Sopenharmony_ci#ifndef TCP_CA_NAME_MAX 2062306a36Sopenharmony_ci#define TCP_CA_NAME_MAX 16 2162306a36Sopenharmony_ci#endif 2262306a36Sopenharmony_ci 2362306a36Sopenharmony_ci#define tcp_jiffies32 ((__u32)bpf_jiffies64()) 2462306a36Sopenharmony_ci 2562306a36Sopenharmony_cistruct sock_common { 2662306a36Sopenharmony_ci unsigned char skc_state; 2762306a36Sopenharmony_ci __u16 skc_num; 2862306a36Sopenharmony_ci} __attribute__((preserve_access_index)); 2962306a36Sopenharmony_ci 3062306a36Sopenharmony_cienum sk_pacing { 3162306a36Sopenharmony_ci SK_PACING_NONE = 0, 3262306a36Sopenharmony_ci SK_PACING_NEEDED = 1, 3362306a36Sopenharmony_ci SK_PACING_FQ = 2, 3462306a36Sopenharmony_ci}; 3562306a36Sopenharmony_ci 3662306a36Sopenharmony_cistruct sock { 3762306a36Sopenharmony_ci struct sock_common __sk_common; 3862306a36Sopenharmony_ci#define sk_state __sk_common.skc_state 3962306a36Sopenharmony_ci unsigned long sk_pacing_rate; 4062306a36Sopenharmony_ci __u32 sk_pacing_status; /* see enum sk_pacing */ 4162306a36Sopenharmony_ci} __attribute__((preserve_access_index)); 4262306a36Sopenharmony_ci 4362306a36Sopenharmony_cistruct inet_sock { 4462306a36Sopenharmony_ci struct sock sk; 4562306a36Sopenharmony_ci} __attribute__((preserve_access_index)); 4662306a36Sopenharmony_ci 4762306a36Sopenharmony_cistruct inet_connection_sock { 4862306a36Sopenharmony_ci struct inet_sock icsk_inet; 4962306a36Sopenharmony_ci __u8 icsk_ca_state:6, 5062306a36Sopenharmony_ci icsk_ca_setsockopt:1, 5162306a36Sopenharmony_ci icsk_ca_dst_locked:1; 5262306a36Sopenharmony_ci struct { 5362306a36Sopenharmony_ci __u8 pending; 5462306a36Sopenharmony_ci } icsk_ack; 5562306a36Sopenharmony_ci __u64 icsk_ca_priv[104 / sizeof(__u64)]; 5662306a36Sopenharmony_ci} __attribute__((preserve_access_index)); 5762306a36Sopenharmony_ci 5862306a36Sopenharmony_cistruct request_sock { 5962306a36Sopenharmony_ci struct sock_common __req_common; 6062306a36Sopenharmony_ci} __attribute__((preserve_access_index)); 6162306a36Sopenharmony_ci 6262306a36Sopenharmony_cistruct tcp_sock { 6362306a36Sopenharmony_ci struct inet_connection_sock inet_conn; 6462306a36Sopenharmony_ci 6562306a36Sopenharmony_ci __u32 rcv_nxt; 6662306a36Sopenharmony_ci __u32 snd_nxt; 6762306a36Sopenharmony_ci __u32 snd_una; 6862306a36Sopenharmony_ci __u32 window_clamp; 6962306a36Sopenharmony_ci __u8 ecn_flags; 7062306a36Sopenharmony_ci __u32 delivered; 7162306a36Sopenharmony_ci __u32 delivered_ce; 7262306a36Sopenharmony_ci __u32 snd_cwnd; 7362306a36Sopenharmony_ci __u32 snd_cwnd_cnt; 7462306a36Sopenharmony_ci __u32 snd_cwnd_clamp; 7562306a36Sopenharmony_ci __u32 snd_ssthresh; 7662306a36Sopenharmony_ci __u8 syn_data:1, /* SYN includes data */ 7762306a36Sopenharmony_ci syn_fastopen:1, /* SYN includes Fast Open option */ 7862306a36Sopenharmony_ci syn_fastopen_exp:1,/* SYN includes Fast Open exp. option */ 7962306a36Sopenharmony_ci syn_fastopen_ch:1, /* Active TFO re-enabling probe */ 8062306a36Sopenharmony_ci syn_data_acked:1,/* data in SYN is acked by SYN-ACK */ 8162306a36Sopenharmony_ci save_syn:1, /* Save headers of SYN packet */ 8262306a36Sopenharmony_ci is_cwnd_limited:1,/* forward progress limited by snd_cwnd? */ 8362306a36Sopenharmony_ci syn_smc:1; /* SYN includes SMC */ 8462306a36Sopenharmony_ci __u32 max_packets_out; 8562306a36Sopenharmony_ci __u32 lsndtime; 8662306a36Sopenharmony_ci __u32 prior_cwnd; 8762306a36Sopenharmony_ci __u64 tcp_mstamp; /* most recent packet received/sent */ 8862306a36Sopenharmony_ci bool is_mptcp; 8962306a36Sopenharmony_ci} __attribute__((preserve_access_index)); 9062306a36Sopenharmony_ci 9162306a36Sopenharmony_cistatic __always_inline struct inet_connection_sock *inet_csk(const struct sock *sk) 9262306a36Sopenharmony_ci{ 9362306a36Sopenharmony_ci return (struct inet_connection_sock *)sk; 9462306a36Sopenharmony_ci} 9562306a36Sopenharmony_ci 9662306a36Sopenharmony_cistatic __always_inline void *inet_csk_ca(const struct sock *sk) 9762306a36Sopenharmony_ci{ 9862306a36Sopenharmony_ci return (void *)inet_csk(sk)->icsk_ca_priv; 9962306a36Sopenharmony_ci} 10062306a36Sopenharmony_ci 10162306a36Sopenharmony_cistatic __always_inline struct tcp_sock *tcp_sk(const struct sock *sk) 10262306a36Sopenharmony_ci{ 10362306a36Sopenharmony_ci return (struct tcp_sock *)sk; 10462306a36Sopenharmony_ci} 10562306a36Sopenharmony_ci 10662306a36Sopenharmony_cistatic __always_inline bool before(__u32 seq1, __u32 seq2) 10762306a36Sopenharmony_ci{ 10862306a36Sopenharmony_ci return (__s32)(seq1-seq2) < 0; 10962306a36Sopenharmony_ci} 11062306a36Sopenharmony_ci#define after(seq2, seq1) before(seq1, seq2) 11162306a36Sopenharmony_ci 11262306a36Sopenharmony_ci#define TCP_ECN_OK 1 11362306a36Sopenharmony_ci#define TCP_ECN_QUEUE_CWR 2 11462306a36Sopenharmony_ci#define TCP_ECN_DEMAND_CWR 4 11562306a36Sopenharmony_ci#define TCP_ECN_SEEN 8 11662306a36Sopenharmony_ci 11762306a36Sopenharmony_cienum inet_csk_ack_state_t { 11862306a36Sopenharmony_ci ICSK_ACK_SCHED = 1, 11962306a36Sopenharmony_ci ICSK_ACK_TIMER = 2, 12062306a36Sopenharmony_ci ICSK_ACK_PUSHED = 4, 12162306a36Sopenharmony_ci ICSK_ACK_PUSHED2 = 8, 12262306a36Sopenharmony_ci ICSK_ACK_NOW = 16 /* Send the next ACK immediately (once) */ 12362306a36Sopenharmony_ci}; 12462306a36Sopenharmony_ci 12562306a36Sopenharmony_cienum tcp_ca_event { 12662306a36Sopenharmony_ci CA_EVENT_TX_START = 0, 12762306a36Sopenharmony_ci CA_EVENT_CWND_RESTART = 1, 12862306a36Sopenharmony_ci CA_EVENT_COMPLETE_CWR = 2, 12962306a36Sopenharmony_ci CA_EVENT_LOSS = 3, 13062306a36Sopenharmony_ci CA_EVENT_ECN_NO_CE = 4, 13162306a36Sopenharmony_ci CA_EVENT_ECN_IS_CE = 5, 13262306a36Sopenharmony_ci}; 13362306a36Sopenharmony_ci 13462306a36Sopenharmony_cistruct ack_sample { 13562306a36Sopenharmony_ci __u32 pkts_acked; 13662306a36Sopenharmony_ci __s32 rtt_us; 13762306a36Sopenharmony_ci __u32 in_flight; 13862306a36Sopenharmony_ci} __attribute__((preserve_access_index)); 13962306a36Sopenharmony_ci 14062306a36Sopenharmony_cistruct rate_sample { 14162306a36Sopenharmony_ci __u64 prior_mstamp; /* starting timestamp for interval */ 14262306a36Sopenharmony_ci __u32 prior_delivered; /* tp->delivered at "prior_mstamp" */ 14362306a36Sopenharmony_ci __s32 delivered; /* number of packets delivered over interval */ 14462306a36Sopenharmony_ci long interval_us; /* time for tp->delivered to incr "delivered" */ 14562306a36Sopenharmony_ci __u32 snd_interval_us; /* snd interval for delivered packets */ 14662306a36Sopenharmony_ci __u32 rcv_interval_us; /* rcv interval for delivered packets */ 14762306a36Sopenharmony_ci long rtt_us; /* RTT of last (S)ACKed packet (or -1) */ 14862306a36Sopenharmony_ci int losses; /* number of packets marked lost upon ACK */ 14962306a36Sopenharmony_ci __u32 acked_sacked; /* number of packets newly (S)ACKed upon ACK */ 15062306a36Sopenharmony_ci __u32 prior_in_flight; /* in flight before this ACK */ 15162306a36Sopenharmony_ci bool is_app_limited; /* is sample from packet with bubble in pipe? */ 15262306a36Sopenharmony_ci bool is_retrans; /* is sample from retransmission? */ 15362306a36Sopenharmony_ci bool is_ack_delayed; /* is this (likely) a delayed ACK? */ 15462306a36Sopenharmony_ci} __attribute__((preserve_access_index)); 15562306a36Sopenharmony_ci 15662306a36Sopenharmony_ci#define TCP_CA_NAME_MAX 16 15762306a36Sopenharmony_ci#define TCP_CONG_NEEDS_ECN 0x2 15862306a36Sopenharmony_ci 15962306a36Sopenharmony_cistruct tcp_congestion_ops { 16062306a36Sopenharmony_ci char name[TCP_CA_NAME_MAX]; 16162306a36Sopenharmony_ci __u32 flags; 16262306a36Sopenharmony_ci 16362306a36Sopenharmony_ci /* initialize private data (optional) */ 16462306a36Sopenharmony_ci void (*init)(struct sock *sk); 16562306a36Sopenharmony_ci /* cleanup private data (optional) */ 16662306a36Sopenharmony_ci void (*release)(struct sock *sk); 16762306a36Sopenharmony_ci 16862306a36Sopenharmony_ci /* return slow start threshold (required) */ 16962306a36Sopenharmony_ci __u32 (*ssthresh)(struct sock *sk); 17062306a36Sopenharmony_ci /* do new cwnd calculation (required) */ 17162306a36Sopenharmony_ci void (*cong_avoid)(struct sock *sk, __u32 ack, __u32 acked); 17262306a36Sopenharmony_ci /* call before changing ca_state (optional) */ 17362306a36Sopenharmony_ci void (*set_state)(struct sock *sk, __u8 new_state); 17462306a36Sopenharmony_ci /* call when cwnd event occurs (optional) */ 17562306a36Sopenharmony_ci void (*cwnd_event)(struct sock *sk, enum tcp_ca_event ev); 17662306a36Sopenharmony_ci /* call when ack arrives (optional) */ 17762306a36Sopenharmony_ci void (*in_ack_event)(struct sock *sk, __u32 flags); 17862306a36Sopenharmony_ci /* new value of cwnd after loss (required) */ 17962306a36Sopenharmony_ci __u32 (*undo_cwnd)(struct sock *sk); 18062306a36Sopenharmony_ci /* hook for packet ack accounting (optional) */ 18162306a36Sopenharmony_ci void (*pkts_acked)(struct sock *sk, const struct ack_sample *sample); 18262306a36Sopenharmony_ci /* override sysctl_tcp_min_tso_segs */ 18362306a36Sopenharmony_ci __u32 (*min_tso_segs)(struct sock *sk); 18462306a36Sopenharmony_ci /* returns the multiplier used in tcp_sndbuf_expand (optional) */ 18562306a36Sopenharmony_ci __u32 (*sndbuf_expand)(struct sock *sk); 18662306a36Sopenharmony_ci /* call when packets are delivered to update cwnd and pacing rate, 18762306a36Sopenharmony_ci * after all the ca_state processing. (optional) 18862306a36Sopenharmony_ci */ 18962306a36Sopenharmony_ci void (*cong_control)(struct sock *sk, const struct rate_sample *rs); 19062306a36Sopenharmony_ci void *owner; 19162306a36Sopenharmony_ci}; 19262306a36Sopenharmony_ci 19362306a36Sopenharmony_ci#define min(a, b) ((a) < (b) ? (a) : (b)) 19462306a36Sopenharmony_ci#define max(a, b) ((a) > (b) ? (a) : (b)) 19562306a36Sopenharmony_ci#define min_not_zero(x, y) ({ \ 19662306a36Sopenharmony_ci typeof(x) __x = (x); \ 19762306a36Sopenharmony_ci typeof(y) __y = (y); \ 19862306a36Sopenharmony_ci __x == 0 ? __y : ((__y == 0) ? __x : min(__x, __y)); }) 19962306a36Sopenharmony_ci 20062306a36Sopenharmony_cistatic __always_inline bool tcp_in_slow_start(const struct tcp_sock *tp) 20162306a36Sopenharmony_ci{ 20262306a36Sopenharmony_ci return tp->snd_cwnd < tp->snd_ssthresh; 20362306a36Sopenharmony_ci} 20462306a36Sopenharmony_ci 20562306a36Sopenharmony_cistatic __always_inline bool tcp_is_cwnd_limited(const struct sock *sk) 20662306a36Sopenharmony_ci{ 20762306a36Sopenharmony_ci const struct tcp_sock *tp = tcp_sk(sk); 20862306a36Sopenharmony_ci 20962306a36Sopenharmony_ci /* If in slow start, ensure cwnd grows to twice what was ACKed. */ 21062306a36Sopenharmony_ci if (tcp_in_slow_start(tp)) 21162306a36Sopenharmony_ci return tp->snd_cwnd < 2 * tp->max_packets_out; 21262306a36Sopenharmony_ci 21362306a36Sopenharmony_ci return !!BPF_CORE_READ_BITFIELD(tp, is_cwnd_limited); 21462306a36Sopenharmony_ci} 21562306a36Sopenharmony_ci 21662306a36Sopenharmony_cistatic __always_inline bool tcp_cc_eq(const char *a, const char *b) 21762306a36Sopenharmony_ci{ 21862306a36Sopenharmony_ci int i; 21962306a36Sopenharmony_ci 22062306a36Sopenharmony_ci for (i = 0; i < TCP_CA_NAME_MAX; i++) { 22162306a36Sopenharmony_ci if (a[i] != b[i]) 22262306a36Sopenharmony_ci return false; 22362306a36Sopenharmony_ci if (!a[i]) 22462306a36Sopenharmony_ci break; 22562306a36Sopenharmony_ci } 22662306a36Sopenharmony_ci 22762306a36Sopenharmony_ci return true; 22862306a36Sopenharmony_ci} 22962306a36Sopenharmony_ci 23062306a36Sopenharmony_ciextern __u32 tcp_slow_start(struct tcp_sock *tp, __u32 acked) __ksym; 23162306a36Sopenharmony_ciextern void tcp_cong_avoid_ai(struct tcp_sock *tp, __u32 w, __u32 acked) __ksym; 23262306a36Sopenharmony_ci 23362306a36Sopenharmony_cistruct mptcp_sock { 23462306a36Sopenharmony_ci struct inet_connection_sock sk; 23562306a36Sopenharmony_ci 23662306a36Sopenharmony_ci __u32 token; 23762306a36Sopenharmony_ci struct sock *first; 23862306a36Sopenharmony_ci char ca_name[TCP_CA_NAME_MAX]; 23962306a36Sopenharmony_ci} __attribute__((preserve_access_index)); 24062306a36Sopenharmony_ci 24162306a36Sopenharmony_ci#endif 242