162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause
262306a36Sopenharmony_ci
362306a36Sopenharmony_ci/* COMMON Applications Kept Enhanced (CAKE) discipline
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Copyright (C) 2014-2018 Jonathan Morton <chromatix99@gmail.com>
662306a36Sopenharmony_ci * Copyright (C) 2015-2018 Toke Høiland-Jørgensen <toke@toke.dk>
762306a36Sopenharmony_ci * Copyright (C) 2014-2018 Dave Täht <dave.taht@gmail.com>
862306a36Sopenharmony_ci * Copyright (C) 2015-2018 Sebastian Moeller <moeller0@gmx.de>
962306a36Sopenharmony_ci * (C) 2015-2018 Kevin Darbyshire-Bryant <kevin@darbyshire-bryant.me.uk>
1062306a36Sopenharmony_ci * Copyright (C) 2017-2018 Ryan Mounce <ryan@mounce.com.au>
1162306a36Sopenharmony_ci *
1262306a36Sopenharmony_ci * The CAKE Principles:
1362306a36Sopenharmony_ci *		   (or, how to have your cake and eat it too)
1462306a36Sopenharmony_ci *
1562306a36Sopenharmony_ci * This is a combination of several shaping, AQM and FQ techniques into one
1662306a36Sopenharmony_ci * easy-to-use package:
1762306a36Sopenharmony_ci *
1862306a36Sopenharmony_ci * - An overall bandwidth shaper, to move the bottleneck away from dumb CPE
1962306a36Sopenharmony_ci *   equipment and bloated MACs.  This operates in deficit mode (as in sch_fq),
2062306a36Sopenharmony_ci *   eliminating the need for any sort of burst parameter (eg. token bucket
2162306a36Sopenharmony_ci *   depth).  Burst support is limited to that necessary to overcome scheduling
2262306a36Sopenharmony_ci *   latency.
2362306a36Sopenharmony_ci *
2462306a36Sopenharmony_ci * - A Diffserv-aware priority queue, giving more priority to certain classes,
2562306a36Sopenharmony_ci *   up to a specified fraction of bandwidth.  Above that bandwidth threshold,
2662306a36Sopenharmony_ci *   the priority is reduced to avoid starving other tins.
2762306a36Sopenharmony_ci *
2862306a36Sopenharmony_ci * - Each priority tin has a separate Flow Queue system, to isolate traffic
2962306a36Sopenharmony_ci *   flows from each other.  This prevents a burst on one flow from increasing
3062306a36Sopenharmony_ci *   the delay to another.  Flows are distributed to queues using a
3162306a36Sopenharmony_ci *   set-associative hash function.
3262306a36Sopenharmony_ci *
3362306a36Sopenharmony_ci * - Each queue is actively managed by Cobalt, which is a combination of the
3462306a36Sopenharmony_ci *   Codel and Blue AQM algorithms.  This serves flows fairly, and signals
3562306a36Sopenharmony_ci *   congestion early via ECN (if available) and/or packet drops, to keep
3662306a36Sopenharmony_ci *   latency low.  The codel parameters are auto-tuned based on the bandwidth
3762306a36Sopenharmony_ci *   setting, as is necessary at low bandwidths.
3862306a36Sopenharmony_ci *
3962306a36Sopenharmony_ci * The configuration parameters are kept deliberately simple for ease of use.
4062306a36Sopenharmony_ci * Everything has sane defaults.  Complete generality of configuration is *not*
4162306a36Sopenharmony_ci * a goal.
4262306a36Sopenharmony_ci *
4362306a36Sopenharmony_ci * The priority queue operates according to a weighted DRR scheme, combined with
4462306a36Sopenharmony_ci * a bandwidth tracker which reuses the shaper logic to detect which side of the
4562306a36Sopenharmony_ci * bandwidth sharing threshold the tin is operating.  This determines whether a
4662306a36Sopenharmony_ci * priority-based weight (high) or a bandwidth-based weight (low) is used for
4762306a36Sopenharmony_ci * that tin in the current pass.
4862306a36Sopenharmony_ci *
4962306a36Sopenharmony_ci * This qdisc was inspired by Eric Dumazet's fq_codel code, which he kindly
5062306a36Sopenharmony_ci * granted us permission to leverage.
5162306a36Sopenharmony_ci */
5262306a36Sopenharmony_ci
5362306a36Sopenharmony_ci#include <linux/module.h>
5462306a36Sopenharmony_ci#include <linux/types.h>
5562306a36Sopenharmony_ci#include <linux/kernel.h>
5662306a36Sopenharmony_ci#include <linux/jiffies.h>
5762306a36Sopenharmony_ci#include <linux/string.h>
5862306a36Sopenharmony_ci#include <linux/in.h>
5962306a36Sopenharmony_ci#include <linux/errno.h>
6062306a36Sopenharmony_ci#include <linux/init.h>
6162306a36Sopenharmony_ci#include <linux/skbuff.h>
6262306a36Sopenharmony_ci#include <linux/jhash.h>
6362306a36Sopenharmony_ci#include <linux/slab.h>
6462306a36Sopenharmony_ci#include <linux/vmalloc.h>
6562306a36Sopenharmony_ci#include <linux/reciprocal_div.h>
6662306a36Sopenharmony_ci#include <net/netlink.h>
6762306a36Sopenharmony_ci#include <linux/if_vlan.h>
6862306a36Sopenharmony_ci#include <net/gso.h>
6962306a36Sopenharmony_ci#include <net/pkt_sched.h>
7062306a36Sopenharmony_ci#include <net/pkt_cls.h>
7162306a36Sopenharmony_ci#include <net/tcp.h>
7262306a36Sopenharmony_ci#include <net/flow_dissector.h>
7362306a36Sopenharmony_ci
7462306a36Sopenharmony_ci#if IS_ENABLED(CONFIG_NF_CONNTRACK)
7562306a36Sopenharmony_ci#include <net/netfilter/nf_conntrack_core.h>
7662306a36Sopenharmony_ci#endif
7762306a36Sopenharmony_ci
7862306a36Sopenharmony_ci#define CAKE_SET_WAYS (8)
7962306a36Sopenharmony_ci#define CAKE_MAX_TINS (8)
8062306a36Sopenharmony_ci#define CAKE_QUEUES (1024)
8162306a36Sopenharmony_ci#define CAKE_FLOW_MASK 63
8262306a36Sopenharmony_ci#define CAKE_FLOW_NAT_FLAG 64
8362306a36Sopenharmony_ci
8462306a36Sopenharmony_ci/* struct cobalt_params - contains codel and blue parameters
8562306a36Sopenharmony_ci * @interval:	codel initial drop rate
8662306a36Sopenharmony_ci * @target:     maximum persistent sojourn time & blue update rate
8762306a36Sopenharmony_ci * @mtu_time:   serialisation delay of maximum-size packet
8862306a36Sopenharmony_ci * @p_inc:      increment of blue drop probability (0.32 fxp)
8962306a36Sopenharmony_ci * @p_dec:      decrement of blue drop probability (0.32 fxp)
9062306a36Sopenharmony_ci */
9162306a36Sopenharmony_cistruct cobalt_params {
9262306a36Sopenharmony_ci	u64	interval;
9362306a36Sopenharmony_ci	u64	target;
9462306a36Sopenharmony_ci	u64	mtu_time;
9562306a36Sopenharmony_ci	u32	p_inc;
9662306a36Sopenharmony_ci	u32	p_dec;
9762306a36Sopenharmony_ci};
9862306a36Sopenharmony_ci
9962306a36Sopenharmony_ci/* struct cobalt_vars - contains codel and blue variables
10062306a36Sopenharmony_ci * @count:		codel dropping frequency
10162306a36Sopenharmony_ci * @rec_inv_sqrt:	reciprocal value of sqrt(count) >> 1
10262306a36Sopenharmony_ci * @drop_next:		time to drop next packet, or when we dropped last
10362306a36Sopenharmony_ci * @blue_timer:		Blue time to next drop
10462306a36Sopenharmony_ci * @p_drop:		BLUE drop probability (0.32 fxp)
10562306a36Sopenharmony_ci * @dropping:		set if in dropping state
10662306a36Sopenharmony_ci * @ecn_marked:		set if marked
10762306a36Sopenharmony_ci */
10862306a36Sopenharmony_cistruct cobalt_vars {
10962306a36Sopenharmony_ci	u32	count;
11062306a36Sopenharmony_ci	u32	rec_inv_sqrt;
11162306a36Sopenharmony_ci	ktime_t	drop_next;
11262306a36Sopenharmony_ci	ktime_t	blue_timer;
11362306a36Sopenharmony_ci	u32     p_drop;
11462306a36Sopenharmony_ci	bool	dropping;
11562306a36Sopenharmony_ci	bool    ecn_marked;
11662306a36Sopenharmony_ci};
11762306a36Sopenharmony_ci
11862306a36Sopenharmony_cienum {
11962306a36Sopenharmony_ci	CAKE_SET_NONE = 0,
12062306a36Sopenharmony_ci	CAKE_SET_SPARSE,
12162306a36Sopenharmony_ci	CAKE_SET_SPARSE_WAIT, /* counted in SPARSE, actually in BULK */
12262306a36Sopenharmony_ci	CAKE_SET_BULK,
12362306a36Sopenharmony_ci	CAKE_SET_DECAYING
12462306a36Sopenharmony_ci};
12562306a36Sopenharmony_ci
12662306a36Sopenharmony_cistruct cake_flow {
12762306a36Sopenharmony_ci	/* this stuff is all needed per-flow at dequeue time */
12862306a36Sopenharmony_ci	struct sk_buff	  *head;
12962306a36Sopenharmony_ci	struct sk_buff	  *tail;
13062306a36Sopenharmony_ci	struct list_head  flowchain;
13162306a36Sopenharmony_ci	s32		  deficit;
13262306a36Sopenharmony_ci	u32		  dropped;
13362306a36Sopenharmony_ci	struct cobalt_vars cvars;
13462306a36Sopenharmony_ci	u16		  srchost; /* index into cake_host table */
13562306a36Sopenharmony_ci	u16		  dsthost;
13662306a36Sopenharmony_ci	u8		  set;
13762306a36Sopenharmony_ci}; /* please try to keep this structure <= 64 bytes */
13862306a36Sopenharmony_ci
13962306a36Sopenharmony_cistruct cake_host {
14062306a36Sopenharmony_ci	u32 srchost_tag;
14162306a36Sopenharmony_ci	u32 dsthost_tag;
14262306a36Sopenharmony_ci	u16 srchost_bulk_flow_count;
14362306a36Sopenharmony_ci	u16 dsthost_bulk_flow_count;
14462306a36Sopenharmony_ci};
14562306a36Sopenharmony_ci
14662306a36Sopenharmony_cistruct cake_heap_entry {
14762306a36Sopenharmony_ci	u16 t:3, b:10;
14862306a36Sopenharmony_ci};
14962306a36Sopenharmony_ci
15062306a36Sopenharmony_cistruct cake_tin_data {
15162306a36Sopenharmony_ci	struct cake_flow flows[CAKE_QUEUES];
15262306a36Sopenharmony_ci	u32	backlogs[CAKE_QUEUES];
15362306a36Sopenharmony_ci	u32	tags[CAKE_QUEUES]; /* for set association */
15462306a36Sopenharmony_ci	u16	overflow_idx[CAKE_QUEUES];
15562306a36Sopenharmony_ci	struct cake_host hosts[CAKE_QUEUES]; /* for triple isolation */
15662306a36Sopenharmony_ci	u16	flow_quantum;
15762306a36Sopenharmony_ci
15862306a36Sopenharmony_ci	struct cobalt_params cparams;
15962306a36Sopenharmony_ci	u32	drop_overlimit;
16062306a36Sopenharmony_ci	u16	bulk_flow_count;
16162306a36Sopenharmony_ci	u16	sparse_flow_count;
16262306a36Sopenharmony_ci	u16	decaying_flow_count;
16362306a36Sopenharmony_ci	u16	unresponsive_flow_count;
16462306a36Sopenharmony_ci
16562306a36Sopenharmony_ci	u32	max_skblen;
16662306a36Sopenharmony_ci
16762306a36Sopenharmony_ci	struct list_head new_flows;
16862306a36Sopenharmony_ci	struct list_head old_flows;
16962306a36Sopenharmony_ci	struct list_head decaying_flows;
17062306a36Sopenharmony_ci
17162306a36Sopenharmony_ci	/* time_next = time_this + ((len * rate_ns) >> rate_shft) */
17262306a36Sopenharmony_ci	ktime_t	time_next_packet;
17362306a36Sopenharmony_ci	u64	tin_rate_ns;
17462306a36Sopenharmony_ci	u64	tin_rate_bps;
17562306a36Sopenharmony_ci	u16	tin_rate_shft;
17662306a36Sopenharmony_ci
17762306a36Sopenharmony_ci	u16	tin_quantum;
17862306a36Sopenharmony_ci	s32	tin_deficit;
17962306a36Sopenharmony_ci	u32	tin_backlog;
18062306a36Sopenharmony_ci	u32	tin_dropped;
18162306a36Sopenharmony_ci	u32	tin_ecn_mark;
18262306a36Sopenharmony_ci
18362306a36Sopenharmony_ci	u32	packets;
18462306a36Sopenharmony_ci	u64	bytes;
18562306a36Sopenharmony_ci
18662306a36Sopenharmony_ci	u32	ack_drops;
18762306a36Sopenharmony_ci
18862306a36Sopenharmony_ci	/* moving averages */
18962306a36Sopenharmony_ci	u64 avge_delay;
19062306a36Sopenharmony_ci	u64 peak_delay;
19162306a36Sopenharmony_ci	u64 base_delay;
19262306a36Sopenharmony_ci
19362306a36Sopenharmony_ci	/* hash function stats */
19462306a36Sopenharmony_ci	u32	way_directs;
19562306a36Sopenharmony_ci	u32	way_hits;
19662306a36Sopenharmony_ci	u32	way_misses;
19762306a36Sopenharmony_ci	u32	way_collisions;
19862306a36Sopenharmony_ci}; /* number of tins is small, so size of this struct doesn't matter much */
19962306a36Sopenharmony_ci
20062306a36Sopenharmony_cistruct cake_sched_data {
20162306a36Sopenharmony_ci	struct tcf_proto __rcu *filter_list; /* optional external classifier */
20262306a36Sopenharmony_ci	struct tcf_block *block;
20362306a36Sopenharmony_ci	struct cake_tin_data *tins;
20462306a36Sopenharmony_ci
20562306a36Sopenharmony_ci	struct cake_heap_entry overflow_heap[CAKE_QUEUES * CAKE_MAX_TINS];
20662306a36Sopenharmony_ci	u16		overflow_timeout;
20762306a36Sopenharmony_ci
20862306a36Sopenharmony_ci	u16		tin_cnt;
20962306a36Sopenharmony_ci	u8		tin_mode;
21062306a36Sopenharmony_ci	u8		flow_mode;
21162306a36Sopenharmony_ci	u8		ack_filter;
21262306a36Sopenharmony_ci	u8		atm_mode;
21362306a36Sopenharmony_ci
21462306a36Sopenharmony_ci	u32		fwmark_mask;
21562306a36Sopenharmony_ci	u16		fwmark_shft;
21662306a36Sopenharmony_ci
21762306a36Sopenharmony_ci	/* time_next = time_this + ((len * rate_ns) >> rate_shft) */
21862306a36Sopenharmony_ci	u16		rate_shft;
21962306a36Sopenharmony_ci	ktime_t		time_next_packet;
22062306a36Sopenharmony_ci	ktime_t		failsafe_next_packet;
22162306a36Sopenharmony_ci	u64		rate_ns;
22262306a36Sopenharmony_ci	u64		rate_bps;
22362306a36Sopenharmony_ci	u16		rate_flags;
22462306a36Sopenharmony_ci	s16		rate_overhead;
22562306a36Sopenharmony_ci	u16		rate_mpu;
22662306a36Sopenharmony_ci	u64		interval;
22762306a36Sopenharmony_ci	u64		target;
22862306a36Sopenharmony_ci
22962306a36Sopenharmony_ci	/* resource tracking */
23062306a36Sopenharmony_ci	u32		buffer_used;
23162306a36Sopenharmony_ci	u32		buffer_max_used;
23262306a36Sopenharmony_ci	u32		buffer_limit;
23362306a36Sopenharmony_ci	u32		buffer_config_limit;
23462306a36Sopenharmony_ci
23562306a36Sopenharmony_ci	/* indices for dequeue */
23662306a36Sopenharmony_ci	u16		cur_tin;
23762306a36Sopenharmony_ci	u16		cur_flow;
23862306a36Sopenharmony_ci
23962306a36Sopenharmony_ci	struct qdisc_watchdog watchdog;
24062306a36Sopenharmony_ci	const u8	*tin_index;
24162306a36Sopenharmony_ci	const u8	*tin_order;
24262306a36Sopenharmony_ci
24362306a36Sopenharmony_ci	/* bandwidth capacity estimate */
24462306a36Sopenharmony_ci	ktime_t		last_packet_time;
24562306a36Sopenharmony_ci	ktime_t		avg_window_begin;
24662306a36Sopenharmony_ci	u64		avg_packet_interval;
24762306a36Sopenharmony_ci	u64		avg_window_bytes;
24862306a36Sopenharmony_ci	u64		avg_peak_bandwidth;
24962306a36Sopenharmony_ci	ktime_t		last_reconfig_time;
25062306a36Sopenharmony_ci
25162306a36Sopenharmony_ci	/* packet length stats */
25262306a36Sopenharmony_ci	u32		avg_netoff;
25362306a36Sopenharmony_ci	u16		max_netlen;
25462306a36Sopenharmony_ci	u16		max_adjlen;
25562306a36Sopenharmony_ci	u16		min_netlen;
25662306a36Sopenharmony_ci	u16		min_adjlen;
25762306a36Sopenharmony_ci};
25862306a36Sopenharmony_ci
25962306a36Sopenharmony_cienum {
26062306a36Sopenharmony_ci	CAKE_FLAG_OVERHEAD	   = BIT(0),
26162306a36Sopenharmony_ci	CAKE_FLAG_AUTORATE_INGRESS = BIT(1),
26262306a36Sopenharmony_ci	CAKE_FLAG_INGRESS	   = BIT(2),
26362306a36Sopenharmony_ci	CAKE_FLAG_WASH		   = BIT(3),
26462306a36Sopenharmony_ci	CAKE_FLAG_SPLIT_GSO	   = BIT(4)
26562306a36Sopenharmony_ci};
26662306a36Sopenharmony_ci
26762306a36Sopenharmony_ci/* COBALT operates the Codel and BLUE algorithms in parallel, in order to
26862306a36Sopenharmony_ci * obtain the best features of each.  Codel is excellent on flows which
26962306a36Sopenharmony_ci * respond to congestion signals in a TCP-like way.  BLUE is more effective on
27062306a36Sopenharmony_ci * unresponsive flows.
27162306a36Sopenharmony_ci */
27262306a36Sopenharmony_ci
27362306a36Sopenharmony_cistruct cobalt_skb_cb {
27462306a36Sopenharmony_ci	ktime_t enqueue_time;
27562306a36Sopenharmony_ci	u32     adjusted_len;
27662306a36Sopenharmony_ci};
27762306a36Sopenharmony_ci
27862306a36Sopenharmony_cistatic u64 us_to_ns(u64 us)
27962306a36Sopenharmony_ci{
28062306a36Sopenharmony_ci	return us * NSEC_PER_USEC;
28162306a36Sopenharmony_ci}
28262306a36Sopenharmony_ci
28362306a36Sopenharmony_cistatic struct cobalt_skb_cb *get_cobalt_cb(const struct sk_buff *skb)
28462306a36Sopenharmony_ci{
28562306a36Sopenharmony_ci	qdisc_cb_private_validate(skb, sizeof(struct cobalt_skb_cb));
28662306a36Sopenharmony_ci	return (struct cobalt_skb_cb *)qdisc_skb_cb(skb)->data;
28762306a36Sopenharmony_ci}
28862306a36Sopenharmony_ci
28962306a36Sopenharmony_cistatic ktime_t cobalt_get_enqueue_time(const struct sk_buff *skb)
29062306a36Sopenharmony_ci{
29162306a36Sopenharmony_ci	return get_cobalt_cb(skb)->enqueue_time;
29262306a36Sopenharmony_ci}
29362306a36Sopenharmony_ci
29462306a36Sopenharmony_cistatic void cobalt_set_enqueue_time(struct sk_buff *skb,
29562306a36Sopenharmony_ci				    ktime_t now)
29662306a36Sopenharmony_ci{
29762306a36Sopenharmony_ci	get_cobalt_cb(skb)->enqueue_time = now;
29862306a36Sopenharmony_ci}
29962306a36Sopenharmony_ci
30062306a36Sopenharmony_cistatic u16 quantum_div[CAKE_QUEUES + 1] = {0};
30162306a36Sopenharmony_ci
30262306a36Sopenharmony_ci/* Diffserv lookup tables */
30362306a36Sopenharmony_ci
30462306a36Sopenharmony_cistatic const u8 precedence[] = {
30562306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
30662306a36Sopenharmony_ci	1, 1, 1, 1, 1, 1, 1, 1,
30762306a36Sopenharmony_ci	2, 2, 2, 2, 2, 2, 2, 2,
30862306a36Sopenharmony_ci	3, 3, 3, 3, 3, 3, 3, 3,
30962306a36Sopenharmony_ci	4, 4, 4, 4, 4, 4, 4, 4,
31062306a36Sopenharmony_ci	5, 5, 5, 5, 5, 5, 5, 5,
31162306a36Sopenharmony_ci	6, 6, 6, 6, 6, 6, 6, 6,
31262306a36Sopenharmony_ci	7, 7, 7, 7, 7, 7, 7, 7,
31362306a36Sopenharmony_ci};
31462306a36Sopenharmony_ci
31562306a36Sopenharmony_cistatic const u8 diffserv8[] = {
31662306a36Sopenharmony_ci	2, 0, 1, 2, 4, 2, 2, 2,
31762306a36Sopenharmony_ci	1, 2, 1, 2, 1, 2, 1, 2,
31862306a36Sopenharmony_ci	5, 2, 4, 2, 4, 2, 4, 2,
31962306a36Sopenharmony_ci	3, 2, 3, 2, 3, 2, 3, 2,
32062306a36Sopenharmony_ci	6, 2, 3, 2, 3, 2, 3, 2,
32162306a36Sopenharmony_ci	6, 2, 2, 2, 6, 2, 6, 2,
32262306a36Sopenharmony_ci	7, 2, 2, 2, 2, 2, 2, 2,
32362306a36Sopenharmony_ci	7, 2, 2, 2, 2, 2, 2, 2,
32462306a36Sopenharmony_ci};
32562306a36Sopenharmony_ci
32662306a36Sopenharmony_cistatic const u8 diffserv4[] = {
32762306a36Sopenharmony_ci	0, 1, 0, 0, 2, 0, 0, 0,
32862306a36Sopenharmony_ci	1, 0, 0, 0, 0, 0, 0, 0,
32962306a36Sopenharmony_ci	2, 0, 2, 0, 2, 0, 2, 0,
33062306a36Sopenharmony_ci	2, 0, 2, 0, 2, 0, 2, 0,
33162306a36Sopenharmony_ci	3, 0, 2, 0, 2, 0, 2, 0,
33262306a36Sopenharmony_ci	3, 0, 0, 0, 3, 0, 3, 0,
33362306a36Sopenharmony_ci	3, 0, 0, 0, 0, 0, 0, 0,
33462306a36Sopenharmony_ci	3, 0, 0, 0, 0, 0, 0, 0,
33562306a36Sopenharmony_ci};
33662306a36Sopenharmony_ci
33762306a36Sopenharmony_cistatic const u8 diffserv3[] = {
33862306a36Sopenharmony_ci	0, 1, 0, 0, 2, 0, 0, 0,
33962306a36Sopenharmony_ci	1, 0, 0, 0, 0, 0, 0, 0,
34062306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
34162306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
34262306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
34362306a36Sopenharmony_ci	0, 0, 0, 0, 2, 0, 2, 0,
34462306a36Sopenharmony_ci	2, 0, 0, 0, 0, 0, 0, 0,
34562306a36Sopenharmony_ci	2, 0, 0, 0, 0, 0, 0, 0,
34662306a36Sopenharmony_ci};
34762306a36Sopenharmony_ci
34862306a36Sopenharmony_cistatic const u8 besteffort[] = {
34962306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
35062306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
35162306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
35262306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
35362306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
35462306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
35562306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
35662306a36Sopenharmony_ci	0, 0, 0, 0, 0, 0, 0, 0,
35762306a36Sopenharmony_ci};
35862306a36Sopenharmony_ci
35962306a36Sopenharmony_ci/* tin priority order for stats dumping */
36062306a36Sopenharmony_ci
36162306a36Sopenharmony_cistatic const u8 normal_order[] = {0, 1, 2, 3, 4, 5, 6, 7};
36262306a36Sopenharmony_cistatic const u8 bulk_order[] = {1, 0, 2, 3};
36362306a36Sopenharmony_ci
36462306a36Sopenharmony_ci#define REC_INV_SQRT_CACHE (16)
36562306a36Sopenharmony_cistatic u32 cobalt_rec_inv_sqrt_cache[REC_INV_SQRT_CACHE] = {0};
36662306a36Sopenharmony_ci
36762306a36Sopenharmony_ci/* http://en.wikipedia.org/wiki/Methods_of_computing_square_roots
36862306a36Sopenharmony_ci * new_invsqrt = (invsqrt / 2) * (3 - count * invsqrt^2)
36962306a36Sopenharmony_ci *
37062306a36Sopenharmony_ci * Here, invsqrt is a fixed point number (< 1.0), 32bit mantissa, aka Q0.32
37162306a36Sopenharmony_ci */
37262306a36Sopenharmony_ci
37362306a36Sopenharmony_cistatic void cobalt_newton_step(struct cobalt_vars *vars)
37462306a36Sopenharmony_ci{
37562306a36Sopenharmony_ci	u32 invsqrt, invsqrt2;
37662306a36Sopenharmony_ci	u64 val;
37762306a36Sopenharmony_ci
37862306a36Sopenharmony_ci	invsqrt = vars->rec_inv_sqrt;
37962306a36Sopenharmony_ci	invsqrt2 = ((u64)invsqrt * invsqrt) >> 32;
38062306a36Sopenharmony_ci	val = (3LL << 32) - ((u64)vars->count * invsqrt2);
38162306a36Sopenharmony_ci
38262306a36Sopenharmony_ci	val >>= 2; /* avoid overflow in following multiply */
38362306a36Sopenharmony_ci	val = (val * invsqrt) >> (32 - 2 + 1);
38462306a36Sopenharmony_ci
38562306a36Sopenharmony_ci	vars->rec_inv_sqrt = val;
38662306a36Sopenharmony_ci}
38762306a36Sopenharmony_ci
38862306a36Sopenharmony_cistatic void cobalt_invsqrt(struct cobalt_vars *vars)
38962306a36Sopenharmony_ci{
39062306a36Sopenharmony_ci	if (vars->count < REC_INV_SQRT_CACHE)
39162306a36Sopenharmony_ci		vars->rec_inv_sqrt = cobalt_rec_inv_sqrt_cache[vars->count];
39262306a36Sopenharmony_ci	else
39362306a36Sopenharmony_ci		cobalt_newton_step(vars);
39462306a36Sopenharmony_ci}
39562306a36Sopenharmony_ci
39662306a36Sopenharmony_ci/* There is a big difference in timing between the accurate values placed in
39762306a36Sopenharmony_ci * the cache and the approximations given by a single Newton step for small
39862306a36Sopenharmony_ci * count values, particularly when stepping from count 1 to 2 or vice versa.
39962306a36Sopenharmony_ci * Above 16, a single Newton step gives sufficient accuracy in either
40062306a36Sopenharmony_ci * direction, given the precision stored.
40162306a36Sopenharmony_ci *
40262306a36Sopenharmony_ci * The magnitude of the error when stepping up to count 2 is such as to give
40362306a36Sopenharmony_ci * the value that *should* have been produced at count 4.
40462306a36Sopenharmony_ci */
40562306a36Sopenharmony_ci
40662306a36Sopenharmony_cistatic void cobalt_cache_init(void)
40762306a36Sopenharmony_ci{
40862306a36Sopenharmony_ci	struct cobalt_vars v;
40962306a36Sopenharmony_ci
41062306a36Sopenharmony_ci	memset(&v, 0, sizeof(v));
41162306a36Sopenharmony_ci	v.rec_inv_sqrt = ~0U;
41262306a36Sopenharmony_ci	cobalt_rec_inv_sqrt_cache[0] = v.rec_inv_sqrt;
41362306a36Sopenharmony_ci
41462306a36Sopenharmony_ci	for (v.count = 1; v.count < REC_INV_SQRT_CACHE; v.count++) {
41562306a36Sopenharmony_ci		cobalt_newton_step(&v);
41662306a36Sopenharmony_ci		cobalt_newton_step(&v);
41762306a36Sopenharmony_ci		cobalt_newton_step(&v);
41862306a36Sopenharmony_ci		cobalt_newton_step(&v);
41962306a36Sopenharmony_ci
42062306a36Sopenharmony_ci		cobalt_rec_inv_sqrt_cache[v.count] = v.rec_inv_sqrt;
42162306a36Sopenharmony_ci	}
42262306a36Sopenharmony_ci}
42362306a36Sopenharmony_ci
42462306a36Sopenharmony_cistatic void cobalt_vars_init(struct cobalt_vars *vars)
42562306a36Sopenharmony_ci{
42662306a36Sopenharmony_ci	memset(vars, 0, sizeof(*vars));
42762306a36Sopenharmony_ci
42862306a36Sopenharmony_ci	if (!cobalt_rec_inv_sqrt_cache[0]) {
42962306a36Sopenharmony_ci		cobalt_cache_init();
43062306a36Sopenharmony_ci		cobalt_rec_inv_sqrt_cache[0] = ~0;
43162306a36Sopenharmony_ci	}
43262306a36Sopenharmony_ci}
43362306a36Sopenharmony_ci
43462306a36Sopenharmony_ci/* CoDel control_law is t + interval/sqrt(count)
43562306a36Sopenharmony_ci * We maintain in rec_inv_sqrt the reciprocal value of sqrt(count) to avoid
43662306a36Sopenharmony_ci * both sqrt() and divide operation.
43762306a36Sopenharmony_ci */
43862306a36Sopenharmony_cistatic ktime_t cobalt_control(ktime_t t,
43962306a36Sopenharmony_ci			      u64 interval,
44062306a36Sopenharmony_ci			      u32 rec_inv_sqrt)
44162306a36Sopenharmony_ci{
44262306a36Sopenharmony_ci	return ktime_add_ns(t, reciprocal_scale(interval,
44362306a36Sopenharmony_ci						rec_inv_sqrt));
44462306a36Sopenharmony_ci}
44562306a36Sopenharmony_ci
44662306a36Sopenharmony_ci/* Call this when a packet had to be dropped due to queue overflow.  Returns
44762306a36Sopenharmony_ci * true if the BLUE state was quiescent before but active after this call.
44862306a36Sopenharmony_ci */
44962306a36Sopenharmony_cistatic bool cobalt_queue_full(struct cobalt_vars *vars,
45062306a36Sopenharmony_ci			      struct cobalt_params *p,
45162306a36Sopenharmony_ci			      ktime_t now)
45262306a36Sopenharmony_ci{
45362306a36Sopenharmony_ci	bool up = false;
45462306a36Sopenharmony_ci
45562306a36Sopenharmony_ci	if (ktime_to_ns(ktime_sub(now, vars->blue_timer)) > p->target) {
45662306a36Sopenharmony_ci		up = !vars->p_drop;
45762306a36Sopenharmony_ci		vars->p_drop += p->p_inc;
45862306a36Sopenharmony_ci		if (vars->p_drop < p->p_inc)
45962306a36Sopenharmony_ci			vars->p_drop = ~0;
46062306a36Sopenharmony_ci		vars->blue_timer = now;
46162306a36Sopenharmony_ci	}
46262306a36Sopenharmony_ci	vars->dropping = true;
46362306a36Sopenharmony_ci	vars->drop_next = now;
46462306a36Sopenharmony_ci	if (!vars->count)
46562306a36Sopenharmony_ci		vars->count = 1;
46662306a36Sopenharmony_ci
46762306a36Sopenharmony_ci	return up;
46862306a36Sopenharmony_ci}
46962306a36Sopenharmony_ci
47062306a36Sopenharmony_ci/* Call this when the queue was serviced but turned out to be empty.  Returns
47162306a36Sopenharmony_ci * true if the BLUE state was active before but quiescent after this call.
47262306a36Sopenharmony_ci */
47362306a36Sopenharmony_cistatic bool cobalt_queue_empty(struct cobalt_vars *vars,
47462306a36Sopenharmony_ci			       struct cobalt_params *p,
47562306a36Sopenharmony_ci			       ktime_t now)
47662306a36Sopenharmony_ci{
47762306a36Sopenharmony_ci	bool down = false;
47862306a36Sopenharmony_ci
47962306a36Sopenharmony_ci	if (vars->p_drop &&
48062306a36Sopenharmony_ci	    ktime_to_ns(ktime_sub(now, vars->blue_timer)) > p->target) {
48162306a36Sopenharmony_ci		if (vars->p_drop < p->p_dec)
48262306a36Sopenharmony_ci			vars->p_drop = 0;
48362306a36Sopenharmony_ci		else
48462306a36Sopenharmony_ci			vars->p_drop -= p->p_dec;
48562306a36Sopenharmony_ci		vars->blue_timer = now;
48662306a36Sopenharmony_ci		down = !vars->p_drop;
48762306a36Sopenharmony_ci	}
48862306a36Sopenharmony_ci	vars->dropping = false;
48962306a36Sopenharmony_ci
49062306a36Sopenharmony_ci	if (vars->count && ktime_to_ns(ktime_sub(now, vars->drop_next)) >= 0) {
49162306a36Sopenharmony_ci		vars->count--;
49262306a36Sopenharmony_ci		cobalt_invsqrt(vars);
49362306a36Sopenharmony_ci		vars->drop_next = cobalt_control(vars->drop_next,
49462306a36Sopenharmony_ci						 p->interval,
49562306a36Sopenharmony_ci						 vars->rec_inv_sqrt);
49662306a36Sopenharmony_ci	}
49762306a36Sopenharmony_ci
49862306a36Sopenharmony_ci	return down;
49962306a36Sopenharmony_ci}
50062306a36Sopenharmony_ci
50162306a36Sopenharmony_ci/* Call this with a freshly dequeued packet for possible congestion marking.
50262306a36Sopenharmony_ci * Returns true as an instruction to drop the packet, false for delivery.
50362306a36Sopenharmony_ci */
50462306a36Sopenharmony_cistatic bool cobalt_should_drop(struct cobalt_vars *vars,
50562306a36Sopenharmony_ci			       struct cobalt_params *p,
50662306a36Sopenharmony_ci			       ktime_t now,
50762306a36Sopenharmony_ci			       struct sk_buff *skb,
50862306a36Sopenharmony_ci			       u32 bulk_flows)
50962306a36Sopenharmony_ci{
51062306a36Sopenharmony_ci	bool next_due, over_target, drop = false;
51162306a36Sopenharmony_ci	ktime_t schedule;
51262306a36Sopenharmony_ci	u64 sojourn;
51362306a36Sopenharmony_ci
51462306a36Sopenharmony_ci/* The 'schedule' variable records, in its sign, whether 'now' is before or
51562306a36Sopenharmony_ci * after 'drop_next'.  This allows 'drop_next' to be updated before the next
51662306a36Sopenharmony_ci * scheduling decision is actually branched, without destroying that
51762306a36Sopenharmony_ci * information.  Similarly, the first 'schedule' value calculated is preserved
51862306a36Sopenharmony_ci * in the boolean 'next_due'.
51962306a36Sopenharmony_ci *
52062306a36Sopenharmony_ci * As for 'drop_next', we take advantage of the fact that 'interval' is both
52162306a36Sopenharmony_ci * the delay between first exceeding 'target' and the first signalling event,
52262306a36Sopenharmony_ci * *and* the scaling factor for the signalling frequency.  It's therefore very
52362306a36Sopenharmony_ci * natural to use a single mechanism for both purposes, and eliminates a
52462306a36Sopenharmony_ci * significant amount of reference Codel's spaghetti code.  To help with this,
52562306a36Sopenharmony_ci * both the '0' and '1' entries in the invsqrt cache are 0xFFFFFFFF, as close
52662306a36Sopenharmony_ci * as possible to 1.0 in fixed-point.
52762306a36Sopenharmony_ci */
52862306a36Sopenharmony_ci
52962306a36Sopenharmony_ci	sojourn = ktime_to_ns(ktime_sub(now, cobalt_get_enqueue_time(skb)));
53062306a36Sopenharmony_ci	schedule = ktime_sub(now, vars->drop_next);
53162306a36Sopenharmony_ci	over_target = sojourn > p->target &&
53262306a36Sopenharmony_ci		      sojourn > p->mtu_time * bulk_flows * 2 &&
53362306a36Sopenharmony_ci		      sojourn > p->mtu_time * 4;
53462306a36Sopenharmony_ci	next_due = vars->count && ktime_to_ns(schedule) >= 0;
53562306a36Sopenharmony_ci
53662306a36Sopenharmony_ci	vars->ecn_marked = false;
53762306a36Sopenharmony_ci
53862306a36Sopenharmony_ci	if (over_target) {
53962306a36Sopenharmony_ci		if (!vars->dropping) {
54062306a36Sopenharmony_ci			vars->dropping = true;
54162306a36Sopenharmony_ci			vars->drop_next = cobalt_control(now,
54262306a36Sopenharmony_ci							 p->interval,
54362306a36Sopenharmony_ci							 vars->rec_inv_sqrt);
54462306a36Sopenharmony_ci		}
54562306a36Sopenharmony_ci		if (!vars->count)
54662306a36Sopenharmony_ci			vars->count = 1;
54762306a36Sopenharmony_ci	} else if (vars->dropping) {
54862306a36Sopenharmony_ci		vars->dropping = false;
54962306a36Sopenharmony_ci	}
55062306a36Sopenharmony_ci
55162306a36Sopenharmony_ci	if (next_due && vars->dropping) {
55262306a36Sopenharmony_ci		/* Use ECN mark if possible, otherwise drop */
55362306a36Sopenharmony_ci		drop = !(vars->ecn_marked = INET_ECN_set_ce(skb));
55462306a36Sopenharmony_ci
55562306a36Sopenharmony_ci		vars->count++;
55662306a36Sopenharmony_ci		if (!vars->count)
55762306a36Sopenharmony_ci			vars->count--;
55862306a36Sopenharmony_ci		cobalt_invsqrt(vars);
55962306a36Sopenharmony_ci		vars->drop_next = cobalt_control(vars->drop_next,
56062306a36Sopenharmony_ci						 p->interval,
56162306a36Sopenharmony_ci						 vars->rec_inv_sqrt);
56262306a36Sopenharmony_ci		schedule = ktime_sub(now, vars->drop_next);
56362306a36Sopenharmony_ci	} else {
56462306a36Sopenharmony_ci		while (next_due) {
56562306a36Sopenharmony_ci			vars->count--;
56662306a36Sopenharmony_ci			cobalt_invsqrt(vars);
56762306a36Sopenharmony_ci			vars->drop_next = cobalt_control(vars->drop_next,
56862306a36Sopenharmony_ci							 p->interval,
56962306a36Sopenharmony_ci							 vars->rec_inv_sqrt);
57062306a36Sopenharmony_ci			schedule = ktime_sub(now, vars->drop_next);
57162306a36Sopenharmony_ci			next_due = vars->count && ktime_to_ns(schedule) >= 0;
57262306a36Sopenharmony_ci		}
57362306a36Sopenharmony_ci	}
57462306a36Sopenharmony_ci
57562306a36Sopenharmony_ci	/* Simple BLUE implementation.  Lack of ECN is deliberate. */
57662306a36Sopenharmony_ci	if (vars->p_drop)
57762306a36Sopenharmony_ci		drop |= (get_random_u32() < vars->p_drop);
57862306a36Sopenharmony_ci
57962306a36Sopenharmony_ci	/* Overload the drop_next field as an activity timeout */
58062306a36Sopenharmony_ci	if (!vars->count)
58162306a36Sopenharmony_ci		vars->drop_next = ktime_add_ns(now, p->interval);
58262306a36Sopenharmony_ci	else if (ktime_to_ns(schedule) > 0 && !drop)
58362306a36Sopenharmony_ci		vars->drop_next = now;
58462306a36Sopenharmony_ci
58562306a36Sopenharmony_ci	return drop;
58662306a36Sopenharmony_ci}
58762306a36Sopenharmony_ci
58862306a36Sopenharmony_cistatic bool cake_update_flowkeys(struct flow_keys *keys,
58962306a36Sopenharmony_ci				 const struct sk_buff *skb)
59062306a36Sopenharmony_ci{
59162306a36Sopenharmony_ci#if IS_ENABLED(CONFIG_NF_CONNTRACK)
59262306a36Sopenharmony_ci	struct nf_conntrack_tuple tuple = {};
59362306a36Sopenharmony_ci	bool rev = !skb->_nfct, upd = false;
59462306a36Sopenharmony_ci	__be32 ip;
59562306a36Sopenharmony_ci
59662306a36Sopenharmony_ci	if (skb_protocol(skb, true) != htons(ETH_P_IP))
59762306a36Sopenharmony_ci		return false;
59862306a36Sopenharmony_ci
59962306a36Sopenharmony_ci	if (!nf_ct_get_tuple_skb(&tuple, skb))
60062306a36Sopenharmony_ci		return false;
60162306a36Sopenharmony_ci
60262306a36Sopenharmony_ci	ip = rev ? tuple.dst.u3.ip : tuple.src.u3.ip;
60362306a36Sopenharmony_ci	if (ip != keys->addrs.v4addrs.src) {
60462306a36Sopenharmony_ci		keys->addrs.v4addrs.src = ip;
60562306a36Sopenharmony_ci		upd = true;
60662306a36Sopenharmony_ci	}
60762306a36Sopenharmony_ci	ip = rev ? tuple.src.u3.ip : tuple.dst.u3.ip;
60862306a36Sopenharmony_ci	if (ip != keys->addrs.v4addrs.dst) {
60962306a36Sopenharmony_ci		keys->addrs.v4addrs.dst = ip;
61062306a36Sopenharmony_ci		upd = true;
61162306a36Sopenharmony_ci	}
61262306a36Sopenharmony_ci
61362306a36Sopenharmony_ci	if (keys->ports.ports) {
61462306a36Sopenharmony_ci		__be16 port;
61562306a36Sopenharmony_ci
61662306a36Sopenharmony_ci		port = rev ? tuple.dst.u.all : tuple.src.u.all;
61762306a36Sopenharmony_ci		if (port != keys->ports.src) {
61862306a36Sopenharmony_ci			keys->ports.src = port;
61962306a36Sopenharmony_ci			upd = true;
62062306a36Sopenharmony_ci		}
62162306a36Sopenharmony_ci		port = rev ? tuple.src.u.all : tuple.dst.u.all;
62262306a36Sopenharmony_ci		if (port != keys->ports.dst) {
62362306a36Sopenharmony_ci			port = keys->ports.dst;
62462306a36Sopenharmony_ci			upd = true;
62562306a36Sopenharmony_ci		}
62662306a36Sopenharmony_ci	}
62762306a36Sopenharmony_ci	return upd;
62862306a36Sopenharmony_ci#else
62962306a36Sopenharmony_ci	return false;
63062306a36Sopenharmony_ci#endif
63162306a36Sopenharmony_ci}
63262306a36Sopenharmony_ci
63362306a36Sopenharmony_ci/* Cake has several subtle multiple bit settings. In these cases you
63462306a36Sopenharmony_ci *  would be matching triple isolate mode as well.
63562306a36Sopenharmony_ci */
63662306a36Sopenharmony_ci
63762306a36Sopenharmony_cistatic bool cake_dsrc(int flow_mode)
63862306a36Sopenharmony_ci{
63962306a36Sopenharmony_ci	return (flow_mode & CAKE_FLOW_DUAL_SRC) == CAKE_FLOW_DUAL_SRC;
64062306a36Sopenharmony_ci}
64162306a36Sopenharmony_ci
64262306a36Sopenharmony_cistatic bool cake_ddst(int flow_mode)
64362306a36Sopenharmony_ci{
64462306a36Sopenharmony_ci	return (flow_mode & CAKE_FLOW_DUAL_DST) == CAKE_FLOW_DUAL_DST;
64562306a36Sopenharmony_ci}
64662306a36Sopenharmony_ci
64762306a36Sopenharmony_cistatic u32 cake_hash(struct cake_tin_data *q, const struct sk_buff *skb,
64862306a36Sopenharmony_ci		     int flow_mode, u16 flow_override, u16 host_override)
64962306a36Sopenharmony_ci{
65062306a36Sopenharmony_ci	bool hash_flows = (!flow_override && !!(flow_mode & CAKE_FLOW_FLOWS));
65162306a36Sopenharmony_ci	bool hash_hosts = (!host_override && !!(flow_mode & CAKE_FLOW_HOSTS));
65262306a36Sopenharmony_ci	bool nat_enabled = !!(flow_mode & CAKE_FLOW_NAT_FLAG);
65362306a36Sopenharmony_ci	u32 flow_hash = 0, srchost_hash = 0, dsthost_hash = 0;
65462306a36Sopenharmony_ci	u16 reduced_hash, srchost_idx, dsthost_idx;
65562306a36Sopenharmony_ci	struct flow_keys keys, host_keys;
65662306a36Sopenharmony_ci	bool use_skbhash = skb->l4_hash;
65762306a36Sopenharmony_ci
65862306a36Sopenharmony_ci	if (unlikely(flow_mode == CAKE_FLOW_NONE))
65962306a36Sopenharmony_ci		return 0;
66062306a36Sopenharmony_ci
66162306a36Sopenharmony_ci	/* If both overrides are set, or we can use the SKB hash and nat mode is
66262306a36Sopenharmony_ci	 * disabled, we can skip packet dissection entirely. If nat mode is
66362306a36Sopenharmony_ci	 * enabled there's another check below after doing the conntrack lookup.
66462306a36Sopenharmony_ci	 */
66562306a36Sopenharmony_ci	if ((!hash_flows || (use_skbhash && !nat_enabled)) && !hash_hosts)
66662306a36Sopenharmony_ci		goto skip_hash;
66762306a36Sopenharmony_ci
66862306a36Sopenharmony_ci	skb_flow_dissect_flow_keys(skb, &keys,
66962306a36Sopenharmony_ci				   FLOW_DISSECTOR_F_STOP_AT_FLOW_LABEL);
67062306a36Sopenharmony_ci
67162306a36Sopenharmony_ci	/* Don't use the SKB hash if we change the lookup keys from conntrack */
67262306a36Sopenharmony_ci	if (nat_enabled && cake_update_flowkeys(&keys, skb))
67362306a36Sopenharmony_ci		use_skbhash = false;
67462306a36Sopenharmony_ci
67562306a36Sopenharmony_ci	/* If we can still use the SKB hash and don't need the host hash, we can
67662306a36Sopenharmony_ci	 * skip the rest of the hashing procedure
67762306a36Sopenharmony_ci	 */
67862306a36Sopenharmony_ci	if (use_skbhash && !hash_hosts)
67962306a36Sopenharmony_ci		goto skip_hash;
68062306a36Sopenharmony_ci
68162306a36Sopenharmony_ci	/* flow_hash_from_keys() sorts the addresses by value, so we have
68262306a36Sopenharmony_ci	 * to preserve their order in a separate data structure to treat
68362306a36Sopenharmony_ci	 * src and dst host addresses as independently selectable.
68462306a36Sopenharmony_ci	 */
68562306a36Sopenharmony_ci	host_keys = keys;
68662306a36Sopenharmony_ci	host_keys.ports.ports     = 0;
68762306a36Sopenharmony_ci	host_keys.basic.ip_proto  = 0;
68862306a36Sopenharmony_ci	host_keys.keyid.keyid     = 0;
68962306a36Sopenharmony_ci	host_keys.tags.flow_label = 0;
69062306a36Sopenharmony_ci
69162306a36Sopenharmony_ci	switch (host_keys.control.addr_type) {
69262306a36Sopenharmony_ci	case FLOW_DISSECTOR_KEY_IPV4_ADDRS:
69362306a36Sopenharmony_ci		host_keys.addrs.v4addrs.src = 0;
69462306a36Sopenharmony_ci		dsthost_hash = flow_hash_from_keys(&host_keys);
69562306a36Sopenharmony_ci		host_keys.addrs.v4addrs.src = keys.addrs.v4addrs.src;
69662306a36Sopenharmony_ci		host_keys.addrs.v4addrs.dst = 0;
69762306a36Sopenharmony_ci		srchost_hash = flow_hash_from_keys(&host_keys);
69862306a36Sopenharmony_ci		break;
69962306a36Sopenharmony_ci
70062306a36Sopenharmony_ci	case FLOW_DISSECTOR_KEY_IPV6_ADDRS:
70162306a36Sopenharmony_ci		memset(&host_keys.addrs.v6addrs.src, 0,
70262306a36Sopenharmony_ci		       sizeof(host_keys.addrs.v6addrs.src));
70362306a36Sopenharmony_ci		dsthost_hash = flow_hash_from_keys(&host_keys);
70462306a36Sopenharmony_ci		host_keys.addrs.v6addrs.src = keys.addrs.v6addrs.src;
70562306a36Sopenharmony_ci		memset(&host_keys.addrs.v6addrs.dst, 0,
70662306a36Sopenharmony_ci		       sizeof(host_keys.addrs.v6addrs.dst));
70762306a36Sopenharmony_ci		srchost_hash = flow_hash_from_keys(&host_keys);
70862306a36Sopenharmony_ci		break;
70962306a36Sopenharmony_ci
71062306a36Sopenharmony_ci	default:
71162306a36Sopenharmony_ci		dsthost_hash = 0;
71262306a36Sopenharmony_ci		srchost_hash = 0;
71362306a36Sopenharmony_ci	}
71462306a36Sopenharmony_ci
71562306a36Sopenharmony_ci	/* This *must* be after the above switch, since as a
71662306a36Sopenharmony_ci	 * side-effect it sorts the src and dst addresses.
71762306a36Sopenharmony_ci	 */
71862306a36Sopenharmony_ci	if (hash_flows && !use_skbhash)
71962306a36Sopenharmony_ci		flow_hash = flow_hash_from_keys(&keys);
72062306a36Sopenharmony_ci
72162306a36Sopenharmony_ciskip_hash:
72262306a36Sopenharmony_ci	if (flow_override)
72362306a36Sopenharmony_ci		flow_hash = flow_override - 1;
72462306a36Sopenharmony_ci	else if (use_skbhash && (flow_mode & CAKE_FLOW_FLOWS))
72562306a36Sopenharmony_ci		flow_hash = skb->hash;
72662306a36Sopenharmony_ci	if (host_override) {
72762306a36Sopenharmony_ci		dsthost_hash = host_override - 1;
72862306a36Sopenharmony_ci		srchost_hash = host_override - 1;
72962306a36Sopenharmony_ci	}
73062306a36Sopenharmony_ci
73162306a36Sopenharmony_ci	if (!(flow_mode & CAKE_FLOW_FLOWS)) {
73262306a36Sopenharmony_ci		if (flow_mode & CAKE_FLOW_SRC_IP)
73362306a36Sopenharmony_ci			flow_hash ^= srchost_hash;
73462306a36Sopenharmony_ci
73562306a36Sopenharmony_ci		if (flow_mode & CAKE_FLOW_DST_IP)
73662306a36Sopenharmony_ci			flow_hash ^= dsthost_hash;
73762306a36Sopenharmony_ci	}
73862306a36Sopenharmony_ci
73962306a36Sopenharmony_ci	reduced_hash = flow_hash % CAKE_QUEUES;
74062306a36Sopenharmony_ci
74162306a36Sopenharmony_ci	/* set-associative hashing */
74262306a36Sopenharmony_ci	/* fast path if no hash collision (direct lookup succeeds) */
74362306a36Sopenharmony_ci	if (likely(q->tags[reduced_hash] == flow_hash &&
74462306a36Sopenharmony_ci		   q->flows[reduced_hash].set)) {
74562306a36Sopenharmony_ci		q->way_directs++;
74662306a36Sopenharmony_ci	} else {
74762306a36Sopenharmony_ci		u32 inner_hash = reduced_hash % CAKE_SET_WAYS;
74862306a36Sopenharmony_ci		u32 outer_hash = reduced_hash - inner_hash;
74962306a36Sopenharmony_ci		bool allocate_src = false;
75062306a36Sopenharmony_ci		bool allocate_dst = false;
75162306a36Sopenharmony_ci		u32 i, k;
75262306a36Sopenharmony_ci
75362306a36Sopenharmony_ci		/* check if any active queue in the set is reserved for
75462306a36Sopenharmony_ci		 * this flow.
75562306a36Sopenharmony_ci		 */
75662306a36Sopenharmony_ci		for (i = 0, k = inner_hash; i < CAKE_SET_WAYS;
75762306a36Sopenharmony_ci		     i++, k = (k + 1) % CAKE_SET_WAYS) {
75862306a36Sopenharmony_ci			if (q->tags[outer_hash + k] == flow_hash) {
75962306a36Sopenharmony_ci				if (i)
76062306a36Sopenharmony_ci					q->way_hits++;
76162306a36Sopenharmony_ci
76262306a36Sopenharmony_ci				if (!q->flows[outer_hash + k].set) {
76362306a36Sopenharmony_ci					/* need to increment host refcnts */
76462306a36Sopenharmony_ci					allocate_src = cake_dsrc(flow_mode);
76562306a36Sopenharmony_ci					allocate_dst = cake_ddst(flow_mode);
76662306a36Sopenharmony_ci				}
76762306a36Sopenharmony_ci
76862306a36Sopenharmony_ci				goto found;
76962306a36Sopenharmony_ci			}
77062306a36Sopenharmony_ci		}
77162306a36Sopenharmony_ci
77262306a36Sopenharmony_ci		/* no queue is reserved for this flow, look for an
77362306a36Sopenharmony_ci		 * empty one.
77462306a36Sopenharmony_ci		 */
77562306a36Sopenharmony_ci		for (i = 0; i < CAKE_SET_WAYS;
77662306a36Sopenharmony_ci			 i++, k = (k + 1) % CAKE_SET_WAYS) {
77762306a36Sopenharmony_ci			if (!q->flows[outer_hash + k].set) {
77862306a36Sopenharmony_ci				q->way_misses++;
77962306a36Sopenharmony_ci				allocate_src = cake_dsrc(flow_mode);
78062306a36Sopenharmony_ci				allocate_dst = cake_ddst(flow_mode);
78162306a36Sopenharmony_ci				goto found;
78262306a36Sopenharmony_ci			}
78362306a36Sopenharmony_ci		}
78462306a36Sopenharmony_ci
78562306a36Sopenharmony_ci		/* With no empty queues, default to the original
78662306a36Sopenharmony_ci		 * queue, accept the collision, update the host tags.
78762306a36Sopenharmony_ci		 */
78862306a36Sopenharmony_ci		q->way_collisions++;
78962306a36Sopenharmony_ci		if (q->flows[outer_hash + k].set == CAKE_SET_BULK) {
79062306a36Sopenharmony_ci			q->hosts[q->flows[reduced_hash].srchost].srchost_bulk_flow_count--;
79162306a36Sopenharmony_ci			q->hosts[q->flows[reduced_hash].dsthost].dsthost_bulk_flow_count--;
79262306a36Sopenharmony_ci		}
79362306a36Sopenharmony_ci		allocate_src = cake_dsrc(flow_mode);
79462306a36Sopenharmony_ci		allocate_dst = cake_ddst(flow_mode);
79562306a36Sopenharmony_cifound:
79662306a36Sopenharmony_ci		/* reserve queue for future packets in same flow */
79762306a36Sopenharmony_ci		reduced_hash = outer_hash + k;
79862306a36Sopenharmony_ci		q->tags[reduced_hash] = flow_hash;
79962306a36Sopenharmony_ci
80062306a36Sopenharmony_ci		if (allocate_src) {
80162306a36Sopenharmony_ci			srchost_idx = srchost_hash % CAKE_QUEUES;
80262306a36Sopenharmony_ci			inner_hash = srchost_idx % CAKE_SET_WAYS;
80362306a36Sopenharmony_ci			outer_hash = srchost_idx - inner_hash;
80462306a36Sopenharmony_ci			for (i = 0, k = inner_hash; i < CAKE_SET_WAYS;
80562306a36Sopenharmony_ci				i++, k = (k + 1) % CAKE_SET_WAYS) {
80662306a36Sopenharmony_ci				if (q->hosts[outer_hash + k].srchost_tag ==
80762306a36Sopenharmony_ci				    srchost_hash)
80862306a36Sopenharmony_ci					goto found_src;
80962306a36Sopenharmony_ci			}
81062306a36Sopenharmony_ci			for (i = 0; i < CAKE_SET_WAYS;
81162306a36Sopenharmony_ci				i++, k = (k + 1) % CAKE_SET_WAYS) {
81262306a36Sopenharmony_ci				if (!q->hosts[outer_hash + k].srchost_bulk_flow_count)
81362306a36Sopenharmony_ci					break;
81462306a36Sopenharmony_ci			}
81562306a36Sopenharmony_ci			q->hosts[outer_hash + k].srchost_tag = srchost_hash;
81662306a36Sopenharmony_cifound_src:
81762306a36Sopenharmony_ci			srchost_idx = outer_hash + k;
81862306a36Sopenharmony_ci			if (q->flows[reduced_hash].set == CAKE_SET_BULK)
81962306a36Sopenharmony_ci				q->hosts[srchost_idx].srchost_bulk_flow_count++;
82062306a36Sopenharmony_ci			q->flows[reduced_hash].srchost = srchost_idx;
82162306a36Sopenharmony_ci		}
82262306a36Sopenharmony_ci
82362306a36Sopenharmony_ci		if (allocate_dst) {
82462306a36Sopenharmony_ci			dsthost_idx = dsthost_hash % CAKE_QUEUES;
82562306a36Sopenharmony_ci			inner_hash = dsthost_idx % CAKE_SET_WAYS;
82662306a36Sopenharmony_ci			outer_hash = dsthost_idx - inner_hash;
82762306a36Sopenharmony_ci			for (i = 0, k = inner_hash; i < CAKE_SET_WAYS;
82862306a36Sopenharmony_ci			     i++, k = (k + 1) % CAKE_SET_WAYS) {
82962306a36Sopenharmony_ci				if (q->hosts[outer_hash + k].dsthost_tag ==
83062306a36Sopenharmony_ci				    dsthost_hash)
83162306a36Sopenharmony_ci					goto found_dst;
83262306a36Sopenharmony_ci			}
83362306a36Sopenharmony_ci			for (i = 0; i < CAKE_SET_WAYS;
83462306a36Sopenharmony_ci			     i++, k = (k + 1) % CAKE_SET_WAYS) {
83562306a36Sopenharmony_ci				if (!q->hosts[outer_hash + k].dsthost_bulk_flow_count)
83662306a36Sopenharmony_ci					break;
83762306a36Sopenharmony_ci			}
83862306a36Sopenharmony_ci			q->hosts[outer_hash + k].dsthost_tag = dsthost_hash;
83962306a36Sopenharmony_cifound_dst:
84062306a36Sopenharmony_ci			dsthost_idx = outer_hash + k;
84162306a36Sopenharmony_ci			if (q->flows[reduced_hash].set == CAKE_SET_BULK)
84262306a36Sopenharmony_ci				q->hosts[dsthost_idx].dsthost_bulk_flow_count++;
84362306a36Sopenharmony_ci			q->flows[reduced_hash].dsthost = dsthost_idx;
84462306a36Sopenharmony_ci		}
84562306a36Sopenharmony_ci	}
84662306a36Sopenharmony_ci
84762306a36Sopenharmony_ci	return reduced_hash;
84862306a36Sopenharmony_ci}
84962306a36Sopenharmony_ci
85062306a36Sopenharmony_ci/* helper functions : might be changed when/if skb use a standard list_head */
85162306a36Sopenharmony_ci/* remove one skb from head of slot queue */
85262306a36Sopenharmony_ci
85362306a36Sopenharmony_cistatic struct sk_buff *dequeue_head(struct cake_flow *flow)
85462306a36Sopenharmony_ci{
85562306a36Sopenharmony_ci	struct sk_buff *skb = flow->head;
85662306a36Sopenharmony_ci
85762306a36Sopenharmony_ci	if (skb) {
85862306a36Sopenharmony_ci		flow->head = skb->next;
85962306a36Sopenharmony_ci		skb_mark_not_on_list(skb);
86062306a36Sopenharmony_ci	}
86162306a36Sopenharmony_ci
86262306a36Sopenharmony_ci	return skb;
86362306a36Sopenharmony_ci}
86462306a36Sopenharmony_ci
86562306a36Sopenharmony_ci/* add skb to flow queue (tail add) */
86662306a36Sopenharmony_ci
86762306a36Sopenharmony_cistatic void flow_queue_add(struct cake_flow *flow, struct sk_buff *skb)
86862306a36Sopenharmony_ci{
86962306a36Sopenharmony_ci	if (!flow->head)
87062306a36Sopenharmony_ci		flow->head = skb;
87162306a36Sopenharmony_ci	else
87262306a36Sopenharmony_ci		flow->tail->next = skb;
87362306a36Sopenharmony_ci	flow->tail = skb;
87462306a36Sopenharmony_ci	skb->next = NULL;
87562306a36Sopenharmony_ci}
87662306a36Sopenharmony_ci
87762306a36Sopenharmony_cistatic struct iphdr *cake_get_iphdr(const struct sk_buff *skb,
87862306a36Sopenharmony_ci				    struct ipv6hdr *buf)
87962306a36Sopenharmony_ci{
88062306a36Sopenharmony_ci	unsigned int offset = skb_network_offset(skb);
88162306a36Sopenharmony_ci	struct iphdr *iph;
88262306a36Sopenharmony_ci
88362306a36Sopenharmony_ci	iph = skb_header_pointer(skb, offset, sizeof(struct iphdr), buf);
88462306a36Sopenharmony_ci
88562306a36Sopenharmony_ci	if (!iph)
88662306a36Sopenharmony_ci		return NULL;
88762306a36Sopenharmony_ci
88862306a36Sopenharmony_ci	if (iph->version == 4 && iph->protocol == IPPROTO_IPV6)
88962306a36Sopenharmony_ci		return skb_header_pointer(skb, offset + iph->ihl * 4,
89062306a36Sopenharmony_ci					  sizeof(struct ipv6hdr), buf);
89162306a36Sopenharmony_ci
89262306a36Sopenharmony_ci	else if (iph->version == 4)
89362306a36Sopenharmony_ci		return iph;
89462306a36Sopenharmony_ci
89562306a36Sopenharmony_ci	else if (iph->version == 6)
89662306a36Sopenharmony_ci		return skb_header_pointer(skb, offset, sizeof(struct ipv6hdr),
89762306a36Sopenharmony_ci					  buf);
89862306a36Sopenharmony_ci
89962306a36Sopenharmony_ci	return NULL;
90062306a36Sopenharmony_ci}
90162306a36Sopenharmony_ci
90262306a36Sopenharmony_cistatic struct tcphdr *cake_get_tcphdr(const struct sk_buff *skb,
90362306a36Sopenharmony_ci				      void *buf, unsigned int bufsize)
90462306a36Sopenharmony_ci{
90562306a36Sopenharmony_ci	unsigned int offset = skb_network_offset(skb);
90662306a36Sopenharmony_ci	const struct ipv6hdr *ipv6h;
90762306a36Sopenharmony_ci	const struct tcphdr *tcph;
90862306a36Sopenharmony_ci	const struct iphdr *iph;
90962306a36Sopenharmony_ci	struct ipv6hdr _ipv6h;
91062306a36Sopenharmony_ci	struct tcphdr _tcph;
91162306a36Sopenharmony_ci
91262306a36Sopenharmony_ci	ipv6h = skb_header_pointer(skb, offset, sizeof(_ipv6h), &_ipv6h);
91362306a36Sopenharmony_ci
91462306a36Sopenharmony_ci	if (!ipv6h)
91562306a36Sopenharmony_ci		return NULL;
91662306a36Sopenharmony_ci
91762306a36Sopenharmony_ci	if (ipv6h->version == 4) {
91862306a36Sopenharmony_ci		iph = (struct iphdr *)ipv6h;
91962306a36Sopenharmony_ci		offset += iph->ihl * 4;
92062306a36Sopenharmony_ci
92162306a36Sopenharmony_ci		/* special-case 6in4 tunnelling, as that is a common way to get
92262306a36Sopenharmony_ci		 * v6 connectivity in the home
92362306a36Sopenharmony_ci		 */
92462306a36Sopenharmony_ci		if (iph->protocol == IPPROTO_IPV6) {
92562306a36Sopenharmony_ci			ipv6h = skb_header_pointer(skb, offset,
92662306a36Sopenharmony_ci						   sizeof(_ipv6h), &_ipv6h);
92762306a36Sopenharmony_ci
92862306a36Sopenharmony_ci			if (!ipv6h || ipv6h->nexthdr != IPPROTO_TCP)
92962306a36Sopenharmony_ci				return NULL;
93062306a36Sopenharmony_ci
93162306a36Sopenharmony_ci			offset += sizeof(struct ipv6hdr);
93262306a36Sopenharmony_ci
93362306a36Sopenharmony_ci		} else if (iph->protocol != IPPROTO_TCP) {
93462306a36Sopenharmony_ci			return NULL;
93562306a36Sopenharmony_ci		}
93662306a36Sopenharmony_ci
93762306a36Sopenharmony_ci	} else if (ipv6h->version == 6) {
93862306a36Sopenharmony_ci		if (ipv6h->nexthdr != IPPROTO_TCP)
93962306a36Sopenharmony_ci			return NULL;
94062306a36Sopenharmony_ci
94162306a36Sopenharmony_ci		offset += sizeof(struct ipv6hdr);
94262306a36Sopenharmony_ci	} else {
94362306a36Sopenharmony_ci		return NULL;
94462306a36Sopenharmony_ci	}
94562306a36Sopenharmony_ci
94662306a36Sopenharmony_ci	tcph = skb_header_pointer(skb, offset, sizeof(_tcph), &_tcph);
94762306a36Sopenharmony_ci	if (!tcph || tcph->doff < 5)
94862306a36Sopenharmony_ci		return NULL;
94962306a36Sopenharmony_ci
95062306a36Sopenharmony_ci	return skb_header_pointer(skb, offset,
95162306a36Sopenharmony_ci				  min(__tcp_hdrlen(tcph), bufsize), buf);
95262306a36Sopenharmony_ci}
95362306a36Sopenharmony_ci
95462306a36Sopenharmony_cistatic const void *cake_get_tcpopt(const struct tcphdr *tcph,
95562306a36Sopenharmony_ci				   int code, int *oplen)
95662306a36Sopenharmony_ci{
95762306a36Sopenharmony_ci	/* inspired by tcp_parse_options in tcp_input.c */
95862306a36Sopenharmony_ci	int length = __tcp_hdrlen(tcph) - sizeof(struct tcphdr);
95962306a36Sopenharmony_ci	const u8 *ptr = (const u8 *)(tcph + 1);
96062306a36Sopenharmony_ci
96162306a36Sopenharmony_ci	while (length > 0) {
96262306a36Sopenharmony_ci		int opcode = *ptr++;
96362306a36Sopenharmony_ci		int opsize;
96462306a36Sopenharmony_ci
96562306a36Sopenharmony_ci		if (opcode == TCPOPT_EOL)
96662306a36Sopenharmony_ci			break;
96762306a36Sopenharmony_ci		if (opcode == TCPOPT_NOP) {
96862306a36Sopenharmony_ci			length--;
96962306a36Sopenharmony_ci			continue;
97062306a36Sopenharmony_ci		}
97162306a36Sopenharmony_ci		if (length < 2)
97262306a36Sopenharmony_ci			break;
97362306a36Sopenharmony_ci		opsize = *ptr++;
97462306a36Sopenharmony_ci		if (opsize < 2 || opsize > length)
97562306a36Sopenharmony_ci			break;
97662306a36Sopenharmony_ci
97762306a36Sopenharmony_ci		if (opcode == code) {
97862306a36Sopenharmony_ci			*oplen = opsize;
97962306a36Sopenharmony_ci			return ptr;
98062306a36Sopenharmony_ci		}
98162306a36Sopenharmony_ci
98262306a36Sopenharmony_ci		ptr += opsize - 2;
98362306a36Sopenharmony_ci		length -= opsize;
98462306a36Sopenharmony_ci	}
98562306a36Sopenharmony_ci
98662306a36Sopenharmony_ci	return NULL;
98762306a36Sopenharmony_ci}
98862306a36Sopenharmony_ci
98962306a36Sopenharmony_ci/* Compare two SACK sequences. A sequence is considered greater if it SACKs more
99062306a36Sopenharmony_ci * bytes than the other. In the case where both sequences ACKs bytes that the
99162306a36Sopenharmony_ci * other doesn't, A is considered greater. DSACKs in A also makes A be
99262306a36Sopenharmony_ci * considered greater.
99362306a36Sopenharmony_ci *
99462306a36Sopenharmony_ci * @return -1, 0 or 1 as normal compare functions
99562306a36Sopenharmony_ci */
99662306a36Sopenharmony_cistatic int cake_tcph_sack_compare(const struct tcphdr *tcph_a,
99762306a36Sopenharmony_ci				  const struct tcphdr *tcph_b)
99862306a36Sopenharmony_ci{
99962306a36Sopenharmony_ci	const struct tcp_sack_block_wire *sack_a, *sack_b;
100062306a36Sopenharmony_ci	u32 ack_seq_a = ntohl(tcph_a->ack_seq);
100162306a36Sopenharmony_ci	u32 bytes_a = 0, bytes_b = 0;
100262306a36Sopenharmony_ci	int oplen_a, oplen_b;
100362306a36Sopenharmony_ci	bool first = true;
100462306a36Sopenharmony_ci
100562306a36Sopenharmony_ci	sack_a = cake_get_tcpopt(tcph_a, TCPOPT_SACK, &oplen_a);
100662306a36Sopenharmony_ci	sack_b = cake_get_tcpopt(tcph_b, TCPOPT_SACK, &oplen_b);
100762306a36Sopenharmony_ci
100862306a36Sopenharmony_ci	/* pointers point to option contents */
100962306a36Sopenharmony_ci	oplen_a -= TCPOLEN_SACK_BASE;
101062306a36Sopenharmony_ci	oplen_b -= TCPOLEN_SACK_BASE;
101162306a36Sopenharmony_ci
101262306a36Sopenharmony_ci	if (sack_a && oplen_a >= sizeof(*sack_a) &&
101362306a36Sopenharmony_ci	    (!sack_b || oplen_b < sizeof(*sack_b)))
101462306a36Sopenharmony_ci		return -1;
101562306a36Sopenharmony_ci	else if (sack_b && oplen_b >= sizeof(*sack_b) &&
101662306a36Sopenharmony_ci		 (!sack_a || oplen_a < sizeof(*sack_a)))
101762306a36Sopenharmony_ci		return 1;
101862306a36Sopenharmony_ci	else if ((!sack_a || oplen_a < sizeof(*sack_a)) &&
101962306a36Sopenharmony_ci		 (!sack_b || oplen_b < sizeof(*sack_b)))
102062306a36Sopenharmony_ci		return 0;
102162306a36Sopenharmony_ci
102262306a36Sopenharmony_ci	while (oplen_a >= sizeof(*sack_a)) {
102362306a36Sopenharmony_ci		const struct tcp_sack_block_wire *sack_tmp = sack_b;
102462306a36Sopenharmony_ci		u32 start_a = get_unaligned_be32(&sack_a->start_seq);
102562306a36Sopenharmony_ci		u32 end_a = get_unaligned_be32(&sack_a->end_seq);
102662306a36Sopenharmony_ci		int oplen_tmp = oplen_b;
102762306a36Sopenharmony_ci		bool found = false;
102862306a36Sopenharmony_ci
102962306a36Sopenharmony_ci		/* DSACK; always considered greater to prevent dropping */
103062306a36Sopenharmony_ci		if (before(start_a, ack_seq_a))
103162306a36Sopenharmony_ci			return -1;
103262306a36Sopenharmony_ci
103362306a36Sopenharmony_ci		bytes_a += end_a - start_a;
103462306a36Sopenharmony_ci
103562306a36Sopenharmony_ci		while (oplen_tmp >= sizeof(*sack_tmp)) {
103662306a36Sopenharmony_ci			u32 start_b = get_unaligned_be32(&sack_tmp->start_seq);
103762306a36Sopenharmony_ci			u32 end_b = get_unaligned_be32(&sack_tmp->end_seq);
103862306a36Sopenharmony_ci
103962306a36Sopenharmony_ci			/* first time through we count the total size */
104062306a36Sopenharmony_ci			if (first)
104162306a36Sopenharmony_ci				bytes_b += end_b - start_b;
104262306a36Sopenharmony_ci
104362306a36Sopenharmony_ci			if (!after(start_b, start_a) && !before(end_b, end_a)) {
104462306a36Sopenharmony_ci				found = true;
104562306a36Sopenharmony_ci				if (!first)
104662306a36Sopenharmony_ci					break;
104762306a36Sopenharmony_ci			}
104862306a36Sopenharmony_ci			oplen_tmp -= sizeof(*sack_tmp);
104962306a36Sopenharmony_ci			sack_tmp++;
105062306a36Sopenharmony_ci		}
105162306a36Sopenharmony_ci
105262306a36Sopenharmony_ci		if (!found)
105362306a36Sopenharmony_ci			return -1;
105462306a36Sopenharmony_ci
105562306a36Sopenharmony_ci		oplen_a -= sizeof(*sack_a);
105662306a36Sopenharmony_ci		sack_a++;
105762306a36Sopenharmony_ci		first = false;
105862306a36Sopenharmony_ci	}
105962306a36Sopenharmony_ci
106062306a36Sopenharmony_ci	/* If we made it this far, all ranges SACKed by A are covered by B, so
106162306a36Sopenharmony_ci	 * either the SACKs are equal, or B SACKs more bytes.
106262306a36Sopenharmony_ci	 */
106362306a36Sopenharmony_ci	return bytes_b > bytes_a ? 1 : 0;
106462306a36Sopenharmony_ci}
106562306a36Sopenharmony_ci
106662306a36Sopenharmony_cistatic void cake_tcph_get_tstamp(const struct tcphdr *tcph,
106762306a36Sopenharmony_ci				 u32 *tsval, u32 *tsecr)
106862306a36Sopenharmony_ci{
106962306a36Sopenharmony_ci	const u8 *ptr;
107062306a36Sopenharmony_ci	int opsize;
107162306a36Sopenharmony_ci
107262306a36Sopenharmony_ci	ptr = cake_get_tcpopt(tcph, TCPOPT_TIMESTAMP, &opsize);
107362306a36Sopenharmony_ci
107462306a36Sopenharmony_ci	if (ptr && opsize == TCPOLEN_TIMESTAMP) {
107562306a36Sopenharmony_ci		*tsval = get_unaligned_be32(ptr);
107662306a36Sopenharmony_ci		*tsecr = get_unaligned_be32(ptr + 4);
107762306a36Sopenharmony_ci	}
107862306a36Sopenharmony_ci}
107962306a36Sopenharmony_ci
108062306a36Sopenharmony_cistatic bool cake_tcph_may_drop(const struct tcphdr *tcph,
108162306a36Sopenharmony_ci			       u32 tstamp_new, u32 tsecr_new)
108262306a36Sopenharmony_ci{
108362306a36Sopenharmony_ci	/* inspired by tcp_parse_options in tcp_input.c */
108462306a36Sopenharmony_ci	int length = __tcp_hdrlen(tcph) - sizeof(struct tcphdr);
108562306a36Sopenharmony_ci	const u8 *ptr = (const u8 *)(tcph + 1);
108662306a36Sopenharmony_ci	u32 tstamp, tsecr;
108762306a36Sopenharmony_ci
108862306a36Sopenharmony_ci	/* 3 reserved flags must be unset to avoid future breakage
108962306a36Sopenharmony_ci	 * ACK must be set
109062306a36Sopenharmony_ci	 * ECE/CWR are handled separately
109162306a36Sopenharmony_ci	 * All other flags URG/PSH/RST/SYN/FIN must be unset
109262306a36Sopenharmony_ci	 * 0x0FFF0000 = all TCP flags (confirm ACK=1, others zero)
109362306a36Sopenharmony_ci	 * 0x00C00000 = CWR/ECE (handled separately)
109462306a36Sopenharmony_ci	 * 0x0F3F0000 = 0x0FFF0000 & ~0x00C00000
109562306a36Sopenharmony_ci	 */
109662306a36Sopenharmony_ci	if (((tcp_flag_word(tcph) &
109762306a36Sopenharmony_ci	      cpu_to_be32(0x0F3F0000)) != TCP_FLAG_ACK))
109862306a36Sopenharmony_ci		return false;
109962306a36Sopenharmony_ci
110062306a36Sopenharmony_ci	while (length > 0) {
110162306a36Sopenharmony_ci		int opcode = *ptr++;
110262306a36Sopenharmony_ci		int opsize;
110362306a36Sopenharmony_ci
110462306a36Sopenharmony_ci		if (opcode == TCPOPT_EOL)
110562306a36Sopenharmony_ci			break;
110662306a36Sopenharmony_ci		if (opcode == TCPOPT_NOP) {
110762306a36Sopenharmony_ci			length--;
110862306a36Sopenharmony_ci			continue;
110962306a36Sopenharmony_ci		}
111062306a36Sopenharmony_ci		if (length < 2)
111162306a36Sopenharmony_ci			break;
111262306a36Sopenharmony_ci		opsize = *ptr++;
111362306a36Sopenharmony_ci		if (opsize < 2 || opsize > length)
111462306a36Sopenharmony_ci			break;
111562306a36Sopenharmony_ci
111662306a36Sopenharmony_ci		switch (opcode) {
111762306a36Sopenharmony_ci		case TCPOPT_MD5SIG: /* doesn't influence state */
111862306a36Sopenharmony_ci			break;
111962306a36Sopenharmony_ci
112062306a36Sopenharmony_ci		case TCPOPT_SACK: /* stricter checking performed later */
112162306a36Sopenharmony_ci			if (opsize % 8 != 2)
112262306a36Sopenharmony_ci				return false;
112362306a36Sopenharmony_ci			break;
112462306a36Sopenharmony_ci
112562306a36Sopenharmony_ci		case TCPOPT_TIMESTAMP:
112662306a36Sopenharmony_ci			/* only drop timestamps lower than new */
112762306a36Sopenharmony_ci			if (opsize != TCPOLEN_TIMESTAMP)
112862306a36Sopenharmony_ci				return false;
112962306a36Sopenharmony_ci			tstamp = get_unaligned_be32(ptr);
113062306a36Sopenharmony_ci			tsecr = get_unaligned_be32(ptr + 4);
113162306a36Sopenharmony_ci			if (after(tstamp, tstamp_new) ||
113262306a36Sopenharmony_ci			    after(tsecr, tsecr_new))
113362306a36Sopenharmony_ci				return false;
113462306a36Sopenharmony_ci			break;
113562306a36Sopenharmony_ci
113662306a36Sopenharmony_ci		case TCPOPT_MSS:  /* these should only be set on SYN */
113762306a36Sopenharmony_ci		case TCPOPT_WINDOW:
113862306a36Sopenharmony_ci		case TCPOPT_SACK_PERM:
113962306a36Sopenharmony_ci		case TCPOPT_FASTOPEN:
114062306a36Sopenharmony_ci		case TCPOPT_EXP:
114162306a36Sopenharmony_ci		default: /* don't drop if any unknown options are present */
114262306a36Sopenharmony_ci			return false;
114362306a36Sopenharmony_ci		}
114462306a36Sopenharmony_ci
114562306a36Sopenharmony_ci		ptr += opsize - 2;
114662306a36Sopenharmony_ci		length -= opsize;
114762306a36Sopenharmony_ci	}
114862306a36Sopenharmony_ci
114962306a36Sopenharmony_ci	return true;
115062306a36Sopenharmony_ci}
115162306a36Sopenharmony_ci
115262306a36Sopenharmony_cistatic struct sk_buff *cake_ack_filter(struct cake_sched_data *q,
115362306a36Sopenharmony_ci				       struct cake_flow *flow)
115462306a36Sopenharmony_ci{
115562306a36Sopenharmony_ci	bool aggressive = q->ack_filter == CAKE_ACK_AGGRESSIVE;
115662306a36Sopenharmony_ci	struct sk_buff *elig_ack = NULL, *elig_ack_prev = NULL;
115762306a36Sopenharmony_ci	struct sk_buff *skb_check, *skb_prev = NULL;
115862306a36Sopenharmony_ci	const struct ipv6hdr *ipv6h, *ipv6h_check;
115962306a36Sopenharmony_ci	unsigned char _tcph[64], _tcph_check[64];
116062306a36Sopenharmony_ci	const struct tcphdr *tcph, *tcph_check;
116162306a36Sopenharmony_ci	const struct iphdr *iph, *iph_check;
116262306a36Sopenharmony_ci	struct ipv6hdr _iph, _iph_check;
116362306a36Sopenharmony_ci	const struct sk_buff *skb;
116462306a36Sopenharmony_ci	int seglen, num_found = 0;
116562306a36Sopenharmony_ci	u32 tstamp = 0, tsecr = 0;
116662306a36Sopenharmony_ci	__be32 elig_flags = 0;
116762306a36Sopenharmony_ci	int sack_comp;
116862306a36Sopenharmony_ci
116962306a36Sopenharmony_ci	/* no other possible ACKs to filter */
117062306a36Sopenharmony_ci	if (flow->head == flow->tail)
117162306a36Sopenharmony_ci		return NULL;
117262306a36Sopenharmony_ci
117362306a36Sopenharmony_ci	skb = flow->tail;
117462306a36Sopenharmony_ci	tcph = cake_get_tcphdr(skb, _tcph, sizeof(_tcph));
117562306a36Sopenharmony_ci	iph = cake_get_iphdr(skb, &_iph);
117662306a36Sopenharmony_ci	if (!tcph)
117762306a36Sopenharmony_ci		return NULL;
117862306a36Sopenharmony_ci
117962306a36Sopenharmony_ci	cake_tcph_get_tstamp(tcph, &tstamp, &tsecr);
118062306a36Sopenharmony_ci
118162306a36Sopenharmony_ci	/* the 'triggering' packet need only have the ACK flag set.
118262306a36Sopenharmony_ci	 * also check that SYN is not set, as there won't be any previous ACKs.
118362306a36Sopenharmony_ci	 */
118462306a36Sopenharmony_ci	if ((tcp_flag_word(tcph) &
118562306a36Sopenharmony_ci	     (TCP_FLAG_ACK | TCP_FLAG_SYN)) != TCP_FLAG_ACK)
118662306a36Sopenharmony_ci		return NULL;
118762306a36Sopenharmony_ci
118862306a36Sopenharmony_ci	/* the 'triggering' ACK is at the tail of the queue, we have already
118962306a36Sopenharmony_ci	 * returned if it is the only packet in the flow. loop through the rest
119062306a36Sopenharmony_ci	 * of the queue looking for pure ACKs with the same 5-tuple as the
119162306a36Sopenharmony_ci	 * triggering one.
119262306a36Sopenharmony_ci	 */
119362306a36Sopenharmony_ci	for (skb_check = flow->head;
119462306a36Sopenharmony_ci	     skb_check && skb_check != skb;
119562306a36Sopenharmony_ci	     skb_prev = skb_check, skb_check = skb_check->next) {
119662306a36Sopenharmony_ci		iph_check = cake_get_iphdr(skb_check, &_iph_check);
119762306a36Sopenharmony_ci		tcph_check = cake_get_tcphdr(skb_check, &_tcph_check,
119862306a36Sopenharmony_ci					     sizeof(_tcph_check));
119962306a36Sopenharmony_ci
120062306a36Sopenharmony_ci		/* only TCP packets with matching 5-tuple are eligible, and only
120162306a36Sopenharmony_ci		 * drop safe headers
120262306a36Sopenharmony_ci		 */
120362306a36Sopenharmony_ci		if (!tcph_check || iph->version != iph_check->version ||
120462306a36Sopenharmony_ci		    tcph_check->source != tcph->source ||
120562306a36Sopenharmony_ci		    tcph_check->dest != tcph->dest)
120662306a36Sopenharmony_ci			continue;
120762306a36Sopenharmony_ci
120862306a36Sopenharmony_ci		if (iph_check->version == 4) {
120962306a36Sopenharmony_ci			if (iph_check->saddr != iph->saddr ||
121062306a36Sopenharmony_ci			    iph_check->daddr != iph->daddr)
121162306a36Sopenharmony_ci				continue;
121262306a36Sopenharmony_ci
121362306a36Sopenharmony_ci			seglen = iph_totlen(skb, iph_check) -
121462306a36Sopenharmony_ci				       (4 * iph_check->ihl);
121562306a36Sopenharmony_ci		} else if (iph_check->version == 6) {
121662306a36Sopenharmony_ci			ipv6h = (struct ipv6hdr *)iph;
121762306a36Sopenharmony_ci			ipv6h_check = (struct ipv6hdr *)iph_check;
121862306a36Sopenharmony_ci
121962306a36Sopenharmony_ci			if (ipv6_addr_cmp(&ipv6h_check->saddr, &ipv6h->saddr) ||
122062306a36Sopenharmony_ci			    ipv6_addr_cmp(&ipv6h_check->daddr, &ipv6h->daddr))
122162306a36Sopenharmony_ci				continue;
122262306a36Sopenharmony_ci
122362306a36Sopenharmony_ci			seglen = ntohs(ipv6h_check->payload_len);
122462306a36Sopenharmony_ci		} else {
122562306a36Sopenharmony_ci			WARN_ON(1);  /* shouldn't happen */
122662306a36Sopenharmony_ci			continue;
122762306a36Sopenharmony_ci		}
122862306a36Sopenharmony_ci
122962306a36Sopenharmony_ci		/* If the ECE/CWR flags changed from the previous eligible
123062306a36Sopenharmony_ci		 * packet in the same flow, we should no longer be dropping that
123162306a36Sopenharmony_ci		 * previous packet as this would lose information.
123262306a36Sopenharmony_ci		 */
123362306a36Sopenharmony_ci		if (elig_ack && (tcp_flag_word(tcph_check) &
123462306a36Sopenharmony_ci				 (TCP_FLAG_ECE | TCP_FLAG_CWR)) != elig_flags) {
123562306a36Sopenharmony_ci			elig_ack = NULL;
123662306a36Sopenharmony_ci			elig_ack_prev = NULL;
123762306a36Sopenharmony_ci			num_found--;
123862306a36Sopenharmony_ci		}
123962306a36Sopenharmony_ci
124062306a36Sopenharmony_ci		/* Check TCP options and flags, don't drop ACKs with segment
124162306a36Sopenharmony_ci		 * data, and don't drop ACKs with a higher cumulative ACK
124262306a36Sopenharmony_ci		 * counter than the triggering packet. Check ACK seqno here to
124362306a36Sopenharmony_ci		 * avoid parsing SACK options of packets we are going to exclude
124462306a36Sopenharmony_ci		 * anyway.
124562306a36Sopenharmony_ci		 */
124662306a36Sopenharmony_ci		if (!cake_tcph_may_drop(tcph_check, tstamp, tsecr) ||
124762306a36Sopenharmony_ci		    (seglen - __tcp_hdrlen(tcph_check)) != 0 ||
124862306a36Sopenharmony_ci		    after(ntohl(tcph_check->ack_seq), ntohl(tcph->ack_seq)))
124962306a36Sopenharmony_ci			continue;
125062306a36Sopenharmony_ci
125162306a36Sopenharmony_ci		/* Check SACK options. The triggering packet must SACK more data
125262306a36Sopenharmony_ci		 * than the ACK under consideration, or SACK the same range but
125362306a36Sopenharmony_ci		 * have a larger cumulative ACK counter. The latter is a
125462306a36Sopenharmony_ci		 * pathological case, but is contained in the following check
125562306a36Sopenharmony_ci		 * anyway, just to be safe.
125662306a36Sopenharmony_ci		 */
125762306a36Sopenharmony_ci		sack_comp = cake_tcph_sack_compare(tcph_check, tcph);
125862306a36Sopenharmony_ci
125962306a36Sopenharmony_ci		if (sack_comp < 0 ||
126062306a36Sopenharmony_ci		    (ntohl(tcph_check->ack_seq) == ntohl(tcph->ack_seq) &&
126162306a36Sopenharmony_ci		     sack_comp == 0))
126262306a36Sopenharmony_ci			continue;
126362306a36Sopenharmony_ci
126462306a36Sopenharmony_ci		/* At this point we have found an eligible pure ACK to drop; if
126562306a36Sopenharmony_ci		 * we are in aggressive mode, we are done. Otherwise, keep
126662306a36Sopenharmony_ci		 * searching unless this is the second eligible ACK we
126762306a36Sopenharmony_ci		 * found.
126862306a36Sopenharmony_ci		 *
126962306a36Sopenharmony_ci		 * Since we want to drop ACK closest to the head of the queue,
127062306a36Sopenharmony_ci		 * save the first eligible ACK we find, even if we need to loop
127162306a36Sopenharmony_ci		 * again.
127262306a36Sopenharmony_ci		 */
127362306a36Sopenharmony_ci		if (!elig_ack) {
127462306a36Sopenharmony_ci			elig_ack = skb_check;
127562306a36Sopenharmony_ci			elig_ack_prev = skb_prev;
127662306a36Sopenharmony_ci			elig_flags = (tcp_flag_word(tcph_check)
127762306a36Sopenharmony_ci				      & (TCP_FLAG_ECE | TCP_FLAG_CWR));
127862306a36Sopenharmony_ci		}
127962306a36Sopenharmony_ci
128062306a36Sopenharmony_ci		if (num_found++ > 0)
128162306a36Sopenharmony_ci			goto found;
128262306a36Sopenharmony_ci	}
128362306a36Sopenharmony_ci
128462306a36Sopenharmony_ci	/* We made it through the queue without finding two eligible ACKs . If
128562306a36Sopenharmony_ci	 * we found a single eligible ACK we can drop it in aggressive mode if
128662306a36Sopenharmony_ci	 * we can guarantee that this does not interfere with ECN flag
128762306a36Sopenharmony_ci	 * information. We ensure this by dropping it only if the enqueued
128862306a36Sopenharmony_ci	 * packet is consecutive with the eligible ACK, and their flags match.
128962306a36Sopenharmony_ci	 */
129062306a36Sopenharmony_ci	if (elig_ack && aggressive && elig_ack->next == skb &&
129162306a36Sopenharmony_ci	    (elig_flags == (tcp_flag_word(tcph) &
129262306a36Sopenharmony_ci			    (TCP_FLAG_ECE | TCP_FLAG_CWR))))
129362306a36Sopenharmony_ci		goto found;
129462306a36Sopenharmony_ci
129562306a36Sopenharmony_ci	return NULL;
129662306a36Sopenharmony_ci
129762306a36Sopenharmony_cifound:
129862306a36Sopenharmony_ci	if (elig_ack_prev)
129962306a36Sopenharmony_ci		elig_ack_prev->next = elig_ack->next;
130062306a36Sopenharmony_ci	else
130162306a36Sopenharmony_ci		flow->head = elig_ack->next;
130262306a36Sopenharmony_ci
130362306a36Sopenharmony_ci	skb_mark_not_on_list(elig_ack);
130462306a36Sopenharmony_ci
130562306a36Sopenharmony_ci	return elig_ack;
130662306a36Sopenharmony_ci}
130762306a36Sopenharmony_ci
130862306a36Sopenharmony_cistatic u64 cake_ewma(u64 avg, u64 sample, u32 shift)
130962306a36Sopenharmony_ci{
131062306a36Sopenharmony_ci	avg -= avg >> shift;
131162306a36Sopenharmony_ci	avg += sample >> shift;
131262306a36Sopenharmony_ci	return avg;
131362306a36Sopenharmony_ci}
131462306a36Sopenharmony_ci
131562306a36Sopenharmony_cistatic u32 cake_calc_overhead(struct cake_sched_data *q, u32 len, u32 off)
131662306a36Sopenharmony_ci{
131762306a36Sopenharmony_ci	if (q->rate_flags & CAKE_FLAG_OVERHEAD)
131862306a36Sopenharmony_ci		len -= off;
131962306a36Sopenharmony_ci
132062306a36Sopenharmony_ci	if (q->max_netlen < len)
132162306a36Sopenharmony_ci		q->max_netlen = len;
132262306a36Sopenharmony_ci	if (q->min_netlen > len)
132362306a36Sopenharmony_ci		q->min_netlen = len;
132462306a36Sopenharmony_ci
132562306a36Sopenharmony_ci	len += q->rate_overhead;
132662306a36Sopenharmony_ci
132762306a36Sopenharmony_ci	if (len < q->rate_mpu)
132862306a36Sopenharmony_ci		len = q->rate_mpu;
132962306a36Sopenharmony_ci
133062306a36Sopenharmony_ci	if (q->atm_mode == CAKE_ATM_ATM) {
133162306a36Sopenharmony_ci		len += 47;
133262306a36Sopenharmony_ci		len /= 48;
133362306a36Sopenharmony_ci		len *= 53;
133462306a36Sopenharmony_ci	} else if (q->atm_mode == CAKE_ATM_PTM) {
133562306a36Sopenharmony_ci		/* Add one byte per 64 bytes or part thereof.
133662306a36Sopenharmony_ci		 * This is conservative and easier to calculate than the
133762306a36Sopenharmony_ci		 * precise value.
133862306a36Sopenharmony_ci		 */
133962306a36Sopenharmony_ci		len += (len + 63) / 64;
134062306a36Sopenharmony_ci	}
134162306a36Sopenharmony_ci
134262306a36Sopenharmony_ci	if (q->max_adjlen < len)
134362306a36Sopenharmony_ci		q->max_adjlen = len;
134462306a36Sopenharmony_ci	if (q->min_adjlen > len)
134562306a36Sopenharmony_ci		q->min_adjlen = len;
134662306a36Sopenharmony_ci
134762306a36Sopenharmony_ci	return len;
134862306a36Sopenharmony_ci}
134962306a36Sopenharmony_ci
135062306a36Sopenharmony_cistatic u32 cake_overhead(struct cake_sched_data *q, const struct sk_buff *skb)
135162306a36Sopenharmony_ci{
135262306a36Sopenharmony_ci	const struct skb_shared_info *shinfo = skb_shinfo(skb);
135362306a36Sopenharmony_ci	unsigned int hdr_len, last_len = 0;
135462306a36Sopenharmony_ci	u32 off = skb_network_offset(skb);
135562306a36Sopenharmony_ci	u32 len = qdisc_pkt_len(skb);
135662306a36Sopenharmony_ci	u16 segs = 1;
135762306a36Sopenharmony_ci
135862306a36Sopenharmony_ci	q->avg_netoff = cake_ewma(q->avg_netoff, off << 16, 8);
135962306a36Sopenharmony_ci
136062306a36Sopenharmony_ci	if (!shinfo->gso_size)
136162306a36Sopenharmony_ci		return cake_calc_overhead(q, len, off);
136262306a36Sopenharmony_ci
136362306a36Sopenharmony_ci	/* borrowed from qdisc_pkt_len_init() */
136462306a36Sopenharmony_ci	hdr_len = skb_transport_offset(skb);
136562306a36Sopenharmony_ci
136662306a36Sopenharmony_ci	/* + transport layer */
136762306a36Sopenharmony_ci	if (likely(shinfo->gso_type & (SKB_GSO_TCPV4 |
136862306a36Sopenharmony_ci						SKB_GSO_TCPV6))) {
136962306a36Sopenharmony_ci		const struct tcphdr *th;
137062306a36Sopenharmony_ci		struct tcphdr _tcphdr;
137162306a36Sopenharmony_ci
137262306a36Sopenharmony_ci		th = skb_header_pointer(skb, hdr_len,
137362306a36Sopenharmony_ci					sizeof(_tcphdr), &_tcphdr);
137462306a36Sopenharmony_ci		if (likely(th))
137562306a36Sopenharmony_ci			hdr_len += __tcp_hdrlen(th);
137662306a36Sopenharmony_ci	} else {
137762306a36Sopenharmony_ci		struct udphdr _udphdr;
137862306a36Sopenharmony_ci
137962306a36Sopenharmony_ci		if (skb_header_pointer(skb, hdr_len,
138062306a36Sopenharmony_ci				       sizeof(_udphdr), &_udphdr))
138162306a36Sopenharmony_ci			hdr_len += sizeof(struct udphdr);
138262306a36Sopenharmony_ci	}
138362306a36Sopenharmony_ci
138462306a36Sopenharmony_ci	if (unlikely(shinfo->gso_type & SKB_GSO_DODGY))
138562306a36Sopenharmony_ci		segs = DIV_ROUND_UP(skb->len - hdr_len,
138662306a36Sopenharmony_ci				    shinfo->gso_size);
138762306a36Sopenharmony_ci	else
138862306a36Sopenharmony_ci		segs = shinfo->gso_segs;
138962306a36Sopenharmony_ci
139062306a36Sopenharmony_ci	len = shinfo->gso_size + hdr_len;
139162306a36Sopenharmony_ci	last_len = skb->len - shinfo->gso_size * (segs - 1);
139262306a36Sopenharmony_ci
139362306a36Sopenharmony_ci	return (cake_calc_overhead(q, len, off) * (segs - 1) +
139462306a36Sopenharmony_ci		cake_calc_overhead(q, last_len, off));
139562306a36Sopenharmony_ci}
139662306a36Sopenharmony_ci
139762306a36Sopenharmony_cistatic void cake_heap_swap(struct cake_sched_data *q, u16 i, u16 j)
139862306a36Sopenharmony_ci{
139962306a36Sopenharmony_ci	struct cake_heap_entry ii = q->overflow_heap[i];
140062306a36Sopenharmony_ci	struct cake_heap_entry jj = q->overflow_heap[j];
140162306a36Sopenharmony_ci
140262306a36Sopenharmony_ci	q->overflow_heap[i] = jj;
140362306a36Sopenharmony_ci	q->overflow_heap[j] = ii;
140462306a36Sopenharmony_ci
140562306a36Sopenharmony_ci	q->tins[ii.t].overflow_idx[ii.b] = j;
140662306a36Sopenharmony_ci	q->tins[jj.t].overflow_idx[jj.b] = i;
140762306a36Sopenharmony_ci}
140862306a36Sopenharmony_ci
140962306a36Sopenharmony_cistatic u32 cake_heap_get_backlog(const struct cake_sched_data *q, u16 i)
141062306a36Sopenharmony_ci{
141162306a36Sopenharmony_ci	struct cake_heap_entry ii = q->overflow_heap[i];
141262306a36Sopenharmony_ci
141362306a36Sopenharmony_ci	return q->tins[ii.t].backlogs[ii.b];
141462306a36Sopenharmony_ci}
141562306a36Sopenharmony_ci
141662306a36Sopenharmony_cistatic void cake_heapify(struct cake_sched_data *q, u16 i)
141762306a36Sopenharmony_ci{
141862306a36Sopenharmony_ci	static const u32 a = CAKE_MAX_TINS * CAKE_QUEUES;
141962306a36Sopenharmony_ci	u32 mb = cake_heap_get_backlog(q, i);
142062306a36Sopenharmony_ci	u32 m = i;
142162306a36Sopenharmony_ci
142262306a36Sopenharmony_ci	while (m < a) {
142362306a36Sopenharmony_ci		u32 l = m + m + 1;
142462306a36Sopenharmony_ci		u32 r = l + 1;
142562306a36Sopenharmony_ci
142662306a36Sopenharmony_ci		if (l < a) {
142762306a36Sopenharmony_ci			u32 lb = cake_heap_get_backlog(q, l);
142862306a36Sopenharmony_ci
142962306a36Sopenharmony_ci			if (lb > mb) {
143062306a36Sopenharmony_ci				m  = l;
143162306a36Sopenharmony_ci				mb = lb;
143262306a36Sopenharmony_ci			}
143362306a36Sopenharmony_ci		}
143462306a36Sopenharmony_ci
143562306a36Sopenharmony_ci		if (r < a) {
143662306a36Sopenharmony_ci			u32 rb = cake_heap_get_backlog(q, r);
143762306a36Sopenharmony_ci
143862306a36Sopenharmony_ci			if (rb > mb) {
143962306a36Sopenharmony_ci				m  = r;
144062306a36Sopenharmony_ci				mb = rb;
144162306a36Sopenharmony_ci			}
144262306a36Sopenharmony_ci		}
144362306a36Sopenharmony_ci
144462306a36Sopenharmony_ci		if (m != i) {
144562306a36Sopenharmony_ci			cake_heap_swap(q, i, m);
144662306a36Sopenharmony_ci			i = m;
144762306a36Sopenharmony_ci		} else {
144862306a36Sopenharmony_ci			break;
144962306a36Sopenharmony_ci		}
145062306a36Sopenharmony_ci	}
145162306a36Sopenharmony_ci}
145262306a36Sopenharmony_ci
145362306a36Sopenharmony_cistatic void cake_heapify_up(struct cake_sched_data *q, u16 i)
145462306a36Sopenharmony_ci{
145562306a36Sopenharmony_ci	while (i > 0 && i < CAKE_MAX_TINS * CAKE_QUEUES) {
145662306a36Sopenharmony_ci		u16 p = (i - 1) >> 1;
145762306a36Sopenharmony_ci		u32 ib = cake_heap_get_backlog(q, i);
145862306a36Sopenharmony_ci		u32 pb = cake_heap_get_backlog(q, p);
145962306a36Sopenharmony_ci
146062306a36Sopenharmony_ci		if (ib > pb) {
146162306a36Sopenharmony_ci			cake_heap_swap(q, i, p);
146262306a36Sopenharmony_ci			i = p;
146362306a36Sopenharmony_ci		} else {
146462306a36Sopenharmony_ci			break;
146562306a36Sopenharmony_ci		}
146662306a36Sopenharmony_ci	}
146762306a36Sopenharmony_ci}
146862306a36Sopenharmony_ci
146962306a36Sopenharmony_cistatic int cake_advance_shaper(struct cake_sched_data *q,
147062306a36Sopenharmony_ci			       struct cake_tin_data *b,
147162306a36Sopenharmony_ci			       struct sk_buff *skb,
147262306a36Sopenharmony_ci			       ktime_t now, bool drop)
147362306a36Sopenharmony_ci{
147462306a36Sopenharmony_ci	u32 len = get_cobalt_cb(skb)->adjusted_len;
147562306a36Sopenharmony_ci
147662306a36Sopenharmony_ci	/* charge packet bandwidth to this tin
147762306a36Sopenharmony_ci	 * and to the global shaper.
147862306a36Sopenharmony_ci	 */
147962306a36Sopenharmony_ci	if (q->rate_ns) {
148062306a36Sopenharmony_ci		u64 tin_dur = (len * b->tin_rate_ns) >> b->tin_rate_shft;
148162306a36Sopenharmony_ci		u64 global_dur = (len * q->rate_ns) >> q->rate_shft;
148262306a36Sopenharmony_ci		u64 failsafe_dur = global_dur + (global_dur >> 1);
148362306a36Sopenharmony_ci
148462306a36Sopenharmony_ci		if (ktime_before(b->time_next_packet, now))
148562306a36Sopenharmony_ci			b->time_next_packet = ktime_add_ns(b->time_next_packet,
148662306a36Sopenharmony_ci							   tin_dur);
148762306a36Sopenharmony_ci
148862306a36Sopenharmony_ci		else if (ktime_before(b->time_next_packet,
148962306a36Sopenharmony_ci				      ktime_add_ns(now, tin_dur)))
149062306a36Sopenharmony_ci			b->time_next_packet = ktime_add_ns(now, tin_dur);
149162306a36Sopenharmony_ci
149262306a36Sopenharmony_ci		q->time_next_packet = ktime_add_ns(q->time_next_packet,
149362306a36Sopenharmony_ci						   global_dur);
149462306a36Sopenharmony_ci		if (!drop)
149562306a36Sopenharmony_ci			q->failsafe_next_packet = \
149662306a36Sopenharmony_ci				ktime_add_ns(q->failsafe_next_packet,
149762306a36Sopenharmony_ci					     failsafe_dur);
149862306a36Sopenharmony_ci	}
149962306a36Sopenharmony_ci	return len;
150062306a36Sopenharmony_ci}
150162306a36Sopenharmony_ci
150262306a36Sopenharmony_cistatic unsigned int cake_drop(struct Qdisc *sch, struct sk_buff **to_free)
150362306a36Sopenharmony_ci{
150462306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
150562306a36Sopenharmony_ci	ktime_t now = ktime_get();
150662306a36Sopenharmony_ci	u32 idx = 0, tin = 0, len;
150762306a36Sopenharmony_ci	struct cake_heap_entry qq;
150862306a36Sopenharmony_ci	struct cake_tin_data *b;
150962306a36Sopenharmony_ci	struct cake_flow *flow;
151062306a36Sopenharmony_ci	struct sk_buff *skb;
151162306a36Sopenharmony_ci
151262306a36Sopenharmony_ci	if (!q->overflow_timeout) {
151362306a36Sopenharmony_ci		int i;
151462306a36Sopenharmony_ci		/* Build fresh max-heap */
151562306a36Sopenharmony_ci		for (i = CAKE_MAX_TINS * CAKE_QUEUES / 2; i >= 0; i--)
151662306a36Sopenharmony_ci			cake_heapify(q, i);
151762306a36Sopenharmony_ci	}
151862306a36Sopenharmony_ci	q->overflow_timeout = 65535;
151962306a36Sopenharmony_ci
152062306a36Sopenharmony_ci	/* select longest queue for pruning */
152162306a36Sopenharmony_ci	qq  = q->overflow_heap[0];
152262306a36Sopenharmony_ci	tin = qq.t;
152362306a36Sopenharmony_ci	idx = qq.b;
152462306a36Sopenharmony_ci
152562306a36Sopenharmony_ci	b = &q->tins[tin];
152662306a36Sopenharmony_ci	flow = &b->flows[idx];
152762306a36Sopenharmony_ci	skb = dequeue_head(flow);
152862306a36Sopenharmony_ci	if (unlikely(!skb)) {
152962306a36Sopenharmony_ci		/* heap has gone wrong, rebuild it next time */
153062306a36Sopenharmony_ci		q->overflow_timeout = 0;
153162306a36Sopenharmony_ci		return idx + (tin << 16);
153262306a36Sopenharmony_ci	}
153362306a36Sopenharmony_ci
153462306a36Sopenharmony_ci	if (cobalt_queue_full(&flow->cvars, &b->cparams, now))
153562306a36Sopenharmony_ci		b->unresponsive_flow_count++;
153662306a36Sopenharmony_ci
153762306a36Sopenharmony_ci	len = qdisc_pkt_len(skb);
153862306a36Sopenharmony_ci	q->buffer_used      -= skb->truesize;
153962306a36Sopenharmony_ci	b->backlogs[idx]    -= len;
154062306a36Sopenharmony_ci	b->tin_backlog      -= len;
154162306a36Sopenharmony_ci	sch->qstats.backlog -= len;
154262306a36Sopenharmony_ci	qdisc_tree_reduce_backlog(sch, 1, len);
154362306a36Sopenharmony_ci
154462306a36Sopenharmony_ci	flow->dropped++;
154562306a36Sopenharmony_ci	b->tin_dropped++;
154662306a36Sopenharmony_ci	sch->qstats.drops++;
154762306a36Sopenharmony_ci
154862306a36Sopenharmony_ci	if (q->rate_flags & CAKE_FLAG_INGRESS)
154962306a36Sopenharmony_ci		cake_advance_shaper(q, b, skb, now, true);
155062306a36Sopenharmony_ci
155162306a36Sopenharmony_ci	__qdisc_drop(skb, to_free);
155262306a36Sopenharmony_ci	sch->q.qlen--;
155362306a36Sopenharmony_ci
155462306a36Sopenharmony_ci	cake_heapify(q, 0);
155562306a36Sopenharmony_ci
155662306a36Sopenharmony_ci	return idx + (tin << 16);
155762306a36Sopenharmony_ci}
155862306a36Sopenharmony_ci
155962306a36Sopenharmony_cistatic u8 cake_handle_diffserv(struct sk_buff *skb, bool wash)
156062306a36Sopenharmony_ci{
156162306a36Sopenharmony_ci	const int offset = skb_network_offset(skb);
156262306a36Sopenharmony_ci	u16 *buf, buf_;
156362306a36Sopenharmony_ci	u8 dscp;
156462306a36Sopenharmony_ci
156562306a36Sopenharmony_ci	switch (skb_protocol(skb, true)) {
156662306a36Sopenharmony_ci	case htons(ETH_P_IP):
156762306a36Sopenharmony_ci		buf = skb_header_pointer(skb, offset, sizeof(buf_), &buf_);
156862306a36Sopenharmony_ci		if (unlikely(!buf))
156962306a36Sopenharmony_ci			return 0;
157062306a36Sopenharmony_ci
157162306a36Sopenharmony_ci		/* ToS is in the second byte of iphdr */
157262306a36Sopenharmony_ci		dscp = ipv4_get_dsfield((struct iphdr *)buf) >> 2;
157362306a36Sopenharmony_ci
157462306a36Sopenharmony_ci		if (wash && dscp) {
157562306a36Sopenharmony_ci			const int wlen = offset + sizeof(struct iphdr);
157662306a36Sopenharmony_ci
157762306a36Sopenharmony_ci			if (!pskb_may_pull(skb, wlen) ||
157862306a36Sopenharmony_ci			    skb_try_make_writable(skb, wlen))
157962306a36Sopenharmony_ci				return 0;
158062306a36Sopenharmony_ci
158162306a36Sopenharmony_ci			ipv4_change_dsfield(ip_hdr(skb), INET_ECN_MASK, 0);
158262306a36Sopenharmony_ci		}
158362306a36Sopenharmony_ci
158462306a36Sopenharmony_ci		return dscp;
158562306a36Sopenharmony_ci
158662306a36Sopenharmony_ci	case htons(ETH_P_IPV6):
158762306a36Sopenharmony_ci		buf = skb_header_pointer(skb, offset, sizeof(buf_), &buf_);
158862306a36Sopenharmony_ci		if (unlikely(!buf))
158962306a36Sopenharmony_ci			return 0;
159062306a36Sopenharmony_ci
159162306a36Sopenharmony_ci		/* Traffic class is in the first and second bytes of ipv6hdr */
159262306a36Sopenharmony_ci		dscp = ipv6_get_dsfield((struct ipv6hdr *)buf) >> 2;
159362306a36Sopenharmony_ci
159462306a36Sopenharmony_ci		if (wash && dscp) {
159562306a36Sopenharmony_ci			const int wlen = offset + sizeof(struct ipv6hdr);
159662306a36Sopenharmony_ci
159762306a36Sopenharmony_ci			if (!pskb_may_pull(skb, wlen) ||
159862306a36Sopenharmony_ci			    skb_try_make_writable(skb, wlen))
159962306a36Sopenharmony_ci				return 0;
160062306a36Sopenharmony_ci
160162306a36Sopenharmony_ci			ipv6_change_dsfield(ipv6_hdr(skb), INET_ECN_MASK, 0);
160262306a36Sopenharmony_ci		}
160362306a36Sopenharmony_ci
160462306a36Sopenharmony_ci		return dscp;
160562306a36Sopenharmony_ci
160662306a36Sopenharmony_ci	case htons(ETH_P_ARP):
160762306a36Sopenharmony_ci		return 0x38;  /* CS7 - Net Control */
160862306a36Sopenharmony_ci
160962306a36Sopenharmony_ci	default:
161062306a36Sopenharmony_ci		/* If there is no Diffserv field, treat as best-effort */
161162306a36Sopenharmony_ci		return 0;
161262306a36Sopenharmony_ci	}
161362306a36Sopenharmony_ci}
161462306a36Sopenharmony_ci
161562306a36Sopenharmony_cistatic struct cake_tin_data *cake_select_tin(struct Qdisc *sch,
161662306a36Sopenharmony_ci					     struct sk_buff *skb)
161762306a36Sopenharmony_ci{
161862306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
161962306a36Sopenharmony_ci	u32 tin, mark;
162062306a36Sopenharmony_ci	bool wash;
162162306a36Sopenharmony_ci	u8 dscp;
162262306a36Sopenharmony_ci
162362306a36Sopenharmony_ci	/* Tin selection: Default to diffserv-based selection, allow overriding
162462306a36Sopenharmony_ci	 * using firewall marks or skb->priority. Call DSCP parsing early if
162562306a36Sopenharmony_ci	 * wash is enabled, otherwise defer to below to skip unneeded parsing.
162662306a36Sopenharmony_ci	 */
162762306a36Sopenharmony_ci	mark = (skb->mark & q->fwmark_mask) >> q->fwmark_shft;
162862306a36Sopenharmony_ci	wash = !!(q->rate_flags & CAKE_FLAG_WASH);
162962306a36Sopenharmony_ci	if (wash)
163062306a36Sopenharmony_ci		dscp = cake_handle_diffserv(skb, wash);
163162306a36Sopenharmony_ci
163262306a36Sopenharmony_ci	if (q->tin_mode == CAKE_DIFFSERV_BESTEFFORT)
163362306a36Sopenharmony_ci		tin = 0;
163462306a36Sopenharmony_ci
163562306a36Sopenharmony_ci	else if (mark && mark <= q->tin_cnt)
163662306a36Sopenharmony_ci		tin = q->tin_order[mark - 1];
163762306a36Sopenharmony_ci
163862306a36Sopenharmony_ci	else if (TC_H_MAJ(skb->priority) == sch->handle &&
163962306a36Sopenharmony_ci		 TC_H_MIN(skb->priority) > 0 &&
164062306a36Sopenharmony_ci		 TC_H_MIN(skb->priority) <= q->tin_cnt)
164162306a36Sopenharmony_ci		tin = q->tin_order[TC_H_MIN(skb->priority) - 1];
164262306a36Sopenharmony_ci
164362306a36Sopenharmony_ci	else {
164462306a36Sopenharmony_ci		if (!wash)
164562306a36Sopenharmony_ci			dscp = cake_handle_diffserv(skb, wash);
164662306a36Sopenharmony_ci		tin = q->tin_index[dscp];
164762306a36Sopenharmony_ci
164862306a36Sopenharmony_ci		if (unlikely(tin >= q->tin_cnt))
164962306a36Sopenharmony_ci			tin = 0;
165062306a36Sopenharmony_ci	}
165162306a36Sopenharmony_ci
165262306a36Sopenharmony_ci	return &q->tins[tin];
165362306a36Sopenharmony_ci}
165462306a36Sopenharmony_ci
165562306a36Sopenharmony_cistatic u32 cake_classify(struct Qdisc *sch, struct cake_tin_data **t,
165662306a36Sopenharmony_ci			 struct sk_buff *skb, int flow_mode, int *qerr)
165762306a36Sopenharmony_ci{
165862306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
165962306a36Sopenharmony_ci	struct tcf_proto *filter;
166062306a36Sopenharmony_ci	struct tcf_result res;
166162306a36Sopenharmony_ci	u16 flow = 0, host = 0;
166262306a36Sopenharmony_ci	int result;
166362306a36Sopenharmony_ci
166462306a36Sopenharmony_ci	filter = rcu_dereference_bh(q->filter_list);
166562306a36Sopenharmony_ci	if (!filter)
166662306a36Sopenharmony_ci		goto hash;
166762306a36Sopenharmony_ci
166862306a36Sopenharmony_ci	*qerr = NET_XMIT_SUCCESS | __NET_XMIT_BYPASS;
166962306a36Sopenharmony_ci	result = tcf_classify(skb, NULL, filter, &res, false);
167062306a36Sopenharmony_ci
167162306a36Sopenharmony_ci	if (result >= 0) {
167262306a36Sopenharmony_ci#ifdef CONFIG_NET_CLS_ACT
167362306a36Sopenharmony_ci		switch (result) {
167462306a36Sopenharmony_ci		case TC_ACT_STOLEN:
167562306a36Sopenharmony_ci		case TC_ACT_QUEUED:
167662306a36Sopenharmony_ci		case TC_ACT_TRAP:
167762306a36Sopenharmony_ci			*qerr = NET_XMIT_SUCCESS | __NET_XMIT_STOLEN;
167862306a36Sopenharmony_ci			fallthrough;
167962306a36Sopenharmony_ci		case TC_ACT_SHOT:
168062306a36Sopenharmony_ci			return 0;
168162306a36Sopenharmony_ci		}
168262306a36Sopenharmony_ci#endif
168362306a36Sopenharmony_ci		if (TC_H_MIN(res.classid) <= CAKE_QUEUES)
168462306a36Sopenharmony_ci			flow = TC_H_MIN(res.classid);
168562306a36Sopenharmony_ci		if (TC_H_MAJ(res.classid) <= (CAKE_QUEUES << 16))
168662306a36Sopenharmony_ci			host = TC_H_MAJ(res.classid) >> 16;
168762306a36Sopenharmony_ci	}
168862306a36Sopenharmony_cihash:
168962306a36Sopenharmony_ci	*t = cake_select_tin(sch, skb);
169062306a36Sopenharmony_ci	return cake_hash(*t, skb, flow_mode, flow, host) + 1;
169162306a36Sopenharmony_ci}
169262306a36Sopenharmony_ci
169362306a36Sopenharmony_cistatic void cake_reconfigure(struct Qdisc *sch);
169462306a36Sopenharmony_ci
169562306a36Sopenharmony_cistatic s32 cake_enqueue(struct sk_buff *skb, struct Qdisc *sch,
169662306a36Sopenharmony_ci			struct sk_buff **to_free)
169762306a36Sopenharmony_ci{
169862306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
169962306a36Sopenharmony_ci	int len = qdisc_pkt_len(skb);
170062306a36Sopenharmony_ci	int ret;
170162306a36Sopenharmony_ci	struct sk_buff *ack = NULL;
170262306a36Sopenharmony_ci	ktime_t now = ktime_get();
170362306a36Sopenharmony_ci	struct cake_tin_data *b;
170462306a36Sopenharmony_ci	struct cake_flow *flow;
170562306a36Sopenharmony_ci	u32 idx;
170662306a36Sopenharmony_ci
170762306a36Sopenharmony_ci	/* choose flow to insert into */
170862306a36Sopenharmony_ci	idx = cake_classify(sch, &b, skb, q->flow_mode, &ret);
170962306a36Sopenharmony_ci	if (idx == 0) {
171062306a36Sopenharmony_ci		if (ret & __NET_XMIT_BYPASS)
171162306a36Sopenharmony_ci			qdisc_qstats_drop(sch);
171262306a36Sopenharmony_ci		__qdisc_drop(skb, to_free);
171362306a36Sopenharmony_ci		return ret;
171462306a36Sopenharmony_ci	}
171562306a36Sopenharmony_ci	idx--;
171662306a36Sopenharmony_ci	flow = &b->flows[idx];
171762306a36Sopenharmony_ci
171862306a36Sopenharmony_ci	/* ensure shaper state isn't stale */
171962306a36Sopenharmony_ci	if (!b->tin_backlog) {
172062306a36Sopenharmony_ci		if (ktime_before(b->time_next_packet, now))
172162306a36Sopenharmony_ci			b->time_next_packet = now;
172262306a36Sopenharmony_ci
172362306a36Sopenharmony_ci		if (!sch->q.qlen) {
172462306a36Sopenharmony_ci			if (ktime_before(q->time_next_packet, now)) {
172562306a36Sopenharmony_ci				q->failsafe_next_packet = now;
172662306a36Sopenharmony_ci				q->time_next_packet = now;
172762306a36Sopenharmony_ci			} else if (ktime_after(q->time_next_packet, now) &&
172862306a36Sopenharmony_ci				   ktime_after(q->failsafe_next_packet, now)) {
172962306a36Sopenharmony_ci				u64 next = \
173062306a36Sopenharmony_ci					min(ktime_to_ns(q->time_next_packet),
173162306a36Sopenharmony_ci					    ktime_to_ns(
173262306a36Sopenharmony_ci						   q->failsafe_next_packet));
173362306a36Sopenharmony_ci				sch->qstats.overlimits++;
173462306a36Sopenharmony_ci				qdisc_watchdog_schedule_ns(&q->watchdog, next);
173562306a36Sopenharmony_ci			}
173662306a36Sopenharmony_ci		}
173762306a36Sopenharmony_ci	}
173862306a36Sopenharmony_ci
173962306a36Sopenharmony_ci	if (unlikely(len > b->max_skblen))
174062306a36Sopenharmony_ci		b->max_skblen = len;
174162306a36Sopenharmony_ci
174262306a36Sopenharmony_ci	if (skb_is_gso(skb) && q->rate_flags & CAKE_FLAG_SPLIT_GSO) {
174362306a36Sopenharmony_ci		struct sk_buff *segs, *nskb;
174462306a36Sopenharmony_ci		netdev_features_t features = netif_skb_features(skb);
174562306a36Sopenharmony_ci		unsigned int slen = 0, numsegs = 0;
174662306a36Sopenharmony_ci
174762306a36Sopenharmony_ci		segs = skb_gso_segment(skb, features & ~NETIF_F_GSO_MASK);
174862306a36Sopenharmony_ci		if (IS_ERR_OR_NULL(segs))
174962306a36Sopenharmony_ci			return qdisc_drop(skb, sch, to_free);
175062306a36Sopenharmony_ci
175162306a36Sopenharmony_ci		skb_list_walk_safe(segs, segs, nskb) {
175262306a36Sopenharmony_ci			skb_mark_not_on_list(segs);
175362306a36Sopenharmony_ci			qdisc_skb_cb(segs)->pkt_len = segs->len;
175462306a36Sopenharmony_ci			cobalt_set_enqueue_time(segs, now);
175562306a36Sopenharmony_ci			get_cobalt_cb(segs)->adjusted_len = cake_overhead(q,
175662306a36Sopenharmony_ci									  segs);
175762306a36Sopenharmony_ci			flow_queue_add(flow, segs);
175862306a36Sopenharmony_ci
175962306a36Sopenharmony_ci			sch->q.qlen++;
176062306a36Sopenharmony_ci			numsegs++;
176162306a36Sopenharmony_ci			slen += segs->len;
176262306a36Sopenharmony_ci			q->buffer_used += segs->truesize;
176362306a36Sopenharmony_ci			b->packets++;
176462306a36Sopenharmony_ci		}
176562306a36Sopenharmony_ci
176662306a36Sopenharmony_ci		/* stats */
176762306a36Sopenharmony_ci		b->bytes	    += slen;
176862306a36Sopenharmony_ci		b->backlogs[idx]    += slen;
176962306a36Sopenharmony_ci		b->tin_backlog      += slen;
177062306a36Sopenharmony_ci		sch->qstats.backlog += slen;
177162306a36Sopenharmony_ci		q->avg_window_bytes += slen;
177262306a36Sopenharmony_ci
177362306a36Sopenharmony_ci		qdisc_tree_reduce_backlog(sch, 1-numsegs, len-slen);
177462306a36Sopenharmony_ci		consume_skb(skb);
177562306a36Sopenharmony_ci	} else {
177662306a36Sopenharmony_ci		/* not splitting */
177762306a36Sopenharmony_ci		cobalt_set_enqueue_time(skb, now);
177862306a36Sopenharmony_ci		get_cobalt_cb(skb)->adjusted_len = cake_overhead(q, skb);
177962306a36Sopenharmony_ci		flow_queue_add(flow, skb);
178062306a36Sopenharmony_ci
178162306a36Sopenharmony_ci		if (q->ack_filter)
178262306a36Sopenharmony_ci			ack = cake_ack_filter(q, flow);
178362306a36Sopenharmony_ci
178462306a36Sopenharmony_ci		if (ack) {
178562306a36Sopenharmony_ci			b->ack_drops++;
178662306a36Sopenharmony_ci			sch->qstats.drops++;
178762306a36Sopenharmony_ci			b->bytes += qdisc_pkt_len(ack);
178862306a36Sopenharmony_ci			len -= qdisc_pkt_len(ack);
178962306a36Sopenharmony_ci			q->buffer_used += skb->truesize - ack->truesize;
179062306a36Sopenharmony_ci			if (q->rate_flags & CAKE_FLAG_INGRESS)
179162306a36Sopenharmony_ci				cake_advance_shaper(q, b, ack, now, true);
179262306a36Sopenharmony_ci
179362306a36Sopenharmony_ci			qdisc_tree_reduce_backlog(sch, 1, qdisc_pkt_len(ack));
179462306a36Sopenharmony_ci			consume_skb(ack);
179562306a36Sopenharmony_ci		} else {
179662306a36Sopenharmony_ci			sch->q.qlen++;
179762306a36Sopenharmony_ci			q->buffer_used      += skb->truesize;
179862306a36Sopenharmony_ci		}
179962306a36Sopenharmony_ci
180062306a36Sopenharmony_ci		/* stats */
180162306a36Sopenharmony_ci		b->packets++;
180262306a36Sopenharmony_ci		b->bytes	    += len;
180362306a36Sopenharmony_ci		b->backlogs[idx]    += len;
180462306a36Sopenharmony_ci		b->tin_backlog      += len;
180562306a36Sopenharmony_ci		sch->qstats.backlog += len;
180662306a36Sopenharmony_ci		q->avg_window_bytes += len;
180762306a36Sopenharmony_ci	}
180862306a36Sopenharmony_ci
180962306a36Sopenharmony_ci	if (q->overflow_timeout)
181062306a36Sopenharmony_ci		cake_heapify_up(q, b->overflow_idx[idx]);
181162306a36Sopenharmony_ci
181262306a36Sopenharmony_ci	/* incoming bandwidth capacity estimate */
181362306a36Sopenharmony_ci	if (q->rate_flags & CAKE_FLAG_AUTORATE_INGRESS) {
181462306a36Sopenharmony_ci		u64 packet_interval = \
181562306a36Sopenharmony_ci			ktime_to_ns(ktime_sub(now, q->last_packet_time));
181662306a36Sopenharmony_ci
181762306a36Sopenharmony_ci		if (packet_interval > NSEC_PER_SEC)
181862306a36Sopenharmony_ci			packet_interval = NSEC_PER_SEC;
181962306a36Sopenharmony_ci
182062306a36Sopenharmony_ci		/* filter out short-term bursts, eg. wifi aggregation */
182162306a36Sopenharmony_ci		q->avg_packet_interval = \
182262306a36Sopenharmony_ci			cake_ewma(q->avg_packet_interval,
182362306a36Sopenharmony_ci				  packet_interval,
182462306a36Sopenharmony_ci				  (packet_interval > q->avg_packet_interval ?
182562306a36Sopenharmony_ci					  2 : 8));
182662306a36Sopenharmony_ci
182762306a36Sopenharmony_ci		q->last_packet_time = now;
182862306a36Sopenharmony_ci
182962306a36Sopenharmony_ci		if (packet_interval > q->avg_packet_interval) {
183062306a36Sopenharmony_ci			u64 window_interval = \
183162306a36Sopenharmony_ci				ktime_to_ns(ktime_sub(now,
183262306a36Sopenharmony_ci						      q->avg_window_begin));
183362306a36Sopenharmony_ci			u64 b = q->avg_window_bytes * (u64)NSEC_PER_SEC;
183462306a36Sopenharmony_ci
183562306a36Sopenharmony_ci			b = div64_u64(b, window_interval);
183662306a36Sopenharmony_ci			q->avg_peak_bandwidth =
183762306a36Sopenharmony_ci				cake_ewma(q->avg_peak_bandwidth, b,
183862306a36Sopenharmony_ci					  b > q->avg_peak_bandwidth ? 2 : 8);
183962306a36Sopenharmony_ci			q->avg_window_bytes = 0;
184062306a36Sopenharmony_ci			q->avg_window_begin = now;
184162306a36Sopenharmony_ci
184262306a36Sopenharmony_ci			if (ktime_after(now,
184362306a36Sopenharmony_ci					ktime_add_ms(q->last_reconfig_time,
184462306a36Sopenharmony_ci						     250))) {
184562306a36Sopenharmony_ci				q->rate_bps = (q->avg_peak_bandwidth * 15) >> 4;
184662306a36Sopenharmony_ci				cake_reconfigure(sch);
184762306a36Sopenharmony_ci			}
184862306a36Sopenharmony_ci		}
184962306a36Sopenharmony_ci	} else {
185062306a36Sopenharmony_ci		q->avg_window_bytes = 0;
185162306a36Sopenharmony_ci		q->last_packet_time = now;
185262306a36Sopenharmony_ci	}
185362306a36Sopenharmony_ci
185462306a36Sopenharmony_ci	/* flowchain */
185562306a36Sopenharmony_ci	if (!flow->set || flow->set == CAKE_SET_DECAYING) {
185662306a36Sopenharmony_ci		struct cake_host *srchost = &b->hosts[flow->srchost];
185762306a36Sopenharmony_ci		struct cake_host *dsthost = &b->hosts[flow->dsthost];
185862306a36Sopenharmony_ci		u16 host_load = 1;
185962306a36Sopenharmony_ci
186062306a36Sopenharmony_ci		if (!flow->set) {
186162306a36Sopenharmony_ci			list_add_tail(&flow->flowchain, &b->new_flows);
186262306a36Sopenharmony_ci		} else {
186362306a36Sopenharmony_ci			b->decaying_flow_count--;
186462306a36Sopenharmony_ci			list_move_tail(&flow->flowchain, &b->new_flows);
186562306a36Sopenharmony_ci		}
186662306a36Sopenharmony_ci		flow->set = CAKE_SET_SPARSE;
186762306a36Sopenharmony_ci		b->sparse_flow_count++;
186862306a36Sopenharmony_ci
186962306a36Sopenharmony_ci		if (cake_dsrc(q->flow_mode))
187062306a36Sopenharmony_ci			host_load = max(host_load, srchost->srchost_bulk_flow_count);
187162306a36Sopenharmony_ci
187262306a36Sopenharmony_ci		if (cake_ddst(q->flow_mode))
187362306a36Sopenharmony_ci			host_load = max(host_load, dsthost->dsthost_bulk_flow_count);
187462306a36Sopenharmony_ci
187562306a36Sopenharmony_ci		flow->deficit = (b->flow_quantum *
187662306a36Sopenharmony_ci				 quantum_div[host_load]) >> 16;
187762306a36Sopenharmony_ci	} else if (flow->set == CAKE_SET_SPARSE_WAIT) {
187862306a36Sopenharmony_ci		struct cake_host *srchost = &b->hosts[flow->srchost];
187962306a36Sopenharmony_ci		struct cake_host *dsthost = &b->hosts[flow->dsthost];
188062306a36Sopenharmony_ci
188162306a36Sopenharmony_ci		/* this flow was empty, accounted as a sparse flow, but actually
188262306a36Sopenharmony_ci		 * in the bulk rotation.
188362306a36Sopenharmony_ci		 */
188462306a36Sopenharmony_ci		flow->set = CAKE_SET_BULK;
188562306a36Sopenharmony_ci		b->sparse_flow_count--;
188662306a36Sopenharmony_ci		b->bulk_flow_count++;
188762306a36Sopenharmony_ci
188862306a36Sopenharmony_ci		if (cake_dsrc(q->flow_mode))
188962306a36Sopenharmony_ci			srchost->srchost_bulk_flow_count++;
189062306a36Sopenharmony_ci
189162306a36Sopenharmony_ci		if (cake_ddst(q->flow_mode))
189262306a36Sopenharmony_ci			dsthost->dsthost_bulk_flow_count++;
189362306a36Sopenharmony_ci
189462306a36Sopenharmony_ci	}
189562306a36Sopenharmony_ci
189662306a36Sopenharmony_ci	if (q->buffer_used > q->buffer_max_used)
189762306a36Sopenharmony_ci		q->buffer_max_used = q->buffer_used;
189862306a36Sopenharmony_ci
189962306a36Sopenharmony_ci	if (q->buffer_used > q->buffer_limit) {
190062306a36Sopenharmony_ci		u32 dropped = 0;
190162306a36Sopenharmony_ci
190262306a36Sopenharmony_ci		while (q->buffer_used > q->buffer_limit) {
190362306a36Sopenharmony_ci			dropped++;
190462306a36Sopenharmony_ci			cake_drop(sch, to_free);
190562306a36Sopenharmony_ci		}
190662306a36Sopenharmony_ci		b->drop_overlimit += dropped;
190762306a36Sopenharmony_ci	}
190862306a36Sopenharmony_ci	return NET_XMIT_SUCCESS;
190962306a36Sopenharmony_ci}
191062306a36Sopenharmony_ci
191162306a36Sopenharmony_cistatic struct sk_buff *cake_dequeue_one(struct Qdisc *sch)
191262306a36Sopenharmony_ci{
191362306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
191462306a36Sopenharmony_ci	struct cake_tin_data *b = &q->tins[q->cur_tin];
191562306a36Sopenharmony_ci	struct cake_flow *flow = &b->flows[q->cur_flow];
191662306a36Sopenharmony_ci	struct sk_buff *skb = NULL;
191762306a36Sopenharmony_ci	u32 len;
191862306a36Sopenharmony_ci
191962306a36Sopenharmony_ci	if (flow->head) {
192062306a36Sopenharmony_ci		skb = dequeue_head(flow);
192162306a36Sopenharmony_ci		len = qdisc_pkt_len(skb);
192262306a36Sopenharmony_ci		b->backlogs[q->cur_flow] -= len;
192362306a36Sopenharmony_ci		b->tin_backlog		 -= len;
192462306a36Sopenharmony_ci		sch->qstats.backlog      -= len;
192562306a36Sopenharmony_ci		q->buffer_used		 -= skb->truesize;
192662306a36Sopenharmony_ci		sch->q.qlen--;
192762306a36Sopenharmony_ci
192862306a36Sopenharmony_ci		if (q->overflow_timeout)
192962306a36Sopenharmony_ci			cake_heapify(q, b->overflow_idx[q->cur_flow]);
193062306a36Sopenharmony_ci	}
193162306a36Sopenharmony_ci	return skb;
193262306a36Sopenharmony_ci}
193362306a36Sopenharmony_ci
193462306a36Sopenharmony_ci/* Discard leftover packets from a tin no longer in use. */
193562306a36Sopenharmony_cistatic void cake_clear_tin(struct Qdisc *sch, u16 tin)
193662306a36Sopenharmony_ci{
193762306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
193862306a36Sopenharmony_ci	struct sk_buff *skb;
193962306a36Sopenharmony_ci
194062306a36Sopenharmony_ci	q->cur_tin = tin;
194162306a36Sopenharmony_ci	for (q->cur_flow = 0; q->cur_flow < CAKE_QUEUES; q->cur_flow++)
194262306a36Sopenharmony_ci		while (!!(skb = cake_dequeue_one(sch)))
194362306a36Sopenharmony_ci			kfree_skb(skb);
194462306a36Sopenharmony_ci}
194562306a36Sopenharmony_ci
194662306a36Sopenharmony_cistatic struct sk_buff *cake_dequeue(struct Qdisc *sch)
194762306a36Sopenharmony_ci{
194862306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
194962306a36Sopenharmony_ci	struct cake_tin_data *b = &q->tins[q->cur_tin];
195062306a36Sopenharmony_ci	struct cake_host *srchost, *dsthost;
195162306a36Sopenharmony_ci	ktime_t now = ktime_get();
195262306a36Sopenharmony_ci	struct cake_flow *flow;
195362306a36Sopenharmony_ci	struct list_head *head;
195462306a36Sopenharmony_ci	bool first_flow = true;
195562306a36Sopenharmony_ci	struct sk_buff *skb;
195662306a36Sopenharmony_ci	u16 host_load;
195762306a36Sopenharmony_ci	u64 delay;
195862306a36Sopenharmony_ci	u32 len;
195962306a36Sopenharmony_ci
196062306a36Sopenharmony_cibegin:
196162306a36Sopenharmony_ci	if (!sch->q.qlen)
196262306a36Sopenharmony_ci		return NULL;
196362306a36Sopenharmony_ci
196462306a36Sopenharmony_ci	/* global hard shaper */
196562306a36Sopenharmony_ci	if (ktime_after(q->time_next_packet, now) &&
196662306a36Sopenharmony_ci	    ktime_after(q->failsafe_next_packet, now)) {
196762306a36Sopenharmony_ci		u64 next = min(ktime_to_ns(q->time_next_packet),
196862306a36Sopenharmony_ci			       ktime_to_ns(q->failsafe_next_packet));
196962306a36Sopenharmony_ci
197062306a36Sopenharmony_ci		sch->qstats.overlimits++;
197162306a36Sopenharmony_ci		qdisc_watchdog_schedule_ns(&q->watchdog, next);
197262306a36Sopenharmony_ci		return NULL;
197362306a36Sopenharmony_ci	}
197462306a36Sopenharmony_ci
197562306a36Sopenharmony_ci	/* Choose a class to work on. */
197662306a36Sopenharmony_ci	if (!q->rate_ns) {
197762306a36Sopenharmony_ci		/* In unlimited mode, can't rely on shaper timings, just balance
197862306a36Sopenharmony_ci		 * with DRR
197962306a36Sopenharmony_ci		 */
198062306a36Sopenharmony_ci		bool wrapped = false, empty = true;
198162306a36Sopenharmony_ci
198262306a36Sopenharmony_ci		while (b->tin_deficit < 0 ||
198362306a36Sopenharmony_ci		       !(b->sparse_flow_count + b->bulk_flow_count)) {
198462306a36Sopenharmony_ci			if (b->tin_deficit <= 0)
198562306a36Sopenharmony_ci				b->tin_deficit += b->tin_quantum;
198662306a36Sopenharmony_ci			if (b->sparse_flow_count + b->bulk_flow_count)
198762306a36Sopenharmony_ci				empty = false;
198862306a36Sopenharmony_ci
198962306a36Sopenharmony_ci			q->cur_tin++;
199062306a36Sopenharmony_ci			b++;
199162306a36Sopenharmony_ci			if (q->cur_tin >= q->tin_cnt) {
199262306a36Sopenharmony_ci				q->cur_tin = 0;
199362306a36Sopenharmony_ci				b = q->tins;
199462306a36Sopenharmony_ci
199562306a36Sopenharmony_ci				if (wrapped) {
199662306a36Sopenharmony_ci					/* It's possible for q->qlen to be
199762306a36Sopenharmony_ci					 * nonzero when we actually have no
199862306a36Sopenharmony_ci					 * packets anywhere.
199962306a36Sopenharmony_ci					 */
200062306a36Sopenharmony_ci					if (empty)
200162306a36Sopenharmony_ci						return NULL;
200262306a36Sopenharmony_ci				} else {
200362306a36Sopenharmony_ci					wrapped = true;
200462306a36Sopenharmony_ci				}
200562306a36Sopenharmony_ci			}
200662306a36Sopenharmony_ci		}
200762306a36Sopenharmony_ci	} else {
200862306a36Sopenharmony_ci		/* In shaped mode, choose:
200962306a36Sopenharmony_ci		 * - Highest-priority tin with queue and meeting schedule, or
201062306a36Sopenharmony_ci		 * - The earliest-scheduled tin with queue.
201162306a36Sopenharmony_ci		 */
201262306a36Sopenharmony_ci		ktime_t best_time = KTIME_MAX;
201362306a36Sopenharmony_ci		int tin, best_tin = 0;
201462306a36Sopenharmony_ci
201562306a36Sopenharmony_ci		for (tin = 0; tin < q->tin_cnt; tin++) {
201662306a36Sopenharmony_ci			b = q->tins + tin;
201762306a36Sopenharmony_ci			if ((b->sparse_flow_count + b->bulk_flow_count) > 0) {
201862306a36Sopenharmony_ci				ktime_t time_to_pkt = \
201962306a36Sopenharmony_ci					ktime_sub(b->time_next_packet, now);
202062306a36Sopenharmony_ci
202162306a36Sopenharmony_ci				if (ktime_to_ns(time_to_pkt) <= 0 ||
202262306a36Sopenharmony_ci				    ktime_compare(time_to_pkt,
202362306a36Sopenharmony_ci						  best_time) <= 0) {
202462306a36Sopenharmony_ci					best_time = time_to_pkt;
202562306a36Sopenharmony_ci					best_tin = tin;
202662306a36Sopenharmony_ci				}
202762306a36Sopenharmony_ci			}
202862306a36Sopenharmony_ci		}
202962306a36Sopenharmony_ci
203062306a36Sopenharmony_ci		q->cur_tin = best_tin;
203162306a36Sopenharmony_ci		b = q->tins + best_tin;
203262306a36Sopenharmony_ci
203362306a36Sopenharmony_ci		/* No point in going further if no packets to deliver. */
203462306a36Sopenharmony_ci		if (unlikely(!(b->sparse_flow_count + b->bulk_flow_count)))
203562306a36Sopenharmony_ci			return NULL;
203662306a36Sopenharmony_ci	}
203762306a36Sopenharmony_ci
203862306a36Sopenharmony_ciretry:
203962306a36Sopenharmony_ci	/* service this class */
204062306a36Sopenharmony_ci	head = &b->decaying_flows;
204162306a36Sopenharmony_ci	if (!first_flow || list_empty(head)) {
204262306a36Sopenharmony_ci		head = &b->new_flows;
204362306a36Sopenharmony_ci		if (list_empty(head)) {
204462306a36Sopenharmony_ci			head = &b->old_flows;
204562306a36Sopenharmony_ci			if (unlikely(list_empty(head))) {
204662306a36Sopenharmony_ci				head = &b->decaying_flows;
204762306a36Sopenharmony_ci				if (unlikely(list_empty(head)))
204862306a36Sopenharmony_ci					goto begin;
204962306a36Sopenharmony_ci			}
205062306a36Sopenharmony_ci		}
205162306a36Sopenharmony_ci	}
205262306a36Sopenharmony_ci	flow = list_first_entry(head, struct cake_flow, flowchain);
205362306a36Sopenharmony_ci	q->cur_flow = flow - b->flows;
205462306a36Sopenharmony_ci	first_flow = false;
205562306a36Sopenharmony_ci
205662306a36Sopenharmony_ci	/* triple isolation (modified DRR++) */
205762306a36Sopenharmony_ci	srchost = &b->hosts[flow->srchost];
205862306a36Sopenharmony_ci	dsthost = &b->hosts[flow->dsthost];
205962306a36Sopenharmony_ci	host_load = 1;
206062306a36Sopenharmony_ci
206162306a36Sopenharmony_ci	/* flow isolation (DRR++) */
206262306a36Sopenharmony_ci	if (flow->deficit <= 0) {
206362306a36Sopenharmony_ci		/* Keep all flows with deficits out of the sparse and decaying
206462306a36Sopenharmony_ci		 * rotations.  No non-empty flow can go into the decaying
206562306a36Sopenharmony_ci		 * rotation, so they can't get deficits
206662306a36Sopenharmony_ci		 */
206762306a36Sopenharmony_ci		if (flow->set == CAKE_SET_SPARSE) {
206862306a36Sopenharmony_ci			if (flow->head) {
206962306a36Sopenharmony_ci				b->sparse_flow_count--;
207062306a36Sopenharmony_ci				b->bulk_flow_count++;
207162306a36Sopenharmony_ci
207262306a36Sopenharmony_ci				if (cake_dsrc(q->flow_mode))
207362306a36Sopenharmony_ci					srchost->srchost_bulk_flow_count++;
207462306a36Sopenharmony_ci
207562306a36Sopenharmony_ci				if (cake_ddst(q->flow_mode))
207662306a36Sopenharmony_ci					dsthost->dsthost_bulk_flow_count++;
207762306a36Sopenharmony_ci
207862306a36Sopenharmony_ci				flow->set = CAKE_SET_BULK;
207962306a36Sopenharmony_ci			} else {
208062306a36Sopenharmony_ci				/* we've moved it to the bulk rotation for
208162306a36Sopenharmony_ci				 * correct deficit accounting but we still want
208262306a36Sopenharmony_ci				 * to count it as a sparse flow, not a bulk one.
208362306a36Sopenharmony_ci				 */
208462306a36Sopenharmony_ci				flow->set = CAKE_SET_SPARSE_WAIT;
208562306a36Sopenharmony_ci			}
208662306a36Sopenharmony_ci		}
208762306a36Sopenharmony_ci
208862306a36Sopenharmony_ci		if (cake_dsrc(q->flow_mode))
208962306a36Sopenharmony_ci			host_load = max(host_load, srchost->srchost_bulk_flow_count);
209062306a36Sopenharmony_ci
209162306a36Sopenharmony_ci		if (cake_ddst(q->flow_mode))
209262306a36Sopenharmony_ci			host_load = max(host_load, dsthost->dsthost_bulk_flow_count);
209362306a36Sopenharmony_ci
209462306a36Sopenharmony_ci		WARN_ON(host_load > CAKE_QUEUES);
209562306a36Sopenharmony_ci
209662306a36Sopenharmony_ci		/* The get_random_u16() is a way to apply dithering to avoid
209762306a36Sopenharmony_ci		 * accumulating roundoff errors
209862306a36Sopenharmony_ci		 */
209962306a36Sopenharmony_ci		flow->deficit += (b->flow_quantum * quantum_div[host_load] +
210062306a36Sopenharmony_ci				  get_random_u16()) >> 16;
210162306a36Sopenharmony_ci		list_move_tail(&flow->flowchain, &b->old_flows);
210262306a36Sopenharmony_ci
210362306a36Sopenharmony_ci		goto retry;
210462306a36Sopenharmony_ci	}
210562306a36Sopenharmony_ci
210662306a36Sopenharmony_ci	/* Retrieve a packet via the AQM */
210762306a36Sopenharmony_ci	while (1) {
210862306a36Sopenharmony_ci		skb = cake_dequeue_one(sch);
210962306a36Sopenharmony_ci		if (!skb) {
211062306a36Sopenharmony_ci			/* this queue was actually empty */
211162306a36Sopenharmony_ci			if (cobalt_queue_empty(&flow->cvars, &b->cparams, now))
211262306a36Sopenharmony_ci				b->unresponsive_flow_count--;
211362306a36Sopenharmony_ci
211462306a36Sopenharmony_ci			if (flow->cvars.p_drop || flow->cvars.count ||
211562306a36Sopenharmony_ci			    ktime_before(now, flow->cvars.drop_next)) {
211662306a36Sopenharmony_ci				/* keep in the flowchain until the state has
211762306a36Sopenharmony_ci				 * decayed to rest
211862306a36Sopenharmony_ci				 */
211962306a36Sopenharmony_ci				list_move_tail(&flow->flowchain,
212062306a36Sopenharmony_ci					       &b->decaying_flows);
212162306a36Sopenharmony_ci				if (flow->set == CAKE_SET_BULK) {
212262306a36Sopenharmony_ci					b->bulk_flow_count--;
212362306a36Sopenharmony_ci
212462306a36Sopenharmony_ci					if (cake_dsrc(q->flow_mode))
212562306a36Sopenharmony_ci						srchost->srchost_bulk_flow_count--;
212662306a36Sopenharmony_ci
212762306a36Sopenharmony_ci					if (cake_ddst(q->flow_mode))
212862306a36Sopenharmony_ci						dsthost->dsthost_bulk_flow_count--;
212962306a36Sopenharmony_ci
213062306a36Sopenharmony_ci					b->decaying_flow_count++;
213162306a36Sopenharmony_ci				} else if (flow->set == CAKE_SET_SPARSE ||
213262306a36Sopenharmony_ci					   flow->set == CAKE_SET_SPARSE_WAIT) {
213362306a36Sopenharmony_ci					b->sparse_flow_count--;
213462306a36Sopenharmony_ci					b->decaying_flow_count++;
213562306a36Sopenharmony_ci				}
213662306a36Sopenharmony_ci				flow->set = CAKE_SET_DECAYING;
213762306a36Sopenharmony_ci			} else {
213862306a36Sopenharmony_ci				/* remove empty queue from the flowchain */
213962306a36Sopenharmony_ci				list_del_init(&flow->flowchain);
214062306a36Sopenharmony_ci				if (flow->set == CAKE_SET_SPARSE ||
214162306a36Sopenharmony_ci				    flow->set == CAKE_SET_SPARSE_WAIT)
214262306a36Sopenharmony_ci					b->sparse_flow_count--;
214362306a36Sopenharmony_ci				else if (flow->set == CAKE_SET_BULK) {
214462306a36Sopenharmony_ci					b->bulk_flow_count--;
214562306a36Sopenharmony_ci
214662306a36Sopenharmony_ci					if (cake_dsrc(q->flow_mode))
214762306a36Sopenharmony_ci						srchost->srchost_bulk_flow_count--;
214862306a36Sopenharmony_ci
214962306a36Sopenharmony_ci					if (cake_ddst(q->flow_mode))
215062306a36Sopenharmony_ci						dsthost->dsthost_bulk_flow_count--;
215162306a36Sopenharmony_ci
215262306a36Sopenharmony_ci				} else
215362306a36Sopenharmony_ci					b->decaying_flow_count--;
215462306a36Sopenharmony_ci
215562306a36Sopenharmony_ci				flow->set = CAKE_SET_NONE;
215662306a36Sopenharmony_ci			}
215762306a36Sopenharmony_ci			goto begin;
215862306a36Sopenharmony_ci		}
215962306a36Sopenharmony_ci
216062306a36Sopenharmony_ci		/* Last packet in queue may be marked, shouldn't be dropped */
216162306a36Sopenharmony_ci		if (!cobalt_should_drop(&flow->cvars, &b->cparams, now, skb,
216262306a36Sopenharmony_ci					(b->bulk_flow_count *
216362306a36Sopenharmony_ci					 !!(q->rate_flags &
216462306a36Sopenharmony_ci					    CAKE_FLAG_INGRESS))) ||
216562306a36Sopenharmony_ci		    !flow->head)
216662306a36Sopenharmony_ci			break;
216762306a36Sopenharmony_ci
216862306a36Sopenharmony_ci		/* drop this packet, get another one */
216962306a36Sopenharmony_ci		if (q->rate_flags & CAKE_FLAG_INGRESS) {
217062306a36Sopenharmony_ci			len = cake_advance_shaper(q, b, skb,
217162306a36Sopenharmony_ci						  now, true);
217262306a36Sopenharmony_ci			flow->deficit -= len;
217362306a36Sopenharmony_ci			b->tin_deficit -= len;
217462306a36Sopenharmony_ci		}
217562306a36Sopenharmony_ci		flow->dropped++;
217662306a36Sopenharmony_ci		b->tin_dropped++;
217762306a36Sopenharmony_ci		qdisc_tree_reduce_backlog(sch, 1, qdisc_pkt_len(skb));
217862306a36Sopenharmony_ci		qdisc_qstats_drop(sch);
217962306a36Sopenharmony_ci		kfree_skb(skb);
218062306a36Sopenharmony_ci		if (q->rate_flags & CAKE_FLAG_INGRESS)
218162306a36Sopenharmony_ci			goto retry;
218262306a36Sopenharmony_ci	}
218362306a36Sopenharmony_ci
218462306a36Sopenharmony_ci	b->tin_ecn_mark += !!flow->cvars.ecn_marked;
218562306a36Sopenharmony_ci	qdisc_bstats_update(sch, skb);
218662306a36Sopenharmony_ci
218762306a36Sopenharmony_ci	/* collect delay stats */
218862306a36Sopenharmony_ci	delay = ktime_to_ns(ktime_sub(now, cobalt_get_enqueue_time(skb)));
218962306a36Sopenharmony_ci	b->avge_delay = cake_ewma(b->avge_delay, delay, 8);
219062306a36Sopenharmony_ci	b->peak_delay = cake_ewma(b->peak_delay, delay,
219162306a36Sopenharmony_ci				  delay > b->peak_delay ? 2 : 8);
219262306a36Sopenharmony_ci	b->base_delay = cake_ewma(b->base_delay, delay,
219362306a36Sopenharmony_ci				  delay < b->base_delay ? 2 : 8);
219462306a36Sopenharmony_ci
219562306a36Sopenharmony_ci	len = cake_advance_shaper(q, b, skb, now, false);
219662306a36Sopenharmony_ci	flow->deficit -= len;
219762306a36Sopenharmony_ci	b->tin_deficit -= len;
219862306a36Sopenharmony_ci
219962306a36Sopenharmony_ci	if (ktime_after(q->time_next_packet, now) && sch->q.qlen) {
220062306a36Sopenharmony_ci		u64 next = min(ktime_to_ns(q->time_next_packet),
220162306a36Sopenharmony_ci			       ktime_to_ns(q->failsafe_next_packet));
220262306a36Sopenharmony_ci
220362306a36Sopenharmony_ci		qdisc_watchdog_schedule_ns(&q->watchdog, next);
220462306a36Sopenharmony_ci	} else if (!sch->q.qlen) {
220562306a36Sopenharmony_ci		int i;
220662306a36Sopenharmony_ci
220762306a36Sopenharmony_ci		for (i = 0; i < q->tin_cnt; i++) {
220862306a36Sopenharmony_ci			if (q->tins[i].decaying_flow_count) {
220962306a36Sopenharmony_ci				ktime_t next = \
221062306a36Sopenharmony_ci					ktime_add_ns(now,
221162306a36Sopenharmony_ci						     q->tins[i].cparams.target);
221262306a36Sopenharmony_ci
221362306a36Sopenharmony_ci				qdisc_watchdog_schedule_ns(&q->watchdog,
221462306a36Sopenharmony_ci							   ktime_to_ns(next));
221562306a36Sopenharmony_ci				break;
221662306a36Sopenharmony_ci			}
221762306a36Sopenharmony_ci		}
221862306a36Sopenharmony_ci	}
221962306a36Sopenharmony_ci
222062306a36Sopenharmony_ci	if (q->overflow_timeout)
222162306a36Sopenharmony_ci		q->overflow_timeout--;
222262306a36Sopenharmony_ci
222362306a36Sopenharmony_ci	return skb;
222462306a36Sopenharmony_ci}
222562306a36Sopenharmony_ci
222662306a36Sopenharmony_cistatic void cake_reset(struct Qdisc *sch)
222762306a36Sopenharmony_ci{
222862306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
222962306a36Sopenharmony_ci	u32 c;
223062306a36Sopenharmony_ci
223162306a36Sopenharmony_ci	if (!q->tins)
223262306a36Sopenharmony_ci		return;
223362306a36Sopenharmony_ci
223462306a36Sopenharmony_ci	for (c = 0; c < CAKE_MAX_TINS; c++)
223562306a36Sopenharmony_ci		cake_clear_tin(sch, c);
223662306a36Sopenharmony_ci}
223762306a36Sopenharmony_ci
223862306a36Sopenharmony_cistatic const struct nla_policy cake_policy[TCA_CAKE_MAX + 1] = {
223962306a36Sopenharmony_ci	[TCA_CAKE_BASE_RATE64]   = { .type = NLA_U64 },
224062306a36Sopenharmony_ci	[TCA_CAKE_DIFFSERV_MODE] = { .type = NLA_U32 },
224162306a36Sopenharmony_ci	[TCA_CAKE_ATM]		 = { .type = NLA_U32 },
224262306a36Sopenharmony_ci	[TCA_CAKE_FLOW_MODE]     = { .type = NLA_U32 },
224362306a36Sopenharmony_ci	[TCA_CAKE_OVERHEAD]      = { .type = NLA_S32 },
224462306a36Sopenharmony_ci	[TCA_CAKE_RTT]		 = { .type = NLA_U32 },
224562306a36Sopenharmony_ci	[TCA_CAKE_TARGET]	 = { .type = NLA_U32 },
224662306a36Sopenharmony_ci	[TCA_CAKE_AUTORATE]      = { .type = NLA_U32 },
224762306a36Sopenharmony_ci	[TCA_CAKE_MEMORY]	 = { .type = NLA_U32 },
224862306a36Sopenharmony_ci	[TCA_CAKE_NAT]		 = { .type = NLA_U32 },
224962306a36Sopenharmony_ci	[TCA_CAKE_RAW]		 = { .type = NLA_U32 },
225062306a36Sopenharmony_ci	[TCA_CAKE_WASH]		 = { .type = NLA_U32 },
225162306a36Sopenharmony_ci	[TCA_CAKE_MPU]		 = { .type = NLA_U32 },
225262306a36Sopenharmony_ci	[TCA_CAKE_INGRESS]	 = { .type = NLA_U32 },
225362306a36Sopenharmony_ci	[TCA_CAKE_ACK_FILTER]	 = { .type = NLA_U32 },
225462306a36Sopenharmony_ci	[TCA_CAKE_SPLIT_GSO]	 = { .type = NLA_U32 },
225562306a36Sopenharmony_ci	[TCA_CAKE_FWMARK]	 = { .type = NLA_U32 },
225662306a36Sopenharmony_ci};
225762306a36Sopenharmony_ci
225862306a36Sopenharmony_cistatic void cake_set_rate(struct cake_tin_data *b, u64 rate, u32 mtu,
225962306a36Sopenharmony_ci			  u64 target_ns, u64 rtt_est_ns)
226062306a36Sopenharmony_ci{
226162306a36Sopenharmony_ci	/* convert byte-rate into time-per-byte
226262306a36Sopenharmony_ci	 * so it will always unwedge in reasonable time.
226362306a36Sopenharmony_ci	 */
226462306a36Sopenharmony_ci	static const u64 MIN_RATE = 64;
226562306a36Sopenharmony_ci	u32 byte_target = mtu;
226662306a36Sopenharmony_ci	u64 byte_target_ns;
226762306a36Sopenharmony_ci	u8  rate_shft = 0;
226862306a36Sopenharmony_ci	u64 rate_ns = 0;
226962306a36Sopenharmony_ci
227062306a36Sopenharmony_ci	b->flow_quantum = 1514;
227162306a36Sopenharmony_ci	if (rate) {
227262306a36Sopenharmony_ci		b->flow_quantum = max(min(rate >> 12, 1514ULL), 300ULL);
227362306a36Sopenharmony_ci		rate_shft = 34;
227462306a36Sopenharmony_ci		rate_ns = ((u64)NSEC_PER_SEC) << rate_shft;
227562306a36Sopenharmony_ci		rate_ns = div64_u64(rate_ns, max(MIN_RATE, rate));
227662306a36Sopenharmony_ci		while (!!(rate_ns >> 34)) {
227762306a36Sopenharmony_ci			rate_ns >>= 1;
227862306a36Sopenharmony_ci			rate_shft--;
227962306a36Sopenharmony_ci		}
228062306a36Sopenharmony_ci	} /* else unlimited, ie. zero delay */
228162306a36Sopenharmony_ci
228262306a36Sopenharmony_ci	b->tin_rate_bps  = rate;
228362306a36Sopenharmony_ci	b->tin_rate_ns   = rate_ns;
228462306a36Sopenharmony_ci	b->tin_rate_shft = rate_shft;
228562306a36Sopenharmony_ci
228662306a36Sopenharmony_ci	byte_target_ns = (byte_target * rate_ns) >> rate_shft;
228762306a36Sopenharmony_ci
228862306a36Sopenharmony_ci	b->cparams.target = max((byte_target_ns * 3) / 2, target_ns);
228962306a36Sopenharmony_ci	b->cparams.interval = max(rtt_est_ns +
229062306a36Sopenharmony_ci				     b->cparams.target - target_ns,
229162306a36Sopenharmony_ci				     b->cparams.target * 2);
229262306a36Sopenharmony_ci	b->cparams.mtu_time = byte_target_ns;
229362306a36Sopenharmony_ci	b->cparams.p_inc = 1 << 24; /* 1/256 */
229462306a36Sopenharmony_ci	b->cparams.p_dec = 1 << 20; /* 1/4096 */
229562306a36Sopenharmony_ci}
229662306a36Sopenharmony_ci
229762306a36Sopenharmony_cistatic int cake_config_besteffort(struct Qdisc *sch)
229862306a36Sopenharmony_ci{
229962306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
230062306a36Sopenharmony_ci	struct cake_tin_data *b = &q->tins[0];
230162306a36Sopenharmony_ci	u32 mtu = psched_mtu(qdisc_dev(sch));
230262306a36Sopenharmony_ci	u64 rate = q->rate_bps;
230362306a36Sopenharmony_ci
230462306a36Sopenharmony_ci	q->tin_cnt = 1;
230562306a36Sopenharmony_ci
230662306a36Sopenharmony_ci	q->tin_index = besteffort;
230762306a36Sopenharmony_ci	q->tin_order = normal_order;
230862306a36Sopenharmony_ci
230962306a36Sopenharmony_ci	cake_set_rate(b, rate, mtu,
231062306a36Sopenharmony_ci		      us_to_ns(q->target), us_to_ns(q->interval));
231162306a36Sopenharmony_ci	b->tin_quantum = 65535;
231262306a36Sopenharmony_ci
231362306a36Sopenharmony_ci	return 0;
231462306a36Sopenharmony_ci}
231562306a36Sopenharmony_ci
231662306a36Sopenharmony_cistatic int cake_config_precedence(struct Qdisc *sch)
231762306a36Sopenharmony_ci{
231862306a36Sopenharmony_ci	/* convert high-level (user visible) parameters into internal format */
231962306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
232062306a36Sopenharmony_ci	u32 mtu = psched_mtu(qdisc_dev(sch));
232162306a36Sopenharmony_ci	u64 rate = q->rate_bps;
232262306a36Sopenharmony_ci	u32 quantum = 256;
232362306a36Sopenharmony_ci	u32 i;
232462306a36Sopenharmony_ci
232562306a36Sopenharmony_ci	q->tin_cnt = 8;
232662306a36Sopenharmony_ci	q->tin_index = precedence;
232762306a36Sopenharmony_ci	q->tin_order = normal_order;
232862306a36Sopenharmony_ci
232962306a36Sopenharmony_ci	for (i = 0; i < q->tin_cnt; i++) {
233062306a36Sopenharmony_ci		struct cake_tin_data *b = &q->tins[i];
233162306a36Sopenharmony_ci
233262306a36Sopenharmony_ci		cake_set_rate(b, rate, mtu, us_to_ns(q->target),
233362306a36Sopenharmony_ci			      us_to_ns(q->interval));
233462306a36Sopenharmony_ci
233562306a36Sopenharmony_ci		b->tin_quantum = max_t(u16, 1U, quantum);
233662306a36Sopenharmony_ci
233762306a36Sopenharmony_ci		/* calculate next class's parameters */
233862306a36Sopenharmony_ci		rate  *= 7;
233962306a36Sopenharmony_ci		rate >>= 3;
234062306a36Sopenharmony_ci
234162306a36Sopenharmony_ci		quantum  *= 7;
234262306a36Sopenharmony_ci		quantum >>= 3;
234362306a36Sopenharmony_ci	}
234462306a36Sopenharmony_ci
234562306a36Sopenharmony_ci	return 0;
234662306a36Sopenharmony_ci}
234762306a36Sopenharmony_ci
234862306a36Sopenharmony_ci/*	List of known Diffserv codepoints:
234962306a36Sopenharmony_ci *
235062306a36Sopenharmony_ci *	Default Forwarding (DF/CS0) - Best Effort
235162306a36Sopenharmony_ci *	Max Throughput (TOS2)
235262306a36Sopenharmony_ci *	Min Delay (TOS4)
235362306a36Sopenharmony_ci *	LLT "La" (TOS5)
235462306a36Sopenharmony_ci *	Assured Forwarding 1 (AF1x) - x3
235562306a36Sopenharmony_ci *	Assured Forwarding 2 (AF2x) - x3
235662306a36Sopenharmony_ci *	Assured Forwarding 3 (AF3x) - x3
235762306a36Sopenharmony_ci *	Assured Forwarding 4 (AF4x) - x3
235862306a36Sopenharmony_ci *	Precedence Class 1 (CS1)
235962306a36Sopenharmony_ci *	Precedence Class 2 (CS2)
236062306a36Sopenharmony_ci *	Precedence Class 3 (CS3)
236162306a36Sopenharmony_ci *	Precedence Class 4 (CS4)
236262306a36Sopenharmony_ci *	Precedence Class 5 (CS5)
236362306a36Sopenharmony_ci *	Precedence Class 6 (CS6)
236462306a36Sopenharmony_ci *	Precedence Class 7 (CS7)
236562306a36Sopenharmony_ci *	Voice Admit (VA)
236662306a36Sopenharmony_ci *	Expedited Forwarding (EF)
236762306a36Sopenharmony_ci *	Lower Effort (LE)
236862306a36Sopenharmony_ci *
236962306a36Sopenharmony_ci *	Total 26 codepoints.
237062306a36Sopenharmony_ci */
237162306a36Sopenharmony_ci
237262306a36Sopenharmony_ci/*	List of traffic classes in RFC 4594, updated by RFC 8622:
237362306a36Sopenharmony_ci *		(roughly descending order of contended priority)
237462306a36Sopenharmony_ci *		(roughly ascending order of uncontended throughput)
237562306a36Sopenharmony_ci *
237662306a36Sopenharmony_ci *	Network Control (CS6,CS7)      - routing traffic
237762306a36Sopenharmony_ci *	Telephony (EF,VA)         - aka. VoIP streams
237862306a36Sopenharmony_ci *	Signalling (CS5)               - VoIP setup
237962306a36Sopenharmony_ci *	Multimedia Conferencing (AF4x) - aka. video calls
238062306a36Sopenharmony_ci *	Realtime Interactive (CS4)     - eg. games
238162306a36Sopenharmony_ci *	Multimedia Streaming (AF3x)    - eg. YouTube, NetFlix, Twitch
238262306a36Sopenharmony_ci *	Broadcast Video (CS3)
238362306a36Sopenharmony_ci *	Low-Latency Data (AF2x,TOS4)      - eg. database
238462306a36Sopenharmony_ci *	Ops, Admin, Management (CS2)      - eg. ssh
238562306a36Sopenharmony_ci *	Standard Service (DF & unrecognised codepoints)
238662306a36Sopenharmony_ci *	High-Throughput Data (AF1x,TOS2)  - eg. web traffic
238762306a36Sopenharmony_ci *	Low-Priority Data (LE,CS1)        - eg. BitTorrent
238862306a36Sopenharmony_ci *
238962306a36Sopenharmony_ci *	Total 12 traffic classes.
239062306a36Sopenharmony_ci */
239162306a36Sopenharmony_ci
239262306a36Sopenharmony_cistatic int cake_config_diffserv8(struct Qdisc *sch)
239362306a36Sopenharmony_ci{
239462306a36Sopenharmony_ci/*	Pruned list of traffic classes for typical applications:
239562306a36Sopenharmony_ci *
239662306a36Sopenharmony_ci *		Network Control          (CS6, CS7)
239762306a36Sopenharmony_ci *		Minimum Latency          (EF, VA, CS5, CS4)
239862306a36Sopenharmony_ci *		Interactive Shell        (CS2)
239962306a36Sopenharmony_ci *		Low Latency Transactions (AF2x, TOS4)
240062306a36Sopenharmony_ci *		Video Streaming          (AF4x, AF3x, CS3)
240162306a36Sopenharmony_ci *		Bog Standard             (DF etc.)
240262306a36Sopenharmony_ci *		High Throughput          (AF1x, TOS2, CS1)
240362306a36Sopenharmony_ci *		Background Traffic       (LE)
240462306a36Sopenharmony_ci *
240562306a36Sopenharmony_ci *		Total 8 traffic classes.
240662306a36Sopenharmony_ci */
240762306a36Sopenharmony_ci
240862306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
240962306a36Sopenharmony_ci	u32 mtu = psched_mtu(qdisc_dev(sch));
241062306a36Sopenharmony_ci	u64 rate = q->rate_bps;
241162306a36Sopenharmony_ci	u32 quantum = 256;
241262306a36Sopenharmony_ci	u32 i;
241362306a36Sopenharmony_ci
241462306a36Sopenharmony_ci	q->tin_cnt = 8;
241562306a36Sopenharmony_ci
241662306a36Sopenharmony_ci	/* codepoint to class mapping */
241762306a36Sopenharmony_ci	q->tin_index = diffserv8;
241862306a36Sopenharmony_ci	q->tin_order = normal_order;
241962306a36Sopenharmony_ci
242062306a36Sopenharmony_ci	/* class characteristics */
242162306a36Sopenharmony_ci	for (i = 0; i < q->tin_cnt; i++) {
242262306a36Sopenharmony_ci		struct cake_tin_data *b = &q->tins[i];
242362306a36Sopenharmony_ci
242462306a36Sopenharmony_ci		cake_set_rate(b, rate, mtu, us_to_ns(q->target),
242562306a36Sopenharmony_ci			      us_to_ns(q->interval));
242662306a36Sopenharmony_ci
242762306a36Sopenharmony_ci		b->tin_quantum = max_t(u16, 1U, quantum);
242862306a36Sopenharmony_ci
242962306a36Sopenharmony_ci		/* calculate next class's parameters */
243062306a36Sopenharmony_ci		rate  *= 7;
243162306a36Sopenharmony_ci		rate >>= 3;
243262306a36Sopenharmony_ci
243362306a36Sopenharmony_ci		quantum  *= 7;
243462306a36Sopenharmony_ci		quantum >>= 3;
243562306a36Sopenharmony_ci	}
243662306a36Sopenharmony_ci
243762306a36Sopenharmony_ci	return 0;
243862306a36Sopenharmony_ci}
243962306a36Sopenharmony_ci
244062306a36Sopenharmony_cistatic int cake_config_diffserv4(struct Qdisc *sch)
244162306a36Sopenharmony_ci{
244262306a36Sopenharmony_ci/*  Further pruned list of traffic classes for four-class system:
244362306a36Sopenharmony_ci *
244462306a36Sopenharmony_ci *	    Latency Sensitive  (CS7, CS6, EF, VA, CS5, CS4)
244562306a36Sopenharmony_ci *	    Streaming Media    (AF4x, AF3x, CS3, AF2x, TOS4, CS2)
244662306a36Sopenharmony_ci *	    Best Effort        (DF, AF1x, TOS2, and those not specified)
244762306a36Sopenharmony_ci *	    Background Traffic (LE, CS1)
244862306a36Sopenharmony_ci *
244962306a36Sopenharmony_ci *		Total 4 traffic classes.
245062306a36Sopenharmony_ci */
245162306a36Sopenharmony_ci
245262306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
245362306a36Sopenharmony_ci	u32 mtu = psched_mtu(qdisc_dev(sch));
245462306a36Sopenharmony_ci	u64 rate = q->rate_bps;
245562306a36Sopenharmony_ci	u32 quantum = 1024;
245662306a36Sopenharmony_ci
245762306a36Sopenharmony_ci	q->tin_cnt = 4;
245862306a36Sopenharmony_ci
245962306a36Sopenharmony_ci	/* codepoint to class mapping */
246062306a36Sopenharmony_ci	q->tin_index = diffserv4;
246162306a36Sopenharmony_ci	q->tin_order = bulk_order;
246262306a36Sopenharmony_ci
246362306a36Sopenharmony_ci	/* class characteristics */
246462306a36Sopenharmony_ci	cake_set_rate(&q->tins[0], rate, mtu,
246562306a36Sopenharmony_ci		      us_to_ns(q->target), us_to_ns(q->interval));
246662306a36Sopenharmony_ci	cake_set_rate(&q->tins[1], rate >> 4, mtu,
246762306a36Sopenharmony_ci		      us_to_ns(q->target), us_to_ns(q->interval));
246862306a36Sopenharmony_ci	cake_set_rate(&q->tins[2], rate >> 1, mtu,
246962306a36Sopenharmony_ci		      us_to_ns(q->target), us_to_ns(q->interval));
247062306a36Sopenharmony_ci	cake_set_rate(&q->tins[3], rate >> 2, mtu,
247162306a36Sopenharmony_ci		      us_to_ns(q->target), us_to_ns(q->interval));
247262306a36Sopenharmony_ci
247362306a36Sopenharmony_ci	/* bandwidth-sharing weights */
247462306a36Sopenharmony_ci	q->tins[0].tin_quantum = quantum;
247562306a36Sopenharmony_ci	q->tins[1].tin_quantum = quantum >> 4;
247662306a36Sopenharmony_ci	q->tins[2].tin_quantum = quantum >> 1;
247762306a36Sopenharmony_ci	q->tins[3].tin_quantum = quantum >> 2;
247862306a36Sopenharmony_ci
247962306a36Sopenharmony_ci	return 0;
248062306a36Sopenharmony_ci}
248162306a36Sopenharmony_ci
248262306a36Sopenharmony_cistatic int cake_config_diffserv3(struct Qdisc *sch)
248362306a36Sopenharmony_ci{
248462306a36Sopenharmony_ci/*  Simplified Diffserv structure with 3 tins.
248562306a36Sopenharmony_ci *		Latency Sensitive	(CS7, CS6, EF, VA, TOS4)
248662306a36Sopenharmony_ci *		Best Effort
248762306a36Sopenharmony_ci *		Low Priority		(LE, CS1)
248862306a36Sopenharmony_ci */
248962306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
249062306a36Sopenharmony_ci	u32 mtu = psched_mtu(qdisc_dev(sch));
249162306a36Sopenharmony_ci	u64 rate = q->rate_bps;
249262306a36Sopenharmony_ci	u32 quantum = 1024;
249362306a36Sopenharmony_ci
249462306a36Sopenharmony_ci	q->tin_cnt = 3;
249562306a36Sopenharmony_ci
249662306a36Sopenharmony_ci	/* codepoint to class mapping */
249762306a36Sopenharmony_ci	q->tin_index = diffserv3;
249862306a36Sopenharmony_ci	q->tin_order = bulk_order;
249962306a36Sopenharmony_ci
250062306a36Sopenharmony_ci	/* class characteristics */
250162306a36Sopenharmony_ci	cake_set_rate(&q->tins[0], rate, mtu,
250262306a36Sopenharmony_ci		      us_to_ns(q->target), us_to_ns(q->interval));
250362306a36Sopenharmony_ci	cake_set_rate(&q->tins[1], rate >> 4, mtu,
250462306a36Sopenharmony_ci		      us_to_ns(q->target), us_to_ns(q->interval));
250562306a36Sopenharmony_ci	cake_set_rate(&q->tins[2], rate >> 2, mtu,
250662306a36Sopenharmony_ci		      us_to_ns(q->target), us_to_ns(q->interval));
250762306a36Sopenharmony_ci
250862306a36Sopenharmony_ci	/* bandwidth-sharing weights */
250962306a36Sopenharmony_ci	q->tins[0].tin_quantum = quantum;
251062306a36Sopenharmony_ci	q->tins[1].tin_quantum = quantum >> 4;
251162306a36Sopenharmony_ci	q->tins[2].tin_quantum = quantum >> 2;
251262306a36Sopenharmony_ci
251362306a36Sopenharmony_ci	return 0;
251462306a36Sopenharmony_ci}
251562306a36Sopenharmony_ci
251662306a36Sopenharmony_cistatic void cake_reconfigure(struct Qdisc *sch)
251762306a36Sopenharmony_ci{
251862306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
251962306a36Sopenharmony_ci	int c, ft;
252062306a36Sopenharmony_ci
252162306a36Sopenharmony_ci	switch (q->tin_mode) {
252262306a36Sopenharmony_ci	case CAKE_DIFFSERV_BESTEFFORT:
252362306a36Sopenharmony_ci		ft = cake_config_besteffort(sch);
252462306a36Sopenharmony_ci		break;
252562306a36Sopenharmony_ci
252662306a36Sopenharmony_ci	case CAKE_DIFFSERV_PRECEDENCE:
252762306a36Sopenharmony_ci		ft = cake_config_precedence(sch);
252862306a36Sopenharmony_ci		break;
252962306a36Sopenharmony_ci
253062306a36Sopenharmony_ci	case CAKE_DIFFSERV_DIFFSERV8:
253162306a36Sopenharmony_ci		ft = cake_config_diffserv8(sch);
253262306a36Sopenharmony_ci		break;
253362306a36Sopenharmony_ci
253462306a36Sopenharmony_ci	case CAKE_DIFFSERV_DIFFSERV4:
253562306a36Sopenharmony_ci		ft = cake_config_diffserv4(sch);
253662306a36Sopenharmony_ci		break;
253762306a36Sopenharmony_ci
253862306a36Sopenharmony_ci	case CAKE_DIFFSERV_DIFFSERV3:
253962306a36Sopenharmony_ci	default:
254062306a36Sopenharmony_ci		ft = cake_config_diffserv3(sch);
254162306a36Sopenharmony_ci		break;
254262306a36Sopenharmony_ci	}
254362306a36Sopenharmony_ci
254462306a36Sopenharmony_ci	for (c = q->tin_cnt; c < CAKE_MAX_TINS; c++) {
254562306a36Sopenharmony_ci		cake_clear_tin(sch, c);
254662306a36Sopenharmony_ci		q->tins[c].cparams.mtu_time = q->tins[ft].cparams.mtu_time;
254762306a36Sopenharmony_ci	}
254862306a36Sopenharmony_ci
254962306a36Sopenharmony_ci	q->rate_ns   = q->tins[ft].tin_rate_ns;
255062306a36Sopenharmony_ci	q->rate_shft = q->tins[ft].tin_rate_shft;
255162306a36Sopenharmony_ci
255262306a36Sopenharmony_ci	if (q->buffer_config_limit) {
255362306a36Sopenharmony_ci		q->buffer_limit = q->buffer_config_limit;
255462306a36Sopenharmony_ci	} else if (q->rate_bps) {
255562306a36Sopenharmony_ci		u64 t = q->rate_bps * q->interval;
255662306a36Sopenharmony_ci
255762306a36Sopenharmony_ci		do_div(t, USEC_PER_SEC / 4);
255862306a36Sopenharmony_ci		q->buffer_limit = max_t(u32, t, 4U << 20);
255962306a36Sopenharmony_ci	} else {
256062306a36Sopenharmony_ci		q->buffer_limit = ~0;
256162306a36Sopenharmony_ci	}
256262306a36Sopenharmony_ci
256362306a36Sopenharmony_ci	sch->flags &= ~TCQ_F_CAN_BYPASS;
256462306a36Sopenharmony_ci
256562306a36Sopenharmony_ci	q->buffer_limit = min(q->buffer_limit,
256662306a36Sopenharmony_ci			      max(sch->limit * psched_mtu(qdisc_dev(sch)),
256762306a36Sopenharmony_ci				  q->buffer_config_limit));
256862306a36Sopenharmony_ci}
256962306a36Sopenharmony_ci
257062306a36Sopenharmony_cistatic int cake_change(struct Qdisc *sch, struct nlattr *opt,
257162306a36Sopenharmony_ci		       struct netlink_ext_ack *extack)
257262306a36Sopenharmony_ci{
257362306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
257462306a36Sopenharmony_ci	struct nlattr *tb[TCA_CAKE_MAX + 1];
257562306a36Sopenharmony_ci	int err;
257662306a36Sopenharmony_ci
257762306a36Sopenharmony_ci	err = nla_parse_nested_deprecated(tb, TCA_CAKE_MAX, opt, cake_policy,
257862306a36Sopenharmony_ci					  extack);
257962306a36Sopenharmony_ci	if (err < 0)
258062306a36Sopenharmony_ci		return err;
258162306a36Sopenharmony_ci
258262306a36Sopenharmony_ci	if (tb[TCA_CAKE_NAT]) {
258362306a36Sopenharmony_ci#if IS_ENABLED(CONFIG_NF_CONNTRACK)
258462306a36Sopenharmony_ci		q->flow_mode &= ~CAKE_FLOW_NAT_FLAG;
258562306a36Sopenharmony_ci		q->flow_mode |= CAKE_FLOW_NAT_FLAG *
258662306a36Sopenharmony_ci			!!nla_get_u32(tb[TCA_CAKE_NAT]);
258762306a36Sopenharmony_ci#else
258862306a36Sopenharmony_ci		NL_SET_ERR_MSG_ATTR(extack, tb[TCA_CAKE_NAT],
258962306a36Sopenharmony_ci				    "No conntrack support in kernel");
259062306a36Sopenharmony_ci		return -EOPNOTSUPP;
259162306a36Sopenharmony_ci#endif
259262306a36Sopenharmony_ci	}
259362306a36Sopenharmony_ci
259462306a36Sopenharmony_ci	if (tb[TCA_CAKE_BASE_RATE64])
259562306a36Sopenharmony_ci		q->rate_bps = nla_get_u64(tb[TCA_CAKE_BASE_RATE64]);
259662306a36Sopenharmony_ci
259762306a36Sopenharmony_ci	if (tb[TCA_CAKE_DIFFSERV_MODE])
259862306a36Sopenharmony_ci		q->tin_mode = nla_get_u32(tb[TCA_CAKE_DIFFSERV_MODE]);
259962306a36Sopenharmony_ci
260062306a36Sopenharmony_ci	if (tb[TCA_CAKE_WASH]) {
260162306a36Sopenharmony_ci		if (!!nla_get_u32(tb[TCA_CAKE_WASH]))
260262306a36Sopenharmony_ci			q->rate_flags |= CAKE_FLAG_WASH;
260362306a36Sopenharmony_ci		else
260462306a36Sopenharmony_ci			q->rate_flags &= ~CAKE_FLAG_WASH;
260562306a36Sopenharmony_ci	}
260662306a36Sopenharmony_ci
260762306a36Sopenharmony_ci	if (tb[TCA_CAKE_FLOW_MODE])
260862306a36Sopenharmony_ci		q->flow_mode = ((q->flow_mode & CAKE_FLOW_NAT_FLAG) |
260962306a36Sopenharmony_ci				(nla_get_u32(tb[TCA_CAKE_FLOW_MODE]) &
261062306a36Sopenharmony_ci					CAKE_FLOW_MASK));
261162306a36Sopenharmony_ci
261262306a36Sopenharmony_ci	if (tb[TCA_CAKE_ATM])
261362306a36Sopenharmony_ci		q->atm_mode = nla_get_u32(tb[TCA_CAKE_ATM]);
261462306a36Sopenharmony_ci
261562306a36Sopenharmony_ci	if (tb[TCA_CAKE_OVERHEAD]) {
261662306a36Sopenharmony_ci		q->rate_overhead = nla_get_s32(tb[TCA_CAKE_OVERHEAD]);
261762306a36Sopenharmony_ci		q->rate_flags |= CAKE_FLAG_OVERHEAD;
261862306a36Sopenharmony_ci
261962306a36Sopenharmony_ci		q->max_netlen = 0;
262062306a36Sopenharmony_ci		q->max_adjlen = 0;
262162306a36Sopenharmony_ci		q->min_netlen = ~0;
262262306a36Sopenharmony_ci		q->min_adjlen = ~0;
262362306a36Sopenharmony_ci	}
262462306a36Sopenharmony_ci
262562306a36Sopenharmony_ci	if (tb[TCA_CAKE_RAW]) {
262662306a36Sopenharmony_ci		q->rate_flags &= ~CAKE_FLAG_OVERHEAD;
262762306a36Sopenharmony_ci
262862306a36Sopenharmony_ci		q->max_netlen = 0;
262962306a36Sopenharmony_ci		q->max_adjlen = 0;
263062306a36Sopenharmony_ci		q->min_netlen = ~0;
263162306a36Sopenharmony_ci		q->min_adjlen = ~0;
263262306a36Sopenharmony_ci	}
263362306a36Sopenharmony_ci
263462306a36Sopenharmony_ci	if (tb[TCA_CAKE_MPU])
263562306a36Sopenharmony_ci		q->rate_mpu = nla_get_u32(tb[TCA_CAKE_MPU]);
263662306a36Sopenharmony_ci
263762306a36Sopenharmony_ci	if (tb[TCA_CAKE_RTT]) {
263862306a36Sopenharmony_ci		q->interval = nla_get_u32(tb[TCA_CAKE_RTT]);
263962306a36Sopenharmony_ci
264062306a36Sopenharmony_ci		if (!q->interval)
264162306a36Sopenharmony_ci			q->interval = 1;
264262306a36Sopenharmony_ci	}
264362306a36Sopenharmony_ci
264462306a36Sopenharmony_ci	if (tb[TCA_CAKE_TARGET]) {
264562306a36Sopenharmony_ci		q->target = nla_get_u32(tb[TCA_CAKE_TARGET]);
264662306a36Sopenharmony_ci
264762306a36Sopenharmony_ci		if (!q->target)
264862306a36Sopenharmony_ci			q->target = 1;
264962306a36Sopenharmony_ci	}
265062306a36Sopenharmony_ci
265162306a36Sopenharmony_ci	if (tb[TCA_CAKE_AUTORATE]) {
265262306a36Sopenharmony_ci		if (!!nla_get_u32(tb[TCA_CAKE_AUTORATE]))
265362306a36Sopenharmony_ci			q->rate_flags |= CAKE_FLAG_AUTORATE_INGRESS;
265462306a36Sopenharmony_ci		else
265562306a36Sopenharmony_ci			q->rate_flags &= ~CAKE_FLAG_AUTORATE_INGRESS;
265662306a36Sopenharmony_ci	}
265762306a36Sopenharmony_ci
265862306a36Sopenharmony_ci	if (tb[TCA_CAKE_INGRESS]) {
265962306a36Sopenharmony_ci		if (!!nla_get_u32(tb[TCA_CAKE_INGRESS]))
266062306a36Sopenharmony_ci			q->rate_flags |= CAKE_FLAG_INGRESS;
266162306a36Sopenharmony_ci		else
266262306a36Sopenharmony_ci			q->rate_flags &= ~CAKE_FLAG_INGRESS;
266362306a36Sopenharmony_ci	}
266462306a36Sopenharmony_ci
266562306a36Sopenharmony_ci	if (tb[TCA_CAKE_ACK_FILTER])
266662306a36Sopenharmony_ci		q->ack_filter = nla_get_u32(tb[TCA_CAKE_ACK_FILTER]);
266762306a36Sopenharmony_ci
266862306a36Sopenharmony_ci	if (tb[TCA_CAKE_MEMORY])
266962306a36Sopenharmony_ci		q->buffer_config_limit = nla_get_u32(tb[TCA_CAKE_MEMORY]);
267062306a36Sopenharmony_ci
267162306a36Sopenharmony_ci	if (tb[TCA_CAKE_SPLIT_GSO]) {
267262306a36Sopenharmony_ci		if (!!nla_get_u32(tb[TCA_CAKE_SPLIT_GSO]))
267362306a36Sopenharmony_ci			q->rate_flags |= CAKE_FLAG_SPLIT_GSO;
267462306a36Sopenharmony_ci		else
267562306a36Sopenharmony_ci			q->rate_flags &= ~CAKE_FLAG_SPLIT_GSO;
267662306a36Sopenharmony_ci	}
267762306a36Sopenharmony_ci
267862306a36Sopenharmony_ci	if (tb[TCA_CAKE_FWMARK]) {
267962306a36Sopenharmony_ci		q->fwmark_mask = nla_get_u32(tb[TCA_CAKE_FWMARK]);
268062306a36Sopenharmony_ci		q->fwmark_shft = q->fwmark_mask ? __ffs(q->fwmark_mask) : 0;
268162306a36Sopenharmony_ci	}
268262306a36Sopenharmony_ci
268362306a36Sopenharmony_ci	if (q->tins) {
268462306a36Sopenharmony_ci		sch_tree_lock(sch);
268562306a36Sopenharmony_ci		cake_reconfigure(sch);
268662306a36Sopenharmony_ci		sch_tree_unlock(sch);
268762306a36Sopenharmony_ci	}
268862306a36Sopenharmony_ci
268962306a36Sopenharmony_ci	return 0;
269062306a36Sopenharmony_ci}
269162306a36Sopenharmony_ci
269262306a36Sopenharmony_cistatic void cake_destroy(struct Qdisc *sch)
269362306a36Sopenharmony_ci{
269462306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
269562306a36Sopenharmony_ci
269662306a36Sopenharmony_ci	qdisc_watchdog_cancel(&q->watchdog);
269762306a36Sopenharmony_ci	tcf_block_put(q->block);
269862306a36Sopenharmony_ci	kvfree(q->tins);
269962306a36Sopenharmony_ci}
270062306a36Sopenharmony_ci
270162306a36Sopenharmony_cistatic int cake_init(struct Qdisc *sch, struct nlattr *opt,
270262306a36Sopenharmony_ci		     struct netlink_ext_ack *extack)
270362306a36Sopenharmony_ci{
270462306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
270562306a36Sopenharmony_ci	int i, j, err;
270662306a36Sopenharmony_ci
270762306a36Sopenharmony_ci	sch->limit = 10240;
270862306a36Sopenharmony_ci	q->tin_mode = CAKE_DIFFSERV_DIFFSERV3;
270962306a36Sopenharmony_ci	q->flow_mode  = CAKE_FLOW_TRIPLE;
271062306a36Sopenharmony_ci
271162306a36Sopenharmony_ci	q->rate_bps = 0; /* unlimited by default */
271262306a36Sopenharmony_ci
271362306a36Sopenharmony_ci	q->interval = 100000; /* 100ms default */
271462306a36Sopenharmony_ci	q->target   =   5000; /* 5ms: codel RFC argues
271562306a36Sopenharmony_ci			       * for 5 to 10% of interval
271662306a36Sopenharmony_ci			       */
271762306a36Sopenharmony_ci	q->rate_flags |= CAKE_FLAG_SPLIT_GSO;
271862306a36Sopenharmony_ci	q->cur_tin = 0;
271962306a36Sopenharmony_ci	q->cur_flow  = 0;
272062306a36Sopenharmony_ci
272162306a36Sopenharmony_ci	qdisc_watchdog_init(&q->watchdog, sch);
272262306a36Sopenharmony_ci
272362306a36Sopenharmony_ci	if (opt) {
272462306a36Sopenharmony_ci		err = cake_change(sch, opt, extack);
272562306a36Sopenharmony_ci
272662306a36Sopenharmony_ci		if (err)
272762306a36Sopenharmony_ci			return err;
272862306a36Sopenharmony_ci	}
272962306a36Sopenharmony_ci
273062306a36Sopenharmony_ci	err = tcf_block_get(&q->block, &q->filter_list, sch, extack);
273162306a36Sopenharmony_ci	if (err)
273262306a36Sopenharmony_ci		return err;
273362306a36Sopenharmony_ci
273462306a36Sopenharmony_ci	quantum_div[0] = ~0;
273562306a36Sopenharmony_ci	for (i = 1; i <= CAKE_QUEUES; i++)
273662306a36Sopenharmony_ci		quantum_div[i] = 65535 / i;
273762306a36Sopenharmony_ci
273862306a36Sopenharmony_ci	q->tins = kvcalloc(CAKE_MAX_TINS, sizeof(struct cake_tin_data),
273962306a36Sopenharmony_ci			   GFP_KERNEL);
274062306a36Sopenharmony_ci	if (!q->tins)
274162306a36Sopenharmony_ci		return -ENOMEM;
274262306a36Sopenharmony_ci
274362306a36Sopenharmony_ci	for (i = 0; i < CAKE_MAX_TINS; i++) {
274462306a36Sopenharmony_ci		struct cake_tin_data *b = q->tins + i;
274562306a36Sopenharmony_ci
274662306a36Sopenharmony_ci		INIT_LIST_HEAD(&b->new_flows);
274762306a36Sopenharmony_ci		INIT_LIST_HEAD(&b->old_flows);
274862306a36Sopenharmony_ci		INIT_LIST_HEAD(&b->decaying_flows);
274962306a36Sopenharmony_ci		b->sparse_flow_count = 0;
275062306a36Sopenharmony_ci		b->bulk_flow_count = 0;
275162306a36Sopenharmony_ci		b->decaying_flow_count = 0;
275262306a36Sopenharmony_ci
275362306a36Sopenharmony_ci		for (j = 0; j < CAKE_QUEUES; j++) {
275462306a36Sopenharmony_ci			struct cake_flow *flow = b->flows + j;
275562306a36Sopenharmony_ci			u32 k = j * CAKE_MAX_TINS + i;
275662306a36Sopenharmony_ci
275762306a36Sopenharmony_ci			INIT_LIST_HEAD(&flow->flowchain);
275862306a36Sopenharmony_ci			cobalt_vars_init(&flow->cvars);
275962306a36Sopenharmony_ci
276062306a36Sopenharmony_ci			q->overflow_heap[k].t = i;
276162306a36Sopenharmony_ci			q->overflow_heap[k].b = j;
276262306a36Sopenharmony_ci			b->overflow_idx[j] = k;
276362306a36Sopenharmony_ci		}
276462306a36Sopenharmony_ci	}
276562306a36Sopenharmony_ci
276662306a36Sopenharmony_ci	cake_reconfigure(sch);
276762306a36Sopenharmony_ci	q->avg_peak_bandwidth = q->rate_bps;
276862306a36Sopenharmony_ci	q->min_netlen = ~0;
276962306a36Sopenharmony_ci	q->min_adjlen = ~0;
277062306a36Sopenharmony_ci	return 0;
277162306a36Sopenharmony_ci}
277262306a36Sopenharmony_ci
277362306a36Sopenharmony_cistatic int cake_dump(struct Qdisc *sch, struct sk_buff *skb)
277462306a36Sopenharmony_ci{
277562306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
277662306a36Sopenharmony_ci	struct nlattr *opts;
277762306a36Sopenharmony_ci
277862306a36Sopenharmony_ci	opts = nla_nest_start_noflag(skb, TCA_OPTIONS);
277962306a36Sopenharmony_ci	if (!opts)
278062306a36Sopenharmony_ci		goto nla_put_failure;
278162306a36Sopenharmony_ci
278262306a36Sopenharmony_ci	if (nla_put_u64_64bit(skb, TCA_CAKE_BASE_RATE64, q->rate_bps,
278362306a36Sopenharmony_ci			      TCA_CAKE_PAD))
278462306a36Sopenharmony_ci		goto nla_put_failure;
278562306a36Sopenharmony_ci
278662306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_FLOW_MODE,
278762306a36Sopenharmony_ci			q->flow_mode & CAKE_FLOW_MASK))
278862306a36Sopenharmony_ci		goto nla_put_failure;
278962306a36Sopenharmony_ci
279062306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_RTT, q->interval))
279162306a36Sopenharmony_ci		goto nla_put_failure;
279262306a36Sopenharmony_ci
279362306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_TARGET, q->target))
279462306a36Sopenharmony_ci		goto nla_put_failure;
279562306a36Sopenharmony_ci
279662306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_MEMORY, q->buffer_config_limit))
279762306a36Sopenharmony_ci		goto nla_put_failure;
279862306a36Sopenharmony_ci
279962306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_AUTORATE,
280062306a36Sopenharmony_ci			!!(q->rate_flags & CAKE_FLAG_AUTORATE_INGRESS)))
280162306a36Sopenharmony_ci		goto nla_put_failure;
280262306a36Sopenharmony_ci
280362306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_INGRESS,
280462306a36Sopenharmony_ci			!!(q->rate_flags & CAKE_FLAG_INGRESS)))
280562306a36Sopenharmony_ci		goto nla_put_failure;
280662306a36Sopenharmony_ci
280762306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_ACK_FILTER, q->ack_filter))
280862306a36Sopenharmony_ci		goto nla_put_failure;
280962306a36Sopenharmony_ci
281062306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_NAT,
281162306a36Sopenharmony_ci			!!(q->flow_mode & CAKE_FLOW_NAT_FLAG)))
281262306a36Sopenharmony_ci		goto nla_put_failure;
281362306a36Sopenharmony_ci
281462306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_DIFFSERV_MODE, q->tin_mode))
281562306a36Sopenharmony_ci		goto nla_put_failure;
281662306a36Sopenharmony_ci
281762306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_WASH,
281862306a36Sopenharmony_ci			!!(q->rate_flags & CAKE_FLAG_WASH)))
281962306a36Sopenharmony_ci		goto nla_put_failure;
282062306a36Sopenharmony_ci
282162306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_OVERHEAD, q->rate_overhead))
282262306a36Sopenharmony_ci		goto nla_put_failure;
282362306a36Sopenharmony_ci
282462306a36Sopenharmony_ci	if (!(q->rate_flags & CAKE_FLAG_OVERHEAD))
282562306a36Sopenharmony_ci		if (nla_put_u32(skb, TCA_CAKE_RAW, 0))
282662306a36Sopenharmony_ci			goto nla_put_failure;
282762306a36Sopenharmony_ci
282862306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_ATM, q->atm_mode))
282962306a36Sopenharmony_ci		goto nla_put_failure;
283062306a36Sopenharmony_ci
283162306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_MPU, q->rate_mpu))
283262306a36Sopenharmony_ci		goto nla_put_failure;
283362306a36Sopenharmony_ci
283462306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_SPLIT_GSO,
283562306a36Sopenharmony_ci			!!(q->rate_flags & CAKE_FLAG_SPLIT_GSO)))
283662306a36Sopenharmony_ci		goto nla_put_failure;
283762306a36Sopenharmony_ci
283862306a36Sopenharmony_ci	if (nla_put_u32(skb, TCA_CAKE_FWMARK, q->fwmark_mask))
283962306a36Sopenharmony_ci		goto nla_put_failure;
284062306a36Sopenharmony_ci
284162306a36Sopenharmony_ci	return nla_nest_end(skb, opts);
284262306a36Sopenharmony_ci
284362306a36Sopenharmony_cinla_put_failure:
284462306a36Sopenharmony_ci	return -1;
284562306a36Sopenharmony_ci}
284662306a36Sopenharmony_ci
284762306a36Sopenharmony_cistatic int cake_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
284862306a36Sopenharmony_ci{
284962306a36Sopenharmony_ci	struct nlattr *stats = nla_nest_start_noflag(d->skb, TCA_STATS_APP);
285062306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
285162306a36Sopenharmony_ci	struct nlattr *tstats, *ts;
285262306a36Sopenharmony_ci	int i;
285362306a36Sopenharmony_ci
285462306a36Sopenharmony_ci	if (!stats)
285562306a36Sopenharmony_ci		return -1;
285662306a36Sopenharmony_ci
285762306a36Sopenharmony_ci#define PUT_STAT_U32(attr, data) do {				       \
285862306a36Sopenharmony_ci		if (nla_put_u32(d->skb, TCA_CAKE_STATS_ ## attr, data)) \
285962306a36Sopenharmony_ci			goto nla_put_failure;			       \
286062306a36Sopenharmony_ci	} while (0)
286162306a36Sopenharmony_ci#define PUT_STAT_U64(attr, data) do {				       \
286262306a36Sopenharmony_ci		if (nla_put_u64_64bit(d->skb, TCA_CAKE_STATS_ ## attr, \
286362306a36Sopenharmony_ci					data, TCA_CAKE_STATS_PAD)) \
286462306a36Sopenharmony_ci			goto nla_put_failure;			       \
286562306a36Sopenharmony_ci	} while (0)
286662306a36Sopenharmony_ci
286762306a36Sopenharmony_ci	PUT_STAT_U64(CAPACITY_ESTIMATE64, q->avg_peak_bandwidth);
286862306a36Sopenharmony_ci	PUT_STAT_U32(MEMORY_LIMIT, q->buffer_limit);
286962306a36Sopenharmony_ci	PUT_STAT_U32(MEMORY_USED, q->buffer_max_used);
287062306a36Sopenharmony_ci	PUT_STAT_U32(AVG_NETOFF, ((q->avg_netoff + 0x8000) >> 16));
287162306a36Sopenharmony_ci	PUT_STAT_U32(MAX_NETLEN, q->max_netlen);
287262306a36Sopenharmony_ci	PUT_STAT_U32(MAX_ADJLEN, q->max_adjlen);
287362306a36Sopenharmony_ci	PUT_STAT_U32(MIN_NETLEN, q->min_netlen);
287462306a36Sopenharmony_ci	PUT_STAT_U32(MIN_ADJLEN, q->min_adjlen);
287562306a36Sopenharmony_ci
287662306a36Sopenharmony_ci#undef PUT_STAT_U32
287762306a36Sopenharmony_ci#undef PUT_STAT_U64
287862306a36Sopenharmony_ci
287962306a36Sopenharmony_ci	tstats = nla_nest_start_noflag(d->skb, TCA_CAKE_STATS_TIN_STATS);
288062306a36Sopenharmony_ci	if (!tstats)
288162306a36Sopenharmony_ci		goto nla_put_failure;
288262306a36Sopenharmony_ci
288362306a36Sopenharmony_ci#define PUT_TSTAT_U32(attr, data) do {					\
288462306a36Sopenharmony_ci		if (nla_put_u32(d->skb, TCA_CAKE_TIN_STATS_ ## attr, data)) \
288562306a36Sopenharmony_ci			goto nla_put_failure;				\
288662306a36Sopenharmony_ci	} while (0)
288762306a36Sopenharmony_ci#define PUT_TSTAT_U64(attr, data) do {					\
288862306a36Sopenharmony_ci		if (nla_put_u64_64bit(d->skb, TCA_CAKE_TIN_STATS_ ## attr, \
288962306a36Sopenharmony_ci					data, TCA_CAKE_TIN_STATS_PAD))	\
289062306a36Sopenharmony_ci			goto nla_put_failure;				\
289162306a36Sopenharmony_ci	} while (0)
289262306a36Sopenharmony_ci
289362306a36Sopenharmony_ci	for (i = 0; i < q->tin_cnt; i++) {
289462306a36Sopenharmony_ci		struct cake_tin_data *b = &q->tins[q->tin_order[i]];
289562306a36Sopenharmony_ci
289662306a36Sopenharmony_ci		ts = nla_nest_start_noflag(d->skb, i + 1);
289762306a36Sopenharmony_ci		if (!ts)
289862306a36Sopenharmony_ci			goto nla_put_failure;
289962306a36Sopenharmony_ci
290062306a36Sopenharmony_ci		PUT_TSTAT_U64(THRESHOLD_RATE64, b->tin_rate_bps);
290162306a36Sopenharmony_ci		PUT_TSTAT_U64(SENT_BYTES64, b->bytes);
290262306a36Sopenharmony_ci		PUT_TSTAT_U32(BACKLOG_BYTES, b->tin_backlog);
290362306a36Sopenharmony_ci
290462306a36Sopenharmony_ci		PUT_TSTAT_U32(TARGET_US,
290562306a36Sopenharmony_ci			      ktime_to_us(ns_to_ktime(b->cparams.target)));
290662306a36Sopenharmony_ci		PUT_TSTAT_U32(INTERVAL_US,
290762306a36Sopenharmony_ci			      ktime_to_us(ns_to_ktime(b->cparams.interval)));
290862306a36Sopenharmony_ci
290962306a36Sopenharmony_ci		PUT_TSTAT_U32(SENT_PACKETS, b->packets);
291062306a36Sopenharmony_ci		PUT_TSTAT_U32(DROPPED_PACKETS, b->tin_dropped);
291162306a36Sopenharmony_ci		PUT_TSTAT_U32(ECN_MARKED_PACKETS, b->tin_ecn_mark);
291262306a36Sopenharmony_ci		PUT_TSTAT_U32(ACKS_DROPPED_PACKETS, b->ack_drops);
291362306a36Sopenharmony_ci
291462306a36Sopenharmony_ci		PUT_TSTAT_U32(PEAK_DELAY_US,
291562306a36Sopenharmony_ci			      ktime_to_us(ns_to_ktime(b->peak_delay)));
291662306a36Sopenharmony_ci		PUT_TSTAT_U32(AVG_DELAY_US,
291762306a36Sopenharmony_ci			      ktime_to_us(ns_to_ktime(b->avge_delay)));
291862306a36Sopenharmony_ci		PUT_TSTAT_U32(BASE_DELAY_US,
291962306a36Sopenharmony_ci			      ktime_to_us(ns_to_ktime(b->base_delay)));
292062306a36Sopenharmony_ci
292162306a36Sopenharmony_ci		PUT_TSTAT_U32(WAY_INDIRECT_HITS, b->way_hits);
292262306a36Sopenharmony_ci		PUT_TSTAT_U32(WAY_MISSES, b->way_misses);
292362306a36Sopenharmony_ci		PUT_TSTAT_U32(WAY_COLLISIONS, b->way_collisions);
292462306a36Sopenharmony_ci
292562306a36Sopenharmony_ci		PUT_TSTAT_U32(SPARSE_FLOWS, b->sparse_flow_count +
292662306a36Sopenharmony_ci					    b->decaying_flow_count);
292762306a36Sopenharmony_ci		PUT_TSTAT_U32(BULK_FLOWS, b->bulk_flow_count);
292862306a36Sopenharmony_ci		PUT_TSTAT_U32(UNRESPONSIVE_FLOWS, b->unresponsive_flow_count);
292962306a36Sopenharmony_ci		PUT_TSTAT_U32(MAX_SKBLEN, b->max_skblen);
293062306a36Sopenharmony_ci
293162306a36Sopenharmony_ci		PUT_TSTAT_U32(FLOW_QUANTUM, b->flow_quantum);
293262306a36Sopenharmony_ci		nla_nest_end(d->skb, ts);
293362306a36Sopenharmony_ci	}
293462306a36Sopenharmony_ci
293562306a36Sopenharmony_ci#undef PUT_TSTAT_U32
293662306a36Sopenharmony_ci#undef PUT_TSTAT_U64
293762306a36Sopenharmony_ci
293862306a36Sopenharmony_ci	nla_nest_end(d->skb, tstats);
293962306a36Sopenharmony_ci	return nla_nest_end(d->skb, stats);
294062306a36Sopenharmony_ci
294162306a36Sopenharmony_cinla_put_failure:
294262306a36Sopenharmony_ci	nla_nest_cancel(d->skb, stats);
294362306a36Sopenharmony_ci	return -1;
294462306a36Sopenharmony_ci}
294562306a36Sopenharmony_ci
294662306a36Sopenharmony_cistatic struct Qdisc *cake_leaf(struct Qdisc *sch, unsigned long arg)
294762306a36Sopenharmony_ci{
294862306a36Sopenharmony_ci	return NULL;
294962306a36Sopenharmony_ci}
295062306a36Sopenharmony_ci
295162306a36Sopenharmony_cistatic unsigned long cake_find(struct Qdisc *sch, u32 classid)
295262306a36Sopenharmony_ci{
295362306a36Sopenharmony_ci	return 0;
295462306a36Sopenharmony_ci}
295562306a36Sopenharmony_ci
295662306a36Sopenharmony_cistatic unsigned long cake_bind(struct Qdisc *sch, unsigned long parent,
295762306a36Sopenharmony_ci			       u32 classid)
295862306a36Sopenharmony_ci{
295962306a36Sopenharmony_ci	return 0;
296062306a36Sopenharmony_ci}
296162306a36Sopenharmony_ci
296262306a36Sopenharmony_cistatic void cake_unbind(struct Qdisc *q, unsigned long cl)
296362306a36Sopenharmony_ci{
296462306a36Sopenharmony_ci}
296562306a36Sopenharmony_ci
296662306a36Sopenharmony_cistatic struct tcf_block *cake_tcf_block(struct Qdisc *sch, unsigned long cl,
296762306a36Sopenharmony_ci					struct netlink_ext_ack *extack)
296862306a36Sopenharmony_ci{
296962306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
297062306a36Sopenharmony_ci
297162306a36Sopenharmony_ci	if (cl)
297262306a36Sopenharmony_ci		return NULL;
297362306a36Sopenharmony_ci	return q->block;
297462306a36Sopenharmony_ci}
297562306a36Sopenharmony_ci
297662306a36Sopenharmony_cistatic int cake_dump_class(struct Qdisc *sch, unsigned long cl,
297762306a36Sopenharmony_ci			   struct sk_buff *skb, struct tcmsg *tcm)
297862306a36Sopenharmony_ci{
297962306a36Sopenharmony_ci	tcm->tcm_handle |= TC_H_MIN(cl);
298062306a36Sopenharmony_ci	return 0;
298162306a36Sopenharmony_ci}
298262306a36Sopenharmony_ci
298362306a36Sopenharmony_cistatic int cake_dump_class_stats(struct Qdisc *sch, unsigned long cl,
298462306a36Sopenharmony_ci				 struct gnet_dump *d)
298562306a36Sopenharmony_ci{
298662306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
298762306a36Sopenharmony_ci	const struct cake_flow *flow = NULL;
298862306a36Sopenharmony_ci	struct gnet_stats_queue qs = { 0 };
298962306a36Sopenharmony_ci	struct nlattr *stats;
299062306a36Sopenharmony_ci	u32 idx = cl - 1;
299162306a36Sopenharmony_ci
299262306a36Sopenharmony_ci	if (idx < CAKE_QUEUES * q->tin_cnt) {
299362306a36Sopenharmony_ci		const struct cake_tin_data *b = \
299462306a36Sopenharmony_ci			&q->tins[q->tin_order[idx / CAKE_QUEUES]];
299562306a36Sopenharmony_ci		const struct sk_buff *skb;
299662306a36Sopenharmony_ci
299762306a36Sopenharmony_ci		flow = &b->flows[idx % CAKE_QUEUES];
299862306a36Sopenharmony_ci
299962306a36Sopenharmony_ci		if (flow->head) {
300062306a36Sopenharmony_ci			sch_tree_lock(sch);
300162306a36Sopenharmony_ci			skb = flow->head;
300262306a36Sopenharmony_ci			while (skb) {
300362306a36Sopenharmony_ci				qs.qlen++;
300462306a36Sopenharmony_ci				skb = skb->next;
300562306a36Sopenharmony_ci			}
300662306a36Sopenharmony_ci			sch_tree_unlock(sch);
300762306a36Sopenharmony_ci		}
300862306a36Sopenharmony_ci		qs.backlog = b->backlogs[idx % CAKE_QUEUES];
300962306a36Sopenharmony_ci		qs.drops = flow->dropped;
301062306a36Sopenharmony_ci	}
301162306a36Sopenharmony_ci	if (gnet_stats_copy_queue(d, NULL, &qs, qs.qlen) < 0)
301262306a36Sopenharmony_ci		return -1;
301362306a36Sopenharmony_ci	if (flow) {
301462306a36Sopenharmony_ci		ktime_t now = ktime_get();
301562306a36Sopenharmony_ci
301662306a36Sopenharmony_ci		stats = nla_nest_start_noflag(d->skb, TCA_STATS_APP);
301762306a36Sopenharmony_ci		if (!stats)
301862306a36Sopenharmony_ci			return -1;
301962306a36Sopenharmony_ci
302062306a36Sopenharmony_ci#define PUT_STAT_U32(attr, data) do {				       \
302162306a36Sopenharmony_ci		if (nla_put_u32(d->skb, TCA_CAKE_STATS_ ## attr, data)) \
302262306a36Sopenharmony_ci			goto nla_put_failure;			       \
302362306a36Sopenharmony_ci	} while (0)
302462306a36Sopenharmony_ci#define PUT_STAT_S32(attr, data) do {				       \
302562306a36Sopenharmony_ci		if (nla_put_s32(d->skb, TCA_CAKE_STATS_ ## attr, data)) \
302662306a36Sopenharmony_ci			goto nla_put_failure;			       \
302762306a36Sopenharmony_ci	} while (0)
302862306a36Sopenharmony_ci
302962306a36Sopenharmony_ci		PUT_STAT_S32(DEFICIT, flow->deficit);
303062306a36Sopenharmony_ci		PUT_STAT_U32(DROPPING, flow->cvars.dropping);
303162306a36Sopenharmony_ci		PUT_STAT_U32(COBALT_COUNT, flow->cvars.count);
303262306a36Sopenharmony_ci		PUT_STAT_U32(P_DROP, flow->cvars.p_drop);
303362306a36Sopenharmony_ci		if (flow->cvars.p_drop) {
303462306a36Sopenharmony_ci			PUT_STAT_S32(BLUE_TIMER_US,
303562306a36Sopenharmony_ci				     ktime_to_us(
303662306a36Sopenharmony_ci					     ktime_sub(now,
303762306a36Sopenharmony_ci						       flow->cvars.blue_timer)));
303862306a36Sopenharmony_ci		}
303962306a36Sopenharmony_ci		if (flow->cvars.dropping) {
304062306a36Sopenharmony_ci			PUT_STAT_S32(DROP_NEXT_US,
304162306a36Sopenharmony_ci				     ktime_to_us(
304262306a36Sopenharmony_ci					     ktime_sub(now,
304362306a36Sopenharmony_ci						       flow->cvars.drop_next)));
304462306a36Sopenharmony_ci		}
304562306a36Sopenharmony_ci
304662306a36Sopenharmony_ci		if (nla_nest_end(d->skb, stats) < 0)
304762306a36Sopenharmony_ci			return -1;
304862306a36Sopenharmony_ci	}
304962306a36Sopenharmony_ci
305062306a36Sopenharmony_ci	return 0;
305162306a36Sopenharmony_ci
305262306a36Sopenharmony_cinla_put_failure:
305362306a36Sopenharmony_ci	nla_nest_cancel(d->skb, stats);
305462306a36Sopenharmony_ci	return -1;
305562306a36Sopenharmony_ci}
305662306a36Sopenharmony_ci
305762306a36Sopenharmony_cistatic void cake_walk(struct Qdisc *sch, struct qdisc_walker *arg)
305862306a36Sopenharmony_ci{
305962306a36Sopenharmony_ci	struct cake_sched_data *q = qdisc_priv(sch);
306062306a36Sopenharmony_ci	unsigned int i, j;
306162306a36Sopenharmony_ci
306262306a36Sopenharmony_ci	if (arg->stop)
306362306a36Sopenharmony_ci		return;
306462306a36Sopenharmony_ci
306562306a36Sopenharmony_ci	for (i = 0; i < q->tin_cnt; i++) {
306662306a36Sopenharmony_ci		struct cake_tin_data *b = &q->tins[q->tin_order[i]];
306762306a36Sopenharmony_ci
306862306a36Sopenharmony_ci		for (j = 0; j < CAKE_QUEUES; j++) {
306962306a36Sopenharmony_ci			if (list_empty(&b->flows[j].flowchain)) {
307062306a36Sopenharmony_ci				arg->count++;
307162306a36Sopenharmony_ci				continue;
307262306a36Sopenharmony_ci			}
307362306a36Sopenharmony_ci			if (!tc_qdisc_stats_dump(sch, i * CAKE_QUEUES + j + 1,
307462306a36Sopenharmony_ci						 arg))
307562306a36Sopenharmony_ci				break;
307662306a36Sopenharmony_ci		}
307762306a36Sopenharmony_ci	}
307862306a36Sopenharmony_ci}
307962306a36Sopenharmony_ci
308062306a36Sopenharmony_cistatic const struct Qdisc_class_ops cake_class_ops = {
308162306a36Sopenharmony_ci	.leaf		=	cake_leaf,
308262306a36Sopenharmony_ci	.find		=	cake_find,
308362306a36Sopenharmony_ci	.tcf_block	=	cake_tcf_block,
308462306a36Sopenharmony_ci	.bind_tcf	=	cake_bind,
308562306a36Sopenharmony_ci	.unbind_tcf	=	cake_unbind,
308662306a36Sopenharmony_ci	.dump		=	cake_dump_class,
308762306a36Sopenharmony_ci	.dump_stats	=	cake_dump_class_stats,
308862306a36Sopenharmony_ci	.walk		=	cake_walk,
308962306a36Sopenharmony_ci};
309062306a36Sopenharmony_ci
309162306a36Sopenharmony_cistatic struct Qdisc_ops cake_qdisc_ops __read_mostly = {
309262306a36Sopenharmony_ci	.cl_ops		=	&cake_class_ops,
309362306a36Sopenharmony_ci	.id		=	"cake",
309462306a36Sopenharmony_ci	.priv_size	=	sizeof(struct cake_sched_data),
309562306a36Sopenharmony_ci	.enqueue	=	cake_enqueue,
309662306a36Sopenharmony_ci	.dequeue	=	cake_dequeue,
309762306a36Sopenharmony_ci	.peek		=	qdisc_peek_dequeued,
309862306a36Sopenharmony_ci	.init		=	cake_init,
309962306a36Sopenharmony_ci	.reset		=	cake_reset,
310062306a36Sopenharmony_ci	.destroy	=	cake_destroy,
310162306a36Sopenharmony_ci	.change		=	cake_change,
310262306a36Sopenharmony_ci	.dump		=	cake_dump,
310362306a36Sopenharmony_ci	.dump_stats	=	cake_dump_stats,
310462306a36Sopenharmony_ci	.owner		=	THIS_MODULE,
310562306a36Sopenharmony_ci};
310662306a36Sopenharmony_ci
310762306a36Sopenharmony_cistatic int __init cake_module_init(void)
310862306a36Sopenharmony_ci{
310962306a36Sopenharmony_ci	return register_qdisc(&cake_qdisc_ops);
311062306a36Sopenharmony_ci}
311162306a36Sopenharmony_ci
311262306a36Sopenharmony_cistatic void __exit cake_module_exit(void)
311362306a36Sopenharmony_ci{
311462306a36Sopenharmony_ci	unregister_qdisc(&cake_qdisc_ops);
311562306a36Sopenharmony_ci}
311662306a36Sopenharmony_ci
311762306a36Sopenharmony_cimodule_init(cake_module_init)
311862306a36Sopenharmony_cimodule_exit(cake_module_exit)
311962306a36Sopenharmony_ciMODULE_AUTHOR("Jonathan Morton");
312062306a36Sopenharmony_ciMODULE_LICENSE("Dual BSD/GPL");
312162306a36Sopenharmony_ciMODULE_DESCRIPTION("The CAKE shaper.");
3122