162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * net/sched/sch_mq.c		Classful multiqueue dummy scheduler
462306a36Sopenharmony_ci *
562306a36Sopenharmony_ci * Copyright (c) 2009 Patrick McHardy <kaber@trash.net>
662306a36Sopenharmony_ci */
762306a36Sopenharmony_ci
862306a36Sopenharmony_ci#include <linux/types.h>
962306a36Sopenharmony_ci#include <linux/slab.h>
1062306a36Sopenharmony_ci#include <linux/kernel.h>
1162306a36Sopenharmony_ci#include <linux/export.h>
1262306a36Sopenharmony_ci#include <linux/string.h>
1362306a36Sopenharmony_ci#include <linux/errno.h>
1462306a36Sopenharmony_ci#include <linux/skbuff.h>
1562306a36Sopenharmony_ci#include <net/netlink.h>
1662306a36Sopenharmony_ci#include <net/pkt_cls.h>
1762306a36Sopenharmony_ci#include <net/pkt_sched.h>
1862306a36Sopenharmony_ci#include <net/sch_generic.h>
1962306a36Sopenharmony_ci
2062306a36Sopenharmony_cistruct mq_sched {
2162306a36Sopenharmony_ci	struct Qdisc		**qdiscs;
2262306a36Sopenharmony_ci};
2362306a36Sopenharmony_ci
2462306a36Sopenharmony_cistatic int mq_offload(struct Qdisc *sch, enum tc_mq_command cmd)
2562306a36Sopenharmony_ci{
2662306a36Sopenharmony_ci	struct net_device *dev = qdisc_dev(sch);
2762306a36Sopenharmony_ci	struct tc_mq_qopt_offload opt = {
2862306a36Sopenharmony_ci		.command = cmd,
2962306a36Sopenharmony_ci		.handle = sch->handle,
3062306a36Sopenharmony_ci	};
3162306a36Sopenharmony_ci
3262306a36Sopenharmony_ci	if (!tc_can_offload(dev) || !dev->netdev_ops->ndo_setup_tc)
3362306a36Sopenharmony_ci		return -EOPNOTSUPP;
3462306a36Sopenharmony_ci
3562306a36Sopenharmony_ci	return dev->netdev_ops->ndo_setup_tc(dev, TC_SETUP_QDISC_MQ, &opt);
3662306a36Sopenharmony_ci}
3762306a36Sopenharmony_ci
3862306a36Sopenharmony_cistatic int mq_offload_stats(struct Qdisc *sch)
3962306a36Sopenharmony_ci{
4062306a36Sopenharmony_ci	struct tc_mq_qopt_offload opt = {
4162306a36Sopenharmony_ci		.command = TC_MQ_STATS,
4262306a36Sopenharmony_ci		.handle = sch->handle,
4362306a36Sopenharmony_ci		.stats = {
4462306a36Sopenharmony_ci			.bstats = &sch->bstats,
4562306a36Sopenharmony_ci			.qstats = &sch->qstats,
4662306a36Sopenharmony_ci		},
4762306a36Sopenharmony_ci	};
4862306a36Sopenharmony_ci
4962306a36Sopenharmony_ci	return qdisc_offload_dump_helper(sch, TC_SETUP_QDISC_MQ, &opt);
5062306a36Sopenharmony_ci}
5162306a36Sopenharmony_ci
5262306a36Sopenharmony_cistatic void mq_destroy(struct Qdisc *sch)
5362306a36Sopenharmony_ci{
5462306a36Sopenharmony_ci	struct net_device *dev = qdisc_dev(sch);
5562306a36Sopenharmony_ci	struct mq_sched *priv = qdisc_priv(sch);
5662306a36Sopenharmony_ci	unsigned int ntx;
5762306a36Sopenharmony_ci
5862306a36Sopenharmony_ci	mq_offload(sch, TC_MQ_DESTROY);
5962306a36Sopenharmony_ci
6062306a36Sopenharmony_ci	if (!priv->qdiscs)
6162306a36Sopenharmony_ci		return;
6262306a36Sopenharmony_ci	for (ntx = 0; ntx < dev->num_tx_queues && priv->qdiscs[ntx]; ntx++)
6362306a36Sopenharmony_ci		qdisc_put(priv->qdiscs[ntx]);
6462306a36Sopenharmony_ci	kfree(priv->qdiscs);
6562306a36Sopenharmony_ci}
6662306a36Sopenharmony_ci
6762306a36Sopenharmony_cistatic int mq_init(struct Qdisc *sch, struct nlattr *opt,
6862306a36Sopenharmony_ci		   struct netlink_ext_ack *extack)
6962306a36Sopenharmony_ci{
7062306a36Sopenharmony_ci	struct net_device *dev = qdisc_dev(sch);
7162306a36Sopenharmony_ci	struct mq_sched *priv = qdisc_priv(sch);
7262306a36Sopenharmony_ci	struct netdev_queue *dev_queue;
7362306a36Sopenharmony_ci	struct Qdisc *qdisc;
7462306a36Sopenharmony_ci	unsigned int ntx;
7562306a36Sopenharmony_ci
7662306a36Sopenharmony_ci	if (sch->parent != TC_H_ROOT)
7762306a36Sopenharmony_ci		return -EOPNOTSUPP;
7862306a36Sopenharmony_ci
7962306a36Sopenharmony_ci	if (!netif_is_multiqueue(dev))
8062306a36Sopenharmony_ci		return -EOPNOTSUPP;
8162306a36Sopenharmony_ci
8262306a36Sopenharmony_ci	/* pre-allocate qdiscs, attachment can't fail */
8362306a36Sopenharmony_ci	priv->qdiscs = kcalloc(dev->num_tx_queues, sizeof(priv->qdiscs[0]),
8462306a36Sopenharmony_ci			       GFP_KERNEL);
8562306a36Sopenharmony_ci	if (!priv->qdiscs)
8662306a36Sopenharmony_ci		return -ENOMEM;
8762306a36Sopenharmony_ci
8862306a36Sopenharmony_ci	for (ntx = 0; ntx < dev->num_tx_queues; ntx++) {
8962306a36Sopenharmony_ci		dev_queue = netdev_get_tx_queue(dev, ntx);
9062306a36Sopenharmony_ci		qdisc = qdisc_create_dflt(dev_queue, get_default_qdisc_ops(dev, ntx),
9162306a36Sopenharmony_ci					  TC_H_MAKE(TC_H_MAJ(sch->handle),
9262306a36Sopenharmony_ci						    TC_H_MIN(ntx + 1)),
9362306a36Sopenharmony_ci					  extack);
9462306a36Sopenharmony_ci		if (!qdisc)
9562306a36Sopenharmony_ci			return -ENOMEM;
9662306a36Sopenharmony_ci		priv->qdiscs[ntx] = qdisc;
9762306a36Sopenharmony_ci		qdisc->flags |= TCQ_F_ONETXQUEUE | TCQ_F_NOPARENT;
9862306a36Sopenharmony_ci	}
9962306a36Sopenharmony_ci
10062306a36Sopenharmony_ci	sch->flags |= TCQ_F_MQROOT;
10162306a36Sopenharmony_ci
10262306a36Sopenharmony_ci	mq_offload(sch, TC_MQ_CREATE);
10362306a36Sopenharmony_ci	return 0;
10462306a36Sopenharmony_ci}
10562306a36Sopenharmony_ci
10662306a36Sopenharmony_cistatic void mq_attach(struct Qdisc *sch)
10762306a36Sopenharmony_ci{
10862306a36Sopenharmony_ci	struct net_device *dev = qdisc_dev(sch);
10962306a36Sopenharmony_ci	struct mq_sched *priv = qdisc_priv(sch);
11062306a36Sopenharmony_ci	struct Qdisc *qdisc, *old;
11162306a36Sopenharmony_ci	unsigned int ntx;
11262306a36Sopenharmony_ci
11362306a36Sopenharmony_ci	for (ntx = 0; ntx < dev->num_tx_queues; ntx++) {
11462306a36Sopenharmony_ci		qdisc = priv->qdiscs[ntx];
11562306a36Sopenharmony_ci		old = dev_graft_qdisc(qdisc->dev_queue, qdisc);
11662306a36Sopenharmony_ci		if (old)
11762306a36Sopenharmony_ci			qdisc_put(old);
11862306a36Sopenharmony_ci#ifdef CONFIG_NET_SCHED
11962306a36Sopenharmony_ci		if (ntx < dev->real_num_tx_queues)
12062306a36Sopenharmony_ci			qdisc_hash_add(qdisc, false);
12162306a36Sopenharmony_ci#endif
12262306a36Sopenharmony_ci
12362306a36Sopenharmony_ci	}
12462306a36Sopenharmony_ci	kfree(priv->qdiscs);
12562306a36Sopenharmony_ci	priv->qdiscs = NULL;
12662306a36Sopenharmony_ci}
12762306a36Sopenharmony_ci
12862306a36Sopenharmony_cistatic int mq_dump(struct Qdisc *sch, struct sk_buff *skb)
12962306a36Sopenharmony_ci{
13062306a36Sopenharmony_ci	struct net_device *dev = qdisc_dev(sch);
13162306a36Sopenharmony_ci	struct Qdisc *qdisc;
13262306a36Sopenharmony_ci	unsigned int ntx;
13362306a36Sopenharmony_ci
13462306a36Sopenharmony_ci	sch->q.qlen = 0;
13562306a36Sopenharmony_ci	gnet_stats_basic_sync_init(&sch->bstats);
13662306a36Sopenharmony_ci	memset(&sch->qstats, 0, sizeof(sch->qstats));
13762306a36Sopenharmony_ci
13862306a36Sopenharmony_ci	/* MQ supports lockless qdiscs. However, statistics accounting needs
13962306a36Sopenharmony_ci	 * to account for all, none, or a mix of locked and unlocked child
14062306a36Sopenharmony_ci	 * qdiscs. Percpu stats are added to counters in-band and locking
14162306a36Sopenharmony_ci	 * qdisc totals are added at end.
14262306a36Sopenharmony_ci	 */
14362306a36Sopenharmony_ci	for (ntx = 0; ntx < dev->num_tx_queues; ntx++) {
14462306a36Sopenharmony_ci		qdisc = rtnl_dereference(netdev_get_tx_queue(dev, ntx)->qdisc_sleeping);
14562306a36Sopenharmony_ci		spin_lock_bh(qdisc_lock(qdisc));
14662306a36Sopenharmony_ci
14762306a36Sopenharmony_ci		gnet_stats_add_basic(&sch->bstats, qdisc->cpu_bstats,
14862306a36Sopenharmony_ci				     &qdisc->bstats, false);
14962306a36Sopenharmony_ci		gnet_stats_add_queue(&sch->qstats, qdisc->cpu_qstats,
15062306a36Sopenharmony_ci				     &qdisc->qstats);
15162306a36Sopenharmony_ci		sch->q.qlen += qdisc_qlen(qdisc);
15262306a36Sopenharmony_ci
15362306a36Sopenharmony_ci		spin_unlock_bh(qdisc_lock(qdisc));
15462306a36Sopenharmony_ci	}
15562306a36Sopenharmony_ci
15662306a36Sopenharmony_ci	return mq_offload_stats(sch);
15762306a36Sopenharmony_ci}
15862306a36Sopenharmony_ci
15962306a36Sopenharmony_cistatic struct netdev_queue *mq_queue_get(struct Qdisc *sch, unsigned long cl)
16062306a36Sopenharmony_ci{
16162306a36Sopenharmony_ci	struct net_device *dev = qdisc_dev(sch);
16262306a36Sopenharmony_ci	unsigned long ntx = cl - 1;
16362306a36Sopenharmony_ci
16462306a36Sopenharmony_ci	if (ntx >= dev->num_tx_queues)
16562306a36Sopenharmony_ci		return NULL;
16662306a36Sopenharmony_ci	return netdev_get_tx_queue(dev, ntx);
16762306a36Sopenharmony_ci}
16862306a36Sopenharmony_ci
16962306a36Sopenharmony_cistatic struct netdev_queue *mq_select_queue(struct Qdisc *sch,
17062306a36Sopenharmony_ci					    struct tcmsg *tcm)
17162306a36Sopenharmony_ci{
17262306a36Sopenharmony_ci	return mq_queue_get(sch, TC_H_MIN(tcm->tcm_parent));
17362306a36Sopenharmony_ci}
17462306a36Sopenharmony_ci
17562306a36Sopenharmony_cistatic int mq_graft(struct Qdisc *sch, unsigned long cl, struct Qdisc *new,
17662306a36Sopenharmony_ci		    struct Qdisc **old, struct netlink_ext_ack *extack)
17762306a36Sopenharmony_ci{
17862306a36Sopenharmony_ci	struct netdev_queue *dev_queue = mq_queue_get(sch, cl);
17962306a36Sopenharmony_ci	struct tc_mq_qopt_offload graft_offload;
18062306a36Sopenharmony_ci	struct net_device *dev = qdisc_dev(sch);
18162306a36Sopenharmony_ci
18262306a36Sopenharmony_ci	if (dev->flags & IFF_UP)
18362306a36Sopenharmony_ci		dev_deactivate(dev);
18462306a36Sopenharmony_ci
18562306a36Sopenharmony_ci	*old = dev_graft_qdisc(dev_queue, new);
18662306a36Sopenharmony_ci	if (new)
18762306a36Sopenharmony_ci		new->flags |= TCQ_F_ONETXQUEUE | TCQ_F_NOPARENT;
18862306a36Sopenharmony_ci	if (dev->flags & IFF_UP)
18962306a36Sopenharmony_ci		dev_activate(dev);
19062306a36Sopenharmony_ci
19162306a36Sopenharmony_ci	graft_offload.handle = sch->handle;
19262306a36Sopenharmony_ci	graft_offload.graft_params.queue = cl - 1;
19362306a36Sopenharmony_ci	graft_offload.graft_params.child_handle = new ? new->handle : 0;
19462306a36Sopenharmony_ci	graft_offload.command = TC_MQ_GRAFT;
19562306a36Sopenharmony_ci
19662306a36Sopenharmony_ci	qdisc_offload_graft_helper(qdisc_dev(sch), sch, new, *old,
19762306a36Sopenharmony_ci				   TC_SETUP_QDISC_MQ, &graft_offload, extack);
19862306a36Sopenharmony_ci	return 0;
19962306a36Sopenharmony_ci}
20062306a36Sopenharmony_ci
20162306a36Sopenharmony_cistatic struct Qdisc *mq_leaf(struct Qdisc *sch, unsigned long cl)
20262306a36Sopenharmony_ci{
20362306a36Sopenharmony_ci	struct netdev_queue *dev_queue = mq_queue_get(sch, cl);
20462306a36Sopenharmony_ci
20562306a36Sopenharmony_ci	return rtnl_dereference(dev_queue->qdisc_sleeping);
20662306a36Sopenharmony_ci}
20762306a36Sopenharmony_ci
20862306a36Sopenharmony_cistatic unsigned long mq_find(struct Qdisc *sch, u32 classid)
20962306a36Sopenharmony_ci{
21062306a36Sopenharmony_ci	unsigned int ntx = TC_H_MIN(classid);
21162306a36Sopenharmony_ci
21262306a36Sopenharmony_ci	if (!mq_queue_get(sch, ntx))
21362306a36Sopenharmony_ci		return 0;
21462306a36Sopenharmony_ci	return ntx;
21562306a36Sopenharmony_ci}
21662306a36Sopenharmony_ci
21762306a36Sopenharmony_cistatic int mq_dump_class(struct Qdisc *sch, unsigned long cl,
21862306a36Sopenharmony_ci			 struct sk_buff *skb, struct tcmsg *tcm)
21962306a36Sopenharmony_ci{
22062306a36Sopenharmony_ci	struct netdev_queue *dev_queue = mq_queue_get(sch, cl);
22162306a36Sopenharmony_ci
22262306a36Sopenharmony_ci	tcm->tcm_parent = TC_H_ROOT;
22362306a36Sopenharmony_ci	tcm->tcm_handle |= TC_H_MIN(cl);
22462306a36Sopenharmony_ci	tcm->tcm_info = rtnl_dereference(dev_queue->qdisc_sleeping)->handle;
22562306a36Sopenharmony_ci	return 0;
22662306a36Sopenharmony_ci}
22762306a36Sopenharmony_ci
22862306a36Sopenharmony_cistatic int mq_dump_class_stats(struct Qdisc *sch, unsigned long cl,
22962306a36Sopenharmony_ci			       struct gnet_dump *d)
23062306a36Sopenharmony_ci{
23162306a36Sopenharmony_ci	struct netdev_queue *dev_queue = mq_queue_get(sch, cl);
23262306a36Sopenharmony_ci
23362306a36Sopenharmony_ci	sch = rtnl_dereference(dev_queue->qdisc_sleeping);
23462306a36Sopenharmony_ci	if (gnet_stats_copy_basic(d, sch->cpu_bstats, &sch->bstats, true) < 0 ||
23562306a36Sopenharmony_ci	    qdisc_qstats_copy(d, sch) < 0)
23662306a36Sopenharmony_ci		return -1;
23762306a36Sopenharmony_ci	return 0;
23862306a36Sopenharmony_ci}
23962306a36Sopenharmony_ci
24062306a36Sopenharmony_cistatic void mq_walk(struct Qdisc *sch, struct qdisc_walker *arg)
24162306a36Sopenharmony_ci{
24262306a36Sopenharmony_ci	struct net_device *dev = qdisc_dev(sch);
24362306a36Sopenharmony_ci	unsigned int ntx;
24462306a36Sopenharmony_ci
24562306a36Sopenharmony_ci	if (arg->stop)
24662306a36Sopenharmony_ci		return;
24762306a36Sopenharmony_ci
24862306a36Sopenharmony_ci	arg->count = arg->skip;
24962306a36Sopenharmony_ci	for (ntx = arg->skip; ntx < dev->num_tx_queues; ntx++) {
25062306a36Sopenharmony_ci		if (!tc_qdisc_stats_dump(sch, ntx + 1, arg))
25162306a36Sopenharmony_ci			break;
25262306a36Sopenharmony_ci	}
25362306a36Sopenharmony_ci}
25462306a36Sopenharmony_ci
25562306a36Sopenharmony_cistatic const struct Qdisc_class_ops mq_class_ops = {
25662306a36Sopenharmony_ci	.select_queue	= mq_select_queue,
25762306a36Sopenharmony_ci	.graft		= mq_graft,
25862306a36Sopenharmony_ci	.leaf		= mq_leaf,
25962306a36Sopenharmony_ci	.find		= mq_find,
26062306a36Sopenharmony_ci	.walk		= mq_walk,
26162306a36Sopenharmony_ci	.dump		= mq_dump_class,
26262306a36Sopenharmony_ci	.dump_stats	= mq_dump_class_stats,
26362306a36Sopenharmony_ci};
26462306a36Sopenharmony_ci
26562306a36Sopenharmony_cistruct Qdisc_ops mq_qdisc_ops __read_mostly = {
26662306a36Sopenharmony_ci	.cl_ops		= &mq_class_ops,
26762306a36Sopenharmony_ci	.id		= "mq",
26862306a36Sopenharmony_ci	.priv_size	= sizeof(struct mq_sched),
26962306a36Sopenharmony_ci	.init		= mq_init,
27062306a36Sopenharmony_ci	.destroy	= mq_destroy,
27162306a36Sopenharmony_ci	.attach		= mq_attach,
27262306a36Sopenharmony_ci	.change_real_num_tx = mq_change_real_num_tx,
27362306a36Sopenharmony_ci	.dump		= mq_dump,
27462306a36Sopenharmony_ci	.owner		= THIS_MODULE,
27562306a36Sopenharmony_ci};
276