xref: /openbmc/linux/net/sched/sch_mqprio.c (revision 4e8b86c062695454df0b76f3fee4fab8dc4bb716)
1b8970f0bSJohn Fastabend /*
2b8970f0bSJohn Fastabend  * net/sched/sch_mqprio.c
3b8970f0bSJohn Fastabend  *
4b8970f0bSJohn Fastabend  * Copyright (c) 2010 John Fastabend <john.r.fastabend@intel.com>
5b8970f0bSJohn Fastabend  *
6b8970f0bSJohn Fastabend  * This program is free software; you can redistribute it and/or
7b8970f0bSJohn Fastabend  * modify it under the terms of the GNU General Public License
8b8970f0bSJohn Fastabend  * version 2 as published by the Free Software Foundation.
9b8970f0bSJohn Fastabend  */
10b8970f0bSJohn Fastabend 
11b8970f0bSJohn Fastabend #include <linux/types.h>
12b8970f0bSJohn Fastabend #include <linux/slab.h>
13b8970f0bSJohn Fastabend #include <linux/kernel.h>
14b8970f0bSJohn Fastabend #include <linux/string.h>
15b8970f0bSJohn Fastabend #include <linux/errno.h>
16b8970f0bSJohn Fastabend #include <linux/skbuff.h>
173a9a231dSPaul Gortmaker #include <linux/module.h>
18b8970f0bSJohn Fastabend #include <net/netlink.h>
19b8970f0bSJohn Fastabend #include <net/pkt_sched.h>
20b8970f0bSJohn Fastabend #include <net/sch_generic.h>
21*4e8b86c0SAmritha Nambiar #include <net/pkt_cls.h>
22b8970f0bSJohn Fastabend 
23b8970f0bSJohn Fastabend struct mqprio_sched {
24b8970f0bSJohn Fastabend 	struct Qdisc		**qdiscs;
25*4e8b86c0SAmritha Nambiar 	u16 mode;
26*4e8b86c0SAmritha Nambiar 	u16 shaper;
272026fecfSAlexander Duyck 	int hw_offload;
28*4e8b86c0SAmritha Nambiar 	u32 flags;
29*4e8b86c0SAmritha Nambiar 	u64 min_rate[TC_QOPT_MAX_QUEUE];
30*4e8b86c0SAmritha Nambiar 	u64 max_rate[TC_QOPT_MAX_QUEUE];
31b8970f0bSJohn Fastabend };
32b8970f0bSJohn Fastabend 
33b8970f0bSJohn Fastabend static void mqprio_destroy(struct Qdisc *sch)
34b8970f0bSJohn Fastabend {
35b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
36b8970f0bSJohn Fastabend 	struct mqprio_sched *priv = qdisc_priv(sch);
37b8970f0bSJohn Fastabend 	unsigned int ntx;
38b8970f0bSJohn Fastabend 
39ac7100baSBen Hutchings 	if (priv->qdiscs) {
40ac7100baSBen Hutchings 		for (ntx = 0;
41ac7100baSBen Hutchings 		     ntx < dev->num_tx_queues && priv->qdiscs[ntx];
42ac7100baSBen Hutchings 		     ntx++)
43b8970f0bSJohn Fastabend 			qdisc_destroy(priv->qdiscs[ntx]);
44ac7100baSBen Hutchings 		kfree(priv->qdiscs);
45ac7100baSBen Hutchings 	}
46b8970f0bSJohn Fastabend 
4756f36acdSAmritha Nambiar 	if (priv->hw_offload && dev->netdev_ops->ndo_setup_tc) {
48*4e8b86c0SAmritha Nambiar 		struct tc_mqprio_qopt_offload mqprio = { { 0 } };
4956f36acdSAmritha Nambiar 
50*4e8b86c0SAmritha Nambiar 		switch (priv->mode) {
51*4e8b86c0SAmritha Nambiar 		case TC_MQPRIO_MODE_DCB:
52*4e8b86c0SAmritha Nambiar 		case TC_MQPRIO_MODE_CHANNEL:
53*4e8b86c0SAmritha Nambiar 			dev->netdev_ops->ndo_setup_tc(dev, TC_SETUP_MQPRIO,
54*4e8b86c0SAmritha Nambiar 						      &mqprio);
55*4e8b86c0SAmritha Nambiar 			break;
56*4e8b86c0SAmritha Nambiar 		default:
57*4e8b86c0SAmritha Nambiar 			return;
58*4e8b86c0SAmritha Nambiar 		}
5956f36acdSAmritha Nambiar 	} else {
60b8970f0bSJohn Fastabend 		netdev_set_num_tc(dev, 0);
61b8970f0bSJohn Fastabend 	}
6256f36acdSAmritha Nambiar }
63b8970f0bSJohn Fastabend 
64b8970f0bSJohn Fastabend static int mqprio_parse_opt(struct net_device *dev, struct tc_mqprio_qopt *qopt)
65b8970f0bSJohn Fastabend {
66b8970f0bSJohn Fastabend 	int i, j;
67b8970f0bSJohn Fastabend 
68b8970f0bSJohn Fastabend 	/* Verify num_tc is not out of max range */
69b8970f0bSJohn Fastabend 	if (qopt->num_tc > TC_MAX_QUEUE)
70b8970f0bSJohn Fastabend 		return -EINVAL;
71b8970f0bSJohn Fastabend 
72b8970f0bSJohn Fastabend 	/* Verify priority mapping uses valid tcs */
73b8970f0bSJohn Fastabend 	for (i = 0; i < TC_BITMASK + 1; i++) {
74b8970f0bSJohn Fastabend 		if (qopt->prio_tc_map[i] >= qopt->num_tc)
75b8970f0bSJohn Fastabend 			return -EINVAL;
76b8970f0bSJohn Fastabend 	}
77b8970f0bSJohn Fastabend 
782026fecfSAlexander Duyck 	/* Limit qopt->hw to maximum supported offload value.  Drivers have
792026fecfSAlexander Duyck 	 * the option of overriding this later if they don't support the a
802026fecfSAlexander Duyck 	 * given offload type.
812026fecfSAlexander Duyck 	 */
822026fecfSAlexander Duyck 	if (qopt->hw > TC_MQPRIO_HW_OFFLOAD_MAX)
832026fecfSAlexander Duyck 		qopt->hw = TC_MQPRIO_HW_OFFLOAD_MAX;
84b8970f0bSJohn Fastabend 
852026fecfSAlexander Duyck 	/* If hardware offload is requested we will leave it to the device
862026fecfSAlexander Duyck 	 * to either populate the queue counts itself or to validate the
872026fecfSAlexander Duyck 	 * provided queue counts.  If ndo_setup_tc is not present then
882026fecfSAlexander Duyck 	 * hardware doesn't support offload and we should return an error.
89b8970f0bSJohn Fastabend 	 */
90b8970f0bSJohn Fastabend 	if (qopt->hw)
912026fecfSAlexander Duyck 		return dev->netdev_ops->ndo_setup_tc ? 0 : -EINVAL;
92b8970f0bSJohn Fastabend 
93b8970f0bSJohn Fastabend 	for (i = 0; i < qopt->num_tc; i++) {
94b8970f0bSJohn Fastabend 		unsigned int last = qopt->offset[i] + qopt->count[i];
95b8970f0bSJohn Fastabend 
96b8970f0bSJohn Fastabend 		/* Verify the queue count is in tx range being equal to the
97b8970f0bSJohn Fastabend 		 * real_num_tx_queues indicates the last queue is in use.
98b8970f0bSJohn Fastabend 		 */
99b8970f0bSJohn Fastabend 		if (qopt->offset[i] >= dev->real_num_tx_queues ||
100b8970f0bSJohn Fastabend 		    !qopt->count[i] ||
101b8970f0bSJohn Fastabend 		    last > dev->real_num_tx_queues)
102b8970f0bSJohn Fastabend 			return -EINVAL;
103b8970f0bSJohn Fastabend 
104b8970f0bSJohn Fastabend 		/* Verify that the offset and counts do not overlap */
105b8970f0bSJohn Fastabend 		for (j = i + 1; j < qopt->num_tc; j++) {
106b8970f0bSJohn Fastabend 			if (last > qopt->offset[j])
107b8970f0bSJohn Fastabend 				return -EINVAL;
108b8970f0bSJohn Fastabend 		}
109b8970f0bSJohn Fastabend 	}
110b8970f0bSJohn Fastabend 
111b8970f0bSJohn Fastabend 	return 0;
112b8970f0bSJohn Fastabend }
113b8970f0bSJohn Fastabend 
114*4e8b86c0SAmritha Nambiar static const struct nla_policy mqprio_policy[TCA_MQPRIO_MAX + 1] = {
115*4e8b86c0SAmritha Nambiar 	[TCA_MQPRIO_MODE]	= { .len = sizeof(u16) },
116*4e8b86c0SAmritha Nambiar 	[TCA_MQPRIO_SHAPER]	= { .len = sizeof(u16) },
117*4e8b86c0SAmritha Nambiar 	[TCA_MQPRIO_MIN_RATE64]	= { .type = NLA_NESTED },
118*4e8b86c0SAmritha Nambiar 	[TCA_MQPRIO_MAX_RATE64]	= { .type = NLA_NESTED },
119*4e8b86c0SAmritha Nambiar };
120*4e8b86c0SAmritha Nambiar 
121*4e8b86c0SAmritha Nambiar static int parse_attr(struct nlattr *tb[], int maxtype, struct nlattr *nla,
122*4e8b86c0SAmritha Nambiar 		      const struct nla_policy *policy, int len)
123*4e8b86c0SAmritha Nambiar {
124*4e8b86c0SAmritha Nambiar 	int nested_len = nla_len(nla) - NLA_ALIGN(len);
125*4e8b86c0SAmritha Nambiar 
126*4e8b86c0SAmritha Nambiar 	if (nested_len >= nla_attr_size(0))
127*4e8b86c0SAmritha Nambiar 		return nla_parse(tb, maxtype, nla_data(nla) + NLA_ALIGN(len),
128*4e8b86c0SAmritha Nambiar 				 nested_len, policy, NULL);
129*4e8b86c0SAmritha Nambiar 
130*4e8b86c0SAmritha Nambiar 	memset(tb, 0, sizeof(struct nlattr *) * (maxtype + 1));
131*4e8b86c0SAmritha Nambiar 	return 0;
132*4e8b86c0SAmritha Nambiar }
133*4e8b86c0SAmritha Nambiar 
134b8970f0bSJohn Fastabend static int mqprio_init(struct Qdisc *sch, struct nlattr *opt)
135b8970f0bSJohn Fastabend {
136b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
137b8970f0bSJohn Fastabend 	struct mqprio_sched *priv = qdisc_priv(sch);
138b8970f0bSJohn Fastabend 	struct netdev_queue *dev_queue;
139b8970f0bSJohn Fastabend 	struct Qdisc *qdisc;
140b8970f0bSJohn Fastabend 	int i, err = -EOPNOTSUPP;
141b8970f0bSJohn Fastabend 	struct tc_mqprio_qopt *qopt = NULL;
142*4e8b86c0SAmritha Nambiar 	struct nlattr *tb[TCA_MQPRIO_MAX + 1];
143*4e8b86c0SAmritha Nambiar 	struct nlattr *attr;
144*4e8b86c0SAmritha Nambiar 	int rem;
145*4e8b86c0SAmritha Nambiar 	int len = nla_len(opt) - NLA_ALIGN(sizeof(*qopt));
146b8970f0bSJohn Fastabend 
147b8970f0bSJohn Fastabend 	BUILD_BUG_ON(TC_MAX_QUEUE != TC_QOPT_MAX_QUEUE);
148b8970f0bSJohn Fastabend 	BUILD_BUG_ON(TC_BITMASK != TC_QOPT_BITMASK);
149b8970f0bSJohn Fastabend 
150b8970f0bSJohn Fastabend 	if (sch->parent != TC_H_ROOT)
151b8970f0bSJohn Fastabend 		return -EOPNOTSUPP;
152b8970f0bSJohn Fastabend 
153b8970f0bSJohn Fastabend 	if (!netif_is_multiqueue(dev))
154b8970f0bSJohn Fastabend 		return -EOPNOTSUPP;
155b8970f0bSJohn Fastabend 
1567838f2ceSThomas Graf 	if (!opt || nla_len(opt) < sizeof(*qopt))
157b8970f0bSJohn Fastabend 		return -EINVAL;
158b8970f0bSJohn Fastabend 
159b8970f0bSJohn Fastabend 	qopt = nla_data(opt);
160b8970f0bSJohn Fastabend 	if (mqprio_parse_opt(dev, qopt))
161b8970f0bSJohn Fastabend 		return -EINVAL;
162b8970f0bSJohn Fastabend 
163*4e8b86c0SAmritha Nambiar 	if (len > 0) {
164*4e8b86c0SAmritha Nambiar 		err = parse_attr(tb, TCA_MQPRIO_MAX, opt, mqprio_policy,
165*4e8b86c0SAmritha Nambiar 				 sizeof(*qopt));
166*4e8b86c0SAmritha Nambiar 		if (err < 0)
167*4e8b86c0SAmritha Nambiar 			return err;
168*4e8b86c0SAmritha Nambiar 
169*4e8b86c0SAmritha Nambiar 		if (!qopt->hw)
170*4e8b86c0SAmritha Nambiar 			return -EINVAL;
171*4e8b86c0SAmritha Nambiar 
172*4e8b86c0SAmritha Nambiar 		if (tb[TCA_MQPRIO_MODE]) {
173*4e8b86c0SAmritha Nambiar 			priv->flags |= TC_MQPRIO_F_MODE;
174*4e8b86c0SAmritha Nambiar 			priv->mode = *(u16 *)nla_data(tb[TCA_MQPRIO_MODE]);
175*4e8b86c0SAmritha Nambiar 		}
176*4e8b86c0SAmritha Nambiar 
177*4e8b86c0SAmritha Nambiar 		if (tb[TCA_MQPRIO_SHAPER]) {
178*4e8b86c0SAmritha Nambiar 			priv->flags |= TC_MQPRIO_F_SHAPER;
179*4e8b86c0SAmritha Nambiar 			priv->shaper = *(u16 *)nla_data(tb[TCA_MQPRIO_SHAPER]);
180*4e8b86c0SAmritha Nambiar 		}
181*4e8b86c0SAmritha Nambiar 
182*4e8b86c0SAmritha Nambiar 		if (tb[TCA_MQPRIO_MIN_RATE64]) {
183*4e8b86c0SAmritha Nambiar 			if (priv->shaper != TC_MQPRIO_SHAPER_BW_RATE)
184*4e8b86c0SAmritha Nambiar 				return -EINVAL;
185*4e8b86c0SAmritha Nambiar 			i = 0;
186*4e8b86c0SAmritha Nambiar 			nla_for_each_nested(attr, tb[TCA_MQPRIO_MIN_RATE64],
187*4e8b86c0SAmritha Nambiar 					    rem) {
188*4e8b86c0SAmritha Nambiar 				if (nla_type(attr) != TCA_MQPRIO_MIN_RATE64)
189*4e8b86c0SAmritha Nambiar 					return -EINVAL;
190*4e8b86c0SAmritha Nambiar 				if (i >= qopt->num_tc)
191*4e8b86c0SAmritha Nambiar 					break;
192*4e8b86c0SAmritha Nambiar 				priv->min_rate[i] = *(u64 *)nla_data(attr);
193*4e8b86c0SAmritha Nambiar 				i++;
194*4e8b86c0SAmritha Nambiar 			}
195*4e8b86c0SAmritha Nambiar 			priv->flags |= TC_MQPRIO_F_MIN_RATE;
196*4e8b86c0SAmritha Nambiar 		}
197*4e8b86c0SAmritha Nambiar 
198*4e8b86c0SAmritha Nambiar 		if (tb[TCA_MQPRIO_MAX_RATE64]) {
199*4e8b86c0SAmritha Nambiar 			if (priv->shaper != TC_MQPRIO_SHAPER_BW_RATE)
200*4e8b86c0SAmritha Nambiar 				return -EINVAL;
201*4e8b86c0SAmritha Nambiar 			i = 0;
202*4e8b86c0SAmritha Nambiar 			nla_for_each_nested(attr, tb[TCA_MQPRIO_MAX_RATE64],
203*4e8b86c0SAmritha Nambiar 					    rem) {
204*4e8b86c0SAmritha Nambiar 				if (nla_type(attr) != TCA_MQPRIO_MAX_RATE64)
205*4e8b86c0SAmritha Nambiar 					return -EINVAL;
206*4e8b86c0SAmritha Nambiar 				if (i >= qopt->num_tc)
207*4e8b86c0SAmritha Nambiar 					break;
208*4e8b86c0SAmritha Nambiar 				priv->max_rate[i] = *(u64 *)nla_data(attr);
209*4e8b86c0SAmritha Nambiar 				i++;
210*4e8b86c0SAmritha Nambiar 			}
211*4e8b86c0SAmritha Nambiar 			priv->flags |= TC_MQPRIO_F_MAX_RATE;
212*4e8b86c0SAmritha Nambiar 		}
213*4e8b86c0SAmritha Nambiar 	}
214*4e8b86c0SAmritha Nambiar 
215b8970f0bSJohn Fastabend 	/* pre-allocate qdisc, attachment can't fail */
216b8970f0bSJohn Fastabend 	priv->qdiscs = kcalloc(dev->num_tx_queues, sizeof(priv->qdiscs[0]),
217b8970f0bSJohn Fastabend 			       GFP_KERNEL);
21887b60cfaSEric Dumazet 	if (!priv->qdiscs)
21987b60cfaSEric Dumazet 		return -ENOMEM;
220b8970f0bSJohn Fastabend 
221b8970f0bSJohn Fastabend 	for (i = 0; i < dev->num_tx_queues; i++) {
222b8970f0bSJohn Fastabend 		dev_queue = netdev_get_tx_queue(dev, i);
2231f27cde3SEric Dumazet 		qdisc = qdisc_create_dflt(dev_queue,
2241f27cde3SEric Dumazet 					  get_default_qdisc_ops(dev, i),
225b8970f0bSJohn Fastabend 					  TC_H_MAKE(TC_H_MAJ(sch->handle),
226b8970f0bSJohn Fastabend 						    TC_H_MIN(i + 1)));
22787b60cfaSEric Dumazet 		if (!qdisc)
22887b60cfaSEric Dumazet 			return -ENOMEM;
22987b60cfaSEric Dumazet 
230b8970f0bSJohn Fastabend 		priv->qdiscs[i] = qdisc;
2314eaf3b84SEric Dumazet 		qdisc->flags |= TCQ_F_ONETXQUEUE | TCQ_F_NOPARENT;
232b8970f0bSJohn Fastabend 	}
233b8970f0bSJohn Fastabend 
234b8970f0bSJohn Fastabend 	/* If the mqprio options indicate that hardware should own
235b8970f0bSJohn Fastabend 	 * the queue mapping then run ndo_setup_tc otherwise use the
236b8970f0bSJohn Fastabend 	 * supplied and verified mapping
237b8970f0bSJohn Fastabend 	 */
238b8970f0bSJohn Fastabend 	if (qopt->hw) {
239*4e8b86c0SAmritha Nambiar 		struct tc_mqprio_qopt_offload mqprio = {.qopt = *qopt};
24016e5cc64SJohn Fastabend 
241*4e8b86c0SAmritha Nambiar 		switch (priv->mode) {
242*4e8b86c0SAmritha Nambiar 		case TC_MQPRIO_MODE_DCB:
243*4e8b86c0SAmritha Nambiar 			if (priv->shaper != TC_MQPRIO_SHAPER_DCB)
244*4e8b86c0SAmritha Nambiar 				return -EINVAL;
245*4e8b86c0SAmritha Nambiar 			break;
246*4e8b86c0SAmritha Nambiar 		case TC_MQPRIO_MODE_CHANNEL:
247*4e8b86c0SAmritha Nambiar 			mqprio.flags = priv->flags;
248*4e8b86c0SAmritha Nambiar 			if (priv->flags & TC_MQPRIO_F_MODE)
249*4e8b86c0SAmritha Nambiar 				mqprio.mode = priv->mode;
250*4e8b86c0SAmritha Nambiar 			if (priv->flags & TC_MQPRIO_F_SHAPER)
251*4e8b86c0SAmritha Nambiar 				mqprio.shaper = priv->shaper;
252*4e8b86c0SAmritha Nambiar 			if (priv->flags & TC_MQPRIO_F_MIN_RATE)
253*4e8b86c0SAmritha Nambiar 				for (i = 0; i < mqprio.qopt.num_tc; i++)
254*4e8b86c0SAmritha Nambiar 					mqprio.min_rate[i] = priv->min_rate[i];
255*4e8b86c0SAmritha Nambiar 			if (priv->flags & TC_MQPRIO_F_MAX_RATE)
256*4e8b86c0SAmritha Nambiar 				for (i = 0; i < mqprio.qopt.num_tc; i++)
257*4e8b86c0SAmritha Nambiar 					mqprio.max_rate[i] = priv->max_rate[i];
258*4e8b86c0SAmritha Nambiar 			break;
259*4e8b86c0SAmritha Nambiar 		default:
260*4e8b86c0SAmritha Nambiar 			return -EINVAL;
261*4e8b86c0SAmritha Nambiar 		}
262*4e8b86c0SAmritha Nambiar 		err = dev->netdev_ops->ndo_setup_tc(dev,
263*4e8b86c0SAmritha Nambiar 						    TC_SETUP_MQPRIO,
264de4784caSJiri Pirko 						    &mqprio);
265b8970f0bSJohn Fastabend 		if (err)
26687b60cfaSEric Dumazet 			return err;
2672026fecfSAlexander Duyck 
268*4e8b86c0SAmritha Nambiar 		priv->hw_offload = mqprio.qopt.hw;
269b8970f0bSJohn Fastabend 	} else {
270b8970f0bSJohn Fastabend 		netdev_set_num_tc(dev, qopt->num_tc);
271b8970f0bSJohn Fastabend 		for (i = 0; i < qopt->num_tc; i++)
272b8970f0bSJohn Fastabend 			netdev_set_tc_queue(dev, i,
273b8970f0bSJohn Fastabend 					    qopt->count[i], qopt->offset[i]);
274b8970f0bSJohn Fastabend 	}
275b8970f0bSJohn Fastabend 
276b8970f0bSJohn Fastabend 	/* Always use supplied priority mappings */
277b8970f0bSJohn Fastabend 	for (i = 0; i < TC_BITMASK + 1; i++)
278b8970f0bSJohn Fastabend 		netdev_set_prio_tc_map(dev, i, qopt->prio_tc_map[i]);
279b8970f0bSJohn Fastabend 
280b8970f0bSJohn Fastabend 	sch->flags |= TCQ_F_MQROOT;
281b8970f0bSJohn Fastabend 	return 0;
282b8970f0bSJohn Fastabend }
283b8970f0bSJohn Fastabend 
284b8970f0bSJohn Fastabend static void mqprio_attach(struct Qdisc *sch)
285b8970f0bSJohn Fastabend {
286b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
287b8970f0bSJohn Fastabend 	struct mqprio_sched *priv = qdisc_priv(sch);
28895dc1929SEric Dumazet 	struct Qdisc *qdisc, *old;
289b8970f0bSJohn Fastabend 	unsigned int ntx;
290b8970f0bSJohn Fastabend 
291b8970f0bSJohn Fastabend 	/* Attach underlying qdisc */
292b8970f0bSJohn Fastabend 	for (ntx = 0; ntx < dev->num_tx_queues; ntx++) {
293b8970f0bSJohn Fastabend 		qdisc = priv->qdiscs[ntx];
29495dc1929SEric Dumazet 		old = dev_graft_qdisc(qdisc->dev_queue, qdisc);
29595dc1929SEric Dumazet 		if (old)
29695dc1929SEric Dumazet 			qdisc_destroy(old);
29795dc1929SEric Dumazet 		if (ntx < dev->real_num_tx_queues)
29849b49971SJiri Kosina 			qdisc_hash_add(qdisc, false);
299b8970f0bSJohn Fastabend 	}
300b8970f0bSJohn Fastabend 	kfree(priv->qdiscs);
301b8970f0bSJohn Fastabend 	priv->qdiscs = NULL;
302b8970f0bSJohn Fastabend }
303b8970f0bSJohn Fastabend 
304b8970f0bSJohn Fastabend static struct netdev_queue *mqprio_queue_get(struct Qdisc *sch,
305b8970f0bSJohn Fastabend 					     unsigned long cl)
306b8970f0bSJohn Fastabend {
307b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
308b8970f0bSJohn Fastabend 	unsigned long ntx = cl - 1 - netdev_get_num_tc(dev);
309b8970f0bSJohn Fastabend 
310b8970f0bSJohn Fastabend 	if (ntx >= dev->num_tx_queues)
311b8970f0bSJohn Fastabend 		return NULL;
312b8970f0bSJohn Fastabend 	return netdev_get_tx_queue(dev, ntx);
313b8970f0bSJohn Fastabend }
314b8970f0bSJohn Fastabend 
315b8970f0bSJohn Fastabend static int mqprio_graft(struct Qdisc *sch, unsigned long cl, struct Qdisc *new,
316b8970f0bSJohn Fastabend 		    struct Qdisc **old)
317b8970f0bSJohn Fastabend {
318b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
319b8970f0bSJohn Fastabend 	struct netdev_queue *dev_queue = mqprio_queue_get(sch, cl);
320b8970f0bSJohn Fastabend 
321b8970f0bSJohn Fastabend 	if (!dev_queue)
322b8970f0bSJohn Fastabend 		return -EINVAL;
323b8970f0bSJohn Fastabend 
324b8970f0bSJohn Fastabend 	if (dev->flags & IFF_UP)
325b8970f0bSJohn Fastabend 		dev_deactivate(dev);
326b8970f0bSJohn Fastabend 
327b8970f0bSJohn Fastabend 	*old = dev_graft_qdisc(dev_queue, new);
328b8970f0bSJohn Fastabend 
3291abbe139SEric Dumazet 	if (new)
3304eaf3b84SEric Dumazet 		new->flags |= TCQ_F_ONETXQUEUE | TCQ_F_NOPARENT;
3311abbe139SEric Dumazet 
332b8970f0bSJohn Fastabend 	if (dev->flags & IFF_UP)
333b8970f0bSJohn Fastabend 		dev_activate(dev);
334b8970f0bSJohn Fastabend 
335b8970f0bSJohn Fastabend 	return 0;
336b8970f0bSJohn Fastabend }
337b8970f0bSJohn Fastabend 
338*4e8b86c0SAmritha Nambiar static int dump_rates(struct mqprio_sched *priv,
339*4e8b86c0SAmritha Nambiar 		      struct tc_mqprio_qopt *opt, struct sk_buff *skb)
340*4e8b86c0SAmritha Nambiar {
341*4e8b86c0SAmritha Nambiar 	struct nlattr *nest;
342*4e8b86c0SAmritha Nambiar 	int i;
343*4e8b86c0SAmritha Nambiar 
344*4e8b86c0SAmritha Nambiar 	if (priv->flags & TC_MQPRIO_F_MIN_RATE) {
345*4e8b86c0SAmritha Nambiar 		nest = nla_nest_start(skb, TCA_MQPRIO_MIN_RATE64);
346*4e8b86c0SAmritha Nambiar 		if (!nest)
347*4e8b86c0SAmritha Nambiar 			goto nla_put_failure;
348*4e8b86c0SAmritha Nambiar 
349*4e8b86c0SAmritha Nambiar 		for (i = 0; i < opt->num_tc; i++) {
350*4e8b86c0SAmritha Nambiar 			if (nla_put(skb, TCA_MQPRIO_MIN_RATE64,
351*4e8b86c0SAmritha Nambiar 				    sizeof(priv->min_rate[i]),
352*4e8b86c0SAmritha Nambiar 				    &priv->min_rate[i]))
353*4e8b86c0SAmritha Nambiar 				goto nla_put_failure;
354*4e8b86c0SAmritha Nambiar 		}
355*4e8b86c0SAmritha Nambiar 		nla_nest_end(skb, nest);
356*4e8b86c0SAmritha Nambiar 	}
357*4e8b86c0SAmritha Nambiar 
358*4e8b86c0SAmritha Nambiar 	if (priv->flags & TC_MQPRIO_F_MAX_RATE) {
359*4e8b86c0SAmritha Nambiar 		nest = nla_nest_start(skb, TCA_MQPRIO_MAX_RATE64);
360*4e8b86c0SAmritha Nambiar 		if (!nest)
361*4e8b86c0SAmritha Nambiar 			goto nla_put_failure;
362*4e8b86c0SAmritha Nambiar 
363*4e8b86c0SAmritha Nambiar 		for (i = 0; i < opt->num_tc; i++) {
364*4e8b86c0SAmritha Nambiar 			if (nla_put(skb, TCA_MQPRIO_MAX_RATE64,
365*4e8b86c0SAmritha Nambiar 				    sizeof(priv->max_rate[i]),
366*4e8b86c0SAmritha Nambiar 				    &priv->max_rate[i]))
367*4e8b86c0SAmritha Nambiar 				goto nla_put_failure;
368*4e8b86c0SAmritha Nambiar 		}
369*4e8b86c0SAmritha Nambiar 		nla_nest_end(skb, nest);
370*4e8b86c0SAmritha Nambiar 	}
371*4e8b86c0SAmritha Nambiar 	return 0;
372*4e8b86c0SAmritha Nambiar 
373*4e8b86c0SAmritha Nambiar nla_put_failure:
374*4e8b86c0SAmritha Nambiar 	nla_nest_cancel(skb, nest);
375*4e8b86c0SAmritha Nambiar 	return -1;
376*4e8b86c0SAmritha Nambiar }
377*4e8b86c0SAmritha Nambiar 
378b8970f0bSJohn Fastabend static int mqprio_dump(struct Qdisc *sch, struct sk_buff *skb)
379b8970f0bSJohn Fastabend {
380b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
381b8970f0bSJohn Fastabend 	struct mqprio_sched *priv = qdisc_priv(sch);
382*4e8b86c0SAmritha Nambiar 	struct nlattr *nla = (struct nlattr *)skb_tail_pointer(skb);
383144ce879SEric Dumazet 	struct tc_mqprio_qopt opt = { 0 };
384b8970f0bSJohn Fastabend 	struct Qdisc *qdisc;
385b8970f0bSJohn Fastabend 	unsigned int i;
386b8970f0bSJohn Fastabend 
387b8970f0bSJohn Fastabend 	sch->q.qlen = 0;
388b8970f0bSJohn Fastabend 	memset(&sch->bstats, 0, sizeof(sch->bstats));
389b8970f0bSJohn Fastabend 	memset(&sch->qstats, 0, sizeof(sch->qstats));
390b8970f0bSJohn Fastabend 
391b8970f0bSJohn Fastabend 	for (i = 0; i < dev->num_tx_queues; i++) {
39246e5da40SJohn Fastabend 		qdisc = rtnl_dereference(netdev_get_tx_queue(dev, i)->qdisc);
393b8970f0bSJohn Fastabend 		spin_lock_bh(qdisc_lock(qdisc));
394b8970f0bSJohn Fastabend 		sch->q.qlen		+= qdisc->q.qlen;
395b8970f0bSJohn Fastabend 		sch->bstats.bytes	+= qdisc->bstats.bytes;
396b8970f0bSJohn Fastabend 		sch->bstats.packets	+= qdisc->bstats.packets;
397b8970f0bSJohn Fastabend 		sch->qstats.backlog	+= qdisc->qstats.backlog;
398b8970f0bSJohn Fastabend 		sch->qstats.drops	+= qdisc->qstats.drops;
399b8970f0bSJohn Fastabend 		sch->qstats.requeues	+= qdisc->qstats.requeues;
400b8970f0bSJohn Fastabend 		sch->qstats.overlimits	+= qdisc->qstats.overlimits;
401b8970f0bSJohn Fastabend 		spin_unlock_bh(qdisc_lock(qdisc));
402b8970f0bSJohn Fastabend 	}
403b8970f0bSJohn Fastabend 
404b8970f0bSJohn Fastabend 	opt.num_tc = netdev_get_num_tc(dev);
405b8970f0bSJohn Fastabend 	memcpy(opt.prio_tc_map, dev->prio_tc_map, sizeof(opt.prio_tc_map));
4062026fecfSAlexander Duyck 	opt.hw = priv->hw_offload;
407b8970f0bSJohn Fastabend 
408b8970f0bSJohn Fastabend 	for (i = 0; i < netdev_get_num_tc(dev); i++) {
409b8970f0bSJohn Fastabend 		opt.count[i] = dev->tc_to_txq[i].count;
410b8970f0bSJohn Fastabend 		opt.offset[i] = dev->tc_to_txq[i].offset;
411b8970f0bSJohn Fastabend 	}
412b8970f0bSJohn Fastabend 
413*4e8b86c0SAmritha Nambiar 	if (nla_put(skb, TCA_OPTIONS, NLA_ALIGN(sizeof(opt)), &opt))
4141b34ec43SDavid S. Miller 		goto nla_put_failure;
415b8970f0bSJohn Fastabend 
416*4e8b86c0SAmritha Nambiar 	if ((priv->flags & TC_MQPRIO_F_MODE) &&
417*4e8b86c0SAmritha Nambiar 	    nla_put_u16(skb, TCA_MQPRIO_MODE, priv->mode))
418*4e8b86c0SAmritha Nambiar 		goto nla_put_failure;
419*4e8b86c0SAmritha Nambiar 
420*4e8b86c0SAmritha Nambiar 	if ((priv->flags & TC_MQPRIO_F_SHAPER) &&
421*4e8b86c0SAmritha Nambiar 	    nla_put_u16(skb, TCA_MQPRIO_SHAPER, priv->shaper))
422*4e8b86c0SAmritha Nambiar 		goto nla_put_failure;
423*4e8b86c0SAmritha Nambiar 
424*4e8b86c0SAmritha Nambiar 	if ((priv->flags & TC_MQPRIO_F_MIN_RATE ||
425*4e8b86c0SAmritha Nambiar 	     priv->flags & TC_MQPRIO_F_MAX_RATE) &&
426*4e8b86c0SAmritha Nambiar 	    (dump_rates(priv, &opt, skb) != 0))
427*4e8b86c0SAmritha Nambiar 		goto nla_put_failure;
428*4e8b86c0SAmritha Nambiar 
429*4e8b86c0SAmritha Nambiar 	return nla_nest_end(skb, nla);
430b8970f0bSJohn Fastabend nla_put_failure:
431*4e8b86c0SAmritha Nambiar 	nlmsg_trim(skb, nla);
432b8970f0bSJohn Fastabend 	return -1;
433b8970f0bSJohn Fastabend }
434b8970f0bSJohn Fastabend 
435b8970f0bSJohn Fastabend static struct Qdisc *mqprio_leaf(struct Qdisc *sch, unsigned long cl)
436b8970f0bSJohn Fastabend {
437b8970f0bSJohn Fastabend 	struct netdev_queue *dev_queue = mqprio_queue_get(sch, cl);
438b8970f0bSJohn Fastabend 
439b8970f0bSJohn Fastabend 	if (!dev_queue)
440b8970f0bSJohn Fastabend 		return NULL;
441b8970f0bSJohn Fastabend 
442b8970f0bSJohn Fastabend 	return dev_queue->qdisc_sleeping;
443b8970f0bSJohn Fastabend }
444b8970f0bSJohn Fastabend 
445143976ceSWANG Cong static unsigned long mqprio_find(struct Qdisc *sch, u32 classid)
446b8970f0bSJohn Fastabend {
447b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
448b8970f0bSJohn Fastabend 	unsigned int ntx = TC_H_MIN(classid);
449b8970f0bSJohn Fastabend 
450b8970f0bSJohn Fastabend 	if (ntx > dev->num_tx_queues + netdev_get_num_tc(dev))
451b8970f0bSJohn Fastabend 		return 0;
452b8970f0bSJohn Fastabend 	return ntx;
453b8970f0bSJohn Fastabend }
454b8970f0bSJohn Fastabend 
455b8970f0bSJohn Fastabend static int mqprio_dump_class(struct Qdisc *sch, unsigned long cl,
456b8970f0bSJohn Fastabend 			 struct sk_buff *skb, struct tcmsg *tcm)
457b8970f0bSJohn Fastabend {
458b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
459b8970f0bSJohn Fastabend 
460b8970f0bSJohn Fastabend 	if (cl <= netdev_get_num_tc(dev)) {
461b8970f0bSJohn Fastabend 		tcm->tcm_parent = TC_H_ROOT;
462b8970f0bSJohn Fastabend 		tcm->tcm_info = 0;
463b8970f0bSJohn Fastabend 	} else {
464b8970f0bSJohn Fastabend 		int i;
465b8970f0bSJohn Fastabend 		struct netdev_queue *dev_queue;
466b8970f0bSJohn Fastabend 
467b8970f0bSJohn Fastabend 		dev_queue = mqprio_queue_get(sch, cl);
468b8970f0bSJohn Fastabend 		tcm->tcm_parent = 0;
469b8970f0bSJohn Fastabend 		for (i = 0; i < netdev_get_num_tc(dev); i++) {
470b8970f0bSJohn Fastabend 			struct netdev_tc_txq tc = dev->tc_to_txq[i];
471b8970f0bSJohn Fastabend 			int q_idx = cl - netdev_get_num_tc(dev);
472b8970f0bSJohn Fastabend 
473b8970f0bSJohn Fastabend 			if (q_idx > tc.offset &&
474b8970f0bSJohn Fastabend 			    q_idx <= tc.offset + tc.count) {
475b8970f0bSJohn Fastabend 				tcm->tcm_parent =
476b8970f0bSJohn Fastabend 					TC_H_MAKE(TC_H_MAJ(sch->handle),
477b8970f0bSJohn Fastabend 						  TC_H_MIN(i + 1));
478b8970f0bSJohn Fastabend 				break;
479b8970f0bSJohn Fastabend 			}
480b8970f0bSJohn Fastabend 		}
481b8970f0bSJohn Fastabend 		tcm->tcm_info = dev_queue->qdisc_sleeping->handle;
482b8970f0bSJohn Fastabend 	}
483b8970f0bSJohn Fastabend 	tcm->tcm_handle |= TC_H_MIN(cl);
484b8970f0bSJohn Fastabend 	return 0;
485b8970f0bSJohn Fastabend }
486b8970f0bSJohn Fastabend 
487b8970f0bSJohn Fastabend static int mqprio_dump_class_stats(struct Qdisc *sch, unsigned long cl,
488b8970f0bSJohn Fastabend 				   struct gnet_dump *d)
489ea18fd95Sstephen hemminger 	__releases(d->lock)
490ea18fd95Sstephen hemminger 	__acquires(d->lock)
491b8970f0bSJohn Fastabend {
492b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
493b8970f0bSJohn Fastabend 
494b8970f0bSJohn Fastabend 	if (cl <= netdev_get_num_tc(dev)) {
495b8970f0bSJohn Fastabend 		int i;
49664015853SJohn Fastabend 		__u32 qlen = 0;
497b8970f0bSJohn Fastabend 		struct Qdisc *qdisc;
498b8970f0bSJohn Fastabend 		struct gnet_stats_queue qstats = {0};
499b8970f0bSJohn Fastabend 		struct gnet_stats_basic_packed bstats = {0};
500b8970f0bSJohn Fastabend 		struct netdev_tc_txq tc = dev->tc_to_txq[cl - 1];
501b8970f0bSJohn Fastabend 
502b8970f0bSJohn Fastabend 		/* Drop lock here it will be reclaimed before touching
503b8970f0bSJohn Fastabend 		 * statistics this is required because the d->lock we
504b8970f0bSJohn Fastabend 		 * hold here is the look on dev_queue->qdisc_sleeping
505b8970f0bSJohn Fastabend 		 * also acquired below.
506b8970f0bSJohn Fastabend 		 */
507edb09eb1SEric Dumazet 		if (d->lock)
508b8970f0bSJohn Fastabend 			spin_unlock_bh(d->lock);
509b8970f0bSJohn Fastabend 
510b8970f0bSJohn Fastabend 		for (i = tc.offset; i < tc.offset + tc.count; i++) {
51146e5da40SJohn Fastabend 			struct netdev_queue *q = netdev_get_tx_queue(dev, i);
51246e5da40SJohn Fastabend 
51346e5da40SJohn Fastabend 			qdisc = rtnl_dereference(q->qdisc);
514b8970f0bSJohn Fastabend 			spin_lock_bh(qdisc_lock(qdisc));
51564015853SJohn Fastabend 			qlen		  += qdisc->q.qlen;
516b8970f0bSJohn Fastabend 			bstats.bytes      += qdisc->bstats.bytes;
517b8970f0bSJohn Fastabend 			bstats.packets    += qdisc->bstats.packets;
518b8970f0bSJohn Fastabend 			qstats.backlog    += qdisc->qstats.backlog;
519b8970f0bSJohn Fastabend 			qstats.drops      += qdisc->qstats.drops;
520b8970f0bSJohn Fastabend 			qstats.requeues   += qdisc->qstats.requeues;
521b8970f0bSJohn Fastabend 			qstats.overlimits += qdisc->qstats.overlimits;
522b8970f0bSJohn Fastabend 			spin_unlock_bh(qdisc_lock(qdisc));
523b8970f0bSJohn Fastabend 		}
524b8970f0bSJohn Fastabend 		/* Reclaim root sleeping lock before completing stats */
525edb09eb1SEric Dumazet 		if (d->lock)
526b8970f0bSJohn Fastabend 			spin_lock_bh(d->lock);
527edb09eb1SEric Dumazet 		if (gnet_stats_copy_basic(NULL, d, NULL, &bstats) < 0 ||
528b0ab6f92SJohn Fastabend 		    gnet_stats_copy_queue(d, NULL, &qstats, qlen) < 0)
529b8970f0bSJohn Fastabend 			return -1;
530b8970f0bSJohn Fastabend 	} else {
531b8970f0bSJohn Fastabend 		struct netdev_queue *dev_queue = mqprio_queue_get(sch, cl);
532b8970f0bSJohn Fastabend 
533b8970f0bSJohn Fastabend 		sch = dev_queue->qdisc_sleeping;
534edb09eb1SEric Dumazet 		if (gnet_stats_copy_basic(qdisc_root_sleeping_running(sch),
535edb09eb1SEric Dumazet 					  d, NULL, &sch->bstats) < 0 ||
536b0ab6f92SJohn Fastabend 		    gnet_stats_copy_queue(d, NULL,
537b0ab6f92SJohn Fastabend 					  &sch->qstats, sch->q.qlen) < 0)
538b8970f0bSJohn Fastabend 			return -1;
539b8970f0bSJohn Fastabend 	}
540b8970f0bSJohn Fastabend 	return 0;
541b8970f0bSJohn Fastabend }
542b8970f0bSJohn Fastabend 
543b8970f0bSJohn Fastabend static void mqprio_walk(struct Qdisc *sch, struct qdisc_walker *arg)
544b8970f0bSJohn Fastabend {
545b8970f0bSJohn Fastabend 	struct net_device *dev = qdisc_dev(sch);
546b8970f0bSJohn Fastabend 	unsigned long ntx;
547b8970f0bSJohn Fastabend 
548b8970f0bSJohn Fastabend 	if (arg->stop)
549b8970f0bSJohn Fastabend 		return;
550b8970f0bSJohn Fastabend 
551b8970f0bSJohn Fastabend 	/* Walk hierarchy with a virtual class per tc */
552b8970f0bSJohn Fastabend 	arg->count = arg->skip;
553b8970f0bSJohn Fastabend 	for (ntx = arg->skip;
554b8970f0bSJohn Fastabend 	     ntx < dev->num_tx_queues + netdev_get_num_tc(dev);
555b8970f0bSJohn Fastabend 	     ntx++) {
556b8970f0bSJohn Fastabend 		if (arg->fn(sch, ntx + 1, arg) < 0) {
557b8970f0bSJohn Fastabend 			arg->stop = 1;
558b8970f0bSJohn Fastabend 			break;
559b8970f0bSJohn Fastabend 		}
560b8970f0bSJohn Fastabend 		arg->count++;
561b8970f0bSJohn Fastabend 	}
562b8970f0bSJohn Fastabend }
563b8970f0bSJohn Fastabend 
564b8970f0bSJohn Fastabend static const struct Qdisc_class_ops mqprio_class_ops = {
565b8970f0bSJohn Fastabend 	.graft		= mqprio_graft,
566b8970f0bSJohn Fastabend 	.leaf		= mqprio_leaf,
567143976ceSWANG Cong 	.find		= mqprio_find,
568b8970f0bSJohn Fastabend 	.walk		= mqprio_walk,
569b8970f0bSJohn Fastabend 	.dump		= mqprio_dump_class,
570b8970f0bSJohn Fastabend 	.dump_stats	= mqprio_dump_class_stats,
571b8970f0bSJohn Fastabend };
572b8970f0bSJohn Fastabend 
573ea18fd95Sstephen hemminger static struct Qdisc_ops mqprio_qdisc_ops __read_mostly = {
574b8970f0bSJohn Fastabend 	.cl_ops		= &mqprio_class_ops,
575b8970f0bSJohn Fastabend 	.id		= "mqprio",
576b8970f0bSJohn Fastabend 	.priv_size	= sizeof(struct mqprio_sched),
577b8970f0bSJohn Fastabend 	.init		= mqprio_init,
578b8970f0bSJohn Fastabend 	.destroy	= mqprio_destroy,
579b8970f0bSJohn Fastabend 	.attach		= mqprio_attach,
580b8970f0bSJohn Fastabend 	.dump		= mqprio_dump,
581b8970f0bSJohn Fastabend 	.owner		= THIS_MODULE,
582b8970f0bSJohn Fastabend };
583b8970f0bSJohn Fastabend 
584b8970f0bSJohn Fastabend static int __init mqprio_module_init(void)
585b8970f0bSJohn Fastabend {
586b8970f0bSJohn Fastabend 	return register_qdisc(&mqprio_qdisc_ops);
587b8970f0bSJohn Fastabend }
588b8970f0bSJohn Fastabend 
589b8970f0bSJohn Fastabend static void __exit mqprio_module_exit(void)
590b8970f0bSJohn Fastabend {
591b8970f0bSJohn Fastabend 	unregister_qdisc(&mqprio_qdisc_ops);
592b8970f0bSJohn Fastabend }
593b8970f0bSJohn Fastabend 
594b8970f0bSJohn Fastabend module_init(mqprio_module_init);
595b8970f0bSJohn Fastabend module_exit(mqprio_module_exit);
596b8970f0bSJohn Fastabend 
597b8970f0bSJohn Fastabend MODULE_LICENSE("GPL");
598