15a781ccbSVinicius Costa Gomes // SPDX-License-Identifier: GPL-2.0 25a781ccbSVinicius Costa Gomes 35a781ccbSVinicius Costa Gomes /* net/sched/sch_taprio.c Time Aware Priority Scheduler 45a781ccbSVinicius Costa Gomes * 55a781ccbSVinicius Costa Gomes * Authors: Vinicius Costa Gomes <vinicius.gomes@intel.com> 65a781ccbSVinicius Costa Gomes * 75a781ccbSVinicius Costa Gomes */ 85a781ccbSVinicius Costa Gomes 95a781ccbSVinicius Costa Gomes #include <linux/types.h> 105a781ccbSVinicius Costa Gomes #include <linux/slab.h> 115a781ccbSVinicius Costa Gomes #include <linux/kernel.h> 125a781ccbSVinicius Costa Gomes #include <linux/string.h> 135a781ccbSVinicius Costa Gomes #include <linux/list.h> 145a781ccbSVinicius Costa Gomes #include <linux/errno.h> 155a781ccbSVinicius Costa Gomes #include <linux/skbuff.h> 165a781ccbSVinicius Costa Gomes #include <linux/module.h> 175a781ccbSVinicius Costa Gomes #include <linux/spinlock.h> 185a781ccbSVinicius Costa Gomes #include <net/netlink.h> 195a781ccbSVinicius Costa Gomes #include <net/pkt_sched.h> 205a781ccbSVinicius Costa Gomes #include <net/pkt_cls.h> 215a781ccbSVinicius Costa Gomes #include <net/sch_generic.h> 225a781ccbSVinicius Costa Gomes 235a781ccbSVinicius Costa Gomes #define TAPRIO_ALL_GATES_OPEN -1 245a781ccbSVinicius Costa Gomes 255a781ccbSVinicius Costa Gomes struct sched_entry { 265a781ccbSVinicius Costa Gomes struct list_head list; 275a781ccbSVinicius Costa Gomes 285a781ccbSVinicius Costa Gomes /* The instant that this entry "closes" and the next one 295a781ccbSVinicius Costa Gomes * should open, the qdisc will make some effort so that no 305a781ccbSVinicius Costa Gomes * packet leaves after this time. 315a781ccbSVinicius Costa Gomes */ 325a781ccbSVinicius Costa Gomes ktime_t close_time; 335a781ccbSVinicius Costa Gomes atomic_t budget; 345a781ccbSVinicius Costa Gomes int index; 355a781ccbSVinicius Costa Gomes u32 gate_mask; 365a781ccbSVinicius Costa Gomes u32 interval; 375a781ccbSVinicius Costa Gomes u8 command; 385a781ccbSVinicius Costa Gomes }; 395a781ccbSVinicius Costa Gomes 405a781ccbSVinicius Costa Gomes struct taprio_sched { 415a781ccbSVinicius Costa Gomes struct Qdisc **qdiscs; 425a781ccbSVinicius Costa Gomes struct Qdisc *root; 435a781ccbSVinicius Costa Gomes s64 base_time; 445a781ccbSVinicius Costa Gomes int clockid; 455a781ccbSVinicius Costa Gomes int picos_per_byte; /* Using picoseconds because for 10Gbps+ 465a781ccbSVinicius Costa Gomes * speeds it's sub-nanoseconds per byte 475a781ccbSVinicius Costa Gomes */ 485a781ccbSVinicius Costa Gomes size_t num_entries; 495a781ccbSVinicius Costa Gomes 505a781ccbSVinicius Costa Gomes /* Protects the update side of the RCU protected current_entry */ 515a781ccbSVinicius Costa Gomes spinlock_t current_entry_lock; 525a781ccbSVinicius Costa Gomes struct sched_entry __rcu *current_entry; 535a781ccbSVinicius Costa Gomes struct list_head entries; 545a781ccbSVinicius Costa Gomes ktime_t (*get_time)(void); 555a781ccbSVinicius Costa Gomes struct hrtimer advance_timer; 565a781ccbSVinicius Costa Gomes }; 575a781ccbSVinicius Costa Gomes 585a781ccbSVinicius Costa Gomes static int taprio_enqueue(struct sk_buff *skb, struct Qdisc *sch, 595a781ccbSVinicius Costa Gomes struct sk_buff **to_free) 605a781ccbSVinicius Costa Gomes { 615a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 625a781ccbSVinicius Costa Gomes struct Qdisc *child; 635a781ccbSVinicius Costa Gomes int queue; 645a781ccbSVinicius Costa Gomes 655a781ccbSVinicius Costa Gomes queue = skb_get_queue_mapping(skb); 665a781ccbSVinicius Costa Gomes 675a781ccbSVinicius Costa Gomes child = q->qdiscs[queue]; 685a781ccbSVinicius Costa Gomes if (unlikely(!child)) 695a781ccbSVinicius Costa Gomes return qdisc_drop(skb, sch, to_free); 705a781ccbSVinicius Costa Gomes 715a781ccbSVinicius Costa Gomes qdisc_qstats_backlog_inc(sch, skb); 725a781ccbSVinicius Costa Gomes sch->q.qlen++; 735a781ccbSVinicius Costa Gomes 745a781ccbSVinicius Costa Gomes return qdisc_enqueue(skb, child, to_free); 755a781ccbSVinicius Costa Gomes } 765a781ccbSVinicius Costa Gomes 775a781ccbSVinicius Costa Gomes static struct sk_buff *taprio_peek(struct Qdisc *sch) 785a781ccbSVinicius Costa Gomes { 795a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 805a781ccbSVinicius Costa Gomes struct net_device *dev = qdisc_dev(sch); 815a781ccbSVinicius Costa Gomes struct sched_entry *entry; 825a781ccbSVinicius Costa Gomes struct sk_buff *skb; 835a781ccbSVinicius Costa Gomes u32 gate_mask; 845a781ccbSVinicius Costa Gomes int i; 855a781ccbSVinicius Costa Gomes 865a781ccbSVinicius Costa Gomes rcu_read_lock(); 875a781ccbSVinicius Costa Gomes entry = rcu_dereference(q->current_entry); 885a781ccbSVinicius Costa Gomes gate_mask = entry ? entry->gate_mask : -1; 895a781ccbSVinicius Costa Gomes rcu_read_unlock(); 905a781ccbSVinicius Costa Gomes 915a781ccbSVinicius Costa Gomes if (!gate_mask) 925a781ccbSVinicius Costa Gomes return NULL; 935a781ccbSVinicius Costa Gomes 945a781ccbSVinicius Costa Gomes for (i = 0; i < dev->num_tx_queues; i++) { 955a781ccbSVinicius Costa Gomes struct Qdisc *child = q->qdiscs[i]; 965a781ccbSVinicius Costa Gomes int prio; 975a781ccbSVinicius Costa Gomes u8 tc; 985a781ccbSVinicius Costa Gomes 995a781ccbSVinicius Costa Gomes if (unlikely(!child)) 1005a781ccbSVinicius Costa Gomes continue; 1015a781ccbSVinicius Costa Gomes 1025a781ccbSVinicius Costa Gomes skb = child->ops->peek(child); 1035a781ccbSVinicius Costa Gomes if (!skb) 1045a781ccbSVinicius Costa Gomes continue; 1055a781ccbSVinicius Costa Gomes 1065a781ccbSVinicius Costa Gomes prio = skb->priority; 1075a781ccbSVinicius Costa Gomes tc = netdev_get_prio_tc_map(dev, prio); 1085a781ccbSVinicius Costa Gomes 1095a781ccbSVinicius Costa Gomes if (!(gate_mask & BIT(tc))) 1105a781ccbSVinicius Costa Gomes return NULL; 1115a781ccbSVinicius Costa Gomes 1125a781ccbSVinicius Costa Gomes return skb; 1135a781ccbSVinicius Costa Gomes } 1145a781ccbSVinicius Costa Gomes 1155a781ccbSVinicius Costa Gomes return NULL; 1165a781ccbSVinicius Costa Gomes } 1175a781ccbSVinicius Costa Gomes 1185a781ccbSVinicius Costa Gomes static inline int length_to_duration(struct taprio_sched *q, int len) 1195a781ccbSVinicius Costa Gomes { 1205a781ccbSVinicius Costa Gomes return (len * q->picos_per_byte) / 1000; 1215a781ccbSVinicius Costa Gomes } 1225a781ccbSVinicius Costa Gomes 1235a781ccbSVinicius Costa Gomes static struct sk_buff *taprio_dequeue(struct Qdisc *sch) 1245a781ccbSVinicius Costa Gomes { 1255a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 1265a781ccbSVinicius Costa Gomes struct net_device *dev = qdisc_dev(sch); 1275a781ccbSVinicius Costa Gomes struct sched_entry *entry; 1285a781ccbSVinicius Costa Gomes struct sk_buff *skb; 1295a781ccbSVinicius Costa Gomes u32 gate_mask; 1305a781ccbSVinicius Costa Gomes int i; 1315a781ccbSVinicius Costa Gomes 1325a781ccbSVinicius Costa Gomes rcu_read_lock(); 1335a781ccbSVinicius Costa Gomes entry = rcu_dereference(q->current_entry); 1345a781ccbSVinicius Costa Gomes /* if there's no entry, it means that the schedule didn't 1355a781ccbSVinicius Costa Gomes * start yet, so force all gates to be open, this is in 1365a781ccbSVinicius Costa Gomes * accordance to IEEE 802.1Qbv-2015 Section 8.6.9.4.5 1375a781ccbSVinicius Costa Gomes * "AdminGateSates" 1385a781ccbSVinicius Costa Gomes */ 1395a781ccbSVinicius Costa Gomes gate_mask = entry ? entry->gate_mask : TAPRIO_ALL_GATES_OPEN; 1405a781ccbSVinicius Costa Gomes rcu_read_unlock(); 1415a781ccbSVinicius Costa Gomes 1425a781ccbSVinicius Costa Gomes if (!gate_mask) 1435a781ccbSVinicius Costa Gomes return NULL; 1445a781ccbSVinicius Costa Gomes 1455a781ccbSVinicius Costa Gomes for (i = 0; i < dev->num_tx_queues; i++) { 1465a781ccbSVinicius Costa Gomes struct Qdisc *child = q->qdiscs[i]; 1475a781ccbSVinicius Costa Gomes ktime_t guard; 1485a781ccbSVinicius Costa Gomes int prio; 1495a781ccbSVinicius Costa Gomes int len; 1505a781ccbSVinicius Costa Gomes u8 tc; 1515a781ccbSVinicius Costa Gomes 1525a781ccbSVinicius Costa Gomes if (unlikely(!child)) 1535a781ccbSVinicius Costa Gomes continue; 1545a781ccbSVinicius Costa Gomes 1555a781ccbSVinicius Costa Gomes skb = child->ops->peek(child); 1565a781ccbSVinicius Costa Gomes if (!skb) 1575a781ccbSVinicius Costa Gomes continue; 1585a781ccbSVinicius Costa Gomes 1595a781ccbSVinicius Costa Gomes prio = skb->priority; 1605a781ccbSVinicius Costa Gomes tc = netdev_get_prio_tc_map(dev, prio); 1615a781ccbSVinicius Costa Gomes 1625a781ccbSVinicius Costa Gomes if (!(gate_mask & BIT(tc))) 1635a781ccbSVinicius Costa Gomes continue; 1645a781ccbSVinicius Costa Gomes 1655a781ccbSVinicius Costa Gomes len = qdisc_pkt_len(skb); 1665a781ccbSVinicius Costa Gomes guard = ktime_add_ns(q->get_time(), 1675a781ccbSVinicius Costa Gomes length_to_duration(q, len)); 1685a781ccbSVinicius Costa Gomes 1695a781ccbSVinicius Costa Gomes /* In the case that there's no gate entry, there's no 1705a781ccbSVinicius Costa Gomes * guard band ... 1715a781ccbSVinicius Costa Gomes */ 1725a781ccbSVinicius Costa Gomes if (gate_mask != TAPRIO_ALL_GATES_OPEN && 1735a781ccbSVinicius Costa Gomes ktime_after(guard, entry->close_time)) 1745a781ccbSVinicius Costa Gomes return NULL; 1755a781ccbSVinicius Costa Gomes 1765a781ccbSVinicius Costa Gomes /* ... and no budget. */ 1775a781ccbSVinicius Costa Gomes if (gate_mask != TAPRIO_ALL_GATES_OPEN && 1785a781ccbSVinicius Costa Gomes atomic_sub_return(len, &entry->budget) < 0) 1795a781ccbSVinicius Costa Gomes return NULL; 1805a781ccbSVinicius Costa Gomes 1815a781ccbSVinicius Costa Gomes skb = child->ops->dequeue(child); 1825a781ccbSVinicius Costa Gomes if (unlikely(!skb)) 1835a781ccbSVinicius Costa Gomes return NULL; 1845a781ccbSVinicius Costa Gomes 1855a781ccbSVinicius Costa Gomes qdisc_bstats_update(sch, skb); 1865a781ccbSVinicius Costa Gomes qdisc_qstats_backlog_dec(sch, skb); 1875a781ccbSVinicius Costa Gomes sch->q.qlen--; 1885a781ccbSVinicius Costa Gomes 1895a781ccbSVinicius Costa Gomes return skb; 1905a781ccbSVinicius Costa Gomes } 1915a781ccbSVinicius Costa Gomes 1925a781ccbSVinicius Costa Gomes return NULL; 1935a781ccbSVinicius Costa Gomes } 1945a781ccbSVinicius Costa Gomes 1955a781ccbSVinicius Costa Gomes static bool should_restart_cycle(const struct taprio_sched *q, 1965a781ccbSVinicius Costa Gomes const struct sched_entry *entry) 1975a781ccbSVinicius Costa Gomes { 1985a781ccbSVinicius Costa Gomes WARN_ON(!entry); 1995a781ccbSVinicius Costa Gomes 2005a781ccbSVinicius Costa Gomes return list_is_last(&entry->list, &q->entries); 2015a781ccbSVinicius Costa Gomes } 2025a781ccbSVinicius Costa Gomes 2035a781ccbSVinicius Costa Gomes static enum hrtimer_restart advance_sched(struct hrtimer *timer) 2045a781ccbSVinicius Costa Gomes { 2055a781ccbSVinicius Costa Gomes struct taprio_sched *q = container_of(timer, struct taprio_sched, 2065a781ccbSVinicius Costa Gomes advance_timer); 2075a781ccbSVinicius Costa Gomes struct sched_entry *entry, *next; 2085a781ccbSVinicius Costa Gomes struct Qdisc *sch = q->root; 2095a781ccbSVinicius Costa Gomes ktime_t close_time; 2105a781ccbSVinicius Costa Gomes 2115a781ccbSVinicius Costa Gomes spin_lock(&q->current_entry_lock); 2125a781ccbSVinicius Costa Gomes entry = rcu_dereference_protected(q->current_entry, 2135a781ccbSVinicius Costa Gomes lockdep_is_held(&q->current_entry_lock)); 2145a781ccbSVinicius Costa Gomes 2155a781ccbSVinicius Costa Gomes /* This is the case that it's the first time that the schedule 2165a781ccbSVinicius Costa Gomes * runs, so it only happens once per schedule. The first entry 2175a781ccbSVinicius Costa Gomes * is pre-calculated during the schedule initialization. 2185a781ccbSVinicius Costa Gomes */ 2195a781ccbSVinicius Costa Gomes if (unlikely(!entry)) { 2205a781ccbSVinicius Costa Gomes next = list_first_entry(&q->entries, struct sched_entry, 2215a781ccbSVinicius Costa Gomes list); 2225a781ccbSVinicius Costa Gomes close_time = next->close_time; 2235a781ccbSVinicius Costa Gomes goto first_run; 2245a781ccbSVinicius Costa Gomes } 2255a781ccbSVinicius Costa Gomes 2265a781ccbSVinicius Costa Gomes if (should_restart_cycle(q, entry)) 2275a781ccbSVinicius Costa Gomes next = list_first_entry(&q->entries, struct sched_entry, 2285a781ccbSVinicius Costa Gomes list); 2295a781ccbSVinicius Costa Gomes else 2305a781ccbSVinicius Costa Gomes next = list_next_entry(entry, list); 2315a781ccbSVinicius Costa Gomes 2325a781ccbSVinicius Costa Gomes close_time = ktime_add_ns(entry->close_time, next->interval); 2335a781ccbSVinicius Costa Gomes 2345a781ccbSVinicius Costa Gomes next->close_time = close_time; 2355a781ccbSVinicius Costa Gomes atomic_set(&next->budget, 2365a781ccbSVinicius Costa Gomes (next->interval * 1000) / q->picos_per_byte); 2375a781ccbSVinicius Costa Gomes 2385a781ccbSVinicius Costa Gomes first_run: 2395a781ccbSVinicius Costa Gomes rcu_assign_pointer(q->current_entry, next); 2405a781ccbSVinicius Costa Gomes spin_unlock(&q->current_entry_lock); 2415a781ccbSVinicius Costa Gomes 2425a781ccbSVinicius Costa Gomes hrtimer_set_expires(&q->advance_timer, close_time); 2435a781ccbSVinicius Costa Gomes 2445a781ccbSVinicius Costa Gomes rcu_read_lock(); 2455a781ccbSVinicius Costa Gomes __netif_schedule(sch); 2465a781ccbSVinicius Costa Gomes rcu_read_unlock(); 2475a781ccbSVinicius Costa Gomes 2485a781ccbSVinicius Costa Gomes return HRTIMER_RESTART; 2495a781ccbSVinicius Costa Gomes } 2505a781ccbSVinicius Costa Gomes 2515a781ccbSVinicius Costa Gomes static const struct nla_policy entry_policy[TCA_TAPRIO_SCHED_ENTRY_MAX + 1] = { 2525a781ccbSVinicius Costa Gomes [TCA_TAPRIO_SCHED_ENTRY_INDEX] = { .type = NLA_U32 }, 2535a781ccbSVinicius Costa Gomes [TCA_TAPRIO_SCHED_ENTRY_CMD] = { .type = NLA_U8 }, 2545a781ccbSVinicius Costa Gomes [TCA_TAPRIO_SCHED_ENTRY_GATE_MASK] = { .type = NLA_U32 }, 2555a781ccbSVinicius Costa Gomes [TCA_TAPRIO_SCHED_ENTRY_INTERVAL] = { .type = NLA_U32 }, 2565a781ccbSVinicius Costa Gomes }; 2575a781ccbSVinicius Costa Gomes 2585a781ccbSVinicius Costa Gomes static const struct nla_policy entry_list_policy[TCA_TAPRIO_SCHED_MAX + 1] = { 2595a781ccbSVinicius Costa Gomes [TCA_TAPRIO_SCHED_ENTRY] = { .type = NLA_NESTED }, 2605a781ccbSVinicius Costa Gomes }; 2615a781ccbSVinicius Costa Gomes 2625a781ccbSVinicius Costa Gomes static const struct nla_policy taprio_policy[TCA_TAPRIO_ATTR_MAX + 1] = { 2635a781ccbSVinicius Costa Gomes [TCA_TAPRIO_ATTR_PRIOMAP] = { 2645a781ccbSVinicius Costa Gomes .len = sizeof(struct tc_mqprio_qopt) 2655a781ccbSVinicius Costa Gomes }, 2665a781ccbSVinicius Costa Gomes [TCA_TAPRIO_ATTR_SCHED_ENTRY_LIST] = { .type = NLA_NESTED }, 2675a781ccbSVinicius Costa Gomes [TCA_TAPRIO_ATTR_SCHED_BASE_TIME] = { .type = NLA_S64 }, 2685a781ccbSVinicius Costa Gomes [TCA_TAPRIO_ATTR_SCHED_SINGLE_ENTRY] = { .type = NLA_NESTED }, 2695a781ccbSVinicius Costa Gomes [TCA_TAPRIO_ATTR_SCHED_CLOCKID] = { .type = NLA_S32 }, 2705a781ccbSVinicius Costa Gomes }; 2715a781ccbSVinicius Costa Gomes 2725a781ccbSVinicius Costa Gomes static int fill_sched_entry(struct nlattr **tb, struct sched_entry *entry, 2735a781ccbSVinicius Costa Gomes struct netlink_ext_ack *extack) 2745a781ccbSVinicius Costa Gomes { 2755a781ccbSVinicius Costa Gomes u32 interval = 0; 2765a781ccbSVinicius Costa Gomes 2775a781ccbSVinicius Costa Gomes if (tb[TCA_TAPRIO_SCHED_ENTRY_CMD]) 2785a781ccbSVinicius Costa Gomes entry->command = nla_get_u8( 2795a781ccbSVinicius Costa Gomes tb[TCA_TAPRIO_SCHED_ENTRY_CMD]); 2805a781ccbSVinicius Costa Gomes 2815a781ccbSVinicius Costa Gomes if (tb[TCA_TAPRIO_SCHED_ENTRY_GATE_MASK]) 2825a781ccbSVinicius Costa Gomes entry->gate_mask = nla_get_u32( 2835a781ccbSVinicius Costa Gomes tb[TCA_TAPRIO_SCHED_ENTRY_GATE_MASK]); 2845a781ccbSVinicius Costa Gomes 2855a781ccbSVinicius Costa Gomes if (tb[TCA_TAPRIO_SCHED_ENTRY_INTERVAL]) 2865a781ccbSVinicius Costa Gomes interval = nla_get_u32( 2875a781ccbSVinicius Costa Gomes tb[TCA_TAPRIO_SCHED_ENTRY_INTERVAL]); 2885a781ccbSVinicius Costa Gomes 2895a781ccbSVinicius Costa Gomes if (interval == 0) { 2905a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Invalid interval for schedule entry"); 2915a781ccbSVinicius Costa Gomes return -EINVAL; 2925a781ccbSVinicius Costa Gomes } 2935a781ccbSVinicius Costa Gomes 2945a781ccbSVinicius Costa Gomes entry->interval = interval; 2955a781ccbSVinicius Costa Gomes 2965a781ccbSVinicius Costa Gomes return 0; 2975a781ccbSVinicius Costa Gomes } 2985a781ccbSVinicius Costa Gomes 2995a781ccbSVinicius Costa Gomes static int parse_sched_entry(struct nlattr *n, struct sched_entry *entry, 3005a781ccbSVinicius Costa Gomes int index, struct netlink_ext_ack *extack) 3015a781ccbSVinicius Costa Gomes { 3025a781ccbSVinicius Costa Gomes struct nlattr *tb[TCA_TAPRIO_SCHED_ENTRY_MAX + 1] = { }; 3035a781ccbSVinicius Costa Gomes int err; 3045a781ccbSVinicius Costa Gomes 3055a781ccbSVinicius Costa Gomes err = nla_parse_nested(tb, TCA_TAPRIO_SCHED_ENTRY_MAX, n, 3065a781ccbSVinicius Costa Gomes entry_policy, NULL); 3075a781ccbSVinicius Costa Gomes if (err < 0) { 3085a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Could not parse nested entry"); 3095a781ccbSVinicius Costa Gomes return -EINVAL; 3105a781ccbSVinicius Costa Gomes } 3115a781ccbSVinicius Costa Gomes 3125a781ccbSVinicius Costa Gomes entry->index = index; 3135a781ccbSVinicius Costa Gomes 3145a781ccbSVinicius Costa Gomes return fill_sched_entry(tb, entry, extack); 3155a781ccbSVinicius Costa Gomes } 3165a781ccbSVinicius Costa Gomes 3175a781ccbSVinicius Costa Gomes /* Returns the number of entries in case of success */ 3185a781ccbSVinicius Costa Gomes static int parse_sched_single_entry(struct nlattr *n, 3195a781ccbSVinicius Costa Gomes struct taprio_sched *q, 3205a781ccbSVinicius Costa Gomes struct netlink_ext_ack *extack) 3215a781ccbSVinicius Costa Gomes { 3225a781ccbSVinicius Costa Gomes struct nlattr *tb_entry[TCA_TAPRIO_SCHED_ENTRY_MAX + 1] = { }; 3235a781ccbSVinicius Costa Gomes struct nlattr *tb_list[TCA_TAPRIO_SCHED_MAX + 1] = { }; 3245a781ccbSVinicius Costa Gomes struct sched_entry *entry; 3255a781ccbSVinicius Costa Gomes bool found = false; 3265a781ccbSVinicius Costa Gomes u32 index; 3275a781ccbSVinicius Costa Gomes int err; 3285a781ccbSVinicius Costa Gomes 3295a781ccbSVinicius Costa Gomes err = nla_parse_nested(tb_list, TCA_TAPRIO_SCHED_MAX, 3305a781ccbSVinicius Costa Gomes n, entry_list_policy, NULL); 3315a781ccbSVinicius Costa Gomes if (err < 0) { 3325a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Could not parse nested entry"); 3335a781ccbSVinicius Costa Gomes return -EINVAL; 3345a781ccbSVinicius Costa Gomes } 3355a781ccbSVinicius Costa Gomes 3365a781ccbSVinicius Costa Gomes if (!tb_list[TCA_TAPRIO_SCHED_ENTRY]) { 3375a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Single-entry must include an entry"); 3385a781ccbSVinicius Costa Gomes return -EINVAL; 3395a781ccbSVinicius Costa Gomes } 3405a781ccbSVinicius Costa Gomes 3415a781ccbSVinicius Costa Gomes err = nla_parse_nested(tb_entry, TCA_TAPRIO_SCHED_ENTRY_MAX, 3425a781ccbSVinicius Costa Gomes tb_list[TCA_TAPRIO_SCHED_ENTRY], 3435a781ccbSVinicius Costa Gomes entry_policy, NULL); 3445a781ccbSVinicius Costa Gomes if (err < 0) { 3455a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Could not parse nested entry"); 3465a781ccbSVinicius Costa Gomes return -EINVAL; 3475a781ccbSVinicius Costa Gomes } 3485a781ccbSVinicius Costa Gomes 3495a781ccbSVinicius Costa Gomes if (!tb_entry[TCA_TAPRIO_SCHED_ENTRY_INDEX]) { 3505a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Entry must specify an index\n"); 3515a781ccbSVinicius Costa Gomes return -EINVAL; 3525a781ccbSVinicius Costa Gomes } 3535a781ccbSVinicius Costa Gomes 3545a781ccbSVinicius Costa Gomes index = nla_get_u32(tb_entry[TCA_TAPRIO_SCHED_ENTRY_INDEX]); 3555a781ccbSVinicius Costa Gomes if (index >= q->num_entries) { 3565a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Index for single entry exceeds number of entries in schedule"); 3575a781ccbSVinicius Costa Gomes return -EINVAL; 3585a781ccbSVinicius Costa Gomes } 3595a781ccbSVinicius Costa Gomes 3605a781ccbSVinicius Costa Gomes list_for_each_entry(entry, &q->entries, list) { 3615a781ccbSVinicius Costa Gomes if (entry->index == index) { 3625a781ccbSVinicius Costa Gomes found = true; 3635a781ccbSVinicius Costa Gomes break; 3645a781ccbSVinicius Costa Gomes } 3655a781ccbSVinicius Costa Gomes } 3665a781ccbSVinicius Costa Gomes 3675a781ccbSVinicius Costa Gomes if (!found) { 3685a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Could not find entry"); 3695a781ccbSVinicius Costa Gomes return -ENOENT; 3705a781ccbSVinicius Costa Gomes } 3715a781ccbSVinicius Costa Gomes 3725a781ccbSVinicius Costa Gomes err = fill_sched_entry(tb_entry, entry, extack); 3735a781ccbSVinicius Costa Gomes if (err < 0) 3745a781ccbSVinicius Costa Gomes return err; 3755a781ccbSVinicius Costa Gomes 3765a781ccbSVinicius Costa Gomes return q->num_entries; 3775a781ccbSVinicius Costa Gomes } 3785a781ccbSVinicius Costa Gomes 3795a781ccbSVinicius Costa Gomes static int parse_sched_list(struct nlattr *list, 3805a781ccbSVinicius Costa Gomes struct taprio_sched *q, 3815a781ccbSVinicius Costa Gomes struct netlink_ext_ack *extack) 3825a781ccbSVinicius Costa Gomes { 3835a781ccbSVinicius Costa Gomes struct nlattr *n; 3845a781ccbSVinicius Costa Gomes int err, rem; 3855a781ccbSVinicius Costa Gomes int i = 0; 3865a781ccbSVinicius Costa Gomes 3875a781ccbSVinicius Costa Gomes if (!list) 3885a781ccbSVinicius Costa Gomes return -EINVAL; 3895a781ccbSVinicius Costa Gomes 3905a781ccbSVinicius Costa Gomes nla_for_each_nested(n, list, rem) { 3915a781ccbSVinicius Costa Gomes struct sched_entry *entry; 3925a781ccbSVinicius Costa Gomes 3935a781ccbSVinicius Costa Gomes if (nla_type(n) != TCA_TAPRIO_SCHED_ENTRY) { 3945a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Attribute is not of type 'entry'"); 3955a781ccbSVinicius Costa Gomes continue; 3965a781ccbSVinicius Costa Gomes } 3975a781ccbSVinicius Costa Gomes 3985a781ccbSVinicius Costa Gomes entry = kzalloc(sizeof(*entry), GFP_KERNEL); 3995a781ccbSVinicius Costa Gomes if (!entry) { 4005a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Not enough memory for entry"); 4015a781ccbSVinicius Costa Gomes return -ENOMEM; 4025a781ccbSVinicius Costa Gomes } 4035a781ccbSVinicius Costa Gomes 4045a781ccbSVinicius Costa Gomes err = parse_sched_entry(n, entry, i, extack); 4055a781ccbSVinicius Costa Gomes if (err < 0) { 4065a781ccbSVinicius Costa Gomes kfree(entry); 4075a781ccbSVinicius Costa Gomes return err; 4085a781ccbSVinicius Costa Gomes } 4095a781ccbSVinicius Costa Gomes 4105a781ccbSVinicius Costa Gomes list_add_tail(&entry->list, &q->entries); 4115a781ccbSVinicius Costa Gomes i++; 4125a781ccbSVinicius Costa Gomes } 4135a781ccbSVinicius Costa Gomes 4145a781ccbSVinicius Costa Gomes q->num_entries = i; 4155a781ccbSVinicius Costa Gomes 4165a781ccbSVinicius Costa Gomes return i; 4175a781ccbSVinicius Costa Gomes } 4185a781ccbSVinicius Costa Gomes 4195a781ccbSVinicius Costa Gomes /* Returns the number of entries in case of success */ 4205a781ccbSVinicius Costa Gomes static int parse_taprio_opt(struct nlattr **tb, struct taprio_sched *q, 4215a781ccbSVinicius Costa Gomes struct netlink_ext_ack *extack) 4225a781ccbSVinicius Costa Gomes { 4235a781ccbSVinicius Costa Gomes int err = 0; 4245a781ccbSVinicius Costa Gomes int clockid; 4255a781ccbSVinicius Costa Gomes 4265a781ccbSVinicius Costa Gomes if (tb[TCA_TAPRIO_ATTR_SCHED_ENTRY_LIST] && 4275a781ccbSVinicius Costa Gomes tb[TCA_TAPRIO_ATTR_SCHED_SINGLE_ENTRY]) 4285a781ccbSVinicius Costa Gomes return -EINVAL; 4295a781ccbSVinicius Costa Gomes 4305a781ccbSVinicius Costa Gomes if (tb[TCA_TAPRIO_ATTR_SCHED_SINGLE_ENTRY] && q->num_entries == 0) 4315a781ccbSVinicius Costa Gomes return -EINVAL; 4325a781ccbSVinicius Costa Gomes 4335a781ccbSVinicius Costa Gomes if (q->clockid == -1 && !tb[TCA_TAPRIO_ATTR_SCHED_CLOCKID]) 4345a781ccbSVinicius Costa Gomes return -EINVAL; 4355a781ccbSVinicius Costa Gomes 4365a781ccbSVinicius Costa Gomes if (tb[TCA_TAPRIO_ATTR_SCHED_BASE_TIME]) 4375a781ccbSVinicius Costa Gomes q->base_time = nla_get_s64( 4385a781ccbSVinicius Costa Gomes tb[TCA_TAPRIO_ATTR_SCHED_BASE_TIME]); 4395a781ccbSVinicius Costa Gomes 4405a781ccbSVinicius Costa Gomes if (tb[TCA_TAPRIO_ATTR_SCHED_CLOCKID]) { 4415a781ccbSVinicius Costa Gomes clockid = nla_get_s32(tb[TCA_TAPRIO_ATTR_SCHED_CLOCKID]); 4425a781ccbSVinicius Costa Gomes 4435a781ccbSVinicius Costa Gomes /* We only support static clockids and we don't allow 4445a781ccbSVinicius Costa Gomes * for it to be modified after the first init. 4455a781ccbSVinicius Costa Gomes */ 4465a781ccbSVinicius Costa Gomes if (clockid < 0 || (q->clockid != -1 && q->clockid != clockid)) 4475a781ccbSVinicius Costa Gomes return -EINVAL; 4485a781ccbSVinicius Costa Gomes 4495a781ccbSVinicius Costa Gomes q->clockid = clockid; 4505a781ccbSVinicius Costa Gomes } 4515a781ccbSVinicius Costa Gomes 4525a781ccbSVinicius Costa Gomes if (tb[TCA_TAPRIO_ATTR_SCHED_ENTRY_LIST]) 4535a781ccbSVinicius Costa Gomes err = parse_sched_list( 4545a781ccbSVinicius Costa Gomes tb[TCA_TAPRIO_ATTR_SCHED_ENTRY_LIST], q, extack); 4555a781ccbSVinicius Costa Gomes else if (tb[TCA_TAPRIO_ATTR_SCHED_SINGLE_ENTRY]) 4565a781ccbSVinicius Costa Gomes err = parse_sched_single_entry( 4575a781ccbSVinicius Costa Gomes tb[TCA_TAPRIO_ATTR_SCHED_SINGLE_ENTRY], q, extack); 4585a781ccbSVinicius Costa Gomes 4595a781ccbSVinicius Costa Gomes /* parse_sched_* return the number of entries in the schedule, 4605a781ccbSVinicius Costa Gomes * a schedule with zero entries is an error. 4615a781ccbSVinicius Costa Gomes */ 4625a781ccbSVinicius Costa Gomes if (err == 0) { 4635a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "The schedule should contain at least one entry"); 4645a781ccbSVinicius Costa Gomes return -EINVAL; 4655a781ccbSVinicius Costa Gomes } 4665a781ccbSVinicius Costa Gomes 4675a781ccbSVinicius Costa Gomes return err; 4685a781ccbSVinicius Costa Gomes } 4695a781ccbSVinicius Costa Gomes 4705a781ccbSVinicius Costa Gomes static int taprio_parse_mqprio_opt(struct net_device *dev, 4715a781ccbSVinicius Costa Gomes struct tc_mqprio_qopt *qopt, 4725a781ccbSVinicius Costa Gomes struct netlink_ext_ack *extack) 4735a781ccbSVinicius Costa Gomes { 4745a781ccbSVinicius Costa Gomes int i, j; 4755a781ccbSVinicius Costa Gomes 4765a781ccbSVinicius Costa Gomes if (!qopt) { 4775a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "'mqprio' configuration is necessary"); 4785a781ccbSVinicius Costa Gomes return -EINVAL; 4795a781ccbSVinicius Costa Gomes } 4805a781ccbSVinicius Costa Gomes 4815a781ccbSVinicius Costa Gomes /* Verify num_tc is not out of max range */ 4825a781ccbSVinicius Costa Gomes if (qopt->num_tc > TC_MAX_QUEUE) { 4835a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Number of traffic classes is outside valid range"); 4845a781ccbSVinicius Costa Gomes return -EINVAL; 4855a781ccbSVinicius Costa Gomes } 4865a781ccbSVinicius Costa Gomes 4875a781ccbSVinicius Costa Gomes /* taprio imposes that traffic classes map 1:n to tx queues */ 4885a781ccbSVinicius Costa Gomes if (qopt->num_tc > dev->num_tx_queues) { 4895a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Number of traffic classes is greater than number of HW queues"); 4905a781ccbSVinicius Costa Gomes return -EINVAL; 4915a781ccbSVinicius Costa Gomes } 4925a781ccbSVinicius Costa Gomes 4935a781ccbSVinicius Costa Gomes /* Verify priority mapping uses valid tcs */ 4945a781ccbSVinicius Costa Gomes for (i = 0; i < TC_BITMASK + 1; i++) { 4955a781ccbSVinicius Costa Gomes if (qopt->prio_tc_map[i] >= qopt->num_tc) { 4965a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Invalid traffic class in priority to traffic class mapping"); 4975a781ccbSVinicius Costa Gomes return -EINVAL; 4985a781ccbSVinicius Costa Gomes } 4995a781ccbSVinicius Costa Gomes } 5005a781ccbSVinicius Costa Gomes 5015a781ccbSVinicius Costa Gomes for (i = 0; i < qopt->num_tc; i++) { 5025a781ccbSVinicius Costa Gomes unsigned int last = qopt->offset[i] + qopt->count[i]; 5035a781ccbSVinicius Costa Gomes 5045a781ccbSVinicius Costa Gomes /* Verify the queue count is in tx range being equal to the 5055a781ccbSVinicius Costa Gomes * real_num_tx_queues indicates the last queue is in use. 5065a781ccbSVinicius Costa Gomes */ 5075a781ccbSVinicius Costa Gomes if (qopt->offset[i] >= dev->num_tx_queues || 5085a781ccbSVinicius Costa Gomes !qopt->count[i] || 5095a781ccbSVinicius Costa Gomes last > dev->real_num_tx_queues) { 5105a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Invalid queue in traffic class to queue mapping"); 5115a781ccbSVinicius Costa Gomes return -EINVAL; 5125a781ccbSVinicius Costa Gomes } 5135a781ccbSVinicius Costa Gomes 5145a781ccbSVinicius Costa Gomes /* Verify that the offset and counts do not overlap */ 5155a781ccbSVinicius Costa Gomes for (j = i + 1; j < qopt->num_tc; j++) { 5165a781ccbSVinicius Costa Gomes if (last > qopt->offset[j]) { 5175a781ccbSVinicius Costa Gomes NL_SET_ERR_MSG(extack, "Detected overlap in the traffic class to queue mapping"); 5185a781ccbSVinicius Costa Gomes return -EINVAL; 5195a781ccbSVinicius Costa Gomes } 5205a781ccbSVinicius Costa Gomes } 5215a781ccbSVinicius Costa Gomes } 5225a781ccbSVinicius Costa Gomes 5235a781ccbSVinicius Costa Gomes return 0; 5245a781ccbSVinicius Costa Gomes } 5255a781ccbSVinicius Costa Gomes 5265a781ccbSVinicius Costa Gomes static ktime_t taprio_get_start_time(struct Qdisc *sch) 5275a781ccbSVinicius Costa Gomes { 5285a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 5295a781ccbSVinicius Costa Gomes struct sched_entry *entry; 5305a781ccbSVinicius Costa Gomes ktime_t now, base, cycle; 5315a781ccbSVinicius Costa Gomes s64 n; 5325a781ccbSVinicius Costa Gomes 5335a781ccbSVinicius Costa Gomes base = ns_to_ktime(q->base_time); 5345a781ccbSVinicius Costa Gomes cycle = 0; 5355a781ccbSVinicius Costa Gomes 5365a781ccbSVinicius Costa Gomes /* Calculate the cycle_time, by summing all the intervals. 5375a781ccbSVinicius Costa Gomes */ 5385a781ccbSVinicius Costa Gomes list_for_each_entry(entry, &q->entries, list) 5395a781ccbSVinicius Costa Gomes cycle = ktime_add_ns(cycle, entry->interval); 5405a781ccbSVinicius Costa Gomes 5415a781ccbSVinicius Costa Gomes if (!cycle) 5425a781ccbSVinicius Costa Gomes return base; 5435a781ccbSVinicius Costa Gomes 5445a781ccbSVinicius Costa Gomes now = q->get_time(); 5455a781ccbSVinicius Costa Gomes 5465a781ccbSVinicius Costa Gomes if (ktime_after(base, now)) 5475a781ccbSVinicius Costa Gomes return base; 5485a781ccbSVinicius Costa Gomes 5495a781ccbSVinicius Costa Gomes /* Schedule the start time for the beginning of the next 5505a781ccbSVinicius Costa Gomes * cycle. 5515a781ccbSVinicius Costa Gomes */ 5525a781ccbSVinicius Costa Gomes n = div64_s64(ktime_sub_ns(now, base), cycle); 5535a781ccbSVinicius Costa Gomes 5545a781ccbSVinicius Costa Gomes return ktime_add_ns(base, (n + 1) * cycle); 5555a781ccbSVinicius Costa Gomes } 5565a781ccbSVinicius Costa Gomes 5575a781ccbSVinicius Costa Gomes static void taprio_start_sched(struct Qdisc *sch, ktime_t start) 5585a781ccbSVinicius Costa Gomes { 5595a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 5605a781ccbSVinicius Costa Gomes struct sched_entry *first; 5615a781ccbSVinicius Costa Gomes unsigned long flags; 5625a781ccbSVinicius Costa Gomes 5635a781ccbSVinicius Costa Gomes spin_lock_irqsave(&q->current_entry_lock, flags); 5645a781ccbSVinicius Costa Gomes 5655a781ccbSVinicius Costa Gomes first = list_first_entry(&q->entries, struct sched_entry, 5665a781ccbSVinicius Costa Gomes list); 5675a781ccbSVinicius Costa Gomes 5685a781ccbSVinicius Costa Gomes first->close_time = ktime_add_ns(start, first->interval); 5695a781ccbSVinicius Costa Gomes atomic_set(&first->budget, 5705a781ccbSVinicius Costa Gomes (first->interval * 1000) / q->picos_per_byte); 5715a781ccbSVinicius Costa Gomes rcu_assign_pointer(q->current_entry, NULL); 5725a781ccbSVinicius Costa Gomes 5735a781ccbSVinicius Costa Gomes spin_unlock_irqrestore(&q->current_entry_lock, flags); 5745a781ccbSVinicius Costa Gomes 5755a781ccbSVinicius Costa Gomes hrtimer_start(&q->advance_timer, start, HRTIMER_MODE_ABS); 5765a781ccbSVinicius Costa Gomes } 5775a781ccbSVinicius Costa Gomes 5785a781ccbSVinicius Costa Gomes static int taprio_change(struct Qdisc *sch, struct nlattr *opt, 5795a781ccbSVinicius Costa Gomes struct netlink_ext_ack *extack) 5805a781ccbSVinicius Costa Gomes { 5815a781ccbSVinicius Costa Gomes struct nlattr *tb[TCA_TAPRIO_ATTR_MAX + 1] = { }; 5825a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 5835a781ccbSVinicius Costa Gomes struct net_device *dev = qdisc_dev(sch); 5845a781ccbSVinicius Costa Gomes struct tc_mqprio_qopt *mqprio = NULL; 5855a781ccbSVinicius Costa Gomes struct ethtool_link_ksettings ecmd; 5865a781ccbSVinicius Costa Gomes int i, err, size; 5875a781ccbSVinicius Costa Gomes s64 link_speed; 5885a781ccbSVinicius Costa Gomes ktime_t start; 5895a781ccbSVinicius Costa Gomes 5905a781ccbSVinicius Costa Gomes err = nla_parse_nested(tb, TCA_TAPRIO_ATTR_MAX, opt, 5915a781ccbSVinicius Costa Gomes taprio_policy, extack); 5925a781ccbSVinicius Costa Gomes if (err < 0) 5935a781ccbSVinicius Costa Gomes return err; 5945a781ccbSVinicius Costa Gomes 5955a781ccbSVinicius Costa Gomes err = -EINVAL; 5965a781ccbSVinicius Costa Gomes if (tb[TCA_TAPRIO_ATTR_PRIOMAP]) 5975a781ccbSVinicius Costa Gomes mqprio = nla_data(tb[TCA_TAPRIO_ATTR_PRIOMAP]); 5985a781ccbSVinicius Costa Gomes 5995a781ccbSVinicius Costa Gomes err = taprio_parse_mqprio_opt(dev, mqprio, extack); 6005a781ccbSVinicius Costa Gomes if (err < 0) 6015a781ccbSVinicius Costa Gomes return err; 6025a781ccbSVinicius Costa Gomes 6035a781ccbSVinicius Costa Gomes /* A schedule with less than one entry is an error */ 6045a781ccbSVinicius Costa Gomes size = parse_taprio_opt(tb, q, extack); 6055a781ccbSVinicius Costa Gomes if (size < 0) 6065a781ccbSVinicius Costa Gomes return size; 6075a781ccbSVinicius Costa Gomes 6085a781ccbSVinicius Costa Gomes hrtimer_init(&q->advance_timer, q->clockid, HRTIMER_MODE_ABS); 6095a781ccbSVinicius Costa Gomes q->advance_timer.function = advance_sched; 6105a781ccbSVinicius Costa Gomes 6115a781ccbSVinicius Costa Gomes switch (q->clockid) { 6125a781ccbSVinicius Costa Gomes case CLOCK_REALTIME: 6135a781ccbSVinicius Costa Gomes q->get_time = ktime_get_real; 6145a781ccbSVinicius Costa Gomes break; 6155a781ccbSVinicius Costa Gomes case CLOCK_MONOTONIC: 6165a781ccbSVinicius Costa Gomes q->get_time = ktime_get; 6175a781ccbSVinicius Costa Gomes break; 6185a781ccbSVinicius Costa Gomes case CLOCK_BOOTTIME: 6195a781ccbSVinicius Costa Gomes q->get_time = ktime_get_boottime; 6205a781ccbSVinicius Costa Gomes break; 6215a781ccbSVinicius Costa Gomes case CLOCK_TAI: 6225a781ccbSVinicius Costa Gomes q->get_time = ktime_get_clocktai; 6235a781ccbSVinicius Costa Gomes break; 6245a781ccbSVinicius Costa Gomes default: 6255a781ccbSVinicius Costa Gomes return -ENOTSUPP; 6265a781ccbSVinicius Costa Gomes } 6275a781ccbSVinicius Costa Gomes 6285a781ccbSVinicius Costa Gomes for (i = 0; i < dev->num_tx_queues; i++) { 6295a781ccbSVinicius Costa Gomes struct netdev_queue *dev_queue; 6305a781ccbSVinicius Costa Gomes struct Qdisc *qdisc; 6315a781ccbSVinicius Costa Gomes 6325a781ccbSVinicius Costa Gomes dev_queue = netdev_get_tx_queue(dev, i); 6335a781ccbSVinicius Costa Gomes qdisc = qdisc_create_dflt(dev_queue, 6345a781ccbSVinicius Costa Gomes &pfifo_qdisc_ops, 6355a781ccbSVinicius Costa Gomes TC_H_MAKE(TC_H_MAJ(sch->handle), 6365a781ccbSVinicius Costa Gomes TC_H_MIN(i + 1)), 6375a781ccbSVinicius Costa Gomes extack); 6385a781ccbSVinicius Costa Gomes if (!qdisc) 6395a781ccbSVinicius Costa Gomes return -ENOMEM; 6405a781ccbSVinicius Costa Gomes 6415a781ccbSVinicius Costa Gomes if (i < dev->real_num_tx_queues) 6425a781ccbSVinicius Costa Gomes qdisc_hash_add(qdisc, false); 6435a781ccbSVinicius Costa Gomes 6445a781ccbSVinicius Costa Gomes q->qdiscs[i] = qdisc; 6455a781ccbSVinicius Costa Gomes } 6465a781ccbSVinicius Costa Gomes 6475a781ccbSVinicius Costa Gomes if (mqprio) { 6485a781ccbSVinicius Costa Gomes netdev_set_num_tc(dev, mqprio->num_tc); 6495a781ccbSVinicius Costa Gomes for (i = 0; i < mqprio->num_tc; i++) 6505a781ccbSVinicius Costa Gomes netdev_set_tc_queue(dev, i, 6515a781ccbSVinicius Costa Gomes mqprio->count[i], 6525a781ccbSVinicius Costa Gomes mqprio->offset[i]); 6535a781ccbSVinicius Costa Gomes 6545a781ccbSVinicius Costa Gomes /* Always use supplied priority mappings */ 6555a781ccbSVinicius Costa Gomes for (i = 0; i < TC_BITMASK + 1; i++) 6565a781ccbSVinicius Costa Gomes netdev_set_prio_tc_map(dev, i, 6575a781ccbSVinicius Costa Gomes mqprio->prio_tc_map[i]); 6585a781ccbSVinicius Costa Gomes } 6595a781ccbSVinicius Costa Gomes 6605a781ccbSVinicius Costa Gomes if (!__ethtool_get_link_ksettings(dev, &ecmd)) 6615a781ccbSVinicius Costa Gomes link_speed = ecmd.base.speed; 6625a781ccbSVinicius Costa Gomes else 6635a781ccbSVinicius Costa Gomes link_speed = SPEED_1000; 6645a781ccbSVinicius Costa Gomes 6655a781ccbSVinicius Costa Gomes q->picos_per_byte = div64_s64(NSEC_PER_SEC * 1000LL * 8, 6665a781ccbSVinicius Costa Gomes link_speed * 1000 * 1000); 6675a781ccbSVinicius Costa Gomes 6685a781ccbSVinicius Costa Gomes start = taprio_get_start_time(sch); 6695a781ccbSVinicius Costa Gomes if (!start) 6705a781ccbSVinicius Costa Gomes return 0; 6715a781ccbSVinicius Costa Gomes 6725a781ccbSVinicius Costa Gomes taprio_start_sched(sch, start); 6735a781ccbSVinicius Costa Gomes 6745a781ccbSVinicius Costa Gomes return 0; 6755a781ccbSVinicius Costa Gomes } 6765a781ccbSVinicius Costa Gomes 6775a781ccbSVinicius Costa Gomes static void taprio_destroy(struct Qdisc *sch) 6785a781ccbSVinicius Costa Gomes { 6795a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 6805a781ccbSVinicius Costa Gomes struct net_device *dev = qdisc_dev(sch); 6815a781ccbSVinicius Costa Gomes struct sched_entry *entry, *n; 6825a781ccbSVinicius Costa Gomes unsigned int i; 6835a781ccbSVinicius Costa Gomes 6845a781ccbSVinicius Costa Gomes hrtimer_cancel(&q->advance_timer); 6855a781ccbSVinicius Costa Gomes 6865a781ccbSVinicius Costa Gomes if (q->qdiscs) { 6875a781ccbSVinicius Costa Gomes for (i = 0; i < dev->num_tx_queues && q->qdiscs[i]; i++) 6885a781ccbSVinicius Costa Gomes qdisc_put(q->qdiscs[i]); 6895a781ccbSVinicius Costa Gomes 6905a781ccbSVinicius Costa Gomes kfree(q->qdiscs); 6915a781ccbSVinicius Costa Gomes } 6925a781ccbSVinicius Costa Gomes q->qdiscs = NULL; 6935a781ccbSVinicius Costa Gomes 6945a781ccbSVinicius Costa Gomes netdev_set_num_tc(dev, 0); 6955a781ccbSVinicius Costa Gomes 6965a781ccbSVinicius Costa Gomes list_for_each_entry_safe(entry, n, &q->entries, list) { 6975a781ccbSVinicius Costa Gomes list_del(&entry->list); 6985a781ccbSVinicius Costa Gomes kfree(entry); 6995a781ccbSVinicius Costa Gomes } 7005a781ccbSVinicius Costa Gomes } 7015a781ccbSVinicius Costa Gomes 7025a781ccbSVinicius Costa Gomes static int taprio_init(struct Qdisc *sch, struct nlattr *opt, 7035a781ccbSVinicius Costa Gomes struct netlink_ext_ack *extack) 7045a781ccbSVinicius Costa Gomes { 7055a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 7065a781ccbSVinicius Costa Gomes struct net_device *dev = qdisc_dev(sch); 7075a781ccbSVinicius Costa Gomes 7085a781ccbSVinicius Costa Gomes INIT_LIST_HEAD(&q->entries); 7095a781ccbSVinicius Costa Gomes spin_lock_init(&q->current_entry_lock); 7105a781ccbSVinicius Costa Gomes 7115a781ccbSVinicius Costa Gomes /* We may overwrite the configuration later */ 7125a781ccbSVinicius Costa Gomes hrtimer_init(&q->advance_timer, CLOCK_TAI, HRTIMER_MODE_ABS); 7135a781ccbSVinicius Costa Gomes 7145a781ccbSVinicius Costa Gomes q->root = sch; 7155a781ccbSVinicius Costa Gomes 7165a781ccbSVinicius Costa Gomes /* We only support static clockids. Use an invalid value as default 7175a781ccbSVinicius Costa Gomes * and get the valid one on taprio_change(). 7185a781ccbSVinicius Costa Gomes */ 7195a781ccbSVinicius Costa Gomes q->clockid = -1; 7205a781ccbSVinicius Costa Gomes 7215a781ccbSVinicius Costa Gomes if (sch->parent != TC_H_ROOT) 7225a781ccbSVinicius Costa Gomes return -EOPNOTSUPP; 7235a781ccbSVinicius Costa Gomes 7245a781ccbSVinicius Costa Gomes if (!netif_is_multiqueue(dev)) 7255a781ccbSVinicius Costa Gomes return -EOPNOTSUPP; 7265a781ccbSVinicius Costa Gomes 7275a781ccbSVinicius Costa Gomes /* pre-allocate qdisc, attachment can't fail */ 7285a781ccbSVinicius Costa Gomes q->qdiscs = kcalloc(dev->num_tx_queues, 7295a781ccbSVinicius Costa Gomes sizeof(q->qdiscs[0]), 7305a781ccbSVinicius Costa Gomes GFP_KERNEL); 7315a781ccbSVinicius Costa Gomes 7325a781ccbSVinicius Costa Gomes if (!q->qdiscs) 7335a781ccbSVinicius Costa Gomes return -ENOMEM; 7345a781ccbSVinicius Costa Gomes 7355a781ccbSVinicius Costa Gomes if (!opt) 7365a781ccbSVinicius Costa Gomes return -EINVAL; 7375a781ccbSVinicius Costa Gomes 7385a781ccbSVinicius Costa Gomes return taprio_change(sch, opt, extack); 7395a781ccbSVinicius Costa Gomes } 7405a781ccbSVinicius Costa Gomes 7415a781ccbSVinicius Costa Gomes static struct netdev_queue *taprio_queue_get(struct Qdisc *sch, 7425a781ccbSVinicius Costa Gomes unsigned long cl) 7435a781ccbSVinicius Costa Gomes { 7445a781ccbSVinicius Costa Gomes struct net_device *dev = qdisc_dev(sch); 7455a781ccbSVinicius Costa Gomes unsigned long ntx = cl - 1; 7465a781ccbSVinicius Costa Gomes 7475a781ccbSVinicius Costa Gomes if (ntx >= dev->num_tx_queues) 7485a781ccbSVinicius Costa Gomes return NULL; 7495a781ccbSVinicius Costa Gomes 7505a781ccbSVinicius Costa Gomes return netdev_get_tx_queue(dev, ntx); 7515a781ccbSVinicius Costa Gomes } 7525a781ccbSVinicius Costa Gomes 7535a781ccbSVinicius Costa Gomes static int taprio_graft(struct Qdisc *sch, unsigned long cl, 7545a781ccbSVinicius Costa Gomes struct Qdisc *new, struct Qdisc **old, 7555a781ccbSVinicius Costa Gomes struct netlink_ext_ack *extack) 7565a781ccbSVinicius Costa Gomes { 7575a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 7585a781ccbSVinicius Costa Gomes struct net_device *dev = qdisc_dev(sch); 7595a781ccbSVinicius Costa Gomes struct netdev_queue *dev_queue = taprio_queue_get(sch, cl); 7605a781ccbSVinicius Costa Gomes 7615a781ccbSVinicius Costa Gomes if (!dev_queue) 7625a781ccbSVinicius Costa Gomes return -EINVAL; 7635a781ccbSVinicius Costa Gomes 7645a781ccbSVinicius Costa Gomes if (dev->flags & IFF_UP) 7655a781ccbSVinicius Costa Gomes dev_deactivate(dev); 7665a781ccbSVinicius Costa Gomes 7675a781ccbSVinicius Costa Gomes *old = q->qdiscs[cl - 1]; 7685a781ccbSVinicius Costa Gomes q->qdiscs[cl - 1] = new; 7695a781ccbSVinicius Costa Gomes 7705a781ccbSVinicius Costa Gomes if (new) 7715a781ccbSVinicius Costa Gomes new->flags |= TCQ_F_ONETXQUEUE | TCQ_F_NOPARENT; 7725a781ccbSVinicius Costa Gomes 7735a781ccbSVinicius Costa Gomes if (dev->flags & IFF_UP) 7745a781ccbSVinicius Costa Gomes dev_activate(dev); 7755a781ccbSVinicius Costa Gomes 7765a781ccbSVinicius Costa Gomes return 0; 7775a781ccbSVinicius Costa Gomes } 7785a781ccbSVinicius Costa Gomes 7795a781ccbSVinicius Costa Gomes static int dump_entry(struct sk_buff *msg, 7805a781ccbSVinicius Costa Gomes const struct sched_entry *entry) 7815a781ccbSVinicius Costa Gomes { 7825a781ccbSVinicius Costa Gomes struct nlattr *item; 7835a781ccbSVinicius Costa Gomes 7845a781ccbSVinicius Costa Gomes item = nla_nest_start(msg, TCA_TAPRIO_SCHED_ENTRY); 7855a781ccbSVinicius Costa Gomes if (!item) 7865a781ccbSVinicius Costa Gomes return -ENOSPC; 7875a781ccbSVinicius Costa Gomes 7885a781ccbSVinicius Costa Gomes if (nla_put_u32(msg, TCA_TAPRIO_SCHED_ENTRY_INDEX, entry->index)) 7895a781ccbSVinicius Costa Gomes goto nla_put_failure; 7905a781ccbSVinicius Costa Gomes 7915a781ccbSVinicius Costa Gomes if (nla_put_u8(msg, TCA_TAPRIO_SCHED_ENTRY_CMD, entry->command)) 7925a781ccbSVinicius Costa Gomes goto nla_put_failure; 7935a781ccbSVinicius Costa Gomes 7945a781ccbSVinicius Costa Gomes if (nla_put_u32(msg, TCA_TAPRIO_SCHED_ENTRY_GATE_MASK, 7955a781ccbSVinicius Costa Gomes entry->gate_mask)) 7965a781ccbSVinicius Costa Gomes goto nla_put_failure; 7975a781ccbSVinicius Costa Gomes 7985a781ccbSVinicius Costa Gomes if (nla_put_u32(msg, TCA_TAPRIO_SCHED_ENTRY_INTERVAL, 7995a781ccbSVinicius Costa Gomes entry->interval)) 8005a781ccbSVinicius Costa Gomes goto nla_put_failure; 8015a781ccbSVinicius Costa Gomes 8025a781ccbSVinicius Costa Gomes return nla_nest_end(msg, item); 8035a781ccbSVinicius Costa Gomes 8045a781ccbSVinicius Costa Gomes nla_put_failure: 8055a781ccbSVinicius Costa Gomes nla_nest_cancel(msg, item); 8065a781ccbSVinicius Costa Gomes return -1; 8075a781ccbSVinicius Costa Gomes } 8085a781ccbSVinicius Costa Gomes 8095a781ccbSVinicius Costa Gomes static int taprio_dump(struct Qdisc *sch, struct sk_buff *skb) 8105a781ccbSVinicius Costa Gomes { 8115a781ccbSVinicius Costa Gomes struct taprio_sched *q = qdisc_priv(sch); 8125a781ccbSVinicius Costa Gomes struct net_device *dev = qdisc_dev(sch); 8135a781ccbSVinicius Costa Gomes struct tc_mqprio_qopt opt = { 0 }; 8145a781ccbSVinicius Costa Gomes struct nlattr *nest, *entry_list; 8155a781ccbSVinicius Costa Gomes struct sched_entry *entry; 8165a781ccbSVinicius Costa Gomes unsigned int i; 8175a781ccbSVinicius Costa Gomes 8185a781ccbSVinicius Costa Gomes opt.num_tc = netdev_get_num_tc(dev); 8195a781ccbSVinicius Costa Gomes memcpy(opt.prio_tc_map, dev->prio_tc_map, sizeof(opt.prio_tc_map)); 8205a781ccbSVinicius Costa Gomes 8215a781ccbSVinicius Costa Gomes for (i = 0; i < netdev_get_num_tc(dev); i++) { 8225a781ccbSVinicius Costa Gomes opt.count[i] = dev->tc_to_txq[i].count; 8235a781ccbSVinicius Costa Gomes opt.offset[i] = dev->tc_to_txq[i].offset; 8245a781ccbSVinicius Costa Gomes } 8255a781ccbSVinicius Costa Gomes 8265a781ccbSVinicius Costa Gomes nest = nla_nest_start(skb, TCA_OPTIONS); 8275a781ccbSVinicius Costa Gomes if (!nest) 8285a781ccbSVinicius Costa Gomes return -ENOSPC; 8295a781ccbSVinicius Costa Gomes 8305a781ccbSVinicius Costa Gomes if (nla_put(skb, TCA_TAPRIO_ATTR_PRIOMAP, sizeof(opt), &opt)) 8315a781ccbSVinicius Costa Gomes goto options_error; 8325a781ccbSVinicius Costa Gomes 8335a781ccbSVinicius Costa Gomes if (nla_put_s64(skb, TCA_TAPRIO_ATTR_SCHED_BASE_TIME, 8345a781ccbSVinicius Costa Gomes q->base_time, TCA_TAPRIO_PAD)) 8355a781ccbSVinicius Costa Gomes goto options_error; 8365a781ccbSVinicius Costa Gomes 8375a781ccbSVinicius Costa Gomes if (nla_put_s32(skb, TCA_TAPRIO_ATTR_SCHED_CLOCKID, q->clockid)) 8385a781ccbSVinicius Costa Gomes goto options_error; 8395a781ccbSVinicius Costa Gomes 8405a781ccbSVinicius Costa Gomes entry_list = nla_nest_start(skb, TCA_TAPRIO_ATTR_SCHED_ENTRY_LIST); 8415a781ccbSVinicius Costa Gomes if (!entry_list) 8425a781ccbSVinicius Costa Gomes goto options_error; 8435a781ccbSVinicius Costa Gomes 8445a781ccbSVinicius Costa Gomes list_for_each_entry(entry, &q->entries, list) { 8455a781ccbSVinicius Costa Gomes if (dump_entry(skb, entry) < 0) 8465a781ccbSVinicius Costa Gomes goto options_error; 8475a781ccbSVinicius Costa Gomes } 8485a781ccbSVinicius Costa Gomes 8495a781ccbSVinicius Costa Gomes nla_nest_end(skb, entry_list); 8505a781ccbSVinicius Costa Gomes 8515a781ccbSVinicius Costa Gomes return nla_nest_end(skb, nest); 8525a781ccbSVinicius Costa Gomes 8535a781ccbSVinicius Costa Gomes options_error: 8545a781ccbSVinicius Costa Gomes nla_nest_cancel(skb, nest); 8555a781ccbSVinicius Costa Gomes return -1; 8565a781ccbSVinicius Costa Gomes } 8575a781ccbSVinicius Costa Gomes 8585a781ccbSVinicius Costa Gomes static struct Qdisc *taprio_leaf(struct Qdisc *sch, unsigned long cl) 8595a781ccbSVinicius Costa Gomes { 8605a781ccbSVinicius Costa Gomes struct netdev_queue *dev_queue = taprio_queue_get(sch, cl); 8615a781ccbSVinicius Costa Gomes 8625a781ccbSVinicius Costa Gomes if (!dev_queue) 8635a781ccbSVinicius Costa Gomes return NULL; 8645a781ccbSVinicius Costa Gomes 8655a781ccbSVinicius Costa Gomes return dev_queue->qdisc_sleeping; 8665a781ccbSVinicius Costa Gomes } 8675a781ccbSVinicius Costa Gomes 8685a781ccbSVinicius Costa Gomes static unsigned long taprio_find(struct Qdisc *sch, u32 classid) 8695a781ccbSVinicius Costa Gomes { 8705a781ccbSVinicius Costa Gomes unsigned int ntx = TC_H_MIN(classid); 8715a781ccbSVinicius Costa Gomes 8725a781ccbSVinicius Costa Gomes if (!taprio_queue_get(sch, ntx)) 8735a781ccbSVinicius Costa Gomes return 0; 8745a781ccbSVinicius Costa Gomes return ntx; 8755a781ccbSVinicius Costa Gomes } 8765a781ccbSVinicius Costa Gomes 8775a781ccbSVinicius Costa Gomes static int taprio_dump_class(struct Qdisc *sch, unsigned long cl, 8785a781ccbSVinicius Costa Gomes struct sk_buff *skb, struct tcmsg *tcm) 8795a781ccbSVinicius Costa Gomes { 8805a781ccbSVinicius Costa Gomes struct netdev_queue *dev_queue = taprio_queue_get(sch, cl); 8815a781ccbSVinicius Costa Gomes 8825a781ccbSVinicius Costa Gomes tcm->tcm_parent = TC_H_ROOT; 8835a781ccbSVinicius Costa Gomes tcm->tcm_handle |= TC_H_MIN(cl); 8845a781ccbSVinicius Costa Gomes tcm->tcm_info = dev_queue->qdisc_sleeping->handle; 8855a781ccbSVinicius Costa Gomes 8865a781ccbSVinicius Costa Gomes return 0; 8875a781ccbSVinicius Costa Gomes } 8885a781ccbSVinicius Costa Gomes 8895a781ccbSVinicius Costa Gomes static int taprio_dump_class_stats(struct Qdisc *sch, unsigned long cl, 8905a781ccbSVinicius Costa Gomes struct gnet_dump *d) 8915a781ccbSVinicius Costa Gomes __releases(d->lock) 8925a781ccbSVinicius Costa Gomes __acquires(d->lock) 8935a781ccbSVinicius Costa Gomes { 8945a781ccbSVinicius Costa Gomes struct netdev_queue *dev_queue = taprio_queue_get(sch, cl); 8955a781ccbSVinicius Costa Gomes 8965a781ccbSVinicius Costa Gomes sch = dev_queue->qdisc_sleeping; 8975a781ccbSVinicius Costa Gomes if (gnet_stats_copy_basic(&sch->running, d, NULL, &sch->bstats) < 0 || 898*5dd431b6SPaolo Abeni qdisc_qstats_copy(d, sch) < 0) 8995a781ccbSVinicius Costa Gomes return -1; 9005a781ccbSVinicius Costa Gomes return 0; 9015a781ccbSVinicius Costa Gomes } 9025a781ccbSVinicius Costa Gomes 9035a781ccbSVinicius Costa Gomes static void taprio_walk(struct Qdisc *sch, struct qdisc_walker *arg) 9045a781ccbSVinicius Costa Gomes { 9055a781ccbSVinicius Costa Gomes struct net_device *dev = qdisc_dev(sch); 9065a781ccbSVinicius Costa Gomes unsigned long ntx; 9075a781ccbSVinicius Costa Gomes 9085a781ccbSVinicius Costa Gomes if (arg->stop) 9095a781ccbSVinicius Costa Gomes return; 9105a781ccbSVinicius Costa Gomes 9115a781ccbSVinicius Costa Gomes arg->count = arg->skip; 9125a781ccbSVinicius Costa Gomes for (ntx = arg->skip; ntx < dev->num_tx_queues; ntx++) { 9135a781ccbSVinicius Costa Gomes if (arg->fn(sch, ntx + 1, arg) < 0) { 9145a781ccbSVinicius Costa Gomes arg->stop = 1; 9155a781ccbSVinicius Costa Gomes break; 9165a781ccbSVinicius Costa Gomes } 9175a781ccbSVinicius Costa Gomes arg->count++; 9185a781ccbSVinicius Costa Gomes } 9195a781ccbSVinicius Costa Gomes } 9205a781ccbSVinicius Costa Gomes 9215a781ccbSVinicius Costa Gomes static struct netdev_queue *taprio_select_queue(struct Qdisc *sch, 9225a781ccbSVinicius Costa Gomes struct tcmsg *tcm) 9235a781ccbSVinicius Costa Gomes { 9245a781ccbSVinicius Costa Gomes return taprio_queue_get(sch, TC_H_MIN(tcm->tcm_parent)); 9255a781ccbSVinicius Costa Gomes } 9265a781ccbSVinicius Costa Gomes 9275a781ccbSVinicius Costa Gomes static const struct Qdisc_class_ops taprio_class_ops = { 9285a781ccbSVinicius Costa Gomes .graft = taprio_graft, 9295a781ccbSVinicius Costa Gomes .leaf = taprio_leaf, 9305a781ccbSVinicius Costa Gomes .find = taprio_find, 9315a781ccbSVinicius Costa Gomes .walk = taprio_walk, 9325a781ccbSVinicius Costa Gomes .dump = taprio_dump_class, 9335a781ccbSVinicius Costa Gomes .dump_stats = taprio_dump_class_stats, 9345a781ccbSVinicius Costa Gomes .select_queue = taprio_select_queue, 9355a781ccbSVinicius Costa Gomes }; 9365a781ccbSVinicius Costa Gomes 9375a781ccbSVinicius Costa Gomes static struct Qdisc_ops taprio_qdisc_ops __read_mostly = { 9385a781ccbSVinicius Costa Gomes .cl_ops = &taprio_class_ops, 9395a781ccbSVinicius Costa Gomes .id = "taprio", 9405a781ccbSVinicius Costa Gomes .priv_size = sizeof(struct taprio_sched), 9415a781ccbSVinicius Costa Gomes .init = taprio_init, 9425a781ccbSVinicius Costa Gomes .destroy = taprio_destroy, 9435a781ccbSVinicius Costa Gomes .peek = taprio_peek, 9445a781ccbSVinicius Costa Gomes .dequeue = taprio_dequeue, 9455a781ccbSVinicius Costa Gomes .enqueue = taprio_enqueue, 9465a781ccbSVinicius Costa Gomes .dump = taprio_dump, 9475a781ccbSVinicius Costa Gomes .owner = THIS_MODULE, 9485a781ccbSVinicius Costa Gomes }; 9495a781ccbSVinicius Costa Gomes 9505a781ccbSVinicius Costa Gomes static int __init taprio_module_init(void) 9515a781ccbSVinicius Costa Gomes { 9525a781ccbSVinicius Costa Gomes return register_qdisc(&taprio_qdisc_ops); 9535a781ccbSVinicius Costa Gomes } 9545a781ccbSVinicius Costa Gomes 9555a781ccbSVinicius Costa Gomes static void __exit taprio_module_exit(void) 9565a781ccbSVinicius Costa Gomes { 9575a781ccbSVinicius Costa Gomes unregister_qdisc(&taprio_qdisc_ops); 9585a781ccbSVinicius Costa Gomes } 9595a781ccbSVinicius Costa Gomes 9605a781ccbSVinicius Costa Gomes module_init(taprio_module_init); 9615a781ccbSVinicius Costa Gomes module_exit(taprio_module_exit); 9625a781ccbSVinicius Costa Gomes MODULE_LICENSE("GPL"); 963