1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* 3 * net/sched/cls_flower.c Flower classifier 4 * 5 * Copyright (c) 2015 Jiri Pirko <jiri@resnulli.us> 6 */ 7 8 #include <linux/kernel.h> 9 #include <linux/init.h> 10 #include <linux/module.h> 11 #include <linux/rhashtable.h> 12 #include <linux/workqueue.h> 13 #include <linux/refcount.h> 14 15 #include <linux/if_ether.h> 16 #include <linux/in6.h> 17 #include <linux/ip.h> 18 #include <linux/mpls.h> 19 20 #include <net/sch_generic.h> 21 #include <net/pkt_cls.h> 22 #include <net/ip.h> 23 #include <net/flow_dissector.h> 24 #include <net/geneve.h> 25 #include <net/vxlan.h> 26 #include <net/erspan.h> 27 28 #include <net/dst.h> 29 #include <net/dst_metadata.h> 30 31 #include <uapi/linux/netfilter/nf_conntrack_common.h> 32 33 #define TCA_FLOWER_KEY_CT_FLAGS_MAX \ 34 ((__TCA_FLOWER_KEY_CT_FLAGS_MAX - 1) << 1) 35 #define TCA_FLOWER_KEY_CT_FLAGS_MASK \ 36 (TCA_FLOWER_KEY_CT_FLAGS_MAX - 1) 37 38 struct fl_flow_key { 39 struct flow_dissector_key_meta meta; 40 struct flow_dissector_key_control control; 41 struct flow_dissector_key_control enc_control; 42 struct flow_dissector_key_basic basic; 43 struct flow_dissector_key_eth_addrs eth; 44 struct flow_dissector_key_vlan vlan; 45 struct flow_dissector_key_vlan cvlan; 46 union { 47 struct flow_dissector_key_ipv4_addrs ipv4; 48 struct flow_dissector_key_ipv6_addrs ipv6; 49 }; 50 struct flow_dissector_key_ports tp; 51 struct flow_dissector_key_icmp icmp; 52 struct flow_dissector_key_arp arp; 53 struct flow_dissector_key_keyid enc_key_id; 54 union { 55 struct flow_dissector_key_ipv4_addrs enc_ipv4; 56 struct flow_dissector_key_ipv6_addrs enc_ipv6; 57 }; 58 struct flow_dissector_key_ports enc_tp; 59 struct flow_dissector_key_mpls mpls; 60 struct flow_dissector_key_tcp tcp; 61 struct flow_dissector_key_ip ip; 62 struct flow_dissector_key_ip enc_ip; 63 struct flow_dissector_key_enc_opts enc_opts; 64 union { 65 struct flow_dissector_key_ports tp; 66 struct { 67 struct flow_dissector_key_ports tp_min; 68 struct flow_dissector_key_ports tp_max; 69 }; 70 } tp_range; 71 struct flow_dissector_key_ct ct; 72 struct flow_dissector_key_hash hash; 73 } __aligned(BITS_PER_LONG / 8); /* Ensure that we can do comparisons as longs. */ 74 75 struct fl_flow_mask_range { 76 unsigned short int start; 77 unsigned short int end; 78 }; 79 80 struct fl_flow_mask { 81 struct fl_flow_key key; 82 struct fl_flow_mask_range range; 83 u32 flags; 84 struct rhash_head ht_node; 85 struct rhashtable ht; 86 struct rhashtable_params filter_ht_params; 87 struct flow_dissector dissector; 88 struct list_head filters; 89 struct rcu_work rwork; 90 struct list_head list; 91 refcount_t refcnt; 92 }; 93 94 struct fl_flow_tmplt { 95 struct fl_flow_key dummy_key; 96 struct fl_flow_key mask; 97 struct flow_dissector dissector; 98 struct tcf_chain *chain; 99 }; 100 101 struct cls_fl_head { 102 struct rhashtable ht; 103 spinlock_t masks_lock; /* Protect masks list */ 104 struct list_head masks; 105 struct list_head hw_filters; 106 struct rcu_work rwork; 107 struct idr handle_idr; 108 }; 109 110 struct cls_fl_filter { 111 struct fl_flow_mask *mask; 112 struct rhash_head ht_node; 113 struct fl_flow_key mkey; 114 struct tcf_exts exts; 115 struct tcf_result res; 116 struct fl_flow_key key; 117 struct list_head list; 118 struct list_head hw_list; 119 u32 handle; 120 u32 flags; 121 u32 in_hw_count; 122 struct rcu_work rwork; 123 struct net_device *hw_dev; 124 /* Flower classifier is unlocked, which means that its reference counter 125 * can be changed concurrently without any kind of external 126 * synchronization. Use atomic reference counter to be concurrency-safe. 127 */ 128 refcount_t refcnt; 129 bool deleted; 130 }; 131 132 static const struct rhashtable_params mask_ht_params = { 133 .key_offset = offsetof(struct fl_flow_mask, key), 134 .key_len = sizeof(struct fl_flow_key), 135 .head_offset = offsetof(struct fl_flow_mask, ht_node), 136 .automatic_shrinking = true, 137 }; 138 139 static unsigned short int fl_mask_range(const struct fl_flow_mask *mask) 140 { 141 return mask->range.end - mask->range.start; 142 } 143 144 static void fl_mask_update_range(struct fl_flow_mask *mask) 145 { 146 const u8 *bytes = (const u8 *) &mask->key; 147 size_t size = sizeof(mask->key); 148 size_t i, first = 0, last; 149 150 for (i = 0; i < size; i++) { 151 if (bytes[i]) { 152 first = i; 153 break; 154 } 155 } 156 last = first; 157 for (i = size - 1; i != first; i--) { 158 if (bytes[i]) { 159 last = i; 160 break; 161 } 162 } 163 mask->range.start = rounddown(first, sizeof(long)); 164 mask->range.end = roundup(last + 1, sizeof(long)); 165 } 166 167 static void *fl_key_get_start(struct fl_flow_key *key, 168 const struct fl_flow_mask *mask) 169 { 170 return (u8 *) key + mask->range.start; 171 } 172 173 static void fl_set_masked_key(struct fl_flow_key *mkey, struct fl_flow_key *key, 174 struct fl_flow_mask *mask) 175 { 176 const long *lkey = fl_key_get_start(key, mask); 177 const long *lmask = fl_key_get_start(&mask->key, mask); 178 long *lmkey = fl_key_get_start(mkey, mask); 179 int i; 180 181 for (i = 0; i < fl_mask_range(mask); i += sizeof(long)) 182 *lmkey++ = *lkey++ & *lmask++; 183 } 184 185 static bool fl_mask_fits_tmplt(struct fl_flow_tmplt *tmplt, 186 struct fl_flow_mask *mask) 187 { 188 const long *lmask = fl_key_get_start(&mask->key, mask); 189 const long *ltmplt; 190 int i; 191 192 if (!tmplt) 193 return true; 194 ltmplt = fl_key_get_start(&tmplt->mask, mask); 195 for (i = 0; i < fl_mask_range(mask); i += sizeof(long)) { 196 if (~*ltmplt++ & *lmask++) 197 return false; 198 } 199 return true; 200 } 201 202 static void fl_clear_masked_range(struct fl_flow_key *key, 203 struct fl_flow_mask *mask) 204 { 205 memset(fl_key_get_start(key, mask), 0, fl_mask_range(mask)); 206 } 207 208 static bool fl_range_port_dst_cmp(struct cls_fl_filter *filter, 209 struct fl_flow_key *key, 210 struct fl_flow_key *mkey) 211 { 212 u16 min_mask, max_mask, min_val, max_val; 213 214 min_mask = ntohs(filter->mask->key.tp_range.tp_min.dst); 215 max_mask = ntohs(filter->mask->key.tp_range.tp_max.dst); 216 min_val = ntohs(filter->key.tp_range.tp_min.dst); 217 max_val = ntohs(filter->key.tp_range.tp_max.dst); 218 219 if (min_mask && max_mask) { 220 if (ntohs(key->tp_range.tp.dst) < min_val || 221 ntohs(key->tp_range.tp.dst) > max_val) 222 return false; 223 224 /* skb does not have min and max values */ 225 mkey->tp_range.tp_min.dst = filter->mkey.tp_range.tp_min.dst; 226 mkey->tp_range.tp_max.dst = filter->mkey.tp_range.tp_max.dst; 227 } 228 return true; 229 } 230 231 static bool fl_range_port_src_cmp(struct cls_fl_filter *filter, 232 struct fl_flow_key *key, 233 struct fl_flow_key *mkey) 234 { 235 u16 min_mask, max_mask, min_val, max_val; 236 237 min_mask = ntohs(filter->mask->key.tp_range.tp_min.src); 238 max_mask = ntohs(filter->mask->key.tp_range.tp_max.src); 239 min_val = ntohs(filter->key.tp_range.tp_min.src); 240 max_val = ntohs(filter->key.tp_range.tp_max.src); 241 242 if (min_mask && max_mask) { 243 if (ntohs(key->tp_range.tp.src) < min_val || 244 ntohs(key->tp_range.tp.src) > max_val) 245 return false; 246 247 /* skb does not have min and max values */ 248 mkey->tp_range.tp_min.src = filter->mkey.tp_range.tp_min.src; 249 mkey->tp_range.tp_max.src = filter->mkey.tp_range.tp_max.src; 250 } 251 return true; 252 } 253 254 static struct cls_fl_filter *__fl_lookup(struct fl_flow_mask *mask, 255 struct fl_flow_key *mkey) 256 { 257 return rhashtable_lookup_fast(&mask->ht, fl_key_get_start(mkey, mask), 258 mask->filter_ht_params); 259 } 260 261 static struct cls_fl_filter *fl_lookup_range(struct fl_flow_mask *mask, 262 struct fl_flow_key *mkey, 263 struct fl_flow_key *key) 264 { 265 struct cls_fl_filter *filter, *f; 266 267 list_for_each_entry_rcu(filter, &mask->filters, list) { 268 if (!fl_range_port_dst_cmp(filter, key, mkey)) 269 continue; 270 271 if (!fl_range_port_src_cmp(filter, key, mkey)) 272 continue; 273 274 f = __fl_lookup(mask, mkey); 275 if (f) 276 return f; 277 } 278 return NULL; 279 } 280 281 static noinline_for_stack 282 struct cls_fl_filter *fl_mask_lookup(struct fl_flow_mask *mask, struct fl_flow_key *key) 283 { 284 struct fl_flow_key mkey; 285 286 fl_set_masked_key(&mkey, key, mask); 287 if ((mask->flags & TCA_FLOWER_MASK_FLAGS_RANGE)) 288 return fl_lookup_range(mask, &mkey, key); 289 290 return __fl_lookup(mask, &mkey); 291 } 292 293 static u16 fl_ct_info_to_flower_map[] = { 294 [IP_CT_ESTABLISHED] = TCA_FLOWER_KEY_CT_FLAGS_TRACKED | 295 TCA_FLOWER_KEY_CT_FLAGS_ESTABLISHED, 296 [IP_CT_RELATED] = TCA_FLOWER_KEY_CT_FLAGS_TRACKED | 297 TCA_FLOWER_KEY_CT_FLAGS_RELATED, 298 [IP_CT_ESTABLISHED_REPLY] = TCA_FLOWER_KEY_CT_FLAGS_TRACKED | 299 TCA_FLOWER_KEY_CT_FLAGS_ESTABLISHED | 300 TCA_FLOWER_KEY_CT_FLAGS_REPLY, 301 [IP_CT_RELATED_REPLY] = TCA_FLOWER_KEY_CT_FLAGS_TRACKED | 302 TCA_FLOWER_KEY_CT_FLAGS_RELATED | 303 TCA_FLOWER_KEY_CT_FLAGS_REPLY, 304 [IP_CT_NEW] = TCA_FLOWER_KEY_CT_FLAGS_TRACKED | 305 TCA_FLOWER_KEY_CT_FLAGS_NEW, 306 }; 307 308 static int fl_classify(struct sk_buff *skb, const struct tcf_proto *tp, 309 struct tcf_result *res) 310 { 311 struct cls_fl_head *head = rcu_dereference_bh(tp->root); 312 bool post_ct = qdisc_skb_cb(skb)->post_ct; 313 struct fl_flow_key skb_key; 314 struct fl_flow_mask *mask; 315 struct cls_fl_filter *f; 316 317 list_for_each_entry_rcu(mask, &head->masks, list) { 318 flow_dissector_init_keys(&skb_key.control, &skb_key.basic); 319 fl_clear_masked_range(&skb_key, mask); 320 321 skb_flow_dissect_meta(skb, &mask->dissector, &skb_key); 322 /* skb_flow_dissect() does not set n_proto in case an unknown 323 * protocol, so do it rather here. 324 */ 325 skb_key.basic.n_proto = skb_protocol(skb, false); 326 skb_flow_dissect_tunnel_info(skb, &mask->dissector, &skb_key); 327 skb_flow_dissect_ct(skb, &mask->dissector, &skb_key, 328 fl_ct_info_to_flower_map, 329 ARRAY_SIZE(fl_ct_info_to_flower_map), 330 post_ct); 331 skb_flow_dissect_hash(skb, &mask->dissector, &skb_key); 332 skb_flow_dissect(skb, &mask->dissector, &skb_key, 0); 333 334 f = fl_mask_lookup(mask, &skb_key); 335 if (f && !tc_skip_sw(f->flags)) { 336 *res = f->res; 337 return tcf_exts_exec(skb, &f->exts, res); 338 } 339 } 340 return -1; 341 } 342 343 static int fl_init(struct tcf_proto *tp) 344 { 345 struct cls_fl_head *head; 346 347 head = kzalloc(sizeof(*head), GFP_KERNEL); 348 if (!head) 349 return -ENOBUFS; 350 351 spin_lock_init(&head->masks_lock); 352 INIT_LIST_HEAD_RCU(&head->masks); 353 INIT_LIST_HEAD(&head->hw_filters); 354 rcu_assign_pointer(tp->root, head); 355 idr_init(&head->handle_idr); 356 357 return rhashtable_init(&head->ht, &mask_ht_params); 358 } 359 360 static void fl_mask_free(struct fl_flow_mask *mask, bool mask_init_done) 361 { 362 /* temporary masks don't have their filters list and ht initialized */ 363 if (mask_init_done) { 364 WARN_ON(!list_empty(&mask->filters)); 365 rhashtable_destroy(&mask->ht); 366 } 367 kfree(mask); 368 } 369 370 static void fl_mask_free_work(struct work_struct *work) 371 { 372 struct fl_flow_mask *mask = container_of(to_rcu_work(work), 373 struct fl_flow_mask, rwork); 374 375 fl_mask_free(mask, true); 376 } 377 378 static void fl_uninit_mask_free_work(struct work_struct *work) 379 { 380 struct fl_flow_mask *mask = container_of(to_rcu_work(work), 381 struct fl_flow_mask, rwork); 382 383 fl_mask_free(mask, false); 384 } 385 386 static bool fl_mask_put(struct cls_fl_head *head, struct fl_flow_mask *mask) 387 { 388 if (!refcount_dec_and_test(&mask->refcnt)) 389 return false; 390 391 rhashtable_remove_fast(&head->ht, &mask->ht_node, mask_ht_params); 392 393 spin_lock(&head->masks_lock); 394 list_del_rcu(&mask->list); 395 spin_unlock(&head->masks_lock); 396 397 tcf_queue_work(&mask->rwork, fl_mask_free_work); 398 399 return true; 400 } 401 402 static struct cls_fl_head *fl_head_dereference(struct tcf_proto *tp) 403 { 404 /* Flower classifier only changes root pointer during init and destroy. 405 * Users must obtain reference to tcf_proto instance before calling its 406 * API, so tp->root pointer is protected from concurrent call to 407 * fl_destroy() by reference counting. 408 */ 409 return rcu_dereference_raw(tp->root); 410 } 411 412 static void __fl_destroy_filter(struct cls_fl_filter *f) 413 { 414 tcf_exts_destroy(&f->exts); 415 tcf_exts_put_net(&f->exts); 416 kfree(f); 417 } 418 419 static void fl_destroy_filter_work(struct work_struct *work) 420 { 421 struct cls_fl_filter *f = container_of(to_rcu_work(work), 422 struct cls_fl_filter, rwork); 423 424 __fl_destroy_filter(f); 425 } 426 427 static void fl_hw_destroy_filter(struct tcf_proto *tp, struct cls_fl_filter *f, 428 bool rtnl_held, struct netlink_ext_ack *extack) 429 { 430 struct tcf_block *block = tp->chain->block; 431 struct flow_cls_offload cls_flower = {}; 432 433 tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, extack); 434 cls_flower.command = FLOW_CLS_DESTROY; 435 cls_flower.cookie = (unsigned long) f; 436 437 tc_setup_cb_destroy(block, tp, TC_SETUP_CLSFLOWER, &cls_flower, false, 438 &f->flags, &f->in_hw_count, rtnl_held); 439 440 } 441 442 static int fl_hw_replace_filter(struct tcf_proto *tp, 443 struct cls_fl_filter *f, bool rtnl_held, 444 struct netlink_ext_ack *extack) 445 { 446 struct tcf_block *block = tp->chain->block; 447 struct flow_cls_offload cls_flower = {}; 448 bool skip_sw = tc_skip_sw(f->flags); 449 int err = 0; 450 451 cls_flower.rule = flow_rule_alloc(tcf_exts_num_actions(&f->exts)); 452 if (!cls_flower.rule) 453 return -ENOMEM; 454 455 tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, extack); 456 cls_flower.command = FLOW_CLS_REPLACE; 457 cls_flower.cookie = (unsigned long) f; 458 cls_flower.rule->match.dissector = &f->mask->dissector; 459 cls_flower.rule->match.mask = &f->mask->key; 460 cls_flower.rule->match.key = &f->mkey; 461 cls_flower.classid = f->res.classid; 462 463 err = tc_setup_flow_action(&cls_flower.rule->action, &f->exts); 464 if (err) { 465 kfree(cls_flower.rule); 466 if (skip_sw) { 467 NL_SET_ERR_MSG_MOD(extack, "Failed to setup flow action"); 468 return err; 469 } 470 return 0; 471 } 472 473 err = tc_setup_cb_add(block, tp, TC_SETUP_CLSFLOWER, &cls_flower, 474 skip_sw, &f->flags, &f->in_hw_count, rtnl_held); 475 tc_cleanup_flow_action(&cls_flower.rule->action); 476 kfree(cls_flower.rule); 477 478 if (err) { 479 fl_hw_destroy_filter(tp, f, rtnl_held, NULL); 480 return err; 481 } 482 483 if (skip_sw && !(f->flags & TCA_CLS_FLAGS_IN_HW)) 484 return -EINVAL; 485 486 return 0; 487 } 488 489 static void fl_hw_update_stats(struct tcf_proto *tp, struct cls_fl_filter *f, 490 bool rtnl_held) 491 { 492 struct tcf_block *block = tp->chain->block; 493 struct flow_cls_offload cls_flower = {}; 494 495 tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, NULL); 496 cls_flower.command = FLOW_CLS_STATS; 497 cls_flower.cookie = (unsigned long) f; 498 cls_flower.classid = f->res.classid; 499 500 tc_setup_cb_call(block, TC_SETUP_CLSFLOWER, &cls_flower, false, 501 rtnl_held); 502 503 tcf_exts_stats_update(&f->exts, cls_flower.stats.bytes, 504 cls_flower.stats.pkts, 505 cls_flower.stats.drops, 506 cls_flower.stats.lastused, 507 cls_flower.stats.used_hw_stats, 508 cls_flower.stats.used_hw_stats_valid); 509 } 510 511 static void __fl_put(struct cls_fl_filter *f) 512 { 513 if (!refcount_dec_and_test(&f->refcnt)) 514 return; 515 516 if (tcf_exts_get_net(&f->exts)) 517 tcf_queue_work(&f->rwork, fl_destroy_filter_work); 518 else 519 __fl_destroy_filter(f); 520 } 521 522 static struct cls_fl_filter *__fl_get(struct cls_fl_head *head, u32 handle) 523 { 524 struct cls_fl_filter *f; 525 526 rcu_read_lock(); 527 f = idr_find(&head->handle_idr, handle); 528 if (f && !refcount_inc_not_zero(&f->refcnt)) 529 f = NULL; 530 rcu_read_unlock(); 531 532 return f; 533 } 534 535 static int __fl_delete(struct tcf_proto *tp, struct cls_fl_filter *f, 536 bool *last, bool rtnl_held, 537 struct netlink_ext_ack *extack) 538 { 539 struct cls_fl_head *head = fl_head_dereference(tp); 540 541 *last = false; 542 543 spin_lock(&tp->lock); 544 if (f->deleted) { 545 spin_unlock(&tp->lock); 546 return -ENOENT; 547 } 548 549 f->deleted = true; 550 rhashtable_remove_fast(&f->mask->ht, &f->ht_node, 551 f->mask->filter_ht_params); 552 idr_remove(&head->handle_idr, f->handle); 553 list_del_rcu(&f->list); 554 spin_unlock(&tp->lock); 555 556 *last = fl_mask_put(head, f->mask); 557 if (!tc_skip_hw(f->flags)) 558 fl_hw_destroy_filter(tp, f, rtnl_held, extack); 559 tcf_unbind_filter(tp, &f->res); 560 __fl_put(f); 561 562 return 0; 563 } 564 565 static void fl_destroy_sleepable(struct work_struct *work) 566 { 567 struct cls_fl_head *head = container_of(to_rcu_work(work), 568 struct cls_fl_head, 569 rwork); 570 571 rhashtable_destroy(&head->ht); 572 kfree(head); 573 module_put(THIS_MODULE); 574 } 575 576 static void fl_destroy(struct tcf_proto *tp, bool rtnl_held, 577 struct netlink_ext_ack *extack) 578 { 579 struct cls_fl_head *head = fl_head_dereference(tp); 580 struct fl_flow_mask *mask, *next_mask; 581 struct cls_fl_filter *f, *next; 582 bool last; 583 584 list_for_each_entry_safe(mask, next_mask, &head->masks, list) { 585 list_for_each_entry_safe(f, next, &mask->filters, list) { 586 __fl_delete(tp, f, &last, rtnl_held, extack); 587 if (last) 588 break; 589 } 590 } 591 idr_destroy(&head->handle_idr); 592 593 __module_get(THIS_MODULE); 594 tcf_queue_work(&head->rwork, fl_destroy_sleepable); 595 } 596 597 static void fl_put(struct tcf_proto *tp, void *arg) 598 { 599 struct cls_fl_filter *f = arg; 600 601 __fl_put(f); 602 } 603 604 static void *fl_get(struct tcf_proto *tp, u32 handle) 605 { 606 struct cls_fl_head *head = fl_head_dereference(tp); 607 608 return __fl_get(head, handle); 609 } 610 611 static const struct nla_policy fl_policy[TCA_FLOWER_MAX + 1] = { 612 [TCA_FLOWER_UNSPEC] = { .type = NLA_UNSPEC }, 613 [TCA_FLOWER_CLASSID] = { .type = NLA_U32 }, 614 [TCA_FLOWER_INDEV] = { .type = NLA_STRING, 615 .len = IFNAMSIZ }, 616 [TCA_FLOWER_KEY_ETH_DST] = { .len = ETH_ALEN }, 617 [TCA_FLOWER_KEY_ETH_DST_MASK] = { .len = ETH_ALEN }, 618 [TCA_FLOWER_KEY_ETH_SRC] = { .len = ETH_ALEN }, 619 [TCA_FLOWER_KEY_ETH_SRC_MASK] = { .len = ETH_ALEN }, 620 [TCA_FLOWER_KEY_ETH_TYPE] = { .type = NLA_U16 }, 621 [TCA_FLOWER_KEY_IP_PROTO] = { .type = NLA_U8 }, 622 [TCA_FLOWER_KEY_IPV4_SRC] = { .type = NLA_U32 }, 623 [TCA_FLOWER_KEY_IPV4_SRC_MASK] = { .type = NLA_U32 }, 624 [TCA_FLOWER_KEY_IPV4_DST] = { .type = NLA_U32 }, 625 [TCA_FLOWER_KEY_IPV4_DST_MASK] = { .type = NLA_U32 }, 626 [TCA_FLOWER_KEY_IPV6_SRC] = { .len = sizeof(struct in6_addr) }, 627 [TCA_FLOWER_KEY_IPV6_SRC_MASK] = { .len = sizeof(struct in6_addr) }, 628 [TCA_FLOWER_KEY_IPV6_DST] = { .len = sizeof(struct in6_addr) }, 629 [TCA_FLOWER_KEY_IPV6_DST_MASK] = { .len = sizeof(struct in6_addr) }, 630 [TCA_FLOWER_KEY_TCP_SRC] = { .type = NLA_U16 }, 631 [TCA_FLOWER_KEY_TCP_DST] = { .type = NLA_U16 }, 632 [TCA_FLOWER_KEY_UDP_SRC] = { .type = NLA_U16 }, 633 [TCA_FLOWER_KEY_UDP_DST] = { .type = NLA_U16 }, 634 [TCA_FLOWER_KEY_VLAN_ID] = { .type = NLA_U16 }, 635 [TCA_FLOWER_KEY_VLAN_PRIO] = { .type = NLA_U8 }, 636 [TCA_FLOWER_KEY_VLAN_ETH_TYPE] = { .type = NLA_U16 }, 637 [TCA_FLOWER_KEY_ENC_KEY_ID] = { .type = NLA_U32 }, 638 [TCA_FLOWER_KEY_ENC_IPV4_SRC] = { .type = NLA_U32 }, 639 [TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK] = { .type = NLA_U32 }, 640 [TCA_FLOWER_KEY_ENC_IPV4_DST] = { .type = NLA_U32 }, 641 [TCA_FLOWER_KEY_ENC_IPV4_DST_MASK] = { .type = NLA_U32 }, 642 [TCA_FLOWER_KEY_ENC_IPV6_SRC] = { .len = sizeof(struct in6_addr) }, 643 [TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK] = { .len = sizeof(struct in6_addr) }, 644 [TCA_FLOWER_KEY_ENC_IPV6_DST] = { .len = sizeof(struct in6_addr) }, 645 [TCA_FLOWER_KEY_ENC_IPV6_DST_MASK] = { .len = sizeof(struct in6_addr) }, 646 [TCA_FLOWER_KEY_TCP_SRC_MASK] = { .type = NLA_U16 }, 647 [TCA_FLOWER_KEY_TCP_DST_MASK] = { .type = NLA_U16 }, 648 [TCA_FLOWER_KEY_UDP_SRC_MASK] = { .type = NLA_U16 }, 649 [TCA_FLOWER_KEY_UDP_DST_MASK] = { .type = NLA_U16 }, 650 [TCA_FLOWER_KEY_SCTP_SRC_MASK] = { .type = NLA_U16 }, 651 [TCA_FLOWER_KEY_SCTP_DST_MASK] = { .type = NLA_U16 }, 652 [TCA_FLOWER_KEY_SCTP_SRC] = { .type = NLA_U16 }, 653 [TCA_FLOWER_KEY_SCTP_DST] = { .type = NLA_U16 }, 654 [TCA_FLOWER_KEY_ENC_UDP_SRC_PORT] = { .type = NLA_U16 }, 655 [TCA_FLOWER_KEY_ENC_UDP_SRC_PORT_MASK] = { .type = NLA_U16 }, 656 [TCA_FLOWER_KEY_ENC_UDP_DST_PORT] = { .type = NLA_U16 }, 657 [TCA_FLOWER_KEY_ENC_UDP_DST_PORT_MASK] = { .type = NLA_U16 }, 658 [TCA_FLOWER_KEY_FLAGS] = { .type = NLA_U32 }, 659 [TCA_FLOWER_KEY_FLAGS_MASK] = { .type = NLA_U32 }, 660 [TCA_FLOWER_KEY_ICMPV4_TYPE] = { .type = NLA_U8 }, 661 [TCA_FLOWER_KEY_ICMPV4_TYPE_MASK] = { .type = NLA_U8 }, 662 [TCA_FLOWER_KEY_ICMPV4_CODE] = { .type = NLA_U8 }, 663 [TCA_FLOWER_KEY_ICMPV4_CODE_MASK] = { .type = NLA_U8 }, 664 [TCA_FLOWER_KEY_ICMPV6_TYPE] = { .type = NLA_U8 }, 665 [TCA_FLOWER_KEY_ICMPV6_TYPE_MASK] = { .type = NLA_U8 }, 666 [TCA_FLOWER_KEY_ICMPV6_CODE] = { .type = NLA_U8 }, 667 [TCA_FLOWER_KEY_ICMPV6_CODE_MASK] = { .type = NLA_U8 }, 668 [TCA_FLOWER_KEY_ARP_SIP] = { .type = NLA_U32 }, 669 [TCA_FLOWER_KEY_ARP_SIP_MASK] = { .type = NLA_U32 }, 670 [TCA_FLOWER_KEY_ARP_TIP] = { .type = NLA_U32 }, 671 [TCA_FLOWER_KEY_ARP_TIP_MASK] = { .type = NLA_U32 }, 672 [TCA_FLOWER_KEY_ARP_OP] = { .type = NLA_U8 }, 673 [TCA_FLOWER_KEY_ARP_OP_MASK] = { .type = NLA_U8 }, 674 [TCA_FLOWER_KEY_ARP_SHA] = { .len = ETH_ALEN }, 675 [TCA_FLOWER_KEY_ARP_SHA_MASK] = { .len = ETH_ALEN }, 676 [TCA_FLOWER_KEY_ARP_THA] = { .len = ETH_ALEN }, 677 [TCA_FLOWER_KEY_ARP_THA_MASK] = { .len = ETH_ALEN }, 678 [TCA_FLOWER_KEY_MPLS_TTL] = { .type = NLA_U8 }, 679 [TCA_FLOWER_KEY_MPLS_BOS] = { .type = NLA_U8 }, 680 [TCA_FLOWER_KEY_MPLS_TC] = { .type = NLA_U8 }, 681 [TCA_FLOWER_KEY_MPLS_LABEL] = { .type = NLA_U32 }, 682 [TCA_FLOWER_KEY_MPLS_OPTS] = { .type = NLA_NESTED }, 683 [TCA_FLOWER_KEY_TCP_FLAGS] = { .type = NLA_U16 }, 684 [TCA_FLOWER_KEY_TCP_FLAGS_MASK] = { .type = NLA_U16 }, 685 [TCA_FLOWER_KEY_IP_TOS] = { .type = NLA_U8 }, 686 [TCA_FLOWER_KEY_IP_TOS_MASK] = { .type = NLA_U8 }, 687 [TCA_FLOWER_KEY_IP_TTL] = { .type = NLA_U8 }, 688 [TCA_FLOWER_KEY_IP_TTL_MASK] = { .type = NLA_U8 }, 689 [TCA_FLOWER_KEY_CVLAN_ID] = { .type = NLA_U16 }, 690 [TCA_FLOWER_KEY_CVLAN_PRIO] = { .type = NLA_U8 }, 691 [TCA_FLOWER_KEY_CVLAN_ETH_TYPE] = { .type = NLA_U16 }, 692 [TCA_FLOWER_KEY_ENC_IP_TOS] = { .type = NLA_U8 }, 693 [TCA_FLOWER_KEY_ENC_IP_TOS_MASK] = { .type = NLA_U8 }, 694 [TCA_FLOWER_KEY_ENC_IP_TTL] = { .type = NLA_U8 }, 695 [TCA_FLOWER_KEY_ENC_IP_TTL_MASK] = { .type = NLA_U8 }, 696 [TCA_FLOWER_KEY_ENC_OPTS] = { .type = NLA_NESTED }, 697 [TCA_FLOWER_KEY_ENC_OPTS_MASK] = { .type = NLA_NESTED }, 698 [TCA_FLOWER_KEY_CT_STATE] = 699 NLA_POLICY_MASK(NLA_U16, TCA_FLOWER_KEY_CT_FLAGS_MASK), 700 [TCA_FLOWER_KEY_CT_STATE_MASK] = 701 NLA_POLICY_MASK(NLA_U16, TCA_FLOWER_KEY_CT_FLAGS_MASK), 702 [TCA_FLOWER_KEY_CT_ZONE] = { .type = NLA_U16 }, 703 [TCA_FLOWER_KEY_CT_ZONE_MASK] = { .type = NLA_U16 }, 704 [TCA_FLOWER_KEY_CT_MARK] = { .type = NLA_U32 }, 705 [TCA_FLOWER_KEY_CT_MARK_MASK] = { .type = NLA_U32 }, 706 [TCA_FLOWER_KEY_CT_LABELS] = { .type = NLA_BINARY, 707 .len = 128 / BITS_PER_BYTE }, 708 [TCA_FLOWER_KEY_CT_LABELS_MASK] = { .type = NLA_BINARY, 709 .len = 128 / BITS_PER_BYTE }, 710 [TCA_FLOWER_FLAGS] = { .type = NLA_U32 }, 711 [TCA_FLOWER_KEY_HASH] = { .type = NLA_U32 }, 712 [TCA_FLOWER_KEY_HASH_MASK] = { .type = NLA_U32 }, 713 714 }; 715 716 static const struct nla_policy 717 enc_opts_policy[TCA_FLOWER_KEY_ENC_OPTS_MAX + 1] = { 718 [TCA_FLOWER_KEY_ENC_OPTS_UNSPEC] = { 719 .strict_start_type = TCA_FLOWER_KEY_ENC_OPTS_VXLAN }, 720 [TCA_FLOWER_KEY_ENC_OPTS_GENEVE] = { .type = NLA_NESTED }, 721 [TCA_FLOWER_KEY_ENC_OPTS_VXLAN] = { .type = NLA_NESTED }, 722 [TCA_FLOWER_KEY_ENC_OPTS_ERSPAN] = { .type = NLA_NESTED }, 723 }; 724 725 static const struct nla_policy 726 geneve_opt_policy[TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX + 1] = { 727 [TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS] = { .type = NLA_U16 }, 728 [TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE] = { .type = NLA_U8 }, 729 [TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA] = { .type = NLA_BINARY, 730 .len = 128 }, 731 }; 732 733 static const struct nla_policy 734 vxlan_opt_policy[TCA_FLOWER_KEY_ENC_OPT_VXLAN_MAX + 1] = { 735 [TCA_FLOWER_KEY_ENC_OPT_VXLAN_GBP] = { .type = NLA_U32 }, 736 }; 737 738 static const struct nla_policy 739 erspan_opt_policy[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_MAX + 1] = { 740 [TCA_FLOWER_KEY_ENC_OPT_ERSPAN_VER] = { .type = NLA_U8 }, 741 [TCA_FLOWER_KEY_ENC_OPT_ERSPAN_INDEX] = { .type = NLA_U32 }, 742 [TCA_FLOWER_KEY_ENC_OPT_ERSPAN_DIR] = { .type = NLA_U8 }, 743 [TCA_FLOWER_KEY_ENC_OPT_ERSPAN_HWID] = { .type = NLA_U8 }, 744 }; 745 746 static const struct nla_policy 747 mpls_stack_entry_policy[TCA_FLOWER_KEY_MPLS_OPT_LSE_MAX + 1] = { 748 [TCA_FLOWER_KEY_MPLS_OPT_LSE_DEPTH] = { .type = NLA_U8 }, 749 [TCA_FLOWER_KEY_MPLS_OPT_LSE_TTL] = { .type = NLA_U8 }, 750 [TCA_FLOWER_KEY_MPLS_OPT_LSE_BOS] = { .type = NLA_U8 }, 751 [TCA_FLOWER_KEY_MPLS_OPT_LSE_TC] = { .type = NLA_U8 }, 752 [TCA_FLOWER_KEY_MPLS_OPT_LSE_LABEL] = { .type = NLA_U32 }, 753 }; 754 755 static void fl_set_key_val(struct nlattr **tb, 756 void *val, int val_type, 757 void *mask, int mask_type, int len) 758 { 759 if (!tb[val_type]) 760 return; 761 nla_memcpy(val, tb[val_type], len); 762 if (mask_type == TCA_FLOWER_UNSPEC || !tb[mask_type]) 763 memset(mask, 0xff, len); 764 else 765 nla_memcpy(mask, tb[mask_type], len); 766 } 767 768 static int fl_set_key_port_range(struct nlattr **tb, struct fl_flow_key *key, 769 struct fl_flow_key *mask, 770 struct netlink_ext_ack *extack) 771 { 772 fl_set_key_val(tb, &key->tp_range.tp_min.dst, 773 TCA_FLOWER_KEY_PORT_DST_MIN, &mask->tp_range.tp_min.dst, 774 TCA_FLOWER_UNSPEC, sizeof(key->tp_range.tp_min.dst)); 775 fl_set_key_val(tb, &key->tp_range.tp_max.dst, 776 TCA_FLOWER_KEY_PORT_DST_MAX, &mask->tp_range.tp_max.dst, 777 TCA_FLOWER_UNSPEC, sizeof(key->tp_range.tp_max.dst)); 778 fl_set_key_val(tb, &key->tp_range.tp_min.src, 779 TCA_FLOWER_KEY_PORT_SRC_MIN, &mask->tp_range.tp_min.src, 780 TCA_FLOWER_UNSPEC, sizeof(key->tp_range.tp_min.src)); 781 fl_set_key_val(tb, &key->tp_range.tp_max.src, 782 TCA_FLOWER_KEY_PORT_SRC_MAX, &mask->tp_range.tp_max.src, 783 TCA_FLOWER_UNSPEC, sizeof(key->tp_range.tp_max.src)); 784 785 if (mask->tp_range.tp_min.dst && mask->tp_range.tp_max.dst && 786 ntohs(key->tp_range.tp_max.dst) <= 787 ntohs(key->tp_range.tp_min.dst)) { 788 NL_SET_ERR_MSG_ATTR(extack, 789 tb[TCA_FLOWER_KEY_PORT_DST_MIN], 790 "Invalid destination port range (min must be strictly smaller than max)"); 791 return -EINVAL; 792 } 793 if (mask->tp_range.tp_min.src && mask->tp_range.tp_max.src && 794 ntohs(key->tp_range.tp_max.src) <= 795 ntohs(key->tp_range.tp_min.src)) { 796 NL_SET_ERR_MSG_ATTR(extack, 797 tb[TCA_FLOWER_KEY_PORT_SRC_MIN], 798 "Invalid source port range (min must be strictly smaller than max)"); 799 return -EINVAL; 800 } 801 802 return 0; 803 } 804 805 static int fl_set_key_mpls_lse(const struct nlattr *nla_lse, 806 struct flow_dissector_key_mpls *key_val, 807 struct flow_dissector_key_mpls *key_mask, 808 struct netlink_ext_ack *extack) 809 { 810 struct nlattr *tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_MAX + 1]; 811 struct flow_dissector_mpls_lse *lse_mask; 812 struct flow_dissector_mpls_lse *lse_val; 813 u8 lse_index; 814 u8 depth; 815 int err; 816 817 err = nla_parse_nested(tb, TCA_FLOWER_KEY_MPLS_OPT_LSE_MAX, nla_lse, 818 mpls_stack_entry_policy, extack); 819 if (err < 0) 820 return err; 821 822 if (!tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_DEPTH]) { 823 NL_SET_ERR_MSG(extack, "Missing MPLS option \"depth\""); 824 return -EINVAL; 825 } 826 827 depth = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_DEPTH]); 828 829 /* LSE depth starts at 1, for consistency with terminology used by 830 * RFC 3031 (section 3.9), where depth 0 refers to unlabeled packets. 831 */ 832 if (depth < 1 || depth > FLOW_DIS_MPLS_MAX) { 833 NL_SET_ERR_MSG_ATTR(extack, 834 tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_DEPTH], 835 "Invalid MPLS depth"); 836 return -EINVAL; 837 } 838 lse_index = depth - 1; 839 840 dissector_set_mpls_lse(key_val, lse_index); 841 dissector_set_mpls_lse(key_mask, lse_index); 842 843 lse_val = &key_val->ls[lse_index]; 844 lse_mask = &key_mask->ls[lse_index]; 845 846 if (tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_TTL]) { 847 lse_val->mpls_ttl = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_TTL]); 848 lse_mask->mpls_ttl = MPLS_TTL_MASK; 849 } 850 if (tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_BOS]) { 851 u8 bos = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_BOS]); 852 853 if (bos & ~MPLS_BOS_MASK) { 854 NL_SET_ERR_MSG_ATTR(extack, 855 tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_BOS], 856 "Bottom Of Stack (BOS) must be 0 or 1"); 857 return -EINVAL; 858 } 859 lse_val->mpls_bos = bos; 860 lse_mask->mpls_bos = MPLS_BOS_MASK; 861 } 862 if (tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_TC]) { 863 u8 tc = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_TC]); 864 865 if (tc & ~MPLS_TC_MASK) { 866 NL_SET_ERR_MSG_ATTR(extack, 867 tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_TC], 868 "Traffic Class (TC) must be between 0 and 7"); 869 return -EINVAL; 870 } 871 lse_val->mpls_tc = tc; 872 lse_mask->mpls_tc = MPLS_TC_MASK; 873 } 874 if (tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_LABEL]) { 875 u32 label = nla_get_u32(tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_LABEL]); 876 877 if (label & ~MPLS_LABEL_MASK) { 878 NL_SET_ERR_MSG_ATTR(extack, 879 tb[TCA_FLOWER_KEY_MPLS_OPT_LSE_LABEL], 880 "Label must be between 0 and 1048575"); 881 return -EINVAL; 882 } 883 lse_val->mpls_label = label; 884 lse_mask->mpls_label = MPLS_LABEL_MASK; 885 } 886 887 return 0; 888 } 889 890 static int fl_set_key_mpls_opts(const struct nlattr *nla_mpls_opts, 891 struct flow_dissector_key_mpls *key_val, 892 struct flow_dissector_key_mpls *key_mask, 893 struct netlink_ext_ack *extack) 894 { 895 struct nlattr *nla_lse; 896 int rem; 897 int err; 898 899 if (!(nla_mpls_opts->nla_type & NLA_F_NESTED)) { 900 NL_SET_ERR_MSG_ATTR(extack, nla_mpls_opts, 901 "NLA_F_NESTED is missing"); 902 return -EINVAL; 903 } 904 905 nla_for_each_nested(nla_lse, nla_mpls_opts, rem) { 906 if (nla_type(nla_lse) != TCA_FLOWER_KEY_MPLS_OPTS_LSE) { 907 NL_SET_ERR_MSG_ATTR(extack, nla_lse, 908 "Invalid MPLS option type"); 909 return -EINVAL; 910 } 911 912 err = fl_set_key_mpls_lse(nla_lse, key_val, key_mask, extack); 913 if (err < 0) 914 return err; 915 } 916 if (rem) { 917 NL_SET_ERR_MSG(extack, 918 "Bytes leftover after parsing MPLS options"); 919 return -EINVAL; 920 } 921 922 return 0; 923 } 924 925 static int fl_set_key_mpls(struct nlattr **tb, 926 struct flow_dissector_key_mpls *key_val, 927 struct flow_dissector_key_mpls *key_mask, 928 struct netlink_ext_ack *extack) 929 { 930 struct flow_dissector_mpls_lse *lse_mask; 931 struct flow_dissector_mpls_lse *lse_val; 932 933 if (tb[TCA_FLOWER_KEY_MPLS_OPTS]) { 934 if (tb[TCA_FLOWER_KEY_MPLS_TTL] || 935 tb[TCA_FLOWER_KEY_MPLS_BOS] || 936 tb[TCA_FLOWER_KEY_MPLS_TC] || 937 tb[TCA_FLOWER_KEY_MPLS_LABEL]) { 938 NL_SET_ERR_MSG_ATTR(extack, 939 tb[TCA_FLOWER_KEY_MPLS_OPTS], 940 "MPLS label, Traffic Class, Bottom Of Stack and Time To Live must be encapsulated in the MPLS options attribute"); 941 return -EBADMSG; 942 } 943 944 return fl_set_key_mpls_opts(tb[TCA_FLOWER_KEY_MPLS_OPTS], 945 key_val, key_mask, extack); 946 } 947 948 lse_val = &key_val->ls[0]; 949 lse_mask = &key_mask->ls[0]; 950 951 if (tb[TCA_FLOWER_KEY_MPLS_TTL]) { 952 lse_val->mpls_ttl = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_TTL]); 953 lse_mask->mpls_ttl = MPLS_TTL_MASK; 954 dissector_set_mpls_lse(key_val, 0); 955 dissector_set_mpls_lse(key_mask, 0); 956 } 957 if (tb[TCA_FLOWER_KEY_MPLS_BOS]) { 958 u8 bos = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_BOS]); 959 960 if (bos & ~MPLS_BOS_MASK) { 961 NL_SET_ERR_MSG_ATTR(extack, 962 tb[TCA_FLOWER_KEY_MPLS_BOS], 963 "Bottom Of Stack (BOS) must be 0 or 1"); 964 return -EINVAL; 965 } 966 lse_val->mpls_bos = bos; 967 lse_mask->mpls_bos = MPLS_BOS_MASK; 968 dissector_set_mpls_lse(key_val, 0); 969 dissector_set_mpls_lse(key_mask, 0); 970 } 971 if (tb[TCA_FLOWER_KEY_MPLS_TC]) { 972 u8 tc = nla_get_u8(tb[TCA_FLOWER_KEY_MPLS_TC]); 973 974 if (tc & ~MPLS_TC_MASK) { 975 NL_SET_ERR_MSG_ATTR(extack, 976 tb[TCA_FLOWER_KEY_MPLS_TC], 977 "Traffic Class (TC) must be between 0 and 7"); 978 return -EINVAL; 979 } 980 lse_val->mpls_tc = tc; 981 lse_mask->mpls_tc = MPLS_TC_MASK; 982 dissector_set_mpls_lse(key_val, 0); 983 dissector_set_mpls_lse(key_mask, 0); 984 } 985 if (tb[TCA_FLOWER_KEY_MPLS_LABEL]) { 986 u32 label = nla_get_u32(tb[TCA_FLOWER_KEY_MPLS_LABEL]); 987 988 if (label & ~MPLS_LABEL_MASK) { 989 NL_SET_ERR_MSG_ATTR(extack, 990 tb[TCA_FLOWER_KEY_MPLS_LABEL], 991 "Label must be between 0 and 1048575"); 992 return -EINVAL; 993 } 994 lse_val->mpls_label = label; 995 lse_mask->mpls_label = MPLS_LABEL_MASK; 996 dissector_set_mpls_lse(key_val, 0); 997 dissector_set_mpls_lse(key_mask, 0); 998 } 999 return 0; 1000 } 1001 1002 static void fl_set_key_vlan(struct nlattr **tb, 1003 __be16 ethertype, 1004 int vlan_id_key, int vlan_prio_key, 1005 struct flow_dissector_key_vlan *key_val, 1006 struct flow_dissector_key_vlan *key_mask) 1007 { 1008 #define VLAN_PRIORITY_MASK 0x7 1009 1010 if (tb[vlan_id_key]) { 1011 key_val->vlan_id = 1012 nla_get_u16(tb[vlan_id_key]) & VLAN_VID_MASK; 1013 key_mask->vlan_id = VLAN_VID_MASK; 1014 } 1015 if (tb[vlan_prio_key]) { 1016 key_val->vlan_priority = 1017 nla_get_u8(tb[vlan_prio_key]) & 1018 VLAN_PRIORITY_MASK; 1019 key_mask->vlan_priority = VLAN_PRIORITY_MASK; 1020 } 1021 key_val->vlan_tpid = ethertype; 1022 key_mask->vlan_tpid = cpu_to_be16(~0); 1023 } 1024 1025 static void fl_set_key_flag(u32 flower_key, u32 flower_mask, 1026 u32 *dissector_key, u32 *dissector_mask, 1027 u32 flower_flag_bit, u32 dissector_flag_bit) 1028 { 1029 if (flower_mask & flower_flag_bit) { 1030 *dissector_mask |= dissector_flag_bit; 1031 if (flower_key & flower_flag_bit) 1032 *dissector_key |= dissector_flag_bit; 1033 } 1034 } 1035 1036 static int fl_set_key_flags(struct nlattr **tb, u32 *flags_key, 1037 u32 *flags_mask, struct netlink_ext_ack *extack) 1038 { 1039 u32 key, mask; 1040 1041 /* mask is mandatory for flags */ 1042 if (!tb[TCA_FLOWER_KEY_FLAGS_MASK]) { 1043 NL_SET_ERR_MSG(extack, "Missing flags mask"); 1044 return -EINVAL; 1045 } 1046 1047 key = be32_to_cpu(nla_get_be32(tb[TCA_FLOWER_KEY_FLAGS])); 1048 mask = be32_to_cpu(nla_get_be32(tb[TCA_FLOWER_KEY_FLAGS_MASK])); 1049 1050 *flags_key = 0; 1051 *flags_mask = 0; 1052 1053 fl_set_key_flag(key, mask, flags_key, flags_mask, 1054 TCA_FLOWER_KEY_FLAGS_IS_FRAGMENT, FLOW_DIS_IS_FRAGMENT); 1055 fl_set_key_flag(key, mask, flags_key, flags_mask, 1056 TCA_FLOWER_KEY_FLAGS_FRAG_IS_FIRST, 1057 FLOW_DIS_FIRST_FRAG); 1058 1059 return 0; 1060 } 1061 1062 static void fl_set_key_ip(struct nlattr **tb, bool encap, 1063 struct flow_dissector_key_ip *key, 1064 struct flow_dissector_key_ip *mask) 1065 { 1066 int tos_key = encap ? TCA_FLOWER_KEY_ENC_IP_TOS : TCA_FLOWER_KEY_IP_TOS; 1067 int ttl_key = encap ? TCA_FLOWER_KEY_ENC_IP_TTL : TCA_FLOWER_KEY_IP_TTL; 1068 int tos_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TOS_MASK : TCA_FLOWER_KEY_IP_TOS_MASK; 1069 int ttl_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TTL_MASK : TCA_FLOWER_KEY_IP_TTL_MASK; 1070 1071 fl_set_key_val(tb, &key->tos, tos_key, &mask->tos, tos_mask, sizeof(key->tos)); 1072 fl_set_key_val(tb, &key->ttl, ttl_key, &mask->ttl, ttl_mask, sizeof(key->ttl)); 1073 } 1074 1075 static int fl_set_geneve_opt(const struct nlattr *nla, struct fl_flow_key *key, 1076 int depth, int option_len, 1077 struct netlink_ext_ack *extack) 1078 { 1079 struct nlattr *tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX + 1]; 1080 struct nlattr *class = NULL, *type = NULL, *data = NULL; 1081 struct geneve_opt *opt; 1082 int err, data_len = 0; 1083 1084 if (option_len > sizeof(struct geneve_opt)) 1085 data_len = option_len - sizeof(struct geneve_opt); 1086 1087 opt = (struct geneve_opt *)&key->enc_opts.data[key->enc_opts.len]; 1088 memset(opt, 0xff, option_len); 1089 opt->length = data_len / 4; 1090 opt->r1 = 0; 1091 opt->r2 = 0; 1092 opt->r3 = 0; 1093 1094 /* If no mask has been prodived we assume an exact match. */ 1095 if (!depth) 1096 return sizeof(struct geneve_opt) + data_len; 1097 1098 if (nla_type(nla) != TCA_FLOWER_KEY_ENC_OPTS_GENEVE) { 1099 NL_SET_ERR_MSG(extack, "Non-geneve option type for mask"); 1100 return -EINVAL; 1101 } 1102 1103 err = nla_parse_nested_deprecated(tb, 1104 TCA_FLOWER_KEY_ENC_OPT_GENEVE_MAX, 1105 nla, geneve_opt_policy, extack); 1106 if (err < 0) 1107 return err; 1108 1109 /* We are not allowed to omit any of CLASS, TYPE or DATA 1110 * fields from the key. 1111 */ 1112 if (!option_len && 1113 (!tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS] || 1114 !tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE] || 1115 !tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA])) { 1116 NL_SET_ERR_MSG(extack, "Missing tunnel key geneve option class, type or data"); 1117 return -EINVAL; 1118 } 1119 1120 /* Omitting any of CLASS, TYPE or DATA fields is allowed 1121 * for the mask. 1122 */ 1123 if (tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA]) { 1124 int new_len = key->enc_opts.len; 1125 1126 data = tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA]; 1127 data_len = nla_len(data); 1128 if (data_len < 4) { 1129 NL_SET_ERR_MSG(extack, "Tunnel key geneve option data is less than 4 bytes long"); 1130 return -ERANGE; 1131 } 1132 if (data_len % 4) { 1133 NL_SET_ERR_MSG(extack, "Tunnel key geneve option data is not a multiple of 4 bytes long"); 1134 return -ERANGE; 1135 } 1136 1137 new_len += sizeof(struct geneve_opt) + data_len; 1138 BUILD_BUG_ON(FLOW_DIS_TUN_OPTS_MAX != IP_TUNNEL_OPTS_MAX); 1139 if (new_len > FLOW_DIS_TUN_OPTS_MAX) { 1140 NL_SET_ERR_MSG(extack, "Tunnel options exceeds max size"); 1141 return -ERANGE; 1142 } 1143 opt->length = data_len / 4; 1144 memcpy(opt->opt_data, nla_data(data), data_len); 1145 } 1146 1147 if (tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS]) { 1148 class = tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS]; 1149 opt->opt_class = nla_get_be16(class); 1150 } 1151 1152 if (tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE]) { 1153 type = tb[TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE]; 1154 opt->type = nla_get_u8(type); 1155 } 1156 1157 return sizeof(struct geneve_opt) + data_len; 1158 } 1159 1160 static int fl_set_vxlan_opt(const struct nlattr *nla, struct fl_flow_key *key, 1161 int depth, int option_len, 1162 struct netlink_ext_ack *extack) 1163 { 1164 struct nlattr *tb[TCA_FLOWER_KEY_ENC_OPT_VXLAN_MAX + 1]; 1165 struct vxlan_metadata *md; 1166 int err; 1167 1168 md = (struct vxlan_metadata *)&key->enc_opts.data[key->enc_opts.len]; 1169 memset(md, 0xff, sizeof(*md)); 1170 1171 if (!depth) 1172 return sizeof(*md); 1173 1174 if (nla_type(nla) != TCA_FLOWER_KEY_ENC_OPTS_VXLAN) { 1175 NL_SET_ERR_MSG(extack, "Non-vxlan option type for mask"); 1176 return -EINVAL; 1177 } 1178 1179 err = nla_parse_nested(tb, TCA_FLOWER_KEY_ENC_OPT_VXLAN_MAX, nla, 1180 vxlan_opt_policy, extack); 1181 if (err < 0) 1182 return err; 1183 1184 if (!option_len && !tb[TCA_FLOWER_KEY_ENC_OPT_VXLAN_GBP]) { 1185 NL_SET_ERR_MSG(extack, "Missing tunnel key vxlan option gbp"); 1186 return -EINVAL; 1187 } 1188 1189 if (tb[TCA_FLOWER_KEY_ENC_OPT_VXLAN_GBP]) { 1190 md->gbp = nla_get_u32(tb[TCA_FLOWER_KEY_ENC_OPT_VXLAN_GBP]); 1191 md->gbp &= VXLAN_GBP_MASK; 1192 } 1193 1194 return sizeof(*md); 1195 } 1196 1197 static int fl_set_erspan_opt(const struct nlattr *nla, struct fl_flow_key *key, 1198 int depth, int option_len, 1199 struct netlink_ext_ack *extack) 1200 { 1201 struct nlattr *tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_MAX + 1]; 1202 struct erspan_metadata *md; 1203 int err; 1204 1205 md = (struct erspan_metadata *)&key->enc_opts.data[key->enc_opts.len]; 1206 memset(md, 0xff, sizeof(*md)); 1207 md->version = 1; 1208 1209 if (!depth) 1210 return sizeof(*md); 1211 1212 if (nla_type(nla) != TCA_FLOWER_KEY_ENC_OPTS_ERSPAN) { 1213 NL_SET_ERR_MSG(extack, "Non-erspan option type for mask"); 1214 return -EINVAL; 1215 } 1216 1217 err = nla_parse_nested(tb, TCA_FLOWER_KEY_ENC_OPT_ERSPAN_MAX, nla, 1218 erspan_opt_policy, extack); 1219 if (err < 0) 1220 return err; 1221 1222 if (!option_len && !tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_VER]) { 1223 NL_SET_ERR_MSG(extack, "Missing tunnel key erspan option ver"); 1224 return -EINVAL; 1225 } 1226 1227 if (tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_VER]) 1228 md->version = nla_get_u8(tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_VER]); 1229 1230 if (md->version == 1) { 1231 if (!option_len && !tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_INDEX]) { 1232 NL_SET_ERR_MSG(extack, "Missing tunnel key erspan option index"); 1233 return -EINVAL; 1234 } 1235 if (tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_INDEX]) { 1236 nla = tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_INDEX]; 1237 memset(&md->u, 0x00, sizeof(md->u)); 1238 md->u.index = nla_get_be32(nla); 1239 } 1240 } else if (md->version == 2) { 1241 if (!option_len && (!tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_DIR] || 1242 !tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_HWID])) { 1243 NL_SET_ERR_MSG(extack, "Missing tunnel key erspan option dir or hwid"); 1244 return -EINVAL; 1245 } 1246 if (tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_DIR]) { 1247 nla = tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_DIR]; 1248 md->u.md2.dir = nla_get_u8(nla); 1249 } 1250 if (tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_HWID]) { 1251 nla = tb[TCA_FLOWER_KEY_ENC_OPT_ERSPAN_HWID]; 1252 set_hwid(&md->u.md2, nla_get_u8(nla)); 1253 } 1254 } else { 1255 NL_SET_ERR_MSG(extack, "Tunnel key erspan option ver is incorrect"); 1256 return -EINVAL; 1257 } 1258 1259 return sizeof(*md); 1260 } 1261 1262 static int fl_set_enc_opt(struct nlattr **tb, struct fl_flow_key *key, 1263 struct fl_flow_key *mask, 1264 struct netlink_ext_ack *extack) 1265 { 1266 const struct nlattr *nla_enc_key, *nla_opt_key, *nla_opt_msk = NULL; 1267 int err, option_len, key_depth, msk_depth = 0; 1268 1269 err = nla_validate_nested_deprecated(tb[TCA_FLOWER_KEY_ENC_OPTS], 1270 TCA_FLOWER_KEY_ENC_OPTS_MAX, 1271 enc_opts_policy, extack); 1272 if (err) 1273 return err; 1274 1275 nla_enc_key = nla_data(tb[TCA_FLOWER_KEY_ENC_OPTS]); 1276 1277 if (tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]) { 1278 err = nla_validate_nested_deprecated(tb[TCA_FLOWER_KEY_ENC_OPTS_MASK], 1279 TCA_FLOWER_KEY_ENC_OPTS_MAX, 1280 enc_opts_policy, extack); 1281 if (err) 1282 return err; 1283 1284 nla_opt_msk = nla_data(tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]); 1285 msk_depth = nla_len(tb[TCA_FLOWER_KEY_ENC_OPTS_MASK]); 1286 if (!nla_ok(nla_opt_msk, msk_depth)) { 1287 NL_SET_ERR_MSG(extack, "Invalid nested attribute for masks"); 1288 return -EINVAL; 1289 } 1290 } 1291 1292 nla_for_each_attr(nla_opt_key, nla_enc_key, 1293 nla_len(tb[TCA_FLOWER_KEY_ENC_OPTS]), key_depth) { 1294 switch (nla_type(nla_opt_key)) { 1295 case TCA_FLOWER_KEY_ENC_OPTS_GENEVE: 1296 if (key->enc_opts.dst_opt_type && 1297 key->enc_opts.dst_opt_type != TUNNEL_GENEVE_OPT) { 1298 NL_SET_ERR_MSG(extack, "Duplicate type for geneve options"); 1299 return -EINVAL; 1300 } 1301 option_len = 0; 1302 key->enc_opts.dst_opt_type = TUNNEL_GENEVE_OPT; 1303 option_len = fl_set_geneve_opt(nla_opt_key, key, 1304 key_depth, option_len, 1305 extack); 1306 if (option_len < 0) 1307 return option_len; 1308 1309 key->enc_opts.len += option_len; 1310 /* At the same time we need to parse through the mask 1311 * in order to verify exact and mask attribute lengths. 1312 */ 1313 mask->enc_opts.dst_opt_type = TUNNEL_GENEVE_OPT; 1314 option_len = fl_set_geneve_opt(nla_opt_msk, mask, 1315 msk_depth, option_len, 1316 extack); 1317 if (option_len < 0) 1318 return option_len; 1319 1320 mask->enc_opts.len += option_len; 1321 if (key->enc_opts.len != mask->enc_opts.len) { 1322 NL_SET_ERR_MSG(extack, "Key and mask miss aligned"); 1323 return -EINVAL; 1324 } 1325 break; 1326 case TCA_FLOWER_KEY_ENC_OPTS_VXLAN: 1327 if (key->enc_opts.dst_opt_type) { 1328 NL_SET_ERR_MSG(extack, "Duplicate type for vxlan options"); 1329 return -EINVAL; 1330 } 1331 option_len = 0; 1332 key->enc_opts.dst_opt_type = TUNNEL_VXLAN_OPT; 1333 option_len = fl_set_vxlan_opt(nla_opt_key, key, 1334 key_depth, option_len, 1335 extack); 1336 if (option_len < 0) 1337 return option_len; 1338 1339 key->enc_opts.len += option_len; 1340 /* At the same time we need to parse through the mask 1341 * in order to verify exact and mask attribute lengths. 1342 */ 1343 mask->enc_opts.dst_opt_type = TUNNEL_VXLAN_OPT; 1344 option_len = fl_set_vxlan_opt(nla_opt_msk, mask, 1345 msk_depth, option_len, 1346 extack); 1347 if (option_len < 0) 1348 return option_len; 1349 1350 mask->enc_opts.len += option_len; 1351 if (key->enc_opts.len != mask->enc_opts.len) { 1352 NL_SET_ERR_MSG(extack, "Key and mask miss aligned"); 1353 return -EINVAL; 1354 } 1355 break; 1356 case TCA_FLOWER_KEY_ENC_OPTS_ERSPAN: 1357 if (key->enc_opts.dst_opt_type) { 1358 NL_SET_ERR_MSG(extack, "Duplicate type for erspan options"); 1359 return -EINVAL; 1360 } 1361 option_len = 0; 1362 key->enc_opts.dst_opt_type = TUNNEL_ERSPAN_OPT; 1363 option_len = fl_set_erspan_opt(nla_opt_key, key, 1364 key_depth, option_len, 1365 extack); 1366 if (option_len < 0) 1367 return option_len; 1368 1369 key->enc_opts.len += option_len; 1370 /* At the same time we need to parse through the mask 1371 * in order to verify exact and mask attribute lengths. 1372 */ 1373 mask->enc_opts.dst_opt_type = TUNNEL_ERSPAN_OPT; 1374 option_len = fl_set_erspan_opt(nla_opt_msk, mask, 1375 msk_depth, option_len, 1376 extack); 1377 if (option_len < 0) 1378 return option_len; 1379 1380 mask->enc_opts.len += option_len; 1381 if (key->enc_opts.len != mask->enc_opts.len) { 1382 NL_SET_ERR_MSG(extack, "Key and mask miss aligned"); 1383 return -EINVAL; 1384 } 1385 break; 1386 default: 1387 NL_SET_ERR_MSG(extack, "Unknown tunnel option type"); 1388 return -EINVAL; 1389 } 1390 1391 if (!msk_depth) 1392 continue; 1393 1394 if (!nla_ok(nla_opt_msk, msk_depth)) { 1395 NL_SET_ERR_MSG(extack, "A mask attribute is invalid"); 1396 return -EINVAL; 1397 } 1398 nla_opt_msk = nla_next(nla_opt_msk, &msk_depth); 1399 } 1400 1401 return 0; 1402 } 1403 1404 static int fl_validate_ct_state(u16 state, struct nlattr *tb, 1405 struct netlink_ext_ack *extack) 1406 { 1407 if (state && !(state & TCA_FLOWER_KEY_CT_FLAGS_TRACKED)) { 1408 NL_SET_ERR_MSG_ATTR(extack, tb, 1409 "no trk, so no other flag can be set"); 1410 return -EINVAL; 1411 } 1412 1413 if (state & TCA_FLOWER_KEY_CT_FLAGS_NEW && 1414 state & TCA_FLOWER_KEY_CT_FLAGS_ESTABLISHED) { 1415 NL_SET_ERR_MSG_ATTR(extack, tb, 1416 "new and est are mutually exclusive"); 1417 return -EINVAL; 1418 } 1419 1420 if (state & TCA_FLOWER_KEY_CT_FLAGS_INVALID && 1421 state & ~(TCA_FLOWER_KEY_CT_FLAGS_TRACKED | 1422 TCA_FLOWER_KEY_CT_FLAGS_INVALID)) { 1423 NL_SET_ERR_MSG_ATTR(extack, tb, 1424 "when inv is set, only trk may be set"); 1425 return -EINVAL; 1426 } 1427 1428 if (state & TCA_FLOWER_KEY_CT_FLAGS_NEW && 1429 state & TCA_FLOWER_KEY_CT_FLAGS_REPLY) { 1430 NL_SET_ERR_MSG_ATTR(extack, tb, 1431 "new and rpl are mutually exclusive"); 1432 return -EINVAL; 1433 } 1434 1435 return 0; 1436 } 1437 1438 static int fl_set_key_ct(struct nlattr **tb, 1439 struct flow_dissector_key_ct *key, 1440 struct flow_dissector_key_ct *mask, 1441 struct netlink_ext_ack *extack) 1442 { 1443 if (tb[TCA_FLOWER_KEY_CT_STATE]) { 1444 int err; 1445 1446 if (!IS_ENABLED(CONFIG_NF_CONNTRACK)) { 1447 NL_SET_ERR_MSG(extack, "Conntrack isn't enabled"); 1448 return -EOPNOTSUPP; 1449 } 1450 fl_set_key_val(tb, &key->ct_state, TCA_FLOWER_KEY_CT_STATE, 1451 &mask->ct_state, TCA_FLOWER_KEY_CT_STATE_MASK, 1452 sizeof(key->ct_state)); 1453 1454 err = fl_validate_ct_state(key->ct_state & mask->ct_state, 1455 tb[TCA_FLOWER_KEY_CT_STATE_MASK], 1456 extack); 1457 if (err) 1458 return err; 1459 1460 } 1461 if (tb[TCA_FLOWER_KEY_CT_ZONE]) { 1462 if (!IS_ENABLED(CONFIG_NF_CONNTRACK_ZONES)) { 1463 NL_SET_ERR_MSG(extack, "Conntrack zones isn't enabled"); 1464 return -EOPNOTSUPP; 1465 } 1466 fl_set_key_val(tb, &key->ct_zone, TCA_FLOWER_KEY_CT_ZONE, 1467 &mask->ct_zone, TCA_FLOWER_KEY_CT_ZONE_MASK, 1468 sizeof(key->ct_zone)); 1469 } 1470 if (tb[TCA_FLOWER_KEY_CT_MARK]) { 1471 if (!IS_ENABLED(CONFIG_NF_CONNTRACK_MARK)) { 1472 NL_SET_ERR_MSG(extack, "Conntrack mark isn't enabled"); 1473 return -EOPNOTSUPP; 1474 } 1475 fl_set_key_val(tb, &key->ct_mark, TCA_FLOWER_KEY_CT_MARK, 1476 &mask->ct_mark, TCA_FLOWER_KEY_CT_MARK_MASK, 1477 sizeof(key->ct_mark)); 1478 } 1479 if (tb[TCA_FLOWER_KEY_CT_LABELS]) { 1480 if (!IS_ENABLED(CONFIG_NF_CONNTRACK_LABELS)) { 1481 NL_SET_ERR_MSG(extack, "Conntrack labels aren't enabled"); 1482 return -EOPNOTSUPP; 1483 } 1484 fl_set_key_val(tb, key->ct_labels, TCA_FLOWER_KEY_CT_LABELS, 1485 mask->ct_labels, TCA_FLOWER_KEY_CT_LABELS_MASK, 1486 sizeof(key->ct_labels)); 1487 } 1488 1489 return 0; 1490 } 1491 1492 static int fl_set_key(struct net *net, struct nlattr **tb, 1493 struct fl_flow_key *key, struct fl_flow_key *mask, 1494 struct netlink_ext_ack *extack) 1495 { 1496 __be16 ethertype; 1497 int ret = 0; 1498 1499 if (tb[TCA_FLOWER_INDEV]) { 1500 int err = tcf_change_indev(net, tb[TCA_FLOWER_INDEV], extack); 1501 if (err < 0) 1502 return err; 1503 key->meta.ingress_ifindex = err; 1504 mask->meta.ingress_ifindex = 0xffffffff; 1505 } 1506 1507 fl_set_key_val(tb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST, 1508 mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK, 1509 sizeof(key->eth.dst)); 1510 fl_set_key_val(tb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC, 1511 mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK, 1512 sizeof(key->eth.src)); 1513 1514 if (tb[TCA_FLOWER_KEY_ETH_TYPE]) { 1515 ethertype = nla_get_be16(tb[TCA_FLOWER_KEY_ETH_TYPE]); 1516 1517 if (eth_type_vlan(ethertype)) { 1518 fl_set_key_vlan(tb, ethertype, TCA_FLOWER_KEY_VLAN_ID, 1519 TCA_FLOWER_KEY_VLAN_PRIO, &key->vlan, 1520 &mask->vlan); 1521 1522 if (tb[TCA_FLOWER_KEY_VLAN_ETH_TYPE]) { 1523 ethertype = nla_get_be16(tb[TCA_FLOWER_KEY_VLAN_ETH_TYPE]); 1524 if (eth_type_vlan(ethertype)) { 1525 fl_set_key_vlan(tb, ethertype, 1526 TCA_FLOWER_KEY_CVLAN_ID, 1527 TCA_FLOWER_KEY_CVLAN_PRIO, 1528 &key->cvlan, &mask->cvlan); 1529 fl_set_key_val(tb, &key->basic.n_proto, 1530 TCA_FLOWER_KEY_CVLAN_ETH_TYPE, 1531 &mask->basic.n_proto, 1532 TCA_FLOWER_UNSPEC, 1533 sizeof(key->basic.n_proto)); 1534 mask->basic.n_proto = cpu_to_be16(0); 1535 } else { 1536 key->basic.n_proto = ethertype; 1537 } 1538 } 1539 } else { 1540 key->basic.n_proto = ethertype; 1541 } 1542 } 1543 1544 if (key->basic.n_proto == htons(ETH_P_IP) || 1545 key->basic.n_proto == htons(ETH_P_IPV6)) { 1546 fl_set_key_val(tb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO, 1547 &mask->basic.ip_proto, TCA_FLOWER_UNSPEC, 1548 sizeof(key->basic.ip_proto)); 1549 fl_set_key_ip(tb, false, &key->ip, &mask->ip); 1550 } 1551 1552 if (tb[TCA_FLOWER_KEY_IPV4_SRC] || tb[TCA_FLOWER_KEY_IPV4_DST]) { 1553 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS; 1554 mask->control.addr_type = ~0; 1555 fl_set_key_val(tb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC, 1556 &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK, 1557 sizeof(key->ipv4.src)); 1558 fl_set_key_val(tb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST, 1559 &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK, 1560 sizeof(key->ipv4.dst)); 1561 } else if (tb[TCA_FLOWER_KEY_IPV6_SRC] || tb[TCA_FLOWER_KEY_IPV6_DST]) { 1562 key->control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS; 1563 mask->control.addr_type = ~0; 1564 fl_set_key_val(tb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC, 1565 &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK, 1566 sizeof(key->ipv6.src)); 1567 fl_set_key_val(tb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST, 1568 &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK, 1569 sizeof(key->ipv6.dst)); 1570 } 1571 1572 if (key->basic.ip_proto == IPPROTO_TCP) { 1573 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC, 1574 &mask->tp.src, TCA_FLOWER_KEY_TCP_SRC_MASK, 1575 sizeof(key->tp.src)); 1576 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST, 1577 &mask->tp.dst, TCA_FLOWER_KEY_TCP_DST_MASK, 1578 sizeof(key->tp.dst)); 1579 fl_set_key_val(tb, &key->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS, 1580 &mask->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS_MASK, 1581 sizeof(key->tcp.flags)); 1582 } else if (key->basic.ip_proto == IPPROTO_UDP) { 1583 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC, 1584 &mask->tp.src, TCA_FLOWER_KEY_UDP_SRC_MASK, 1585 sizeof(key->tp.src)); 1586 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST, 1587 &mask->tp.dst, TCA_FLOWER_KEY_UDP_DST_MASK, 1588 sizeof(key->tp.dst)); 1589 } else if (key->basic.ip_proto == IPPROTO_SCTP) { 1590 fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_SCTP_SRC, 1591 &mask->tp.src, TCA_FLOWER_KEY_SCTP_SRC_MASK, 1592 sizeof(key->tp.src)); 1593 fl_set_key_val(tb, &key->tp.dst, TCA_FLOWER_KEY_SCTP_DST, 1594 &mask->tp.dst, TCA_FLOWER_KEY_SCTP_DST_MASK, 1595 sizeof(key->tp.dst)); 1596 } else if (key->basic.n_proto == htons(ETH_P_IP) && 1597 key->basic.ip_proto == IPPROTO_ICMP) { 1598 fl_set_key_val(tb, &key->icmp.type, TCA_FLOWER_KEY_ICMPV4_TYPE, 1599 &mask->icmp.type, 1600 TCA_FLOWER_KEY_ICMPV4_TYPE_MASK, 1601 sizeof(key->icmp.type)); 1602 fl_set_key_val(tb, &key->icmp.code, TCA_FLOWER_KEY_ICMPV4_CODE, 1603 &mask->icmp.code, 1604 TCA_FLOWER_KEY_ICMPV4_CODE_MASK, 1605 sizeof(key->icmp.code)); 1606 } else if (key->basic.n_proto == htons(ETH_P_IPV6) && 1607 key->basic.ip_proto == IPPROTO_ICMPV6) { 1608 fl_set_key_val(tb, &key->icmp.type, TCA_FLOWER_KEY_ICMPV6_TYPE, 1609 &mask->icmp.type, 1610 TCA_FLOWER_KEY_ICMPV6_TYPE_MASK, 1611 sizeof(key->icmp.type)); 1612 fl_set_key_val(tb, &key->icmp.code, TCA_FLOWER_KEY_ICMPV6_CODE, 1613 &mask->icmp.code, 1614 TCA_FLOWER_KEY_ICMPV6_CODE_MASK, 1615 sizeof(key->icmp.code)); 1616 } else if (key->basic.n_proto == htons(ETH_P_MPLS_UC) || 1617 key->basic.n_proto == htons(ETH_P_MPLS_MC)) { 1618 ret = fl_set_key_mpls(tb, &key->mpls, &mask->mpls, extack); 1619 if (ret) 1620 return ret; 1621 } else if (key->basic.n_proto == htons(ETH_P_ARP) || 1622 key->basic.n_proto == htons(ETH_P_RARP)) { 1623 fl_set_key_val(tb, &key->arp.sip, TCA_FLOWER_KEY_ARP_SIP, 1624 &mask->arp.sip, TCA_FLOWER_KEY_ARP_SIP_MASK, 1625 sizeof(key->arp.sip)); 1626 fl_set_key_val(tb, &key->arp.tip, TCA_FLOWER_KEY_ARP_TIP, 1627 &mask->arp.tip, TCA_FLOWER_KEY_ARP_TIP_MASK, 1628 sizeof(key->arp.tip)); 1629 fl_set_key_val(tb, &key->arp.op, TCA_FLOWER_KEY_ARP_OP, 1630 &mask->arp.op, TCA_FLOWER_KEY_ARP_OP_MASK, 1631 sizeof(key->arp.op)); 1632 fl_set_key_val(tb, key->arp.sha, TCA_FLOWER_KEY_ARP_SHA, 1633 mask->arp.sha, TCA_FLOWER_KEY_ARP_SHA_MASK, 1634 sizeof(key->arp.sha)); 1635 fl_set_key_val(tb, key->arp.tha, TCA_FLOWER_KEY_ARP_THA, 1636 mask->arp.tha, TCA_FLOWER_KEY_ARP_THA_MASK, 1637 sizeof(key->arp.tha)); 1638 } 1639 1640 if (key->basic.ip_proto == IPPROTO_TCP || 1641 key->basic.ip_proto == IPPROTO_UDP || 1642 key->basic.ip_proto == IPPROTO_SCTP) { 1643 ret = fl_set_key_port_range(tb, key, mask, extack); 1644 if (ret) 1645 return ret; 1646 } 1647 1648 if (tb[TCA_FLOWER_KEY_ENC_IPV4_SRC] || 1649 tb[TCA_FLOWER_KEY_ENC_IPV4_DST]) { 1650 key->enc_control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS; 1651 mask->enc_control.addr_type = ~0; 1652 fl_set_key_val(tb, &key->enc_ipv4.src, 1653 TCA_FLOWER_KEY_ENC_IPV4_SRC, 1654 &mask->enc_ipv4.src, 1655 TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK, 1656 sizeof(key->enc_ipv4.src)); 1657 fl_set_key_val(tb, &key->enc_ipv4.dst, 1658 TCA_FLOWER_KEY_ENC_IPV4_DST, 1659 &mask->enc_ipv4.dst, 1660 TCA_FLOWER_KEY_ENC_IPV4_DST_MASK, 1661 sizeof(key->enc_ipv4.dst)); 1662 } 1663 1664 if (tb[TCA_FLOWER_KEY_ENC_IPV6_SRC] || 1665 tb[TCA_FLOWER_KEY_ENC_IPV6_DST]) { 1666 key->enc_control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS; 1667 mask->enc_control.addr_type = ~0; 1668 fl_set_key_val(tb, &key->enc_ipv6.src, 1669 TCA_FLOWER_KEY_ENC_IPV6_SRC, 1670 &mask->enc_ipv6.src, 1671 TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK, 1672 sizeof(key->enc_ipv6.src)); 1673 fl_set_key_val(tb, &key->enc_ipv6.dst, 1674 TCA_FLOWER_KEY_ENC_IPV6_DST, 1675 &mask->enc_ipv6.dst, 1676 TCA_FLOWER_KEY_ENC_IPV6_DST_MASK, 1677 sizeof(key->enc_ipv6.dst)); 1678 } 1679 1680 fl_set_key_val(tb, &key->enc_key_id.keyid, TCA_FLOWER_KEY_ENC_KEY_ID, 1681 &mask->enc_key_id.keyid, TCA_FLOWER_UNSPEC, 1682 sizeof(key->enc_key_id.keyid)); 1683 1684 fl_set_key_val(tb, &key->enc_tp.src, TCA_FLOWER_KEY_ENC_UDP_SRC_PORT, 1685 &mask->enc_tp.src, TCA_FLOWER_KEY_ENC_UDP_SRC_PORT_MASK, 1686 sizeof(key->enc_tp.src)); 1687 1688 fl_set_key_val(tb, &key->enc_tp.dst, TCA_FLOWER_KEY_ENC_UDP_DST_PORT, 1689 &mask->enc_tp.dst, TCA_FLOWER_KEY_ENC_UDP_DST_PORT_MASK, 1690 sizeof(key->enc_tp.dst)); 1691 1692 fl_set_key_ip(tb, true, &key->enc_ip, &mask->enc_ip); 1693 1694 fl_set_key_val(tb, &key->hash.hash, TCA_FLOWER_KEY_HASH, 1695 &mask->hash.hash, TCA_FLOWER_KEY_HASH_MASK, 1696 sizeof(key->hash.hash)); 1697 1698 if (tb[TCA_FLOWER_KEY_ENC_OPTS]) { 1699 ret = fl_set_enc_opt(tb, key, mask, extack); 1700 if (ret) 1701 return ret; 1702 } 1703 1704 ret = fl_set_key_ct(tb, &key->ct, &mask->ct, extack); 1705 if (ret) 1706 return ret; 1707 1708 if (tb[TCA_FLOWER_KEY_FLAGS]) 1709 ret = fl_set_key_flags(tb, &key->control.flags, 1710 &mask->control.flags, extack); 1711 1712 return ret; 1713 } 1714 1715 static void fl_mask_copy(struct fl_flow_mask *dst, 1716 struct fl_flow_mask *src) 1717 { 1718 const void *psrc = fl_key_get_start(&src->key, src); 1719 void *pdst = fl_key_get_start(&dst->key, src); 1720 1721 memcpy(pdst, psrc, fl_mask_range(src)); 1722 dst->range = src->range; 1723 } 1724 1725 static const struct rhashtable_params fl_ht_params = { 1726 .key_offset = offsetof(struct cls_fl_filter, mkey), /* base offset */ 1727 .head_offset = offsetof(struct cls_fl_filter, ht_node), 1728 .automatic_shrinking = true, 1729 }; 1730 1731 static int fl_init_mask_hashtable(struct fl_flow_mask *mask) 1732 { 1733 mask->filter_ht_params = fl_ht_params; 1734 mask->filter_ht_params.key_len = fl_mask_range(mask); 1735 mask->filter_ht_params.key_offset += mask->range.start; 1736 1737 return rhashtable_init(&mask->ht, &mask->filter_ht_params); 1738 } 1739 1740 #define FL_KEY_MEMBER_OFFSET(member) offsetof(struct fl_flow_key, member) 1741 #define FL_KEY_MEMBER_SIZE(member) sizeof_field(struct fl_flow_key, member) 1742 1743 #define FL_KEY_IS_MASKED(mask, member) \ 1744 memchr_inv(((char *)mask) + FL_KEY_MEMBER_OFFSET(member), \ 1745 0, FL_KEY_MEMBER_SIZE(member)) \ 1746 1747 #define FL_KEY_SET(keys, cnt, id, member) \ 1748 do { \ 1749 keys[cnt].key_id = id; \ 1750 keys[cnt].offset = FL_KEY_MEMBER_OFFSET(member); \ 1751 cnt++; \ 1752 } while(0); 1753 1754 #define FL_KEY_SET_IF_MASKED(mask, keys, cnt, id, member) \ 1755 do { \ 1756 if (FL_KEY_IS_MASKED(mask, member)) \ 1757 FL_KEY_SET(keys, cnt, id, member); \ 1758 } while(0); 1759 1760 static void fl_init_dissector(struct flow_dissector *dissector, 1761 struct fl_flow_key *mask) 1762 { 1763 struct flow_dissector_key keys[FLOW_DISSECTOR_KEY_MAX]; 1764 size_t cnt = 0; 1765 1766 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1767 FLOW_DISSECTOR_KEY_META, meta); 1768 FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_CONTROL, control); 1769 FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_BASIC, basic); 1770 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1771 FLOW_DISSECTOR_KEY_ETH_ADDRS, eth); 1772 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1773 FLOW_DISSECTOR_KEY_IPV4_ADDRS, ipv4); 1774 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1775 FLOW_DISSECTOR_KEY_IPV6_ADDRS, ipv6); 1776 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1777 FLOW_DISSECTOR_KEY_PORTS, tp); 1778 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1779 FLOW_DISSECTOR_KEY_PORTS_RANGE, tp_range); 1780 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1781 FLOW_DISSECTOR_KEY_IP, ip); 1782 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1783 FLOW_DISSECTOR_KEY_TCP, tcp); 1784 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1785 FLOW_DISSECTOR_KEY_ICMP, icmp); 1786 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1787 FLOW_DISSECTOR_KEY_ARP, arp); 1788 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1789 FLOW_DISSECTOR_KEY_MPLS, mpls); 1790 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1791 FLOW_DISSECTOR_KEY_VLAN, vlan); 1792 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1793 FLOW_DISSECTOR_KEY_CVLAN, cvlan); 1794 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1795 FLOW_DISSECTOR_KEY_ENC_KEYID, enc_key_id); 1796 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1797 FLOW_DISSECTOR_KEY_ENC_IPV4_ADDRS, enc_ipv4); 1798 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1799 FLOW_DISSECTOR_KEY_ENC_IPV6_ADDRS, enc_ipv6); 1800 if (FL_KEY_IS_MASKED(mask, enc_ipv4) || 1801 FL_KEY_IS_MASKED(mask, enc_ipv6)) 1802 FL_KEY_SET(keys, cnt, FLOW_DISSECTOR_KEY_ENC_CONTROL, 1803 enc_control); 1804 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1805 FLOW_DISSECTOR_KEY_ENC_PORTS, enc_tp); 1806 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1807 FLOW_DISSECTOR_KEY_ENC_IP, enc_ip); 1808 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1809 FLOW_DISSECTOR_KEY_ENC_OPTS, enc_opts); 1810 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1811 FLOW_DISSECTOR_KEY_CT, ct); 1812 FL_KEY_SET_IF_MASKED(mask, keys, cnt, 1813 FLOW_DISSECTOR_KEY_HASH, hash); 1814 1815 skb_flow_dissector_init(dissector, keys, cnt); 1816 } 1817 1818 static struct fl_flow_mask *fl_create_new_mask(struct cls_fl_head *head, 1819 struct fl_flow_mask *mask) 1820 { 1821 struct fl_flow_mask *newmask; 1822 int err; 1823 1824 newmask = kzalloc(sizeof(*newmask), GFP_KERNEL); 1825 if (!newmask) 1826 return ERR_PTR(-ENOMEM); 1827 1828 fl_mask_copy(newmask, mask); 1829 1830 if ((newmask->key.tp_range.tp_min.dst && 1831 newmask->key.tp_range.tp_max.dst) || 1832 (newmask->key.tp_range.tp_min.src && 1833 newmask->key.tp_range.tp_max.src)) 1834 newmask->flags |= TCA_FLOWER_MASK_FLAGS_RANGE; 1835 1836 err = fl_init_mask_hashtable(newmask); 1837 if (err) 1838 goto errout_free; 1839 1840 fl_init_dissector(&newmask->dissector, &newmask->key); 1841 1842 INIT_LIST_HEAD_RCU(&newmask->filters); 1843 1844 refcount_set(&newmask->refcnt, 1); 1845 err = rhashtable_replace_fast(&head->ht, &mask->ht_node, 1846 &newmask->ht_node, mask_ht_params); 1847 if (err) 1848 goto errout_destroy; 1849 1850 spin_lock(&head->masks_lock); 1851 list_add_tail_rcu(&newmask->list, &head->masks); 1852 spin_unlock(&head->masks_lock); 1853 1854 return newmask; 1855 1856 errout_destroy: 1857 rhashtable_destroy(&newmask->ht); 1858 errout_free: 1859 kfree(newmask); 1860 1861 return ERR_PTR(err); 1862 } 1863 1864 static int fl_check_assign_mask(struct cls_fl_head *head, 1865 struct cls_fl_filter *fnew, 1866 struct cls_fl_filter *fold, 1867 struct fl_flow_mask *mask) 1868 { 1869 struct fl_flow_mask *newmask; 1870 int ret = 0; 1871 1872 rcu_read_lock(); 1873 1874 /* Insert mask as temporary node to prevent concurrent creation of mask 1875 * with same key. Any concurrent lookups with same key will return 1876 * -EAGAIN because mask's refcnt is zero. 1877 */ 1878 fnew->mask = rhashtable_lookup_get_insert_fast(&head->ht, 1879 &mask->ht_node, 1880 mask_ht_params); 1881 if (!fnew->mask) { 1882 rcu_read_unlock(); 1883 1884 if (fold) { 1885 ret = -EINVAL; 1886 goto errout_cleanup; 1887 } 1888 1889 newmask = fl_create_new_mask(head, mask); 1890 if (IS_ERR(newmask)) { 1891 ret = PTR_ERR(newmask); 1892 goto errout_cleanup; 1893 } 1894 1895 fnew->mask = newmask; 1896 return 0; 1897 } else if (IS_ERR(fnew->mask)) { 1898 ret = PTR_ERR(fnew->mask); 1899 } else if (fold && fold->mask != fnew->mask) { 1900 ret = -EINVAL; 1901 } else if (!refcount_inc_not_zero(&fnew->mask->refcnt)) { 1902 /* Mask was deleted concurrently, try again */ 1903 ret = -EAGAIN; 1904 } 1905 rcu_read_unlock(); 1906 return ret; 1907 1908 errout_cleanup: 1909 rhashtable_remove_fast(&head->ht, &mask->ht_node, 1910 mask_ht_params); 1911 return ret; 1912 } 1913 1914 static int fl_set_parms(struct net *net, struct tcf_proto *tp, 1915 struct cls_fl_filter *f, struct fl_flow_mask *mask, 1916 unsigned long base, struct nlattr **tb, 1917 struct nlattr *est, bool ovr, 1918 struct fl_flow_tmplt *tmplt, bool rtnl_held, 1919 struct netlink_ext_ack *extack) 1920 { 1921 int err; 1922 1923 err = tcf_exts_validate(net, tp, tb, est, &f->exts, ovr, rtnl_held, 1924 extack); 1925 if (err < 0) 1926 return err; 1927 1928 if (tb[TCA_FLOWER_CLASSID]) { 1929 f->res.classid = nla_get_u32(tb[TCA_FLOWER_CLASSID]); 1930 if (!rtnl_held) 1931 rtnl_lock(); 1932 tcf_bind_filter(tp, &f->res, base); 1933 if (!rtnl_held) 1934 rtnl_unlock(); 1935 } 1936 1937 err = fl_set_key(net, tb, &f->key, &mask->key, extack); 1938 if (err) 1939 return err; 1940 1941 fl_mask_update_range(mask); 1942 fl_set_masked_key(&f->mkey, &f->key, mask); 1943 1944 if (!fl_mask_fits_tmplt(tmplt, mask)) { 1945 NL_SET_ERR_MSG_MOD(extack, "Mask does not fit the template"); 1946 return -EINVAL; 1947 } 1948 1949 return 0; 1950 } 1951 1952 static int fl_ht_insert_unique(struct cls_fl_filter *fnew, 1953 struct cls_fl_filter *fold, 1954 bool *in_ht) 1955 { 1956 struct fl_flow_mask *mask = fnew->mask; 1957 int err; 1958 1959 err = rhashtable_lookup_insert_fast(&mask->ht, 1960 &fnew->ht_node, 1961 mask->filter_ht_params); 1962 if (err) { 1963 *in_ht = false; 1964 /* It is okay if filter with same key exists when 1965 * overwriting. 1966 */ 1967 return fold && err == -EEXIST ? 0 : err; 1968 } 1969 1970 *in_ht = true; 1971 return 0; 1972 } 1973 1974 static int fl_change(struct net *net, struct sk_buff *in_skb, 1975 struct tcf_proto *tp, unsigned long base, 1976 u32 handle, struct nlattr **tca, 1977 void **arg, bool ovr, bool rtnl_held, 1978 struct netlink_ext_ack *extack) 1979 { 1980 struct cls_fl_head *head = fl_head_dereference(tp); 1981 struct cls_fl_filter *fold = *arg; 1982 struct cls_fl_filter *fnew; 1983 struct fl_flow_mask *mask; 1984 struct nlattr **tb; 1985 bool in_ht; 1986 int err; 1987 1988 if (!tca[TCA_OPTIONS]) { 1989 err = -EINVAL; 1990 goto errout_fold; 1991 } 1992 1993 mask = kzalloc(sizeof(struct fl_flow_mask), GFP_KERNEL); 1994 if (!mask) { 1995 err = -ENOBUFS; 1996 goto errout_fold; 1997 } 1998 1999 tb = kcalloc(TCA_FLOWER_MAX + 1, sizeof(struct nlattr *), GFP_KERNEL); 2000 if (!tb) { 2001 err = -ENOBUFS; 2002 goto errout_mask_alloc; 2003 } 2004 2005 err = nla_parse_nested_deprecated(tb, TCA_FLOWER_MAX, 2006 tca[TCA_OPTIONS], fl_policy, NULL); 2007 if (err < 0) 2008 goto errout_tb; 2009 2010 if (fold && handle && fold->handle != handle) { 2011 err = -EINVAL; 2012 goto errout_tb; 2013 } 2014 2015 fnew = kzalloc(sizeof(*fnew), GFP_KERNEL); 2016 if (!fnew) { 2017 err = -ENOBUFS; 2018 goto errout_tb; 2019 } 2020 INIT_LIST_HEAD(&fnew->hw_list); 2021 refcount_set(&fnew->refcnt, 1); 2022 2023 err = tcf_exts_init(&fnew->exts, net, TCA_FLOWER_ACT, 0); 2024 if (err < 0) 2025 goto errout; 2026 2027 if (tb[TCA_FLOWER_FLAGS]) { 2028 fnew->flags = nla_get_u32(tb[TCA_FLOWER_FLAGS]); 2029 2030 if (!tc_flags_valid(fnew->flags)) { 2031 err = -EINVAL; 2032 goto errout; 2033 } 2034 } 2035 2036 err = fl_set_parms(net, tp, fnew, mask, base, tb, tca[TCA_RATE], ovr, 2037 tp->chain->tmplt_priv, rtnl_held, extack); 2038 if (err) 2039 goto errout; 2040 2041 err = fl_check_assign_mask(head, fnew, fold, mask); 2042 if (err) 2043 goto errout; 2044 2045 err = fl_ht_insert_unique(fnew, fold, &in_ht); 2046 if (err) 2047 goto errout_mask; 2048 2049 if (!tc_skip_hw(fnew->flags)) { 2050 err = fl_hw_replace_filter(tp, fnew, rtnl_held, extack); 2051 if (err) 2052 goto errout_ht; 2053 } 2054 2055 if (!tc_in_hw(fnew->flags)) 2056 fnew->flags |= TCA_CLS_FLAGS_NOT_IN_HW; 2057 2058 spin_lock(&tp->lock); 2059 2060 /* tp was deleted concurrently. -EAGAIN will cause caller to lookup 2061 * proto again or create new one, if necessary. 2062 */ 2063 if (tp->deleting) { 2064 err = -EAGAIN; 2065 goto errout_hw; 2066 } 2067 2068 if (fold) { 2069 /* Fold filter was deleted concurrently. Retry lookup. */ 2070 if (fold->deleted) { 2071 err = -EAGAIN; 2072 goto errout_hw; 2073 } 2074 2075 fnew->handle = handle; 2076 2077 if (!in_ht) { 2078 struct rhashtable_params params = 2079 fnew->mask->filter_ht_params; 2080 2081 err = rhashtable_insert_fast(&fnew->mask->ht, 2082 &fnew->ht_node, 2083 params); 2084 if (err) 2085 goto errout_hw; 2086 in_ht = true; 2087 } 2088 2089 refcount_inc(&fnew->refcnt); 2090 rhashtable_remove_fast(&fold->mask->ht, 2091 &fold->ht_node, 2092 fold->mask->filter_ht_params); 2093 idr_replace(&head->handle_idr, fnew, fnew->handle); 2094 list_replace_rcu(&fold->list, &fnew->list); 2095 fold->deleted = true; 2096 2097 spin_unlock(&tp->lock); 2098 2099 fl_mask_put(head, fold->mask); 2100 if (!tc_skip_hw(fold->flags)) 2101 fl_hw_destroy_filter(tp, fold, rtnl_held, NULL); 2102 tcf_unbind_filter(tp, &fold->res); 2103 /* Caller holds reference to fold, so refcnt is always > 0 2104 * after this. 2105 */ 2106 refcount_dec(&fold->refcnt); 2107 __fl_put(fold); 2108 } else { 2109 if (handle) { 2110 /* user specifies a handle and it doesn't exist */ 2111 err = idr_alloc_u32(&head->handle_idr, fnew, &handle, 2112 handle, GFP_ATOMIC); 2113 2114 /* Filter with specified handle was concurrently 2115 * inserted after initial check in cls_api. This is not 2116 * necessarily an error if NLM_F_EXCL is not set in 2117 * message flags. Returning EAGAIN will cause cls_api to 2118 * try to update concurrently inserted rule. 2119 */ 2120 if (err == -ENOSPC) 2121 err = -EAGAIN; 2122 } else { 2123 handle = 1; 2124 err = idr_alloc_u32(&head->handle_idr, fnew, &handle, 2125 INT_MAX, GFP_ATOMIC); 2126 } 2127 if (err) 2128 goto errout_hw; 2129 2130 refcount_inc(&fnew->refcnt); 2131 fnew->handle = handle; 2132 list_add_tail_rcu(&fnew->list, &fnew->mask->filters); 2133 spin_unlock(&tp->lock); 2134 } 2135 2136 *arg = fnew; 2137 2138 kfree(tb); 2139 tcf_queue_work(&mask->rwork, fl_uninit_mask_free_work); 2140 return 0; 2141 2142 errout_ht: 2143 spin_lock(&tp->lock); 2144 errout_hw: 2145 fnew->deleted = true; 2146 spin_unlock(&tp->lock); 2147 if (!tc_skip_hw(fnew->flags)) 2148 fl_hw_destroy_filter(tp, fnew, rtnl_held, NULL); 2149 if (in_ht) 2150 rhashtable_remove_fast(&fnew->mask->ht, &fnew->ht_node, 2151 fnew->mask->filter_ht_params); 2152 errout_mask: 2153 fl_mask_put(head, fnew->mask); 2154 errout: 2155 __fl_put(fnew); 2156 errout_tb: 2157 kfree(tb); 2158 errout_mask_alloc: 2159 tcf_queue_work(&mask->rwork, fl_uninit_mask_free_work); 2160 errout_fold: 2161 if (fold) 2162 __fl_put(fold); 2163 return err; 2164 } 2165 2166 static int fl_delete(struct tcf_proto *tp, void *arg, bool *last, 2167 bool rtnl_held, struct netlink_ext_ack *extack) 2168 { 2169 struct cls_fl_head *head = fl_head_dereference(tp); 2170 struct cls_fl_filter *f = arg; 2171 bool last_on_mask; 2172 int err = 0; 2173 2174 err = __fl_delete(tp, f, &last_on_mask, rtnl_held, extack); 2175 *last = list_empty(&head->masks); 2176 __fl_put(f); 2177 2178 return err; 2179 } 2180 2181 static void fl_walk(struct tcf_proto *tp, struct tcf_walker *arg, 2182 bool rtnl_held) 2183 { 2184 struct cls_fl_head *head = fl_head_dereference(tp); 2185 unsigned long id = arg->cookie, tmp; 2186 struct cls_fl_filter *f; 2187 2188 arg->count = arg->skip; 2189 2190 idr_for_each_entry_continue_ul(&head->handle_idr, f, tmp, id) { 2191 /* don't return filters that are being deleted */ 2192 if (!refcount_inc_not_zero(&f->refcnt)) 2193 continue; 2194 if (arg->fn(tp, f, arg) < 0) { 2195 __fl_put(f); 2196 arg->stop = 1; 2197 break; 2198 } 2199 __fl_put(f); 2200 arg->count++; 2201 } 2202 arg->cookie = id; 2203 } 2204 2205 static struct cls_fl_filter * 2206 fl_get_next_hw_filter(struct tcf_proto *tp, struct cls_fl_filter *f, bool add) 2207 { 2208 struct cls_fl_head *head = fl_head_dereference(tp); 2209 2210 spin_lock(&tp->lock); 2211 if (list_empty(&head->hw_filters)) { 2212 spin_unlock(&tp->lock); 2213 return NULL; 2214 } 2215 2216 if (!f) 2217 f = list_entry(&head->hw_filters, struct cls_fl_filter, 2218 hw_list); 2219 list_for_each_entry_continue(f, &head->hw_filters, hw_list) { 2220 if (!(add && f->deleted) && refcount_inc_not_zero(&f->refcnt)) { 2221 spin_unlock(&tp->lock); 2222 return f; 2223 } 2224 } 2225 2226 spin_unlock(&tp->lock); 2227 return NULL; 2228 } 2229 2230 static int fl_reoffload(struct tcf_proto *tp, bool add, flow_setup_cb_t *cb, 2231 void *cb_priv, struct netlink_ext_ack *extack) 2232 { 2233 struct tcf_block *block = tp->chain->block; 2234 struct flow_cls_offload cls_flower = {}; 2235 struct cls_fl_filter *f = NULL; 2236 int err; 2237 2238 /* hw_filters list can only be changed by hw offload functions after 2239 * obtaining rtnl lock. Make sure it is not changed while reoffload is 2240 * iterating it. 2241 */ 2242 ASSERT_RTNL(); 2243 2244 while ((f = fl_get_next_hw_filter(tp, f, add))) { 2245 cls_flower.rule = 2246 flow_rule_alloc(tcf_exts_num_actions(&f->exts)); 2247 if (!cls_flower.rule) { 2248 __fl_put(f); 2249 return -ENOMEM; 2250 } 2251 2252 tc_cls_common_offload_init(&cls_flower.common, tp, f->flags, 2253 extack); 2254 cls_flower.command = add ? 2255 FLOW_CLS_REPLACE : FLOW_CLS_DESTROY; 2256 cls_flower.cookie = (unsigned long)f; 2257 cls_flower.rule->match.dissector = &f->mask->dissector; 2258 cls_flower.rule->match.mask = &f->mask->key; 2259 cls_flower.rule->match.key = &f->mkey; 2260 2261 err = tc_setup_flow_action(&cls_flower.rule->action, &f->exts); 2262 if (err) { 2263 kfree(cls_flower.rule); 2264 if (tc_skip_sw(f->flags)) { 2265 NL_SET_ERR_MSG_MOD(extack, "Failed to setup flow action"); 2266 __fl_put(f); 2267 return err; 2268 } 2269 goto next_flow; 2270 } 2271 2272 cls_flower.classid = f->res.classid; 2273 2274 err = tc_setup_cb_reoffload(block, tp, add, cb, 2275 TC_SETUP_CLSFLOWER, &cls_flower, 2276 cb_priv, &f->flags, 2277 &f->in_hw_count); 2278 tc_cleanup_flow_action(&cls_flower.rule->action); 2279 kfree(cls_flower.rule); 2280 2281 if (err) { 2282 __fl_put(f); 2283 return err; 2284 } 2285 next_flow: 2286 __fl_put(f); 2287 } 2288 2289 return 0; 2290 } 2291 2292 static void fl_hw_add(struct tcf_proto *tp, void *type_data) 2293 { 2294 struct flow_cls_offload *cls_flower = type_data; 2295 struct cls_fl_filter *f = 2296 (struct cls_fl_filter *) cls_flower->cookie; 2297 struct cls_fl_head *head = fl_head_dereference(tp); 2298 2299 spin_lock(&tp->lock); 2300 list_add(&f->hw_list, &head->hw_filters); 2301 spin_unlock(&tp->lock); 2302 } 2303 2304 static void fl_hw_del(struct tcf_proto *tp, void *type_data) 2305 { 2306 struct flow_cls_offload *cls_flower = type_data; 2307 struct cls_fl_filter *f = 2308 (struct cls_fl_filter *) cls_flower->cookie; 2309 2310 spin_lock(&tp->lock); 2311 if (!list_empty(&f->hw_list)) 2312 list_del_init(&f->hw_list); 2313 spin_unlock(&tp->lock); 2314 } 2315 2316 static int fl_hw_create_tmplt(struct tcf_chain *chain, 2317 struct fl_flow_tmplt *tmplt) 2318 { 2319 struct flow_cls_offload cls_flower = {}; 2320 struct tcf_block *block = chain->block; 2321 2322 cls_flower.rule = flow_rule_alloc(0); 2323 if (!cls_flower.rule) 2324 return -ENOMEM; 2325 2326 cls_flower.common.chain_index = chain->index; 2327 cls_flower.command = FLOW_CLS_TMPLT_CREATE; 2328 cls_flower.cookie = (unsigned long) tmplt; 2329 cls_flower.rule->match.dissector = &tmplt->dissector; 2330 cls_flower.rule->match.mask = &tmplt->mask; 2331 cls_flower.rule->match.key = &tmplt->dummy_key; 2332 2333 /* We don't care if driver (any of them) fails to handle this 2334 * call. It serves just as a hint for it. 2335 */ 2336 tc_setup_cb_call(block, TC_SETUP_CLSFLOWER, &cls_flower, false, true); 2337 kfree(cls_flower.rule); 2338 2339 return 0; 2340 } 2341 2342 static void fl_hw_destroy_tmplt(struct tcf_chain *chain, 2343 struct fl_flow_tmplt *tmplt) 2344 { 2345 struct flow_cls_offload cls_flower = {}; 2346 struct tcf_block *block = chain->block; 2347 2348 cls_flower.common.chain_index = chain->index; 2349 cls_flower.command = FLOW_CLS_TMPLT_DESTROY; 2350 cls_flower.cookie = (unsigned long) tmplt; 2351 2352 tc_setup_cb_call(block, TC_SETUP_CLSFLOWER, &cls_flower, false, true); 2353 } 2354 2355 static void *fl_tmplt_create(struct net *net, struct tcf_chain *chain, 2356 struct nlattr **tca, 2357 struct netlink_ext_ack *extack) 2358 { 2359 struct fl_flow_tmplt *tmplt; 2360 struct nlattr **tb; 2361 int err; 2362 2363 if (!tca[TCA_OPTIONS]) 2364 return ERR_PTR(-EINVAL); 2365 2366 tb = kcalloc(TCA_FLOWER_MAX + 1, sizeof(struct nlattr *), GFP_KERNEL); 2367 if (!tb) 2368 return ERR_PTR(-ENOBUFS); 2369 err = nla_parse_nested_deprecated(tb, TCA_FLOWER_MAX, 2370 tca[TCA_OPTIONS], fl_policy, NULL); 2371 if (err) 2372 goto errout_tb; 2373 2374 tmplt = kzalloc(sizeof(*tmplt), GFP_KERNEL); 2375 if (!tmplt) { 2376 err = -ENOMEM; 2377 goto errout_tb; 2378 } 2379 tmplt->chain = chain; 2380 err = fl_set_key(net, tb, &tmplt->dummy_key, &tmplt->mask, extack); 2381 if (err) 2382 goto errout_tmplt; 2383 2384 fl_init_dissector(&tmplt->dissector, &tmplt->mask); 2385 2386 err = fl_hw_create_tmplt(chain, tmplt); 2387 if (err) 2388 goto errout_tmplt; 2389 2390 kfree(tb); 2391 return tmplt; 2392 2393 errout_tmplt: 2394 kfree(tmplt); 2395 errout_tb: 2396 kfree(tb); 2397 return ERR_PTR(err); 2398 } 2399 2400 static void fl_tmplt_destroy(void *tmplt_priv) 2401 { 2402 struct fl_flow_tmplt *tmplt = tmplt_priv; 2403 2404 fl_hw_destroy_tmplt(tmplt->chain, tmplt); 2405 kfree(tmplt); 2406 } 2407 2408 static int fl_dump_key_val(struct sk_buff *skb, 2409 void *val, int val_type, 2410 void *mask, int mask_type, int len) 2411 { 2412 int err; 2413 2414 if (!memchr_inv(mask, 0, len)) 2415 return 0; 2416 err = nla_put(skb, val_type, len, val); 2417 if (err) 2418 return err; 2419 if (mask_type != TCA_FLOWER_UNSPEC) { 2420 err = nla_put(skb, mask_type, len, mask); 2421 if (err) 2422 return err; 2423 } 2424 return 0; 2425 } 2426 2427 static int fl_dump_key_port_range(struct sk_buff *skb, struct fl_flow_key *key, 2428 struct fl_flow_key *mask) 2429 { 2430 if (fl_dump_key_val(skb, &key->tp_range.tp_min.dst, 2431 TCA_FLOWER_KEY_PORT_DST_MIN, 2432 &mask->tp_range.tp_min.dst, TCA_FLOWER_UNSPEC, 2433 sizeof(key->tp_range.tp_min.dst)) || 2434 fl_dump_key_val(skb, &key->tp_range.tp_max.dst, 2435 TCA_FLOWER_KEY_PORT_DST_MAX, 2436 &mask->tp_range.tp_max.dst, TCA_FLOWER_UNSPEC, 2437 sizeof(key->tp_range.tp_max.dst)) || 2438 fl_dump_key_val(skb, &key->tp_range.tp_min.src, 2439 TCA_FLOWER_KEY_PORT_SRC_MIN, 2440 &mask->tp_range.tp_min.src, TCA_FLOWER_UNSPEC, 2441 sizeof(key->tp_range.tp_min.src)) || 2442 fl_dump_key_val(skb, &key->tp_range.tp_max.src, 2443 TCA_FLOWER_KEY_PORT_SRC_MAX, 2444 &mask->tp_range.tp_max.src, TCA_FLOWER_UNSPEC, 2445 sizeof(key->tp_range.tp_max.src))) 2446 return -1; 2447 2448 return 0; 2449 } 2450 2451 static int fl_dump_key_mpls_opt_lse(struct sk_buff *skb, 2452 struct flow_dissector_key_mpls *mpls_key, 2453 struct flow_dissector_key_mpls *mpls_mask, 2454 u8 lse_index) 2455 { 2456 struct flow_dissector_mpls_lse *lse_mask = &mpls_mask->ls[lse_index]; 2457 struct flow_dissector_mpls_lse *lse_key = &mpls_key->ls[lse_index]; 2458 int err; 2459 2460 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_OPT_LSE_DEPTH, 2461 lse_index + 1); 2462 if (err) 2463 return err; 2464 2465 if (lse_mask->mpls_ttl) { 2466 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_OPT_LSE_TTL, 2467 lse_key->mpls_ttl); 2468 if (err) 2469 return err; 2470 } 2471 if (lse_mask->mpls_bos) { 2472 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_OPT_LSE_BOS, 2473 lse_key->mpls_bos); 2474 if (err) 2475 return err; 2476 } 2477 if (lse_mask->mpls_tc) { 2478 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_OPT_LSE_TC, 2479 lse_key->mpls_tc); 2480 if (err) 2481 return err; 2482 } 2483 if (lse_mask->mpls_label) { 2484 err = nla_put_u32(skb, TCA_FLOWER_KEY_MPLS_OPT_LSE_LABEL, 2485 lse_key->mpls_label); 2486 if (err) 2487 return err; 2488 } 2489 2490 return 0; 2491 } 2492 2493 static int fl_dump_key_mpls_opts(struct sk_buff *skb, 2494 struct flow_dissector_key_mpls *mpls_key, 2495 struct flow_dissector_key_mpls *mpls_mask) 2496 { 2497 struct nlattr *opts; 2498 struct nlattr *lse; 2499 u8 lse_index; 2500 int err; 2501 2502 opts = nla_nest_start(skb, TCA_FLOWER_KEY_MPLS_OPTS); 2503 if (!opts) 2504 return -EMSGSIZE; 2505 2506 for (lse_index = 0; lse_index < FLOW_DIS_MPLS_MAX; lse_index++) { 2507 if (!(mpls_mask->used_lses & 1 << lse_index)) 2508 continue; 2509 2510 lse = nla_nest_start(skb, TCA_FLOWER_KEY_MPLS_OPTS_LSE); 2511 if (!lse) { 2512 err = -EMSGSIZE; 2513 goto err_opts; 2514 } 2515 2516 err = fl_dump_key_mpls_opt_lse(skb, mpls_key, mpls_mask, 2517 lse_index); 2518 if (err) 2519 goto err_opts_lse; 2520 nla_nest_end(skb, lse); 2521 } 2522 nla_nest_end(skb, opts); 2523 2524 return 0; 2525 2526 err_opts_lse: 2527 nla_nest_cancel(skb, lse); 2528 err_opts: 2529 nla_nest_cancel(skb, opts); 2530 2531 return err; 2532 } 2533 2534 static int fl_dump_key_mpls(struct sk_buff *skb, 2535 struct flow_dissector_key_mpls *mpls_key, 2536 struct flow_dissector_key_mpls *mpls_mask) 2537 { 2538 struct flow_dissector_mpls_lse *lse_mask; 2539 struct flow_dissector_mpls_lse *lse_key; 2540 int err; 2541 2542 if (!mpls_mask->used_lses) 2543 return 0; 2544 2545 lse_mask = &mpls_mask->ls[0]; 2546 lse_key = &mpls_key->ls[0]; 2547 2548 /* For backward compatibility, don't use the MPLS nested attributes if 2549 * the rule can be expressed using the old attributes. 2550 */ 2551 if (mpls_mask->used_lses & ~1 || 2552 (!lse_mask->mpls_ttl && !lse_mask->mpls_bos && 2553 !lse_mask->mpls_tc && !lse_mask->mpls_label)) 2554 return fl_dump_key_mpls_opts(skb, mpls_key, mpls_mask); 2555 2556 if (lse_mask->mpls_ttl) { 2557 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_TTL, 2558 lse_key->mpls_ttl); 2559 if (err) 2560 return err; 2561 } 2562 if (lse_mask->mpls_tc) { 2563 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_TC, 2564 lse_key->mpls_tc); 2565 if (err) 2566 return err; 2567 } 2568 if (lse_mask->mpls_label) { 2569 err = nla_put_u32(skb, TCA_FLOWER_KEY_MPLS_LABEL, 2570 lse_key->mpls_label); 2571 if (err) 2572 return err; 2573 } 2574 if (lse_mask->mpls_bos) { 2575 err = nla_put_u8(skb, TCA_FLOWER_KEY_MPLS_BOS, 2576 lse_key->mpls_bos); 2577 if (err) 2578 return err; 2579 } 2580 return 0; 2581 } 2582 2583 static int fl_dump_key_ip(struct sk_buff *skb, bool encap, 2584 struct flow_dissector_key_ip *key, 2585 struct flow_dissector_key_ip *mask) 2586 { 2587 int tos_key = encap ? TCA_FLOWER_KEY_ENC_IP_TOS : TCA_FLOWER_KEY_IP_TOS; 2588 int ttl_key = encap ? TCA_FLOWER_KEY_ENC_IP_TTL : TCA_FLOWER_KEY_IP_TTL; 2589 int tos_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TOS_MASK : TCA_FLOWER_KEY_IP_TOS_MASK; 2590 int ttl_mask = encap ? TCA_FLOWER_KEY_ENC_IP_TTL_MASK : TCA_FLOWER_KEY_IP_TTL_MASK; 2591 2592 if (fl_dump_key_val(skb, &key->tos, tos_key, &mask->tos, tos_mask, sizeof(key->tos)) || 2593 fl_dump_key_val(skb, &key->ttl, ttl_key, &mask->ttl, ttl_mask, sizeof(key->ttl))) 2594 return -1; 2595 2596 return 0; 2597 } 2598 2599 static int fl_dump_key_vlan(struct sk_buff *skb, 2600 int vlan_id_key, int vlan_prio_key, 2601 struct flow_dissector_key_vlan *vlan_key, 2602 struct flow_dissector_key_vlan *vlan_mask) 2603 { 2604 int err; 2605 2606 if (!memchr_inv(vlan_mask, 0, sizeof(*vlan_mask))) 2607 return 0; 2608 if (vlan_mask->vlan_id) { 2609 err = nla_put_u16(skb, vlan_id_key, 2610 vlan_key->vlan_id); 2611 if (err) 2612 return err; 2613 } 2614 if (vlan_mask->vlan_priority) { 2615 err = nla_put_u8(skb, vlan_prio_key, 2616 vlan_key->vlan_priority); 2617 if (err) 2618 return err; 2619 } 2620 return 0; 2621 } 2622 2623 static void fl_get_key_flag(u32 dissector_key, u32 dissector_mask, 2624 u32 *flower_key, u32 *flower_mask, 2625 u32 flower_flag_bit, u32 dissector_flag_bit) 2626 { 2627 if (dissector_mask & dissector_flag_bit) { 2628 *flower_mask |= flower_flag_bit; 2629 if (dissector_key & dissector_flag_bit) 2630 *flower_key |= flower_flag_bit; 2631 } 2632 } 2633 2634 static int fl_dump_key_flags(struct sk_buff *skb, u32 flags_key, u32 flags_mask) 2635 { 2636 u32 key, mask; 2637 __be32 _key, _mask; 2638 int err; 2639 2640 if (!memchr_inv(&flags_mask, 0, sizeof(flags_mask))) 2641 return 0; 2642 2643 key = 0; 2644 mask = 0; 2645 2646 fl_get_key_flag(flags_key, flags_mask, &key, &mask, 2647 TCA_FLOWER_KEY_FLAGS_IS_FRAGMENT, FLOW_DIS_IS_FRAGMENT); 2648 fl_get_key_flag(flags_key, flags_mask, &key, &mask, 2649 TCA_FLOWER_KEY_FLAGS_FRAG_IS_FIRST, 2650 FLOW_DIS_FIRST_FRAG); 2651 2652 _key = cpu_to_be32(key); 2653 _mask = cpu_to_be32(mask); 2654 2655 err = nla_put(skb, TCA_FLOWER_KEY_FLAGS, 4, &_key); 2656 if (err) 2657 return err; 2658 2659 return nla_put(skb, TCA_FLOWER_KEY_FLAGS_MASK, 4, &_mask); 2660 } 2661 2662 static int fl_dump_key_geneve_opt(struct sk_buff *skb, 2663 struct flow_dissector_key_enc_opts *enc_opts) 2664 { 2665 struct geneve_opt *opt; 2666 struct nlattr *nest; 2667 int opt_off = 0; 2668 2669 nest = nla_nest_start_noflag(skb, TCA_FLOWER_KEY_ENC_OPTS_GENEVE); 2670 if (!nest) 2671 goto nla_put_failure; 2672 2673 while (enc_opts->len > opt_off) { 2674 opt = (struct geneve_opt *)&enc_opts->data[opt_off]; 2675 2676 if (nla_put_be16(skb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_CLASS, 2677 opt->opt_class)) 2678 goto nla_put_failure; 2679 if (nla_put_u8(skb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_TYPE, 2680 opt->type)) 2681 goto nla_put_failure; 2682 if (nla_put(skb, TCA_FLOWER_KEY_ENC_OPT_GENEVE_DATA, 2683 opt->length * 4, opt->opt_data)) 2684 goto nla_put_failure; 2685 2686 opt_off += sizeof(struct geneve_opt) + opt->length * 4; 2687 } 2688 nla_nest_end(skb, nest); 2689 return 0; 2690 2691 nla_put_failure: 2692 nla_nest_cancel(skb, nest); 2693 return -EMSGSIZE; 2694 } 2695 2696 static int fl_dump_key_vxlan_opt(struct sk_buff *skb, 2697 struct flow_dissector_key_enc_opts *enc_opts) 2698 { 2699 struct vxlan_metadata *md; 2700 struct nlattr *nest; 2701 2702 nest = nla_nest_start_noflag(skb, TCA_FLOWER_KEY_ENC_OPTS_VXLAN); 2703 if (!nest) 2704 goto nla_put_failure; 2705 2706 md = (struct vxlan_metadata *)&enc_opts->data[0]; 2707 if (nla_put_u32(skb, TCA_FLOWER_KEY_ENC_OPT_VXLAN_GBP, md->gbp)) 2708 goto nla_put_failure; 2709 2710 nla_nest_end(skb, nest); 2711 return 0; 2712 2713 nla_put_failure: 2714 nla_nest_cancel(skb, nest); 2715 return -EMSGSIZE; 2716 } 2717 2718 static int fl_dump_key_erspan_opt(struct sk_buff *skb, 2719 struct flow_dissector_key_enc_opts *enc_opts) 2720 { 2721 struct erspan_metadata *md; 2722 struct nlattr *nest; 2723 2724 nest = nla_nest_start_noflag(skb, TCA_FLOWER_KEY_ENC_OPTS_ERSPAN); 2725 if (!nest) 2726 goto nla_put_failure; 2727 2728 md = (struct erspan_metadata *)&enc_opts->data[0]; 2729 if (nla_put_u8(skb, TCA_FLOWER_KEY_ENC_OPT_ERSPAN_VER, md->version)) 2730 goto nla_put_failure; 2731 2732 if (md->version == 1 && 2733 nla_put_be32(skb, TCA_FLOWER_KEY_ENC_OPT_ERSPAN_INDEX, md->u.index)) 2734 goto nla_put_failure; 2735 2736 if (md->version == 2 && 2737 (nla_put_u8(skb, TCA_FLOWER_KEY_ENC_OPT_ERSPAN_DIR, 2738 md->u.md2.dir) || 2739 nla_put_u8(skb, TCA_FLOWER_KEY_ENC_OPT_ERSPAN_HWID, 2740 get_hwid(&md->u.md2)))) 2741 goto nla_put_failure; 2742 2743 nla_nest_end(skb, nest); 2744 return 0; 2745 2746 nla_put_failure: 2747 nla_nest_cancel(skb, nest); 2748 return -EMSGSIZE; 2749 } 2750 2751 static int fl_dump_key_ct(struct sk_buff *skb, 2752 struct flow_dissector_key_ct *key, 2753 struct flow_dissector_key_ct *mask) 2754 { 2755 if (IS_ENABLED(CONFIG_NF_CONNTRACK) && 2756 fl_dump_key_val(skb, &key->ct_state, TCA_FLOWER_KEY_CT_STATE, 2757 &mask->ct_state, TCA_FLOWER_KEY_CT_STATE_MASK, 2758 sizeof(key->ct_state))) 2759 goto nla_put_failure; 2760 2761 if (IS_ENABLED(CONFIG_NF_CONNTRACK_ZONES) && 2762 fl_dump_key_val(skb, &key->ct_zone, TCA_FLOWER_KEY_CT_ZONE, 2763 &mask->ct_zone, TCA_FLOWER_KEY_CT_ZONE_MASK, 2764 sizeof(key->ct_zone))) 2765 goto nla_put_failure; 2766 2767 if (IS_ENABLED(CONFIG_NF_CONNTRACK_MARK) && 2768 fl_dump_key_val(skb, &key->ct_mark, TCA_FLOWER_KEY_CT_MARK, 2769 &mask->ct_mark, TCA_FLOWER_KEY_CT_MARK_MASK, 2770 sizeof(key->ct_mark))) 2771 goto nla_put_failure; 2772 2773 if (IS_ENABLED(CONFIG_NF_CONNTRACK_LABELS) && 2774 fl_dump_key_val(skb, &key->ct_labels, TCA_FLOWER_KEY_CT_LABELS, 2775 &mask->ct_labels, TCA_FLOWER_KEY_CT_LABELS_MASK, 2776 sizeof(key->ct_labels))) 2777 goto nla_put_failure; 2778 2779 return 0; 2780 2781 nla_put_failure: 2782 return -EMSGSIZE; 2783 } 2784 2785 static int fl_dump_key_options(struct sk_buff *skb, int enc_opt_type, 2786 struct flow_dissector_key_enc_opts *enc_opts) 2787 { 2788 struct nlattr *nest; 2789 int err; 2790 2791 if (!enc_opts->len) 2792 return 0; 2793 2794 nest = nla_nest_start_noflag(skb, enc_opt_type); 2795 if (!nest) 2796 goto nla_put_failure; 2797 2798 switch (enc_opts->dst_opt_type) { 2799 case TUNNEL_GENEVE_OPT: 2800 err = fl_dump_key_geneve_opt(skb, enc_opts); 2801 if (err) 2802 goto nla_put_failure; 2803 break; 2804 case TUNNEL_VXLAN_OPT: 2805 err = fl_dump_key_vxlan_opt(skb, enc_opts); 2806 if (err) 2807 goto nla_put_failure; 2808 break; 2809 case TUNNEL_ERSPAN_OPT: 2810 err = fl_dump_key_erspan_opt(skb, enc_opts); 2811 if (err) 2812 goto nla_put_failure; 2813 break; 2814 default: 2815 goto nla_put_failure; 2816 } 2817 nla_nest_end(skb, nest); 2818 return 0; 2819 2820 nla_put_failure: 2821 nla_nest_cancel(skb, nest); 2822 return -EMSGSIZE; 2823 } 2824 2825 static int fl_dump_key_enc_opt(struct sk_buff *skb, 2826 struct flow_dissector_key_enc_opts *key_opts, 2827 struct flow_dissector_key_enc_opts *msk_opts) 2828 { 2829 int err; 2830 2831 err = fl_dump_key_options(skb, TCA_FLOWER_KEY_ENC_OPTS, key_opts); 2832 if (err) 2833 return err; 2834 2835 return fl_dump_key_options(skb, TCA_FLOWER_KEY_ENC_OPTS_MASK, msk_opts); 2836 } 2837 2838 static int fl_dump_key(struct sk_buff *skb, struct net *net, 2839 struct fl_flow_key *key, struct fl_flow_key *mask) 2840 { 2841 if (mask->meta.ingress_ifindex) { 2842 struct net_device *dev; 2843 2844 dev = __dev_get_by_index(net, key->meta.ingress_ifindex); 2845 if (dev && nla_put_string(skb, TCA_FLOWER_INDEV, dev->name)) 2846 goto nla_put_failure; 2847 } 2848 2849 if (fl_dump_key_val(skb, key->eth.dst, TCA_FLOWER_KEY_ETH_DST, 2850 mask->eth.dst, TCA_FLOWER_KEY_ETH_DST_MASK, 2851 sizeof(key->eth.dst)) || 2852 fl_dump_key_val(skb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC, 2853 mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK, 2854 sizeof(key->eth.src)) || 2855 fl_dump_key_val(skb, &key->basic.n_proto, TCA_FLOWER_KEY_ETH_TYPE, 2856 &mask->basic.n_proto, TCA_FLOWER_UNSPEC, 2857 sizeof(key->basic.n_proto))) 2858 goto nla_put_failure; 2859 2860 if (fl_dump_key_mpls(skb, &key->mpls, &mask->mpls)) 2861 goto nla_put_failure; 2862 2863 if (fl_dump_key_vlan(skb, TCA_FLOWER_KEY_VLAN_ID, 2864 TCA_FLOWER_KEY_VLAN_PRIO, &key->vlan, &mask->vlan)) 2865 goto nla_put_failure; 2866 2867 if (fl_dump_key_vlan(skb, TCA_FLOWER_KEY_CVLAN_ID, 2868 TCA_FLOWER_KEY_CVLAN_PRIO, 2869 &key->cvlan, &mask->cvlan) || 2870 (mask->cvlan.vlan_tpid && 2871 nla_put_be16(skb, TCA_FLOWER_KEY_VLAN_ETH_TYPE, 2872 key->cvlan.vlan_tpid))) 2873 goto nla_put_failure; 2874 2875 if (mask->basic.n_proto) { 2876 if (mask->cvlan.vlan_tpid) { 2877 if (nla_put_be16(skb, TCA_FLOWER_KEY_CVLAN_ETH_TYPE, 2878 key->basic.n_proto)) 2879 goto nla_put_failure; 2880 } else if (mask->vlan.vlan_tpid) { 2881 if (nla_put_be16(skb, TCA_FLOWER_KEY_VLAN_ETH_TYPE, 2882 key->basic.n_proto)) 2883 goto nla_put_failure; 2884 } 2885 } 2886 2887 if ((key->basic.n_proto == htons(ETH_P_IP) || 2888 key->basic.n_proto == htons(ETH_P_IPV6)) && 2889 (fl_dump_key_val(skb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO, 2890 &mask->basic.ip_proto, TCA_FLOWER_UNSPEC, 2891 sizeof(key->basic.ip_proto)) || 2892 fl_dump_key_ip(skb, false, &key->ip, &mask->ip))) 2893 goto nla_put_failure; 2894 2895 if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS && 2896 (fl_dump_key_val(skb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC, 2897 &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK, 2898 sizeof(key->ipv4.src)) || 2899 fl_dump_key_val(skb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST, 2900 &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK, 2901 sizeof(key->ipv4.dst)))) 2902 goto nla_put_failure; 2903 else if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS && 2904 (fl_dump_key_val(skb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC, 2905 &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK, 2906 sizeof(key->ipv6.src)) || 2907 fl_dump_key_val(skb, &key->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST, 2908 &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK, 2909 sizeof(key->ipv6.dst)))) 2910 goto nla_put_failure; 2911 2912 if (key->basic.ip_proto == IPPROTO_TCP && 2913 (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC, 2914 &mask->tp.src, TCA_FLOWER_KEY_TCP_SRC_MASK, 2915 sizeof(key->tp.src)) || 2916 fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_TCP_DST, 2917 &mask->tp.dst, TCA_FLOWER_KEY_TCP_DST_MASK, 2918 sizeof(key->tp.dst)) || 2919 fl_dump_key_val(skb, &key->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS, 2920 &mask->tcp.flags, TCA_FLOWER_KEY_TCP_FLAGS_MASK, 2921 sizeof(key->tcp.flags)))) 2922 goto nla_put_failure; 2923 else if (key->basic.ip_proto == IPPROTO_UDP && 2924 (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_UDP_SRC, 2925 &mask->tp.src, TCA_FLOWER_KEY_UDP_SRC_MASK, 2926 sizeof(key->tp.src)) || 2927 fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_UDP_DST, 2928 &mask->tp.dst, TCA_FLOWER_KEY_UDP_DST_MASK, 2929 sizeof(key->tp.dst)))) 2930 goto nla_put_failure; 2931 else if (key->basic.ip_proto == IPPROTO_SCTP && 2932 (fl_dump_key_val(skb, &key->tp.src, TCA_FLOWER_KEY_SCTP_SRC, 2933 &mask->tp.src, TCA_FLOWER_KEY_SCTP_SRC_MASK, 2934 sizeof(key->tp.src)) || 2935 fl_dump_key_val(skb, &key->tp.dst, TCA_FLOWER_KEY_SCTP_DST, 2936 &mask->tp.dst, TCA_FLOWER_KEY_SCTP_DST_MASK, 2937 sizeof(key->tp.dst)))) 2938 goto nla_put_failure; 2939 else if (key->basic.n_proto == htons(ETH_P_IP) && 2940 key->basic.ip_proto == IPPROTO_ICMP && 2941 (fl_dump_key_val(skb, &key->icmp.type, 2942 TCA_FLOWER_KEY_ICMPV4_TYPE, &mask->icmp.type, 2943 TCA_FLOWER_KEY_ICMPV4_TYPE_MASK, 2944 sizeof(key->icmp.type)) || 2945 fl_dump_key_val(skb, &key->icmp.code, 2946 TCA_FLOWER_KEY_ICMPV4_CODE, &mask->icmp.code, 2947 TCA_FLOWER_KEY_ICMPV4_CODE_MASK, 2948 sizeof(key->icmp.code)))) 2949 goto nla_put_failure; 2950 else if (key->basic.n_proto == htons(ETH_P_IPV6) && 2951 key->basic.ip_proto == IPPROTO_ICMPV6 && 2952 (fl_dump_key_val(skb, &key->icmp.type, 2953 TCA_FLOWER_KEY_ICMPV6_TYPE, &mask->icmp.type, 2954 TCA_FLOWER_KEY_ICMPV6_TYPE_MASK, 2955 sizeof(key->icmp.type)) || 2956 fl_dump_key_val(skb, &key->icmp.code, 2957 TCA_FLOWER_KEY_ICMPV6_CODE, &mask->icmp.code, 2958 TCA_FLOWER_KEY_ICMPV6_CODE_MASK, 2959 sizeof(key->icmp.code)))) 2960 goto nla_put_failure; 2961 else if ((key->basic.n_proto == htons(ETH_P_ARP) || 2962 key->basic.n_proto == htons(ETH_P_RARP)) && 2963 (fl_dump_key_val(skb, &key->arp.sip, 2964 TCA_FLOWER_KEY_ARP_SIP, &mask->arp.sip, 2965 TCA_FLOWER_KEY_ARP_SIP_MASK, 2966 sizeof(key->arp.sip)) || 2967 fl_dump_key_val(skb, &key->arp.tip, 2968 TCA_FLOWER_KEY_ARP_TIP, &mask->arp.tip, 2969 TCA_FLOWER_KEY_ARP_TIP_MASK, 2970 sizeof(key->arp.tip)) || 2971 fl_dump_key_val(skb, &key->arp.op, 2972 TCA_FLOWER_KEY_ARP_OP, &mask->arp.op, 2973 TCA_FLOWER_KEY_ARP_OP_MASK, 2974 sizeof(key->arp.op)) || 2975 fl_dump_key_val(skb, key->arp.sha, TCA_FLOWER_KEY_ARP_SHA, 2976 mask->arp.sha, TCA_FLOWER_KEY_ARP_SHA_MASK, 2977 sizeof(key->arp.sha)) || 2978 fl_dump_key_val(skb, key->arp.tha, TCA_FLOWER_KEY_ARP_THA, 2979 mask->arp.tha, TCA_FLOWER_KEY_ARP_THA_MASK, 2980 sizeof(key->arp.tha)))) 2981 goto nla_put_failure; 2982 2983 if ((key->basic.ip_proto == IPPROTO_TCP || 2984 key->basic.ip_proto == IPPROTO_UDP || 2985 key->basic.ip_proto == IPPROTO_SCTP) && 2986 fl_dump_key_port_range(skb, key, mask)) 2987 goto nla_put_failure; 2988 2989 if (key->enc_control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS && 2990 (fl_dump_key_val(skb, &key->enc_ipv4.src, 2991 TCA_FLOWER_KEY_ENC_IPV4_SRC, &mask->enc_ipv4.src, 2992 TCA_FLOWER_KEY_ENC_IPV4_SRC_MASK, 2993 sizeof(key->enc_ipv4.src)) || 2994 fl_dump_key_val(skb, &key->enc_ipv4.dst, 2995 TCA_FLOWER_KEY_ENC_IPV4_DST, &mask->enc_ipv4.dst, 2996 TCA_FLOWER_KEY_ENC_IPV4_DST_MASK, 2997 sizeof(key->enc_ipv4.dst)))) 2998 goto nla_put_failure; 2999 else if (key->enc_control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS && 3000 (fl_dump_key_val(skb, &key->enc_ipv6.src, 3001 TCA_FLOWER_KEY_ENC_IPV6_SRC, &mask->enc_ipv6.src, 3002 TCA_FLOWER_KEY_ENC_IPV6_SRC_MASK, 3003 sizeof(key->enc_ipv6.src)) || 3004 fl_dump_key_val(skb, &key->enc_ipv6.dst, 3005 TCA_FLOWER_KEY_ENC_IPV6_DST, 3006 &mask->enc_ipv6.dst, 3007 TCA_FLOWER_KEY_ENC_IPV6_DST_MASK, 3008 sizeof(key->enc_ipv6.dst)))) 3009 goto nla_put_failure; 3010 3011 if (fl_dump_key_val(skb, &key->enc_key_id, TCA_FLOWER_KEY_ENC_KEY_ID, 3012 &mask->enc_key_id, TCA_FLOWER_UNSPEC, 3013 sizeof(key->enc_key_id)) || 3014 fl_dump_key_val(skb, &key->enc_tp.src, 3015 TCA_FLOWER_KEY_ENC_UDP_SRC_PORT, 3016 &mask->enc_tp.src, 3017 TCA_FLOWER_KEY_ENC_UDP_SRC_PORT_MASK, 3018 sizeof(key->enc_tp.src)) || 3019 fl_dump_key_val(skb, &key->enc_tp.dst, 3020 TCA_FLOWER_KEY_ENC_UDP_DST_PORT, 3021 &mask->enc_tp.dst, 3022 TCA_FLOWER_KEY_ENC_UDP_DST_PORT_MASK, 3023 sizeof(key->enc_tp.dst)) || 3024 fl_dump_key_ip(skb, true, &key->enc_ip, &mask->enc_ip) || 3025 fl_dump_key_enc_opt(skb, &key->enc_opts, &mask->enc_opts)) 3026 goto nla_put_failure; 3027 3028 if (fl_dump_key_ct(skb, &key->ct, &mask->ct)) 3029 goto nla_put_failure; 3030 3031 if (fl_dump_key_flags(skb, key->control.flags, mask->control.flags)) 3032 goto nla_put_failure; 3033 3034 if (fl_dump_key_val(skb, &key->hash.hash, TCA_FLOWER_KEY_HASH, 3035 &mask->hash.hash, TCA_FLOWER_KEY_HASH_MASK, 3036 sizeof(key->hash.hash))) 3037 goto nla_put_failure; 3038 3039 return 0; 3040 3041 nla_put_failure: 3042 return -EMSGSIZE; 3043 } 3044 3045 static int fl_dump(struct net *net, struct tcf_proto *tp, void *fh, 3046 struct sk_buff *skb, struct tcmsg *t, bool rtnl_held) 3047 { 3048 struct cls_fl_filter *f = fh; 3049 struct nlattr *nest; 3050 struct fl_flow_key *key, *mask; 3051 bool skip_hw; 3052 3053 if (!f) 3054 return skb->len; 3055 3056 t->tcm_handle = f->handle; 3057 3058 nest = nla_nest_start_noflag(skb, TCA_OPTIONS); 3059 if (!nest) 3060 goto nla_put_failure; 3061 3062 spin_lock(&tp->lock); 3063 3064 if (f->res.classid && 3065 nla_put_u32(skb, TCA_FLOWER_CLASSID, f->res.classid)) 3066 goto nla_put_failure_locked; 3067 3068 key = &f->key; 3069 mask = &f->mask->key; 3070 skip_hw = tc_skip_hw(f->flags); 3071 3072 if (fl_dump_key(skb, net, key, mask)) 3073 goto nla_put_failure_locked; 3074 3075 if (f->flags && nla_put_u32(skb, TCA_FLOWER_FLAGS, f->flags)) 3076 goto nla_put_failure_locked; 3077 3078 spin_unlock(&tp->lock); 3079 3080 if (!skip_hw) 3081 fl_hw_update_stats(tp, f, rtnl_held); 3082 3083 if (nla_put_u32(skb, TCA_FLOWER_IN_HW_COUNT, f->in_hw_count)) 3084 goto nla_put_failure; 3085 3086 if (tcf_exts_dump(skb, &f->exts)) 3087 goto nla_put_failure; 3088 3089 nla_nest_end(skb, nest); 3090 3091 if (tcf_exts_dump_stats(skb, &f->exts) < 0) 3092 goto nla_put_failure; 3093 3094 return skb->len; 3095 3096 nla_put_failure_locked: 3097 spin_unlock(&tp->lock); 3098 nla_put_failure: 3099 nla_nest_cancel(skb, nest); 3100 return -1; 3101 } 3102 3103 static int fl_terse_dump(struct net *net, struct tcf_proto *tp, void *fh, 3104 struct sk_buff *skb, struct tcmsg *t, bool rtnl_held) 3105 { 3106 struct cls_fl_filter *f = fh; 3107 struct nlattr *nest; 3108 bool skip_hw; 3109 3110 if (!f) 3111 return skb->len; 3112 3113 t->tcm_handle = f->handle; 3114 3115 nest = nla_nest_start_noflag(skb, TCA_OPTIONS); 3116 if (!nest) 3117 goto nla_put_failure; 3118 3119 spin_lock(&tp->lock); 3120 3121 skip_hw = tc_skip_hw(f->flags); 3122 3123 if (f->flags && nla_put_u32(skb, TCA_FLOWER_FLAGS, f->flags)) 3124 goto nla_put_failure_locked; 3125 3126 spin_unlock(&tp->lock); 3127 3128 if (!skip_hw) 3129 fl_hw_update_stats(tp, f, rtnl_held); 3130 3131 if (tcf_exts_terse_dump(skb, &f->exts)) 3132 goto nla_put_failure; 3133 3134 nla_nest_end(skb, nest); 3135 3136 return skb->len; 3137 3138 nla_put_failure_locked: 3139 spin_unlock(&tp->lock); 3140 nla_put_failure: 3141 nla_nest_cancel(skb, nest); 3142 return -1; 3143 } 3144 3145 static int fl_tmplt_dump(struct sk_buff *skb, struct net *net, void *tmplt_priv) 3146 { 3147 struct fl_flow_tmplt *tmplt = tmplt_priv; 3148 struct fl_flow_key *key, *mask; 3149 struct nlattr *nest; 3150 3151 nest = nla_nest_start_noflag(skb, TCA_OPTIONS); 3152 if (!nest) 3153 goto nla_put_failure; 3154 3155 key = &tmplt->dummy_key; 3156 mask = &tmplt->mask; 3157 3158 if (fl_dump_key(skb, net, key, mask)) 3159 goto nla_put_failure; 3160 3161 nla_nest_end(skb, nest); 3162 3163 return skb->len; 3164 3165 nla_put_failure: 3166 nla_nest_cancel(skb, nest); 3167 return -EMSGSIZE; 3168 } 3169 3170 static void fl_bind_class(void *fh, u32 classid, unsigned long cl, void *q, 3171 unsigned long base) 3172 { 3173 struct cls_fl_filter *f = fh; 3174 3175 if (f && f->res.classid == classid) { 3176 if (cl) 3177 __tcf_bind_filter(q, &f->res, base); 3178 else 3179 __tcf_unbind_filter(q, &f->res); 3180 } 3181 } 3182 3183 static bool fl_delete_empty(struct tcf_proto *tp) 3184 { 3185 struct cls_fl_head *head = fl_head_dereference(tp); 3186 3187 spin_lock(&tp->lock); 3188 tp->deleting = idr_is_empty(&head->handle_idr); 3189 spin_unlock(&tp->lock); 3190 3191 return tp->deleting; 3192 } 3193 3194 static struct tcf_proto_ops cls_fl_ops __read_mostly = { 3195 .kind = "flower", 3196 .classify = fl_classify, 3197 .init = fl_init, 3198 .destroy = fl_destroy, 3199 .get = fl_get, 3200 .put = fl_put, 3201 .change = fl_change, 3202 .delete = fl_delete, 3203 .delete_empty = fl_delete_empty, 3204 .walk = fl_walk, 3205 .reoffload = fl_reoffload, 3206 .hw_add = fl_hw_add, 3207 .hw_del = fl_hw_del, 3208 .dump = fl_dump, 3209 .terse_dump = fl_terse_dump, 3210 .bind_class = fl_bind_class, 3211 .tmplt_create = fl_tmplt_create, 3212 .tmplt_destroy = fl_tmplt_destroy, 3213 .tmplt_dump = fl_tmplt_dump, 3214 .owner = THIS_MODULE, 3215 .flags = TCF_PROTO_OPS_DOIT_UNLOCKED, 3216 }; 3217 3218 static int __init cls_fl_init(void) 3219 { 3220 return register_tcf_proto_ops(&cls_fl_ops); 3221 } 3222 3223 static void __exit cls_fl_exit(void) 3224 { 3225 unregister_tcf_proto_ops(&cls_fl_ops); 3226 } 3227 3228 module_init(cls_fl_init); 3229 module_exit(cls_fl_exit); 3230 3231 MODULE_AUTHOR("Jiri Pirko <jiri@resnulli.us>"); 3232 MODULE_DESCRIPTION("Flower classifier"); 3233 MODULE_LICENSE("GPL v2"); 3234