1 /* Broadcom NetXtreme-C/E network driver.
2 *
3 * Copyright (c) 2017 Broadcom Limited
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation.
8 */
9
10 #include <linux/netdevice.h>
11 #include <linux/inetdevice.h>
12 #include <linux/if_vlan.h>
13 #include <net/flow_dissector.h>
14 #include <net/pkt_cls.h>
15 #include <net/tc_act/tc_gact.h>
16 #include <net/tc_act/tc_skbedit.h>
17 #include <net/tc_act/tc_mirred.h>
18 #include <net/tc_act/tc_vlan.h>
19 #include <net/tc_act/tc_pedit.h>
20 #include <net/tc_act/tc_tunnel_key.h>
21 #include <net/vxlan.h>
22
23 #include "bnxt_hsi.h"
24 #include "bnxt.h"
25 #include "bnxt_hwrm.h"
26 #include "bnxt_sriov.h"
27 #include "bnxt_tc.h"
28 #include "bnxt_vfr.h"
29
30 #define BNXT_FID_INVALID 0xffff
31 #define VLAN_TCI(vid, prio) ((vid) | ((prio) << VLAN_PRIO_SHIFT))
32
33 #define is_vlan_pcp_wildcarded(vlan_tci_mask) \
34 ((ntohs(vlan_tci_mask) & VLAN_PRIO_MASK) == 0x0000)
35 #define is_vlan_pcp_exactmatch(vlan_tci_mask) \
36 ((ntohs(vlan_tci_mask) & VLAN_PRIO_MASK) == VLAN_PRIO_MASK)
37 #define is_vlan_pcp_zero(vlan_tci) \
38 ((ntohs(vlan_tci) & VLAN_PRIO_MASK) == 0x0000)
39 #define is_vid_exactmatch(vlan_tci_mask) \
40 ((ntohs(vlan_tci_mask) & VLAN_VID_MASK) == VLAN_VID_MASK)
41
42 static bool is_wildcard(void *mask, int len);
43 static bool is_exactmatch(void *mask, int len);
44 /* Return the dst fid of the func for flow forwarding
45 * For PFs: src_fid is the fid of the PF
46 * For VF-reps: src_fid the fid of the VF
47 */
bnxt_flow_get_dst_fid(struct bnxt * pf_bp,struct net_device * dev)48 static u16 bnxt_flow_get_dst_fid(struct bnxt *pf_bp, struct net_device *dev)
49 {
50 struct bnxt *bp;
51
52 /* check if dev belongs to the same switch */
53 if (!netdev_port_same_parent_id(pf_bp->dev, dev)) {
54 netdev_info(pf_bp->dev, "dev(ifindex=%d) not on same switch\n",
55 dev->ifindex);
56 return BNXT_FID_INVALID;
57 }
58
59 /* Is dev a VF-rep? */
60 if (bnxt_dev_is_vf_rep(dev))
61 return bnxt_vf_rep_get_fid(dev);
62
63 bp = netdev_priv(dev);
64 return bp->pf.fw_fid;
65 }
66
bnxt_tc_parse_redir(struct bnxt * bp,struct bnxt_tc_actions * actions,const struct flow_action_entry * act)67 static int bnxt_tc_parse_redir(struct bnxt *bp,
68 struct bnxt_tc_actions *actions,
69 const struct flow_action_entry *act)
70 {
71 struct net_device *dev = act->dev;
72
73 if (!dev) {
74 netdev_info(bp->dev, "no dev in mirred action\n");
75 return -EINVAL;
76 }
77
78 actions->flags |= BNXT_TC_ACTION_FLAG_FWD;
79 actions->dst_dev = dev;
80 return 0;
81 }
82
bnxt_tc_parse_vlan(struct bnxt * bp,struct bnxt_tc_actions * actions,const struct flow_action_entry * act)83 static int bnxt_tc_parse_vlan(struct bnxt *bp,
84 struct bnxt_tc_actions *actions,
85 const struct flow_action_entry *act)
86 {
87 switch (act->id) {
88 case FLOW_ACTION_VLAN_POP:
89 actions->flags |= BNXT_TC_ACTION_FLAG_POP_VLAN;
90 break;
91 case FLOW_ACTION_VLAN_PUSH:
92 actions->flags |= BNXT_TC_ACTION_FLAG_PUSH_VLAN;
93 actions->push_vlan_tci = htons(act->vlan.vid);
94 actions->push_vlan_tpid = act->vlan.proto;
95 break;
96 default:
97 return -EOPNOTSUPP;
98 }
99 return 0;
100 }
101
bnxt_tc_parse_tunnel_set(struct bnxt * bp,struct bnxt_tc_actions * actions,const struct flow_action_entry * act)102 static int bnxt_tc_parse_tunnel_set(struct bnxt *bp,
103 struct bnxt_tc_actions *actions,
104 const struct flow_action_entry *act)
105 {
106 const struct ip_tunnel_info *tun_info = act->tunnel;
107 const struct ip_tunnel_key *tun_key = &tun_info->key;
108
109 if (ip_tunnel_info_af(tun_info) != AF_INET) {
110 netdev_info(bp->dev, "only IPv4 tunnel-encap is supported\n");
111 return -EOPNOTSUPP;
112 }
113
114 actions->tun_encap_key = *tun_key;
115 actions->flags |= BNXT_TC_ACTION_FLAG_TUNNEL_ENCAP;
116 return 0;
117 }
118
119 /* Key & Mask from the stack comes unaligned in multiple iterations of 4 bytes
120 * each(u32).
121 * This routine consolidates such multiple unaligned values into one
122 * field each for Key & Mask (for src and dst macs separately)
123 * For example,
124 * Mask/Key Offset Iteration
125 * ========== ====== =========
126 * dst mac 0xffffffff 0 1
127 * dst mac 0x0000ffff 4 2
128 *
129 * src mac 0xffff0000 4 1
130 * src mac 0xffffffff 8 2
131 *
132 * The above combination coming from the stack will be consolidated as
133 * Mask/Key
134 * ==============
135 * src mac: 0xffffffffffff
136 * dst mac: 0xffffffffffff
137 */
bnxt_set_l2_key_mask(u32 part_key,u32 part_mask,u8 * actual_key,u8 * actual_mask)138 static void bnxt_set_l2_key_mask(u32 part_key, u32 part_mask,
139 u8 *actual_key, u8 *actual_mask)
140 {
141 u32 key = get_unaligned((u32 *)actual_key);
142 u32 mask = get_unaligned((u32 *)actual_mask);
143
144 part_key &= part_mask;
145 part_key |= key & ~part_mask;
146
147 put_unaligned(mask | part_mask, (u32 *)actual_mask);
148 put_unaligned(part_key, (u32 *)actual_key);
149 }
150
151 static int
bnxt_fill_l2_rewrite_fields(struct bnxt_tc_actions * actions,u16 * eth_addr,u16 * eth_addr_mask)152 bnxt_fill_l2_rewrite_fields(struct bnxt_tc_actions *actions,
153 u16 *eth_addr, u16 *eth_addr_mask)
154 {
155 u16 *p;
156 int j;
157
158 if (unlikely(bnxt_eth_addr_key_mask_invalid(eth_addr, eth_addr_mask)))
159 return -EINVAL;
160
161 if (!is_wildcard(ð_addr_mask[0], ETH_ALEN)) {
162 if (!is_exactmatch(ð_addr_mask[0], ETH_ALEN))
163 return -EINVAL;
164 /* FW expects dmac to be in u16 array format */
165 p = eth_addr;
166 for (j = 0; j < 3; j++)
167 actions->l2_rewrite_dmac[j] = cpu_to_be16(*(p + j));
168 }
169
170 if (!is_wildcard(ð_addr_mask[ETH_ALEN / 2], ETH_ALEN)) {
171 if (!is_exactmatch(ð_addr_mask[ETH_ALEN / 2], ETH_ALEN))
172 return -EINVAL;
173 /* FW expects smac to be in u16 array format */
174 p = ð_addr[ETH_ALEN / 2];
175 for (j = 0; j < 3; j++)
176 actions->l2_rewrite_smac[j] = cpu_to_be16(*(p + j));
177 }
178
179 return 0;
180 }
181
182 static int
bnxt_tc_parse_pedit(struct bnxt * bp,struct bnxt_tc_actions * actions,struct flow_action_entry * act,int act_idx,u8 * eth_addr,u8 * eth_addr_mask)183 bnxt_tc_parse_pedit(struct bnxt *bp, struct bnxt_tc_actions *actions,
184 struct flow_action_entry *act, int act_idx, u8 *eth_addr,
185 u8 *eth_addr_mask)
186 {
187 size_t offset_of_ip6_daddr = offsetof(struct ipv6hdr, daddr);
188 size_t offset_of_ip6_saddr = offsetof(struct ipv6hdr, saddr);
189 u32 mask, val, offset, idx;
190 u8 htype;
191
192 offset = act->mangle.offset;
193 htype = act->mangle.htype;
194 mask = ~act->mangle.mask;
195 val = act->mangle.val;
196
197 switch (htype) {
198 case FLOW_ACT_MANGLE_HDR_TYPE_ETH:
199 if (offset > PEDIT_OFFSET_SMAC_LAST_4_BYTES) {
200 netdev_err(bp->dev,
201 "%s: eth_hdr: Invalid pedit field\n",
202 __func__);
203 return -EINVAL;
204 }
205 actions->flags |= BNXT_TC_ACTION_FLAG_L2_REWRITE;
206
207 bnxt_set_l2_key_mask(val, mask, ð_addr[offset],
208 ð_addr_mask[offset]);
209 break;
210 case FLOW_ACT_MANGLE_HDR_TYPE_IP4:
211 actions->flags |= BNXT_TC_ACTION_FLAG_NAT_XLATE;
212 actions->nat.l3_is_ipv4 = true;
213 if (offset == offsetof(struct iphdr, saddr)) {
214 actions->nat.src_xlate = true;
215 actions->nat.l3.ipv4.saddr.s_addr = htonl(val);
216 } else if (offset == offsetof(struct iphdr, daddr)) {
217 actions->nat.src_xlate = false;
218 actions->nat.l3.ipv4.daddr.s_addr = htonl(val);
219 } else {
220 netdev_err(bp->dev,
221 "%s: IPv4_hdr: Invalid pedit field\n",
222 __func__);
223 return -EINVAL;
224 }
225
226 netdev_dbg(bp->dev, "nat.src_xlate = %d src IP: %pI4 dst ip : %pI4\n",
227 actions->nat.src_xlate, &actions->nat.l3.ipv4.saddr,
228 &actions->nat.l3.ipv4.daddr);
229 break;
230
231 case FLOW_ACT_MANGLE_HDR_TYPE_IP6:
232 actions->flags |= BNXT_TC_ACTION_FLAG_NAT_XLATE;
233 actions->nat.l3_is_ipv4 = false;
234 if (offset >= offsetof(struct ipv6hdr, saddr) &&
235 offset < offset_of_ip6_daddr) {
236 /* 16 byte IPv6 address comes in 4 iterations of
237 * 4byte chunks each
238 */
239 actions->nat.src_xlate = true;
240 idx = (offset - offset_of_ip6_saddr) / 4;
241 /* First 4bytes will be copied to idx 0 and so on */
242 actions->nat.l3.ipv6.saddr.s6_addr32[idx] = htonl(val);
243 } else if (offset >= offset_of_ip6_daddr &&
244 offset < offset_of_ip6_daddr + 16) {
245 actions->nat.src_xlate = false;
246 idx = (offset - offset_of_ip6_daddr) / 4;
247 actions->nat.l3.ipv6.saddr.s6_addr32[idx] = htonl(val);
248 } else {
249 netdev_err(bp->dev,
250 "%s: IPv6_hdr: Invalid pedit field\n",
251 __func__);
252 return -EINVAL;
253 }
254 break;
255 case FLOW_ACT_MANGLE_HDR_TYPE_TCP:
256 case FLOW_ACT_MANGLE_HDR_TYPE_UDP:
257 /* HW does not support L4 rewrite alone without L3
258 * rewrite
259 */
260 if (!(actions->flags & BNXT_TC_ACTION_FLAG_NAT_XLATE)) {
261 netdev_err(bp->dev,
262 "Need to specify L3 rewrite as well\n");
263 return -EINVAL;
264 }
265 if (actions->nat.src_xlate)
266 actions->nat.l4.ports.sport = htons(val);
267 else
268 actions->nat.l4.ports.dport = htons(val);
269 netdev_dbg(bp->dev, "actions->nat.sport = %d dport = %d\n",
270 actions->nat.l4.ports.sport,
271 actions->nat.l4.ports.dport);
272 break;
273 default:
274 netdev_err(bp->dev, "%s: Unsupported pedit hdr type\n",
275 __func__);
276 return -EINVAL;
277 }
278 return 0;
279 }
280
bnxt_tc_parse_actions(struct bnxt * bp,struct bnxt_tc_actions * actions,struct flow_action * flow_action,struct netlink_ext_ack * extack)281 static int bnxt_tc_parse_actions(struct bnxt *bp,
282 struct bnxt_tc_actions *actions,
283 struct flow_action *flow_action,
284 struct netlink_ext_ack *extack)
285 {
286 /* Used to store the L2 rewrite mask for dmac (6 bytes) followed by
287 * smac (6 bytes) if rewrite of both is specified, otherwise either
288 * dmac or smac
289 */
290 u16 eth_addr_mask[ETH_ALEN] = { 0 };
291 /* Used to store the L2 rewrite key for dmac (6 bytes) followed by
292 * smac (6 bytes) if rewrite of both is specified, otherwise either
293 * dmac or smac
294 */
295 u16 eth_addr[ETH_ALEN] = { 0 };
296 struct flow_action_entry *act;
297 int i, rc;
298
299 if (!flow_action_has_entries(flow_action)) {
300 netdev_info(bp->dev, "no actions\n");
301 return -EINVAL;
302 }
303
304 if (!flow_action_basic_hw_stats_check(flow_action, extack))
305 return -EOPNOTSUPP;
306
307 flow_action_for_each(i, act, flow_action) {
308 switch (act->id) {
309 case FLOW_ACTION_DROP:
310 actions->flags |= BNXT_TC_ACTION_FLAG_DROP;
311 return 0; /* don't bother with other actions */
312 case FLOW_ACTION_REDIRECT:
313 rc = bnxt_tc_parse_redir(bp, actions, act);
314 if (rc)
315 return rc;
316 break;
317 case FLOW_ACTION_VLAN_POP:
318 case FLOW_ACTION_VLAN_PUSH:
319 case FLOW_ACTION_VLAN_MANGLE:
320 rc = bnxt_tc_parse_vlan(bp, actions, act);
321 if (rc)
322 return rc;
323 break;
324 case FLOW_ACTION_TUNNEL_ENCAP:
325 rc = bnxt_tc_parse_tunnel_set(bp, actions, act);
326 if (rc)
327 return rc;
328 break;
329 case FLOW_ACTION_TUNNEL_DECAP:
330 actions->flags |= BNXT_TC_ACTION_FLAG_TUNNEL_DECAP;
331 break;
332 /* Packet edit: L2 rewrite, NAT, NAPT */
333 case FLOW_ACTION_MANGLE:
334 rc = bnxt_tc_parse_pedit(bp, actions, act, i,
335 (u8 *)eth_addr,
336 (u8 *)eth_addr_mask);
337 if (rc)
338 return rc;
339 break;
340 default:
341 break;
342 }
343 }
344
345 if (actions->flags & BNXT_TC_ACTION_FLAG_L2_REWRITE) {
346 rc = bnxt_fill_l2_rewrite_fields(actions, eth_addr,
347 eth_addr_mask);
348 if (rc)
349 return rc;
350 }
351
352 if (actions->flags & BNXT_TC_ACTION_FLAG_FWD) {
353 if (actions->flags & BNXT_TC_ACTION_FLAG_TUNNEL_ENCAP) {
354 /* dst_fid is PF's fid */
355 actions->dst_fid = bp->pf.fw_fid;
356 } else {
357 /* find the FID from dst_dev */
358 actions->dst_fid =
359 bnxt_flow_get_dst_fid(bp, actions->dst_dev);
360 if (actions->dst_fid == BNXT_FID_INVALID)
361 return -EINVAL;
362 }
363 }
364
365 return 0;
366 }
367
bnxt_tc_parse_flow(struct bnxt * bp,struct flow_cls_offload * tc_flow_cmd,struct bnxt_tc_flow * flow)368 static int bnxt_tc_parse_flow(struct bnxt *bp,
369 struct flow_cls_offload *tc_flow_cmd,
370 struct bnxt_tc_flow *flow)
371 {
372 struct flow_rule *rule = flow_cls_offload_flow_rule(tc_flow_cmd);
373 struct flow_dissector *dissector = rule->match.dissector;
374
375 /* KEY_CONTROL and KEY_BASIC are needed for forming a meaningful key */
376 if ((dissector->used_keys & BIT_ULL(FLOW_DISSECTOR_KEY_CONTROL)) == 0 ||
377 (dissector->used_keys & BIT_ULL(FLOW_DISSECTOR_KEY_BASIC)) == 0) {
378 netdev_info(bp->dev, "cannot form TC key: used_keys = 0x%llx\n",
379 dissector->used_keys);
380 return -EOPNOTSUPP;
381 }
382
383 if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_BASIC)) {
384 struct flow_match_basic match;
385
386 flow_rule_match_basic(rule, &match);
387 flow->l2_key.ether_type = match.key->n_proto;
388 flow->l2_mask.ether_type = match.mask->n_proto;
389
390 if (match.key->n_proto == htons(ETH_P_IP) ||
391 match.key->n_proto == htons(ETH_P_IPV6)) {
392 flow->l4_key.ip_proto = match.key->ip_proto;
393 flow->l4_mask.ip_proto = match.mask->ip_proto;
394 }
395 }
396
397 if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_ETH_ADDRS)) {
398 struct flow_match_eth_addrs match;
399
400 flow_rule_match_eth_addrs(rule, &match);
401 flow->flags |= BNXT_TC_FLOW_FLAGS_ETH_ADDRS;
402 ether_addr_copy(flow->l2_key.dmac, match.key->dst);
403 ether_addr_copy(flow->l2_mask.dmac, match.mask->dst);
404 ether_addr_copy(flow->l2_key.smac, match.key->src);
405 ether_addr_copy(flow->l2_mask.smac, match.mask->src);
406 }
407
408 if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_VLAN)) {
409 struct flow_match_vlan match;
410
411 flow_rule_match_vlan(rule, &match);
412 flow->l2_key.inner_vlan_tci =
413 cpu_to_be16(VLAN_TCI(match.key->vlan_id,
414 match.key->vlan_priority));
415 flow->l2_mask.inner_vlan_tci =
416 cpu_to_be16((VLAN_TCI(match.mask->vlan_id,
417 match.mask->vlan_priority)));
418 flow->l2_key.inner_vlan_tpid = htons(ETH_P_8021Q);
419 flow->l2_mask.inner_vlan_tpid = htons(0xffff);
420 flow->l2_key.num_vlans = 1;
421 }
422
423 if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IPV4_ADDRS)) {
424 struct flow_match_ipv4_addrs match;
425
426 flow_rule_match_ipv4_addrs(rule, &match);
427 flow->flags |= BNXT_TC_FLOW_FLAGS_IPV4_ADDRS;
428 flow->l3_key.ipv4.daddr.s_addr = match.key->dst;
429 flow->l3_mask.ipv4.daddr.s_addr = match.mask->dst;
430 flow->l3_key.ipv4.saddr.s_addr = match.key->src;
431 flow->l3_mask.ipv4.saddr.s_addr = match.mask->src;
432 } else if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_IPV6_ADDRS)) {
433 struct flow_match_ipv6_addrs match;
434
435 flow_rule_match_ipv6_addrs(rule, &match);
436 flow->flags |= BNXT_TC_FLOW_FLAGS_IPV6_ADDRS;
437 flow->l3_key.ipv6.daddr = match.key->dst;
438 flow->l3_mask.ipv6.daddr = match.mask->dst;
439 flow->l3_key.ipv6.saddr = match.key->src;
440 flow->l3_mask.ipv6.saddr = match.mask->src;
441 }
442
443 if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_PORTS)) {
444 struct flow_match_ports match;
445
446 flow_rule_match_ports(rule, &match);
447 flow->flags |= BNXT_TC_FLOW_FLAGS_PORTS;
448 flow->l4_key.ports.dport = match.key->dst;
449 flow->l4_mask.ports.dport = match.mask->dst;
450 flow->l4_key.ports.sport = match.key->src;
451 flow->l4_mask.ports.sport = match.mask->src;
452 }
453
454 if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_ICMP)) {
455 struct flow_match_icmp match;
456
457 flow_rule_match_icmp(rule, &match);
458 flow->flags |= BNXT_TC_FLOW_FLAGS_ICMP;
459 flow->l4_key.icmp.type = match.key->type;
460 flow->l4_key.icmp.code = match.key->code;
461 flow->l4_mask.icmp.type = match.mask->type;
462 flow->l4_mask.icmp.code = match.mask->code;
463 }
464
465 if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_ENC_IPV4_ADDRS)) {
466 struct flow_match_ipv4_addrs match;
467
468 flow_rule_match_enc_ipv4_addrs(rule, &match);
469 flow->flags |= BNXT_TC_FLOW_FLAGS_TUNL_IPV4_ADDRS;
470 flow->tun_key.u.ipv4.dst = match.key->dst;
471 flow->tun_mask.u.ipv4.dst = match.mask->dst;
472 flow->tun_key.u.ipv4.src = match.key->src;
473 flow->tun_mask.u.ipv4.src = match.mask->src;
474 } else if (flow_rule_match_key(rule,
475 FLOW_DISSECTOR_KEY_ENC_IPV6_ADDRS)) {
476 return -EOPNOTSUPP;
477 }
478
479 if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_ENC_KEYID)) {
480 struct flow_match_enc_keyid match;
481
482 flow_rule_match_enc_keyid(rule, &match);
483 flow->flags |= BNXT_TC_FLOW_FLAGS_TUNL_ID;
484 flow->tun_key.tun_id = key32_to_tunnel_id(match.key->keyid);
485 flow->tun_mask.tun_id = key32_to_tunnel_id(match.mask->keyid);
486 }
487
488 if (flow_rule_match_key(rule, FLOW_DISSECTOR_KEY_ENC_PORTS)) {
489 struct flow_match_ports match;
490
491 flow_rule_match_enc_ports(rule, &match);
492 flow->flags |= BNXT_TC_FLOW_FLAGS_TUNL_PORTS;
493 flow->tun_key.tp_dst = match.key->dst;
494 flow->tun_mask.tp_dst = match.mask->dst;
495 flow->tun_key.tp_src = match.key->src;
496 flow->tun_mask.tp_src = match.mask->src;
497 }
498
499 return bnxt_tc_parse_actions(bp, &flow->actions, &rule->action,
500 tc_flow_cmd->common.extack);
501 }
502
bnxt_hwrm_cfa_flow_free(struct bnxt * bp,struct bnxt_tc_flow_node * flow_node)503 static int bnxt_hwrm_cfa_flow_free(struct bnxt *bp,
504 struct bnxt_tc_flow_node *flow_node)
505 {
506 struct hwrm_cfa_flow_free_input *req;
507 int rc;
508
509 rc = hwrm_req_init(bp, req, HWRM_CFA_FLOW_FREE);
510 if (!rc) {
511 if (bp->fw_cap & BNXT_FW_CAP_OVS_64BIT_HANDLE)
512 req->ext_flow_handle = flow_node->ext_flow_handle;
513 else
514 req->flow_handle = flow_node->flow_handle;
515
516 rc = hwrm_req_send(bp, req);
517 }
518 if (rc)
519 netdev_info(bp->dev, "%s: Error rc=%d\n", __func__, rc);
520
521 return rc;
522 }
523
ipv6_mask_len(struct in6_addr * mask)524 static int ipv6_mask_len(struct in6_addr *mask)
525 {
526 int mask_len = 0, i;
527
528 for (i = 0; i < 4; i++)
529 mask_len += inet_mask_len(mask->s6_addr32[i]);
530
531 return mask_len;
532 }
533
is_wildcard(void * mask,int len)534 static bool is_wildcard(void *mask, int len)
535 {
536 const u8 *p = mask;
537 int i;
538
539 for (i = 0; i < len; i++) {
540 if (p[i] != 0)
541 return false;
542 }
543 return true;
544 }
545
is_exactmatch(void * mask,int len)546 static bool is_exactmatch(void *mask, int len)
547 {
548 const u8 *p = mask;
549 int i;
550
551 for (i = 0; i < len; i++)
552 if (p[i] != 0xff)
553 return false;
554
555 return true;
556 }
557
is_vlan_tci_allowed(__be16 vlan_tci_mask,__be16 vlan_tci)558 static bool is_vlan_tci_allowed(__be16 vlan_tci_mask,
559 __be16 vlan_tci)
560 {
561 /* VLAN priority must be either exactly zero or fully wildcarded and
562 * VLAN id must be exact match.
563 */
564 if (is_vid_exactmatch(vlan_tci_mask) &&
565 ((is_vlan_pcp_exactmatch(vlan_tci_mask) &&
566 is_vlan_pcp_zero(vlan_tci)) ||
567 is_vlan_pcp_wildcarded(vlan_tci_mask)))
568 return true;
569
570 return false;
571 }
572
bits_set(void * key,int len)573 static bool bits_set(void *key, int len)
574 {
575 const u8 *p = key;
576 int i;
577
578 for (i = 0; i < len; i++)
579 if (p[i] != 0)
580 return true;
581
582 return false;
583 }
584
bnxt_hwrm_cfa_flow_alloc(struct bnxt * bp,struct bnxt_tc_flow * flow,__le16 ref_flow_handle,__le32 tunnel_handle,struct bnxt_tc_flow_node * flow_node)585 static int bnxt_hwrm_cfa_flow_alloc(struct bnxt *bp, struct bnxt_tc_flow *flow,
586 __le16 ref_flow_handle,
587 __le32 tunnel_handle,
588 struct bnxt_tc_flow_node *flow_node)
589 {
590 struct bnxt_tc_actions *actions = &flow->actions;
591 struct bnxt_tc_l3_key *l3_mask = &flow->l3_mask;
592 struct bnxt_tc_l3_key *l3_key = &flow->l3_key;
593 struct hwrm_cfa_flow_alloc_output *resp;
594 struct hwrm_cfa_flow_alloc_input *req;
595 u16 flow_flags = 0, action_flags = 0;
596 int rc;
597
598 rc = hwrm_req_init(bp, req, HWRM_CFA_FLOW_ALLOC);
599 if (rc)
600 return rc;
601
602 req->src_fid = cpu_to_le16(flow->src_fid);
603 req->ref_flow_handle = ref_flow_handle;
604
605 if (actions->flags & BNXT_TC_ACTION_FLAG_L2_REWRITE) {
606 memcpy(req->l2_rewrite_dmac, actions->l2_rewrite_dmac,
607 ETH_ALEN);
608 memcpy(req->l2_rewrite_smac, actions->l2_rewrite_smac,
609 ETH_ALEN);
610 action_flags |=
611 CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_L2_HEADER_REWRITE;
612 }
613
614 if (actions->flags & BNXT_TC_ACTION_FLAG_NAT_XLATE) {
615 if (actions->nat.l3_is_ipv4) {
616 action_flags |=
617 CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_NAT_IPV4_ADDRESS;
618
619 if (actions->nat.src_xlate) {
620 action_flags |=
621 CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_NAT_SRC;
622 /* L3 source rewrite */
623 req->nat_ip_address[0] =
624 actions->nat.l3.ipv4.saddr.s_addr;
625 /* L4 source port */
626 if (actions->nat.l4.ports.sport)
627 req->nat_port =
628 actions->nat.l4.ports.sport;
629 } else {
630 action_flags |=
631 CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_NAT_DEST;
632 /* L3 destination rewrite */
633 req->nat_ip_address[0] =
634 actions->nat.l3.ipv4.daddr.s_addr;
635 /* L4 destination port */
636 if (actions->nat.l4.ports.dport)
637 req->nat_port =
638 actions->nat.l4.ports.dport;
639 }
640 netdev_dbg(bp->dev,
641 "req->nat_ip_address: %pI4 src_xlate: %d req->nat_port: %x\n",
642 req->nat_ip_address, actions->nat.src_xlate,
643 req->nat_port);
644 } else {
645 if (actions->nat.src_xlate) {
646 action_flags |=
647 CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_NAT_SRC;
648 /* L3 source rewrite */
649 memcpy(req->nat_ip_address,
650 actions->nat.l3.ipv6.saddr.s6_addr32,
651 sizeof(req->nat_ip_address));
652 /* L4 source port */
653 if (actions->nat.l4.ports.sport)
654 req->nat_port =
655 actions->nat.l4.ports.sport;
656 } else {
657 action_flags |=
658 CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_NAT_DEST;
659 /* L3 destination rewrite */
660 memcpy(req->nat_ip_address,
661 actions->nat.l3.ipv6.daddr.s6_addr32,
662 sizeof(req->nat_ip_address));
663 /* L4 destination port */
664 if (actions->nat.l4.ports.dport)
665 req->nat_port =
666 actions->nat.l4.ports.dport;
667 }
668 netdev_dbg(bp->dev,
669 "req->nat_ip_address: %pI6 src_xlate: %d req->nat_port: %x\n",
670 req->nat_ip_address, actions->nat.src_xlate,
671 req->nat_port);
672 }
673 }
674
675 if (actions->flags & BNXT_TC_ACTION_FLAG_TUNNEL_DECAP ||
676 actions->flags & BNXT_TC_ACTION_FLAG_TUNNEL_ENCAP) {
677 req->tunnel_handle = tunnel_handle;
678 flow_flags |= CFA_FLOW_ALLOC_REQ_FLAGS_TUNNEL;
679 action_flags |= CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_TUNNEL;
680 }
681
682 req->ethertype = flow->l2_key.ether_type;
683 req->ip_proto = flow->l4_key.ip_proto;
684
685 if (flow->flags & BNXT_TC_FLOW_FLAGS_ETH_ADDRS) {
686 memcpy(req->dmac, flow->l2_key.dmac, ETH_ALEN);
687 memcpy(req->smac, flow->l2_key.smac, ETH_ALEN);
688 }
689
690 if (flow->l2_key.num_vlans > 0) {
691 flow_flags |= CFA_FLOW_ALLOC_REQ_FLAGS_NUM_VLAN_ONE;
692 /* FW expects the inner_vlan_tci value to be set
693 * in outer_vlan_tci when num_vlans is 1 (which is
694 * always the case in TC.)
695 */
696 req->outer_vlan_tci = flow->l2_key.inner_vlan_tci;
697 }
698
699 /* If all IP and L4 fields are wildcarded then this is an L2 flow */
700 if (is_wildcard(l3_mask, sizeof(*l3_mask)) &&
701 is_wildcard(&flow->l4_mask, sizeof(flow->l4_mask))) {
702 flow_flags |= CFA_FLOW_ALLOC_REQ_FLAGS_FLOWTYPE_L2;
703 } else {
704 flow_flags |= flow->l2_key.ether_type == htons(ETH_P_IP) ?
705 CFA_FLOW_ALLOC_REQ_FLAGS_FLOWTYPE_IPV4 :
706 CFA_FLOW_ALLOC_REQ_FLAGS_FLOWTYPE_IPV6;
707
708 if (flow->flags & BNXT_TC_FLOW_FLAGS_IPV4_ADDRS) {
709 req->ip_dst[0] = l3_key->ipv4.daddr.s_addr;
710 req->ip_dst_mask_len =
711 inet_mask_len(l3_mask->ipv4.daddr.s_addr);
712 req->ip_src[0] = l3_key->ipv4.saddr.s_addr;
713 req->ip_src_mask_len =
714 inet_mask_len(l3_mask->ipv4.saddr.s_addr);
715 } else if (flow->flags & BNXT_TC_FLOW_FLAGS_IPV6_ADDRS) {
716 memcpy(req->ip_dst, l3_key->ipv6.daddr.s6_addr32,
717 sizeof(req->ip_dst));
718 req->ip_dst_mask_len =
719 ipv6_mask_len(&l3_mask->ipv6.daddr);
720 memcpy(req->ip_src, l3_key->ipv6.saddr.s6_addr32,
721 sizeof(req->ip_src));
722 req->ip_src_mask_len =
723 ipv6_mask_len(&l3_mask->ipv6.saddr);
724 }
725 }
726
727 if (flow->flags & BNXT_TC_FLOW_FLAGS_PORTS) {
728 req->l4_src_port = flow->l4_key.ports.sport;
729 req->l4_src_port_mask = flow->l4_mask.ports.sport;
730 req->l4_dst_port = flow->l4_key.ports.dport;
731 req->l4_dst_port_mask = flow->l4_mask.ports.dport;
732 } else if (flow->flags & BNXT_TC_FLOW_FLAGS_ICMP) {
733 /* l4 ports serve as type/code when ip_proto is ICMP */
734 req->l4_src_port = htons(flow->l4_key.icmp.type);
735 req->l4_src_port_mask = htons(flow->l4_mask.icmp.type);
736 req->l4_dst_port = htons(flow->l4_key.icmp.code);
737 req->l4_dst_port_mask = htons(flow->l4_mask.icmp.code);
738 }
739 req->flags = cpu_to_le16(flow_flags);
740
741 if (actions->flags & BNXT_TC_ACTION_FLAG_DROP) {
742 action_flags |= CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_DROP;
743 } else {
744 if (actions->flags & BNXT_TC_ACTION_FLAG_FWD) {
745 action_flags |= CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_FWD;
746 req->dst_fid = cpu_to_le16(actions->dst_fid);
747 }
748 if (actions->flags & BNXT_TC_ACTION_FLAG_PUSH_VLAN) {
749 action_flags |=
750 CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_L2_HEADER_REWRITE;
751 req->l2_rewrite_vlan_tpid = actions->push_vlan_tpid;
752 req->l2_rewrite_vlan_tci = actions->push_vlan_tci;
753 memcpy(&req->l2_rewrite_dmac, &req->dmac, ETH_ALEN);
754 memcpy(&req->l2_rewrite_smac, &req->smac, ETH_ALEN);
755 }
756 if (actions->flags & BNXT_TC_ACTION_FLAG_POP_VLAN) {
757 action_flags |=
758 CFA_FLOW_ALLOC_REQ_ACTION_FLAGS_L2_HEADER_REWRITE;
759 /* Rewrite config with tpid = 0 implies vlan pop */
760 req->l2_rewrite_vlan_tpid = 0;
761 memcpy(&req->l2_rewrite_dmac, &req->dmac, ETH_ALEN);
762 memcpy(&req->l2_rewrite_smac, &req->smac, ETH_ALEN);
763 }
764 }
765 req->action_flags = cpu_to_le16(action_flags);
766
767 resp = hwrm_req_hold(bp, req);
768 rc = hwrm_req_send_silent(bp, req);
769 if (!rc) {
770 /* CFA_FLOW_ALLOC response interpretation:
771 * fw with fw with
772 * 16-bit 64-bit
773 * flow handle flow handle
774 * =========== ===========
775 * flow_handle flow handle flow context id
776 * ext_flow_handle INVALID flow handle
777 * flow_id INVALID flow counter id
778 */
779 flow_node->flow_handle = resp->flow_handle;
780 if (bp->fw_cap & BNXT_FW_CAP_OVS_64BIT_HANDLE) {
781 flow_node->ext_flow_handle = resp->ext_flow_handle;
782 flow_node->flow_id = resp->flow_id;
783 }
784 }
785 hwrm_req_drop(bp, req);
786 return rc;
787 }
788
hwrm_cfa_decap_filter_alloc(struct bnxt * bp,struct bnxt_tc_flow * flow,struct bnxt_tc_l2_key * l2_info,__le32 ref_decap_handle,__le32 * decap_filter_handle)789 static int hwrm_cfa_decap_filter_alloc(struct bnxt *bp,
790 struct bnxt_tc_flow *flow,
791 struct bnxt_tc_l2_key *l2_info,
792 __le32 ref_decap_handle,
793 __le32 *decap_filter_handle)
794 {
795 struct hwrm_cfa_decap_filter_alloc_output *resp;
796 struct ip_tunnel_key *tun_key = &flow->tun_key;
797 struct hwrm_cfa_decap_filter_alloc_input *req;
798 u32 enables = 0;
799 int rc;
800
801 rc = hwrm_req_init(bp, req, HWRM_CFA_DECAP_FILTER_ALLOC);
802 if (rc)
803 goto exit;
804
805 req->flags = cpu_to_le32(CFA_DECAP_FILTER_ALLOC_REQ_FLAGS_OVS_TUNNEL);
806 enables |= CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_TUNNEL_TYPE |
807 CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_IP_PROTOCOL;
808 req->tunnel_type = CFA_DECAP_FILTER_ALLOC_REQ_TUNNEL_TYPE_VXLAN;
809 req->ip_protocol = CFA_DECAP_FILTER_ALLOC_REQ_IP_PROTOCOL_UDP;
810
811 if (flow->flags & BNXT_TC_FLOW_FLAGS_TUNL_ID) {
812 enables |= CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_TUNNEL_ID;
813 /* tunnel_id is wrongly defined in hsi defn. as __le32 */
814 req->tunnel_id = tunnel_id_to_key32(tun_key->tun_id);
815 }
816
817 if (flow->flags & BNXT_TC_FLOW_FLAGS_TUNL_ETH_ADDRS) {
818 enables |= CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_DST_MACADDR;
819 ether_addr_copy(req->dst_macaddr, l2_info->dmac);
820 }
821 if (l2_info->num_vlans) {
822 enables |= CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_T_IVLAN_VID;
823 req->t_ivlan_vid = l2_info->inner_vlan_tci;
824 }
825
826 enables |= CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_ETHERTYPE;
827 req->ethertype = htons(ETH_P_IP);
828
829 if (flow->flags & BNXT_TC_FLOW_FLAGS_TUNL_IPV4_ADDRS) {
830 enables |= CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_SRC_IPADDR |
831 CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_DST_IPADDR |
832 CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_IPADDR_TYPE;
833 req->ip_addr_type =
834 CFA_DECAP_FILTER_ALLOC_REQ_IP_ADDR_TYPE_IPV4;
835 req->dst_ipaddr[0] = tun_key->u.ipv4.dst;
836 req->src_ipaddr[0] = tun_key->u.ipv4.src;
837 }
838
839 if (flow->flags & BNXT_TC_FLOW_FLAGS_TUNL_PORTS) {
840 enables |= CFA_DECAP_FILTER_ALLOC_REQ_ENABLES_DST_PORT;
841 req->dst_port = tun_key->tp_dst;
842 }
843
844 /* Eventhough the decap_handle returned by hwrm_cfa_decap_filter_alloc
845 * is defined as __le32, l2_ctxt_ref_id is defined in HSI as __le16.
846 */
847 req->l2_ctxt_ref_id = (__force __le16)ref_decap_handle;
848 req->enables = cpu_to_le32(enables);
849
850 resp = hwrm_req_hold(bp, req);
851 rc = hwrm_req_send_silent(bp, req);
852 if (!rc)
853 *decap_filter_handle = resp->decap_filter_id;
854 hwrm_req_drop(bp, req);
855 exit:
856 if (rc)
857 netdev_info(bp->dev, "%s: Error rc=%d\n", __func__, rc);
858
859 return rc;
860 }
861
hwrm_cfa_decap_filter_free(struct bnxt * bp,__le32 decap_filter_handle)862 static int hwrm_cfa_decap_filter_free(struct bnxt *bp,
863 __le32 decap_filter_handle)
864 {
865 struct hwrm_cfa_decap_filter_free_input *req;
866 int rc;
867
868 rc = hwrm_req_init(bp, req, HWRM_CFA_DECAP_FILTER_FREE);
869 if (!rc) {
870 req->decap_filter_id = decap_filter_handle;
871 rc = hwrm_req_send(bp, req);
872 }
873 if (rc)
874 netdev_info(bp->dev, "%s: Error rc=%d\n", __func__, rc);
875
876 return rc;
877 }
878
hwrm_cfa_encap_record_alloc(struct bnxt * bp,struct ip_tunnel_key * encap_key,struct bnxt_tc_l2_key * l2_info,__le32 * encap_record_handle)879 static int hwrm_cfa_encap_record_alloc(struct bnxt *bp,
880 struct ip_tunnel_key *encap_key,
881 struct bnxt_tc_l2_key *l2_info,
882 __le32 *encap_record_handle)
883 {
884 struct hwrm_cfa_encap_record_alloc_output *resp;
885 struct hwrm_cfa_encap_record_alloc_input *req;
886 struct hwrm_cfa_encap_data_vxlan *encap;
887 struct hwrm_vxlan_ipv4_hdr *encap_ipv4;
888 int rc;
889
890 rc = hwrm_req_init(bp, req, HWRM_CFA_ENCAP_RECORD_ALLOC);
891 if (rc)
892 goto exit;
893
894 encap = (struct hwrm_cfa_encap_data_vxlan *)&req->encap_data;
895 req->encap_type = CFA_ENCAP_RECORD_ALLOC_REQ_ENCAP_TYPE_VXLAN;
896 ether_addr_copy(encap->dst_mac_addr, l2_info->dmac);
897 ether_addr_copy(encap->src_mac_addr, l2_info->smac);
898 if (l2_info->num_vlans) {
899 encap->num_vlan_tags = l2_info->num_vlans;
900 encap->ovlan_tci = l2_info->inner_vlan_tci;
901 encap->ovlan_tpid = l2_info->inner_vlan_tpid;
902 }
903
904 encap_ipv4 = (struct hwrm_vxlan_ipv4_hdr *)encap->l3;
905 encap_ipv4->ver_hlen = 4 << VXLAN_IPV4_HDR_VER_HLEN_VERSION_SFT;
906 encap_ipv4->ver_hlen |= 5 << VXLAN_IPV4_HDR_VER_HLEN_HEADER_LENGTH_SFT;
907 encap_ipv4->ttl = encap_key->ttl;
908
909 encap_ipv4->dest_ip_addr = encap_key->u.ipv4.dst;
910 encap_ipv4->src_ip_addr = encap_key->u.ipv4.src;
911 encap_ipv4->protocol = IPPROTO_UDP;
912
913 encap->dst_port = encap_key->tp_dst;
914 encap->vni = tunnel_id_to_key32(encap_key->tun_id);
915
916 resp = hwrm_req_hold(bp, req);
917 rc = hwrm_req_send_silent(bp, req);
918 if (!rc)
919 *encap_record_handle = resp->encap_record_id;
920 hwrm_req_drop(bp, req);
921 exit:
922 if (rc)
923 netdev_info(bp->dev, "%s: Error rc=%d\n", __func__, rc);
924
925 return rc;
926 }
927
hwrm_cfa_encap_record_free(struct bnxt * bp,__le32 encap_record_handle)928 static int hwrm_cfa_encap_record_free(struct bnxt *bp,
929 __le32 encap_record_handle)
930 {
931 struct hwrm_cfa_encap_record_free_input *req;
932 int rc;
933
934 rc = hwrm_req_init(bp, req, HWRM_CFA_ENCAP_RECORD_FREE);
935 if (!rc) {
936 req->encap_record_id = encap_record_handle;
937 rc = hwrm_req_send(bp, req);
938 }
939 if (rc)
940 netdev_info(bp->dev, "%s: Error rc=%d\n", __func__, rc);
941
942 return rc;
943 }
944
bnxt_tc_put_l2_node(struct bnxt * bp,struct bnxt_tc_flow_node * flow_node)945 static int bnxt_tc_put_l2_node(struct bnxt *bp,
946 struct bnxt_tc_flow_node *flow_node)
947 {
948 struct bnxt_tc_l2_node *l2_node = flow_node->l2_node;
949 struct bnxt_tc_info *tc_info = bp->tc_info;
950 int rc;
951
952 /* remove flow_node from the L2 shared flow list */
953 list_del(&flow_node->l2_list_node);
954 if (--l2_node->refcount == 0) {
955 rc = rhashtable_remove_fast(&tc_info->l2_table, &l2_node->node,
956 tc_info->l2_ht_params);
957 if (rc)
958 netdev_err(bp->dev,
959 "Error: %s: rhashtable_remove_fast: %d\n",
960 __func__, rc);
961 kfree_rcu(l2_node, rcu);
962 }
963 return 0;
964 }
965
966 static struct bnxt_tc_l2_node *
bnxt_tc_get_l2_node(struct bnxt * bp,struct rhashtable * l2_table,struct rhashtable_params ht_params,struct bnxt_tc_l2_key * l2_key)967 bnxt_tc_get_l2_node(struct bnxt *bp, struct rhashtable *l2_table,
968 struct rhashtable_params ht_params,
969 struct bnxt_tc_l2_key *l2_key)
970 {
971 struct bnxt_tc_l2_node *l2_node;
972 int rc;
973
974 l2_node = rhashtable_lookup_fast(l2_table, l2_key, ht_params);
975 if (!l2_node) {
976 l2_node = kzalloc(sizeof(*l2_node), GFP_KERNEL);
977 if (!l2_node) {
978 rc = -ENOMEM;
979 return NULL;
980 }
981
982 l2_node->key = *l2_key;
983 rc = rhashtable_insert_fast(l2_table, &l2_node->node,
984 ht_params);
985 if (rc) {
986 kfree_rcu(l2_node, rcu);
987 netdev_err(bp->dev,
988 "Error: %s: rhashtable_insert_fast: %d\n",
989 __func__, rc);
990 return NULL;
991 }
992 INIT_LIST_HEAD(&l2_node->common_l2_flows);
993 }
994 return l2_node;
995 }
996
997 /* Get the ref_flow_handle for a flow by checking if there are any other
998 * flows that share the same L2 key as this flow.
999 */
1000 static int
bnxt_tc_get_ref_flow_handle(struct bnxt * bp,struct bnxt_tc_flow * flow,struct bnxt_tc_flow_node * flow_node,__le16 * ref_flow_handle)1001 bnxt_tc_get_ref_flow_handle(struct bnxt *bp, struct bnxt_tc_flow *flow,
1002 struct bnxt_tc_flow_node *flow_node,
1003 __le16 *ref_flow_handle)
1004 {
1005 struct bnxt_tc_info *tc_info = bp->tc_info;
1006 struct bnxt_tc_flow_node *ref_flow_node;
1007 struct bnxt_tc_l2_node *l2_node;
1008
1009 l2_node = bnxt_tc_get_l2_node(bp, &tc_info->l2_table,
1010 tc_info->l2_ht_params,
1011 &flow->l2_key);
1012 if (!l2_node)
1013 return -1;
1014
1015 /* If any other flow is using this l2_node, use it's flow_handle
1016 * as the ref_flow_handle
1017 */
1018 if (l2_node->refcount > 0) {
1019 ref_flow_node = list_first_entry(&l2_node->common_l2_flows,
1020 struct bnxt_tc_flow_node,
1021 l2_list_node);
1022 *ref_flow_handle = ref_flow_node->flow_handle;
1023 } else {
1024 *ref_flow_handle = cpu_to_le16(0xffff);
1025 }
1026
1027 /* Insert the l2_node into the flow_node so that subsequent flows
1028 * with a matching l2 key can use the flow_handle of this flow
1029 * as their ref_flow_handle
1030 */
1031 flow_node->l2_node = l2_node;
1032 list_add(&flow_node->l2_list_node, &l2_node->common_l2_flows);
1033 l2_node->refcount++;
1034 return 0;
1035 }
1036
1037 /* After the flow parsing is done, this routine is used for checking
1038 * if there are any aspects of the flow that prevent it from being
1039 * offloaded.
1040 */
bnxt_tc_can_offload(struct bnxt * bp,struct bnxt_tc_flow * flow)1041 static bool bnxt_tc_can_offload(struct bnxt *bp, struct bnxt_tc_flow *flow)
1042 {
1043 /* If L4 ports are specified then ip_proto must be TCP or UDP */
1044 if ((flow->flags & BNXT_TC_FLOW_FLAGS_PORTS) &&
1045 (flow->l4_key.ip_proto != IPPROTO_TCP &&
1046 flow->l4_key.ip_proto != IPPROTO_UDP)) {
1047 netdev_info(bp->dev, "Cannot offload non-TCP/UDP (%d) ports\n",
1048 flow->l4_key.ip_proto);
1049 return false;
1050 }
1051
1052 /* Currently source/dest MAC cannot be partial wildcard */
1053 if (bits_set(&flow->l2_key.smac, sizeof(flow->l2_key.smac)) &&
1054 !is_exactmatch(flow->l2_mask.smac, sizeof(flow->l2_mask.smac))) {
1055 netdev_info(bp->dev, "Wildcard match unsupported for Source MAC\n");
1056 return false;
1057 }
1058 if (bits_set(&flow->l2_key.dmac, sizeof(flow->l2_key.dmac)) &&
1059 !is_exactmatch(&flow->l2_mask.dmac, sizeof(flow->l2_mask.dmac))) {
1060 netdev_info(bp->dev, "Wildcard match unsupported for Dest MAC\n");
1061 return false;
1062 }
1063
1064 /* Currently VLAN fields cannot be partial wildcard */
1065 if (bits_set(&flow->l2_key.inner_vlan_tci,
1066 sizeof(flow->l2_key.inner_vlan_tci)) &&
1067 !is_vlan_tci_allowed(flow->l2_mask.inner_vlan_tci,
1068 flow->l2_key.inner_vlan_tci)) {
1069 netdev_info(bp->dev, "Unsupported VLAN TCI\n");
1070 return false;
1071 }
1072 if (bits_set(&flow->l2_key.inner_vlan_tpid,
1073 sizeof(flow->l2_key.inner_vlan_tpid)) &&
1074 !is_exactmatch(&flow->l2_mask.inner_vlan_tpid,
1075 sizeof(flow->l2_mask.inner_vlan_tpid))) {
1076 netdev_info(bp->dev, "Wildcard match unsupported for VLAN TPID\n");
1077 return false;
1078 }
1079
1080 /* Currently Ethertype must be set */
1081 if (!is_exactmatch(&flow->l2_mask.ether_type,
1082 sizeof(flow->l2_mask.ether_type))) {
1083 netdev_info(bp->dev, "Wildcard match unsupported for Ethertype\n");
1084 return false;
1085 }
1086
1087 return true;
1088 }
1089
1090 /* Returns the final refcount of the node on success
1091 * or a -ve error code on failure
1092 */
bnxt_tc_put_tunnel_node(struct bnxt * bp,struct rhashtable * tunnel_table,struct rhashtable_params * ht_params,struct bnxt_tc_tunnel_node * tunnel_node)1093 static int bnxt_tc_put_tunnel_node(struct bnxt *bp,
1094 struct rhashtable *tunnel_table,
1095 struct rhashtable_params *ht_params,
1096 struct bnxt_tc_tunnel_node *tunnel_node)
1097 {
1098 int rc;
1099
1100 if (--tunnel_node->refcount == 0) {
1101 rc = rhashtable_remove_fast(tunnel_table, &tunnel_node->node,
1102 *ht_params);
1103 if (rc) {
1104 netdev_err(bp->dev, "rhashtable_remove_fast rc=%d\n", rc);
1105 rc = -1;
1106 }
1107 kfree_rcu(tunnel_node, rcu);
1108 return rc;
1109 } else {
1110 return tunnel_node->refcount;
1111 }
1112 }
1113
1114 /* Get (or add) either encap or decap tunnel node from/to the supplied
1115 * hash table.
1116 */
1117 static struct bnxt_tc_tunnel_node *
bnxt_tc_get_tunnel_node(struct bnxt * bp,struct rhashtable * tunnel_table,struct rhashtable_params * ht_params,struct ip_tunnel_key * tun_key)1118 bnxt_tc_get_tunnel_node(struct bnxt *bp, struct rhashtable *tunnel_table,
1119 struct rhashtable_params *ht_params,
1120 struct ip_tunnel_key *tun_key)
1121 {
1122 struct bnxt_tc_tunnel_node *tunnel_node;
1123 int rc;
1124
1125 tunnel_node = rhashtable_lookup_fast(tunnel_table, tun_key, *ht_params);
1126 if (!tunnel_node) {
1127 tunnel_node = kzalloc(sizeof(*tunnel_node), GFP_KERNEL);
1128 if (!tunnel_node) {
1129 rc = -ENOMEM;
1130 goto err;
1131 }
1132
1133 tunnel_node->key = *tun_key;
1134 tunnel_node->tunnel_handle = INVALID_TUNNEL_HANDLE;
1135 rc = rhashtable_insert_fast(tunnel_table, &tunnel_node->node,
1136 *ht_params);
1137 if (rc) {
1138 kfree_rcu(tunnel_node, rcu);
1139 goto err;
1140 }
1141 }
1142 tunnel_node->refcount++;
1143 return tunnel_node;
1144 err:
1145 netdev_info(bp->dev, "error rc=%d\n", rc);
1146 return NULL;
1147 }
1148
bnxt_tc_get_ref_decap_handle(struct bnxt * bp,struct bnxt_tc_flow * flow,struct bnxt_tc_l2_key * l2_key,struct bnxt_tc_flow_node * flow_node,__le32 * ref_decap_handle)1149 static int bnxt_tc_get_ref_decap_handle(struct bnxt *bp,
1150 struct bnxt_tc_flow *flow,
1151 struct bnxt_tc_l2_key *l2_key,
1152 struct bnxt_tc_flow_node *flow_node,
1153 __le32 *ref_decap_handle)
1154 {
1155 struct bnxt_tc_info *tc_info = bp->tc_info;
1156 struct bnxt_tc_flow_node *ref_flow_node;
1157 struct bnxt_tc_l2_node *decap_l2_node;
1158
1159 decap_l2_node = bnxt_tc_get_l2_node(bp, &tc_info->decap_l2_table,
1160 tc_info->decap_l2_ht_params,
1161 l2_key);
1162 if (!decap_l2_node)
1163 return -1;
1164
1165 /* If any other flow is using this decap_l2_node, use it's decap_handle
1166 * as the ref_decap_handle
1167 */
1168 if (decap_l2_node->refcount > 0) {
1169 ref_flow_node =
1170 list_first_entry(&decap_l2_node->common_l2_flows,
1171 struct bnxt_tc_flow_node,
1172 decap_l2_list_node);
1173 *ref_decap_handle = ref_flow_node->decap_node->tunnel_handle;
1174 } else {
1175 *ref_decap_handle = INVALID_TUNNEL_HANDLE;
1176 }
1177
1178 /* Insert the l2_node into the flow_node so that subsequent flows
1179 * with a matching decap l2 key can use the decap_filter_handle of
1180 * this flow as their ref_decap_handle
1181 */
1182 flow_node->decap_l2_node = decap_l2_node;
1183 list_add(&flow_node->decap_l2_list_node,
1184 &decap_l2_node->common_l2_flows);
1185 decap_l2_node->refcount++;
1186 return 0;
1187 }
1188
bnxt_tc_put_decap_l2_node(struct bnxt * bp,struct bnxt_tc_flow_node * flow_node)1189 static void bnxt_tc_put_decap_l2_node(struct bnxt *bp,
1190 struct bnxt_tc_flow_node *flow_node)
1191 {
1192 struct bnxt_tc_l2_node *decap_l2_node = flow_node->decap_l2_node;
1193 struct bnxt_tc_info *tc_info = bp->tc_info;
1194 int rc;
1195
1196 /* remove flow_node from the decap L2 sharing flow list */
1197 list_del(&flow_node->decap_l2_list_node);
1198 if (--decap_l2_node->refcount == 0) {
1199 rc = rhashtable_remove_fast(&tc_info->decap_l2_table,
1200 &decap_l2_node->node,
1201 tc_info->decap_l2_ht_params);
1202 if (rc)
1203 netdev_err(bp->dev, "rhashtable_remove_fast rc=%d\n", rc);
1204 kfree_rcu(decap_l2_node, rcu);
1205 }
1206 }
1207
bnxt_tc_put_decap_handle(struct bnxt * bp,struct bnxt_tc_flow_node * flow_node)1208 static void bnxt_tc_put_decap_handle(struct bnxt *bp,
1209 struct bnxt_tc_flow_node *flow_node)
1210 {
1211 __le32 decap_handle = flow_node->decap_node->tunnel_handle;
1212 struct bnxt_tc_info *tc_info = bp->tc_info;
1213 int rc;
1214
1215 if (flow_node->decap_l2_node)
1216 bnxt_tc_put_decap_l2_node(bp, flow_node);
1217
1218 rc = bnxt_tc_put_tunnel_node(bp, &tc_info->decap_table,
1219 &tc_info->decap_ht_params,
1220 flow_node->decap_node);
1221 if (!rc && decap_handle != INVALID_TUNNEL_HANDLE)
1222 hwrm_cfa_decap_filter_free(bp, decap_handle);
1223 }
1224
bnxt_tc_resolve_tunnel_hdrs(struct bnxt * bp,struct ip_tunnel_key * tun_key,struct bnxt_tc_l2_key * l2_info)1225 static int bnxt_tc_resolve_tunnel_hdrs(struct bnxt *bp,
1226 struct ip_tunnel_key *tun_key,
1227 struct bnxt_tc_l2_key *l2_info)
1228 {
1229 #ifdef CONFIG_INET
1230 struct net_device *real_dst_dev = bp->dev;
1231 struct flowi4 flow = { {0} };
1232 struct net_device *dst_dev;
1233 struct neighbour *nbr;
1234 struct rtable *rt;
1235 int rc;
1236
1237 flow.flowi4_proto = IPPROTO_UDP;
1238 flow.fl4_dport = tun_key->tp_dst;
1239 flow.daddr = tun_key->u.ipv4.dst;
1240
1241 rt = ip_route_output_key(dev_net(real_dst_dev), &flow);
1242 if (IS_ERR(rt)) {
1243 netdev_info(bp->dev, "no route to %pI4b\n", &flow.daddr);
1244 return -EOPNOTSUPP;
1245 }
1246
1247 /* The route must either point to the real_dst_dev or a dst_dev that
1248 * uses the real_dst_dev.
1249 */
1250 dst_dev = rt->dst.dev;
1251 if (is_vlan_dev(dst_dev)) {
1252 #if IS_ENABLED(CONFIG_VLAN_8021Q)
1253 struct vlan_dev_priv *vlan = vlan_dev_priv(dst_dev);
1254
1255 if (vlan->real_dev != real_dst_dev) {
1256 netdev_info(bp->dev,
1257 "dst_dev(%s) doesn't use PF-if(%s)\n",
1258 netdev_name(dst_dev),
1259 netdev_name(real_dst_dev));
1260 rc = -EOPNOTSUPP;
1261 goto put_rt;
1262 }
1263 l2_info->inner_vlan_tci = htons(vlan->vlan_id);
1264 l2_info->inner_vlan_tpid = vlan->vlan_proto;
1265 l2_info->num_vlans = 1;
1266 #endif
1267 } else if (dst_dev != real_dst_dev) {
1268 netdev_info(bp->dev,
1269 "dst_dev(%s) for %pI4b is not PF-if(%s)\n",
1270 netdev_name(dst_dev), &flow.daddr,
1271 netdev_name(real_dst_dev));
1272 rc = -EOPNOTSUPP;
1273 goto put_rt;
1274 }
1275
1276 nbr = dst_neigh_lookup(&rt->dst, &flow.daddr);
1277 if (!nbr) {
1278 netdev_info(bp->dev, "can't lookup neighbor for %pI4b\n",
1279 &flow.daddr);
1280 rc = -EOPNOTSUPP;
1281 goto put_rt;
1282 }
1283
1284 tun_key->u.ipv4.src = flow.saddr;
1285 tun_key->ttl = ip4_dst_hoplimit(&rt->dst);
1286 neigh_ha_snapshot(l2_info->dmac, nbr, dst_dev);
1287 ether_addr_copy(l2_info->smac, dst_dev->dev_addr);
1288 neigh_release(nbr);
1289 ip_rt_put(rt);
1290
1291 return 0;
1292 put_rt:
1293 ip_rt_put(rt);
1294 return rc;
1295 #else
1296 return -EOPNOTSUPP;
1297 #endif
1298 }
1299
bnxt_tc_get_decap_handle(struct bnxt * bp,struct bnxt_tc_flow * flow,struct bnxt_tc_flow_node * flow_node,__le32 * decap_filter_handle)1300 static int bnxt_tc_get_decap_handle(struct bnxt *bp, struct bnxt_tc_flow *flow,
1301 struct bnxt_tc_flow_node *flow_node,
1302 __le32 *decap_filter_handle)
1303 {
1304 struct ip_tunnel_key *decap_key = &flow->tun_key;
1305 struct bnxt_tc_info *tc_info = bp->tc_info;
1306 struct bnxt_tc_l2_key l2_info = { {0} };
1307 struct bnxt_tc_tunnel_node *decap_node;
1308 struct ip_tunnel_key tun_key = { 0 };
1309 struct bnxt_tc_l2_key *decap_l2_info;
1310 __le32 ref_decap_handle;
1311 int rc;
1312
1313 /* Check if there's another flow using the same tunnel decap.
1314 * If not, add this tunnel to the table and resolve the other
1315 * tunnel header fileds. Ignore src_port in the tunnel_key,
1316 * since it is not required for decap filters.
1317 */
1318 decap_key->tp_src = 0;
1319 decap_node = bnxt_tc_get_tunnel_node(bp, &tc_info->decap_table,
1320 &tc_info->decap_ht_params,
1321 decap_key);
1322 if (!decap_node)
1323 return -ENOMEM;
1324
1325 flow_node->decap_node = decap_node;
1326
1327 if (decap_node->tunnel_handle != INVALID_TUNNEL_HANDLE)
1328 goto done;
1329
1330 /* Resolve the L2 fields for tunnel decap
1331 * Resolve the route for remote vtep (saddr) of the decap key
1332 * Find it's next-hop mac addrs
1333 */
1334 tun_key.u.ipv4.dst = flow->tun_key.u.ipv4.src;
1335 tun_key.tp_dst = flow->tun_key.tp_dst;
1336 rc = bnxt_tc_resolve_tunnel_hdrs(bp, &tun_key, &l2_info);
1337 if (rc)
1338 goto put_decap;
1339
1340 decap_l2_info = &decap_node->l2_info;
1341 /* decap smac is wildcarded */
1342 ether_addr_copy(decap_l2_info->dmac, l2_info.smac);
1343 if (l2_info.num_vlans) {
1344 decap_l2_info->num_vlans = l2_info.num_vlans;
1345 decap_l2_info->inner_vlan_tpid = l2_info.inner_vlan_tpid;
1346 decap_l2_info->inner_vlan_tci = l2_info.inner_vlan_tci;
1347 }
1348 flow->flags |= BNXT_TC_FLOW_FLAGS_TUNL_ETH_ADDRS;
1349
1350 /* For getting a decap_filter_handle we first need to check if
1351 * there are any other decap flows that share the same tunnel L2
1352 * key and if so, pass that flow's decap_filter_handle as the
1353 * ref_decap_handle for this flow.
1354 */
1355 rc = bnxt_tc_get_ref_decap_handle(bp, flow, decap_l2_info, flow_node,
1356 &ref_decap_handle);
1357 if (rc)
1358 goto put_decap;
1359
1360 /* Issue the hwrm cmd to allocate a decap filter handle */
1361 rc = hwrm_cfa_decap_filter_alloc(bp, flow, decap_l2_info,
1362 ref_decap_handle,
1363 &decap_node->tunnel_handle);
1364 if (rc)
1365 goto put_decap_l2;
1366
1367 done:
1368 *decap_filter_handle = decap_node->tunnel_handle;
1369 return 0;
1370
1371 put_decap_l2:
1372 bnxt_tc_put_decap_l2_node(bp, flow_node);
1373 put_decap:
1374 bnxt_tc_put_tunnel_node(bp, &tc_info->decap_table,
1375 &tc_info->decap_ht_params,
1376 flow_node->decap_node);
1377 return rc;
1378 }
1379
bnxt_tc_put_encap_handle(struct bnxt * bp,struct bnxt_tc_tunnel_node * encap_node)1380 static void bnxt_tc_put_encap_handle(struct bnxt *bp,
1381 struct bnxt_tc_tunnel_node *encap_node)
1382 {
1383 __le32 encap_handle = encap_node->tunnel_handle;
1384 struct bnxt_tc_info *tc_info = bp->tc_info;
1385 int rc;
1386
1387 rc = bnxt_tc_put_tunnel_node(bp, &tc_info->encap_table,
1388 &tc_info->encap_ht_params, encap_node);
1389 if (!rc && encap_handle != INVALID_TUNNEL_HANDLE)
1390 hwrm_cfa_encap_record_free(bp, encap_handle);
1391 }
1392
1393 /* Lookup the tunnel encap table and check if there's an encap_handle
1394 * alloc'd already.
1395 * If not, query L2 info via a route lookup and issue an encap_record_alloc
1396 * cmd to FW.
1397 */
bnxt_tc_get_encap_handle(struct bnxt * bp,struct bnxt_tc_flow * flow,struct bnxt_tc_flow_node * flow_node,__le32 * encap_handle)1398 static int bnxt_tc_get_encap_handle(struct bnxt *bp, struct bnxt_tc_flow *flow,
1399 struct bnxt_tc_flow_node *flow_node,
1400 __le32 *encap_handle)
1401 {
1402 struct ip_tunnel_key *encap_key = &flow->actions.tun_encap_key;
1403 struct bnxt_tc_info *tc_info = bp->tc_info;
1404 struct bnxt_tc_tunnel_node *encap_node;
1405 int rc;
1406
1407 /* Check if there's another flow using the same tunnel encap.
1408 * If not, add this tunnel to the table and resolve the other
1409 * tunnel header fileds
1410 */
1411 encap_node = bnxt_tc_get_tunnel_node(bp, &tc_info->encap_table,
1412 &tc_info->encap_ht_params,
1413 encap_key);
1414 if (!encap_node)
1415 return -ENOMEM;
1416
1417 flow_node->encap_node = encap_node;
1418
1419 if (encap_node->tunnel_handle != INVALID_TUNNEL_HANDLE)
1420 goto done;
1421
1422 rc = bnxt_tc_resolve_tunnel_hdrs(bp, encap_key, &encap_node->l2_info);
1423 if (rc)
1424 goto put_encap;
1425
1426 /* Allocate a new tunnel encap record */
1427 rc = hwrm_cfa_encap_record_alloc(bp, encap_key, &encap_node->l2_info,
1428 &encap_node->tunnel_handle);
1429 if (rc)
1430 goto put_encap;
1431
1432 done:
1433 *encap_handle = encap_node->tunnel_handle;
1434 return 0;
1435
1436 put_encap:
1437 bnxt_tc_put_tunnel_node(bp, &tc_info->encap_table,
1438 &tc_info->encap_ht_params, encap_node);
1439 return rc;
1440 }
1441
bnxt_tc_put_tunnel_handle(struct bnxt * bp,struct bnxt_tc_flow * flow,struct bnxt_tc_flow_node * flow_node)1442 static void bnxt_tc_put_tunnel_handle(struct bnxt *bp,
1443 struct bnxt_tc_flow *flow,
1444 struct bnxt_tc_flow_node *flow_node)
1445 {
1446 if (flow->actions.flags & BNXT_TC_ACTION_FLAG_TUNNEL_DECAP)
1447 bnxt_tc_put_decap_handle(bp, flow_node);
1448 else if (flow->actions.flags & BNXT_TC_ACTION_FLAG_TUNNEL_ENCAP)
1449 bnxt_tc_put_encap_handle(bp, flow_node->encap_node);
1450 }
1451
bnxt_tc_get_tunnel_handle(struct bnxt * bp,struct bnxt_tc_flow * flow,struct bnxt_tc_flow_node * flow_node,__le32 * tunnel_handle)1452 static int bnxt_tc_get_tunnel_handle(struct bnxt *bp,
1453 struct bnxt_tc_flow *flow,
1454 struct bnxt_tc_flow_node *flow_node,
1455 __le32 *tunnel_handle)
1456 {
1457 if (flow->actions.flags & BNXT_TC_ACTION_FLAG_TUNNEL_DECAP)
1458 return bnxt_tc_get_decap_handle(bp, flow, flow_node,
1459 tunnel_handle);
1460 else if (flow->actions.flags & BNXT_TC_ACTION_FLAG_TUNNEL_ENCAP)
1461 return bnxt_tc_get_encap_handle(bp, flow, flow_node,
1462 tunnel_handle);
1463 else
1464 return 0;
1465 }
__bnxt_tc_del_flow(struct bnxt * bp,struct bnxt_tc_flow_node * flow_node)1466 static int __bnxt_tc_del_flow(struct bnxt *bp,
1467 struct bnxt_tc_flow_node *flow_node)
1468 {
1469 struct bnxt_tc_info *tc_info = bp->tc_info;
1470 int rc;
1471
1472 /* send HWRM cmd to free the flow-id */
1473 bnxt_hwrm_cfa_flow_free(bp, flow_node);
1474
1475 mutex_lock(&tc_info->lock);
1476
1477 /* release references to any tunnel encap/decap nodes */
1478 bnxt_tc_put_tunnel_handle(bp, &flow_node->flow, flow_node);
1479
1480 /* release reference to l2 node */
1481 bnxt_tc_put_l2_node(bp, flow_node);
1482
1483 mutex_unlock(&tc_info->lock);
1484
1485 rc = rhashtable_remove_fast(&tc_info->flow_table, &flow_node->node,
1486 tc_info->flow_ht_params);
1487 if (rc)
1488 netdev_err(bp->dev, "Error: %s: rhashtable_remove_fast rc=%d\n",
1489 __func__, rc);
1490
1491 kfree_rcu(flow_node, rcu);
1492 return 0;
1493 }
1494
bnxt_tc_set_flow_dir(struct bnxt * bp,struct bnxt_tc_flow * flow,u16 src_fid)1495 static void bnxt_tc_set_flow_dir(struct bnxt *bp, struct bnxt_tc_flow *flow,
1496 u16 src_fid)
1497 {
1498 flow->l2_key.dir = (bp->pf.fw_fid == src_fid) ? BNXT_DIR_RX : BNXT_DIR_TX;
1499 }
1500
bnxt_tc_set_src_fid(struct bnxt * bp,struct bnxt_tc_flow * flow,u16 src_fid)1501 static void bnxt_tc_set_src_fid(struct bnxt *bp, struct bnxt_tc_flow *flow,
1502 u16 src_fid)
1503 {
1504 if (flow->actions.flags & BNXT_TC_ACTION_FLAG_TUNNEL_DECAP)
1505 flow->src_fid = bp->pf.fw_fid;
1506 else
1507 flow->src_fid = src_fid;
1508 }
1509
1510 /* Add a new flow or replace an existing flow.
1511 * Notes on locking:
1512 * There are essentially two critical sections here.
1513 * 1. while adding a new flow
1514 * a) lookup l2-key
1515 * b) issue HWRM cmd and get flow_handle
1516 * c) link l2-key with flow
1517 * 2. while deleting a flow
1518 * a) unlinking l2-key from flow
1519 * A lock is needed to protect these two critical sections.
1520 *
1521 * The hash-tables are already protected by the rhashtable API.
1522 */
bnxt_tc_add_flow(struct bnxt * bp,u16 src_fid,struct flow_cls_offload * tc_flow_cmd)1523 static int bnxt_tc_add_flow(struct bnxt *bp, u16 src_fid,
1524 struct flow_cls_offload *tc_flow_cmd)
1525 {
1526 struct bnxt_tc_flow_node *new_node, *old_node;
1527 struct bnxt_tc_info *tc_info = bp->tc_info;
1528 struct bnxt_tc_flow *flow;
1529 __le32 tunnel_handle = 0;
1530 __le16 ref_flow_handle;
1531 int rc;
1532
1533 /* allocate memory for the new flow and it's node */
1534 new_node = kzalloc(sizeof(*new_node), GFP_KERNEL);
1535 if (!new_node) {
1536 rc = -ENOMEM;
1537 goto done;
1538 }
1539 new_node->cookie = tc_flow_cmd->cookie;
1540 flow = &new_node->flow;
1541
1542 rc = bnxt_tc_parse_flow(bp, tc_flow_cmd, flow);
1543 if (rc)
1544 goto free_node;
1545
1546 bnxt_tc_set_src_fid(bp, flow, src_fid);
1547 bnxt_tc_set_flow_dir(bp, flow, flow->src_fid);
1548
1549 if (!bnxt_tc_can_offload(bp, flow)) {
1550 rc = -EOPNOTSUPP;
1551 kfree_rcu(new_node, rcu);
1552 return rc;
1553 }
1554
1555 /* If a flow exists with the same cookie, delete it */
1556 old_node = rhashtable_lookup_fast(&tc_info->flow_table,
1557 &tc_flow_cmd->cookie,
1558 tc_info->flow_ht_params);
1559 if (old_node)
1560 __bnxt_tc_del_flow(bp, old_node);
1561
1562 /* Check if the L2 part of the flow has been offloaded already.
1563 * If so, bump up it's refcnt and get it's reference handle.
1564 */
1565 mutex_lock(&tc_info->lock);
1566 rc = bnxt_tc_get_ref_flow_handle(bp, flow, new_node, &ref_flow_handle);
1567 if (rc)
1568 goto unlock;
1569
1570 /* If the flow involves tunnel encap/decap, get tunnel_handle */
1571 rc = bnxt_tc_get_tunnel_handle(bp, flow, new_node, &tunnel_handle);
1572 if (rc)
1573 goto put_l2;
1574
1575 /* send HWRM cmd to alloc the flow */
1576 rc = bnxt_hwrm_cfa_flow_alloc(bp, flow, ref_flow_handle,
1577 tunnel_handle, new_node);
1578 if (rc)
1579 goto put_tunnel;
1580
1581 flow->lastused = jiffies;
1582 spin_lock_init(&flow->stats_lock);
1583 /* add new flow to flow-table */
1584 rc = rhashtable_insert_fast(&tc_info->flow_table, &new_node->node,
1585 tc_info->flow_ht_params);
1586 if (rc)
1587 goto hwrm_flow_free;
1588
1589 mutex_unlock(&tc_info->lock);
1590 return 0;
1591
1592 hwrm_flow_free:
1593 bnxt_hwrm_cfa_flow_free(bp, new_node);
1594 put_tunnel:
1595 bnxt_tc_put_tunnel_handle(bp, flow, new_node);
1596 put_l2:
1597 bnxt_tc_put_l2_node(bp, new_node);
1598 unlock:
1599 mutex_unlock(&tc_info->lock);
1600 free_node:
1601 kfree_rcu(new_node, rcu);
1602 done:
1603 netdev_err(bp->dev, "Error: %s: cookie=0x%lx error=%d\n",
1604 __func__, tc_flow_cmd->cookie, rc);
1605 return rc;
1606 }
1607
bnxt_tc_del_flow(struct bnxt * bp,struct flow_cls_offload * tc_flow_cmd)1608 static int bnxt_tc_del_flow(struct bnxt *bp,
1609 struct flow_cls_offload *tc_flow_cmd)
1610 {
1611 struct bnxt_tc_info *tc_info = bp->tc_info;
1612 struct bnxt_tc_flow_node *flow_node;
1613
1614 flow_node = rhashtable_lookup_fast(&tc_info->flow_table,
1615 &tc_flow_cmd->cookie,
1616 tc_info->flow_ht_params);
1617 if (!flow_node)
1618 return -EINVAL;
1619
1620 return __bnxt_tc_del_flow(bp, flow_node);
1621 }
1622
bnxt_tc_get_flow_stats(struct bnxt * bp,struct flow_cls_offload * tc_flow_cmd)1623 static int bnxt_tc_get_flow_stats(struct bnxt *bp,
1624 struct flow_cls_offload *tc_flow_cmd)
1625 {
1626 struct bnxt_tc_flow_stats stats, *curr_stats, *prev_stats;
1627 struct bnxt_tc_info *tc_info = bp->tc_info;
1628 struct bnxt_tc_flow_node *flow_node;
1629 struct bnxt_tc_flow *flow;
1630 unsigned long lastused;
1631
1632 flow_node = rhashtable_lookup_fast(&tc_info->flow_table,
1633 &tc_flow_cmd->cookie,
1634 tc_info->flow_ht_params);
1635 if (!flow_node)
1636 return -1;
1637
1638 flow = &flow_node->flow;
1639 curr_stats = &flow->stats;
1640 prev_stats = &flow->prev_stats;
1641
1642 spin_lock(&flow->stats_lock);
1643 stats.packets = curr_stats->packets - prev_stats->packets;
1644 stats.bytes = curr_stats->bytes - prev_stats->bytes;
1645 *prev_stats = *curr_stats;
1646 lastused = flow->lastused;
1647 spin_unlock(&flow->stats_lock);
1648
1649 flow_stats_update(&tc_flow_cmd->stats, stats.bytes, stats.packets, 0,
1650 lastused, FLOW_ACTION_HW_STATS_DELAYED);
1651 return 0;
1652 }
1653
bnxt_fill_cfa_stats_req(struct bnxt * bp,struct bnxt_tc_flow_node * flow_node,__le16 * flow_handle,__le32 * flow_id)1654 static void bnxt_fill_cfa_stats_req(struct bnxt *bp,
1655 struct bnxt_tc_flow_node *flow_node,
1656 __le16 *flow_handle, __le32 *flow_id)
1657 {
1658 u16 handle;
1659
1660 if (bp->fw_cap & BNXT_FW_CAP_OVS_64BIT_HANDLE) {
1661 *flow_id = flow_node->flow_id;
1662
1663 /* If flow_id is used to fetch flow stats then:
1664 * 1. lower 12 bits of flow_handle must be set to all 1s.
1665 * 2. 15th bit of flow_handle must specify the flow
1666 * direction (TX/RX).
1667 */
1668 if (flow_node->flow.l2_key.dir == BNXT_DIR_RX)
1669 handle = CFA_FLOW_INFO_REQ_FLOW_HANDLE_DIR_RX |
1670 CFA_FLOW_INFO_REQ_FLOW_HANDLE_MAX_MASK;
1671 else
1672 handle = CFA_FLOW_INFO_REQ_FLOW_HANDLE_MAX_MASK;
1673
1674 *flow_handle = cpu_to_le16(handle);
1675 } else {
1676 *flow_handle = flow_node->flow_handle;
1677 }
1678 }
1679
1680 static int
bnxt_hwrm_cfa_flow_stats_get(struct bnxt * bp,int num_flows,struct bnxt_tc_stats_batch stats_batch[])1681 bnxt_hwrm_cfa_flow_stats_get(struct bnxt *bp, int num_flows,
1682 struct bnxt_tc_stats_batch stats_batch[])
1683 {
1684 struct hwrm_cfa_flow_stats_output *resp;
1685 struct hwrm_cfa_flow_stats_input *req;
1686 __le16 *req_flow_handles;
1687 __le32 *req_flow_ids;
1688 int rc, i;
1689
1690 rc = hwrm_req_init(bp, req, HWRM_CFA_FLOW_STATS);
1691 if (rc)
1692 goto exit;
1693
1694 req_flow_handles = &req->flow_handle_0;
1695 req_flow_ids = &req->flow_id_0;
1696
1697 req->num_flows = cpu_to_le16(num_flows);
1698 for (i = 0; i < num_flows; i++) {
1699 struct bnxt_tc_flow_node *flow_node = stats_batch[i].flow_node;
1700
1701 bnxt_fill_cfa_stats_req(bp, flow_node,
1702 &req_flow_handles[i], &req_flow_ids[i]);
1703 }
1704
1705 resp = hwrm_req_hold(bp, req);
1706 rc = hwrm_req_send(bp, req);
1707 if (!rc) {
1708 __le64 *resp_packets;
1709 __le64 *resp_bytes;
1710
1711 resp_packets = &resp->packet_0;
1712 resp_bytes = &resp->byte_0;
1713
1714 for (i = 0; i < num_flows; i++) {
1715 stats_batch[i].hw_stats.packets =
1716 le64_to_cpu(resp_packets[i]);
1717 stats_batch[i].hw_stats.bytes =
1718 le64_to_cpu(resp_bytes[i]);
1719 }
1720 }
1721 hwrm_req_drop(bp, req);
1722 exit:
1723 if (rc)
1724 netdev_info(bp->dev, "error rc=%d\n", rc);
1725
1726 return rc;
1727 }
1728
1729 /* Add val to accum while handling a possible wraparound
1730 * of val. Eventhough val is of type u64, its actual width
1731 * is denoted by mask and will wrap-around beyond that width.
1732 */
accumulate_val(u64 * accum,u64 val,u64 mask)1733 static void accumulate_val(u64 *accum, u64 val, u64 mask)
1734 {
1735 #define low_bits(x, mask) ((x) & (mask))
1736 #define high_bits(x, mask) ((x) & ~(mask))
1737 bool wrapped = val < low_bits(*accum, mask);
1738
1739 *accum = high_bits(*accum, mask) + val;
1740 if (wrapped)
1741 *accum += (mask + 1);
1742 }
1743
1744 /* The HW counters' width is much less than 64bits.
1745 * Handle possible wrap-around while updating the stat counters
1746 */
bnxt_flow_stats_accum(struct bnxt_tc_info * tc_info,struct bnxt_tc_flow_stats * acc_stats,struct bnxt_tc_flow_stats * hw_stats)1747 static void bnxt_flow_stats_accum(struct bnxt_tc_info *tc_info,
1748 struct bnxt_tc_flow_stats *acc_stats,
1749 struct bnxt_tc_flow_stats *hw_stats)
1750 {
1751 accumulate_val(&acc_stats->bytes, hw_stats->bytes, tc_info->bytes_mask);
1752 accumulate_val(&acc_stats->packets, hw_stats->packets,
1753 tc_info->packets_mask);
1754 }
1755
1756 static int
bnxt_tc_flow_stats_batch_update(struct bnxt * bp,int num_flows,struct bnxt_tc_stats_batch stats_batch[])1757 bnxt_tc_flow_stats_batch_update(struct bnxt *bp, int num_flows,
1758 struct bnxt_tc_stats_batch stats_batch[])
1759 {
1760 struct bnxt_tc_info *tc_info = bp->tc_info;
1761 int rc, i;
1762
1763 rc = bnxt_hwrm_cfa_flow_stats_get(bp, num_flows, stats_batch);
1764 if (rc)
1765 return rc;
1766
1767 for (i = 0; i < num_flows; i++) {
1768 struct bnxt_tc_flow_node *flow_node = stats_batch[i].flow_node;
1769 struct bnxt_tc_flow *flow = &flow_node->flow;
1770
1771 spin_lock(&flow->stats_lock);
1772 bnxt_flow_stats_accum(tc_info, &flow->stats,
1773 &stats_batch[i].hw_stats);
1774 if (flow->stats.packets != flow->prev_stats.packets)
1775 flow->lastused = jiffies;
1776 spin_unlock(&flow->stats_lock);
1777 }
1778
1779 return 0;
1780 }
1781
1782 static int
bnxt_tc_flow_stats_batch_prep(struct bnxt * bp,struct bnxt_tc_stats_batch stats_batch[],int * num_flows)1783 bnxt_tc_flow_stats_batch_prep(struct bnxt *bp,
1784 struct bnxt_tc_stats_batch stats_batch[],
1785 int *num_flows)
1786 {
1787 struct bnxt_tc_info *tc_info = bp->tc_info;
1788 struct rhashtable_iter *iter = &tc_info->iter;
1789 void *flow_node;
1790 int rc, i;
1791
1792 rhashtable_walk_start(iter);
1793
1794 rc = 0;
1795 for (i = 0; i < BNXT_FLOW_STATS_BATCH_MAX; i++) {
1796 flow_node = rhashtable_walk_next(iter);
1797 if (IS_ERR(flow_node)) {
1798 i = 0;
1799 if (PTR_ERR(flow_node) == -EAGAIN) {
1800 continue;
1801 } else {
1802 rc = PTR_ERR(flow_node);
1803 goto done;
1804 }
1805 }
1806
1807 /* No more flows */
1808 if (!flow_node)
1809 goto done;
1810
1811 stats_batch[i].flow_node = flow_node;
1812 }
1813 done:
1814 rhashtable_walk_stop(iter);
1815 *num_flows = i;
1816 return rc;
1817 }
1818
bnxt_tc_flow_stats_work(struct bnxt * bp)1819 void bnxt_tc_flow_stats_work(struct bnxt *bp)
1820 {
1821 struct bnxt_tc_info *tc_info = bp->tc_info;
1822 int num_flows, rc;
1823
1824 num_flows = atomic_read(&tc_info->flow_table.nelems);
1825 if (!num_flows)
1826 return;
1827
1828 rhashtable_walk_enter(&tc_info->flow_table, &tc_info->iter);
1829
1830 for (;;) {
1831 rc = bnxt_tc_flow_stats_batch_prep(bp, tc_info->stats_batch,
1832 &num_flows);
1833 if (rc) {
1834 if (rc == -EAGAIN)
1835 continue;
1836 break;
1837 }
1838
1839 if (!num_flows)
1840 break;
1841
1842 bnxt_tc_flow_stats_batch_update(bp, num_flows,
1843 tc_info->stats_batch);
1844 }
1845
1846 rhashtable_walk_exit(&tc_info->iter);
1847 }
1848
bnxt_tc_setup_flower(struct bnxt * bp,u16 src_fid,struct flow_cls_offload * cls_flower)1849 int bnxt_tc_setup_flower(struct bnxt *bp, u16 src_fid,
1850 struct flow_cls_offload *cls_flower)
1851 {
1852 switch (cls_flower->command) {
1853 case FLOW_CLS_REPLACE:
1854 return bnxt_tc_add_flow(bp, src_fid, cls_flower);
1855 case FLOW_CLS_DESTROY:
1856 return bnxt_tc_del_flow(bp, cls_flower);
1857 case FLOW_CLS_STATS:
1858 return bnxt_tc_get_flow_stats(bp, cls_flower);
1859 default:
1860 return -EOPNOTSUPP;
1861 }
1862 }
1863
bnxt_tc_setup_indr_block_cb(enum tc_setup_type type,void * type_data,void * cb_priv)1864 static int bnxt_tc_setup_indr_block_cb(enum tc_setup_type type,
1865 void *type_data, void *cb_priv)
1866 {
1867 struct bnxt_flower_indr_block_cb_priv *priv = cb_priv;
1868 struct flow_cls_offload *flower = type_data;
1869 struct bnxt *bp = priv->bp;
1870
1871 if (!tc_cls_can_offload_and_chain0(bp->dev, type_data))
1872 return -EOPNOTSUPP;
1873
1874 switch (type) {
1875 case TC_SETUP_CLSFLOWER:
1876 return bnxt_tc_setup_flower(bp, bp->pf.fw_fid, flower);
1877 default:
1878 return -EOPNOTSUPP;
1879 }
1880 }
1881
1882 static struct bnxt_flower_indr_block_cb_priv *
bnxt_tc_indr_block_cb_lookup(struct bnxt * bp,struct net_device * netdev)1883 bnxt_tc_indr_block_cb_lookup(struct bnxt *bp, struct net_device *netdev)
1884 {
1885 struct bnxt_flower_indr_block_cb_priv *cb_priv;
1886
1887 list_for_each_entry(cb_priv, &bp->tc_indr_block_list, list)
1888 if (cb_priv->tunnel_netdev == netdev)
1889 return cb_priv;
1890
1891 return NULL;
1892 }
1893
bnxt_tc_setup_indr_rel(void * cb_priv)1894 static void bnxt_tc_setup_indr_rel(void *cb_priv)
1895 {
1896 struct bnxt_flower_indr_block_cb_priv *priv = cb_priv;
1897
1898 list_del(&priv->list);
1899 kfree(priv);
1900 }
1901
bnxt_tc_setup_indr_block(struct net_device * netdev,struct Qdisc * sch,struct bnxt * bp,struct flow_block_offload * f,void * data,void (* cleanup)(struct flow_block_cb * block_cb))1902 static int bnxt_tc_setup_indr_block(struct net_device *netdev, struct Qdisc *sch, struct bnxt *bp,
1903 struct flow_block_offload *f, void *data,
1904 void (*cleanup)(struct flow_block_cb *block_cb))
1905 {
1906 struct bnxt_flower_indr_block_cb_priv *cb_priv;
1907 struct flow_block_cb *block_cb;
1908
1909 if (f->binder_type != FLOW_BLOCK_BINDER_TYPE_CLSACT_INGRESS)
1910 return -EOPNOTSUPP;
1911
1912 switch (f->command) {
1913 case FLOW_BLOCK_BIND:
1914 cb_priv = kmalloc(sizeof(*cb_priv), GFP_KERNEL);
1915 if (!cb_priv)
1916 return -ENOMEM;
1917
1918 cb_priv->tunnel_netdev = netdev;
1919 cb_priv->bp = bp;
1920 list_add(&cb_priv->list, &bp->tc_indr_block_list);
1921
1922 block_cb = flow_indr_block_cb_alloc(bnxt_tc_setup_indr_block_cb,
1923 cb_priv, cb_priv,
1924 bnxt_tc_setup_indr_rel, f,
1925 netdev, sch, data, bp, cleanup);
1926 if (IS_ERR(block_cb)) {
1927 list_del(&cb_priv->list);
1928 kfree(cb_priv);
1929 return PTR_ERR(block_cb);
1930 }
1931
1932 flow_block_cb_add(block_cb, f);
1933 list_add_tail(&block_cb->driver_list, &bnxt_block_cb_list);
1934 break;
1935 case FLOW_BLOCK_UNBIND:
1936 cb_priv = bnxt_tc_indr_block_cb_lookup(bp, netdev);
1937 if (!cb_priv)
1938 return -ENOENT;
1939
1940 block_cb = flow_block_cb_lookup(f->block,
1941 bnxt_tc_setup_indr_block_cb,
1942 cb_priv);
1943 if (!block_cb)
1944 return -ENOENT;
1945
1946 flow_indr_block_cb_remove(block_cb, f);
1947 list_del(&block_cb->driver_list);
1948 break;
1949 default:
1950 return -EOPNOTSUPP;
1951 }
1952 return 0;
1953 }
1954
bnxt_is_netdev_indr_offload(struct net_device * netdev)1955 static bool bnxt_is_netdev_indr_offload(struct net_device *netdev)
1956 {
1957 return netif_is_vxlan(netdev);
1958 }
1959
bnxt_tc_setup_indr_cb(struct net_device * netdev,struct Qdisc * sch,void * cb_priv,enum tc_setup_type type,void * type_data,void * data,void (* cleanup)(struct flow_block_cb * block_cb))1960 static int bnxt_tc_setup_indr_cb(struct net_device *netdev, struct Qdisc *sch, void *cb_priv,
1961 enum tc_setup_type type, void *type_data,
1962 void *data,
1963 void (*cleanup)(struct flow_block_cb *block_cb))
1964 {
1965 if (!netdev || !bnxt_is_netdev_indr_offload(netdev))
1966 return -EOPNOTSUPP;
1967
1968 switch (type) {
1969 case TC_SETUP_BLOCK:
1970 return bnxt_tc_setup_indr_block(netdev, sch, cb_priv, type_data, data, cleanup);
1971 default:
1972 break;
1973 }
1974
1975 return -EOPNOTSUPP;
1976 }
1977
1978 static const struct rhashtable_params bnxt_tc_flow_ht_params = {
1979 .head_offset = offsetof(struct bnxt_tc_flow_node, node),
1980 .key_offset = offsetof(struct bnxt_tc_flow_node, cookie),
1981 .key_len = sizeof(((struct bnxt_tc_flow_node *)0)->cookie),
1982 .automatic_shrinking = true
1983 };
1984
1985 static const struct rhashtable_params bnxt_tc_l2_ht_params = {
1986 .head_offset = offsetof(struct bnxt_tc_l2_node, node),
1987 .key_offset = offsetof(struct bnxt_tc_l2_node, key),
1988 .key_len = BNXT_TC_L2_KEY_LEN,
1989 .automatic_shrinking = true
1990 };
1991
1992 static const struct rhashtable_params bnxt_tc_decap_l2_ht_params = {
1993 .head_offset = offsetof(struct bnxt_tc_l2_node, node),
1994 .key_offset = offsetof(struct bnxt_tc_l2_node, key),
1995 .key_len = BNXT_TC_L2_KEY_LEN,
1996 .automatic_shrinking = true
1997 };
1998
1999 static const struct rhashtable_params bnxt_tc_tunnel_ht_params = {
2000 .head_offset = offsetof(struct bnxt_tc_tunnel_node, node),
2001 .key_offset = offsetof(struct bnxt_tc_tunnel_node, key),
2002 .key_len = sizeof(struct ip_tunnel_key),
2003 .automatic_shrinking = true
2004 };
2005
2006 /* convert counter width in bits to a mask */
2007 #define mask(width) ((u64)~0 >> (64 - (width)))
2008
bnxt_init_tc(struct bnxt * bp)2009 int bnxt_init_tc(struct bnxt *bp)
2010 {
2011 struct bnxt_tc_info *tc_info;
2012 int rc;
2013
2014 if (bp->hwrm_spec_code < 0x10803)
2015 return 0;
2016
2017 tc_info = kzalloc(sizeof(*tc_info), GFP_KERNEL);
2018 if (!tc_info)
2019 return -ENOMEM;
2020 mutex_init(&tc_info->lock);
2021
2022 /* Counter widths are programmed by FW */
2023 tc_info->bytes_mask = mask(36);
2024 tc_info->packets_mask = mask(28);
2025
2026 tc_info->flow_ht_params = bnxt_tc_flow_ht_params;
2027 rc = rhashtable_init(&tc_info->flow_table, &tc_info->flow_ht_params);
2028 if (rc)
2029 goto free_tc_info;
2030
2031 tc_info->l2_ht_params = bnxt_tc_l2_ht_params;
2032 rc = rhashtable_init(&tc_info->l2_table, &tc_info->l2_ht_params);
2033 if (rc)
2034 goto destroy_flow_table;
2035
2036 tc_info->decap_l2_ht_params = bnxt_tc_decap_l2_ht_params;
2037 rc = rhashtable_init(&tc_info->decap_l2_table,
2038 &tc_info->decap_l2_ht_params);
2039 if (rc)
2040 goto destroy_l2_table;
2041
2042 tc_info->decap_ht_params = bnxt_tc_tunnel_ht_params;
2043 rc = rhashtable_init(&tc_info->decap_table,
2044 &tc_info->decap_ht_params);
2045 if (rc)
2046 goto destroy_decap_l2_table;
2047
2048 tc_info->encap_ht_params = bnxt_tc_tunnel_ht_params;
2049 rc = rhashtable_init(&tc_info->encap_table,
2050 &tc_info->encap_ht_params);
2051 if (rc)
2052 goto destroy_decap_table;
2053
2054 tc_info->enabled = true;
2055 bp->dev->hw_features |= NETIF_F_HW_TC;
2056 bp->dev->features |= NETIF_F_HW_TC;
2057 bp->tc_info = tc_info;
2058
2059 /* init indirect block notifications */
2060 INIT_LIST_HEAD(&bp->tc_indr_block_list);
2061
2062 rc = flow_indr_dev_register(bnxt_tc_setup_indr_cb, bp);
2063 if (!rc)
2064 return 0;
2065
2066 rhashtable_destroy(&tc_info->encap_table);
2067
2068 destroy_decap_table:
2069 rhashtable_destroy(&tc_info->decap_table);
2070 destroy_decap_l2_table:
2071 rhashtable_destroy(&tc_info->decap_l2_table);
2072 destroy_l2_table:
2073 rhashtable_destroy(&tc_info->l2_table);
2074 destroy_flow_table:
2075 rhashtable_destroy(&tc_info->flow_table);
2076 free_tc_info:
2077 kfree(tc_info);
2078 bp->tc_info = NULL;
2079 return rc;
2080 }
2081
bnxt_shutdown_tc(struct bnxt * bp)2082 void bnxt_shutdown_tc(struct bnxt *bp)
2083 {
2084 struct bnxt_tc_info *tc_info = bp->tc_info;
2085
2086 if (!bnxt_tc_flower_enabled(bp))
2087 return;
2088
2089 flow_indr_dev_unregister(bnxt_tc_setup_indr_cb, bp,
2090 bnxt_tc_setup_indr_rel);
2091 rhashtable_destroy(&tc_info->flow_table);
2092 rhashtable_destroy(&tc_info->l2_table);
2093 rhashtable_destroy(&tc_info->decap_l2_table);
2094 rhashtable_destroy(&tc_info->decap_table);
2095 rhashtable_destroy(&tc_info->encap_table);
2096 kfree(tc_info);
2097 bp->tc_info = NULL;
2098 }
2099