1 /* 2 * Copyright (c) 2007 Mellanox Technologies. All rights reserved. 3 * 4 * This software is available to you under a choice of one of two 5 * licenses. You may choose to be licensed under the terms of the GNU 6 * General Public License (GPL) Version 2, available from the file 7 * COPYING in the main directory of this source tree, or the 8 * OpenIB.org BSD license below: 9 * 10 * Redistribution and use in source and binary forms, with or 11 * without modification, are permitted provided that the following 12 * conditions are met: 13 * 14 * - Redistributions of source code must retain the above 15 * copyright notice, this list of conditions and the following 16 * disclaimer. 17 * 18 * - Redistributions in binary form must reproduce the above 19 * copyright notice, this list of conditions and the following 20 * disclaimer in the documentation and/or other materials 21 * provided with the distribution. 22 * 23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 30 * SOFTWARE. 31 * 32 */ 33 34 #include <linux/etherdevice.h> 35 #include <linux/tcp.h> 36 #include <linux/if_vlan.h> 37 #include <linux/delay.h> 38 #include <linux/slab.h> 39 #include <linux/hash.h> 40 #include <net/ip.h> 41 #include <net/busy_poll.h> 42 #include <net/vxlan.h> 43 44 #include <linux/mlx4/driver.h> 45 #include <linux/mlx4/device.h> 46 #include <linux/mlx4/cmd.h> 47 #include <linux/mlx4/cq.h> 48 49 #include "mlx4_en.h" 50 #include "en_port.h" 51 52 int mlx4_en_setup_tc(struct net_device *dev, u8 up) 53 { 54 struct mlx4_en_priv *priv = netdev_priv(dev); 55 int i; 56 unsigned int offset = 0; 57 58 if (up && up != MLX4_EN_NUM_UP) 59 return -EINVAL; 60 61 netdev_set_num_tc(dev, up); 62 63 /* Partition Tx queues evenly amongst UP's */ 64 for (i = 0; i < up; i++) { 65 netdev_set_tc_queue(dev, i, priv->num_tx_rings_p_up, offset); 66 offset += priv->num_tx_rings_p_up; 67 } 68 69 return 0; 70 } 71 72 #ifdef CONFIG_NET_RX_BUSY_POLL 73 /* must be called with local_bh_disable()d */ 74 static int mlx4_en_low_latency_recv(struct napi_struct *napi) 75 { 76 struct mlx4_en_cq *cq = container_of(napi, struct mlx4_en_cq, napi); 77 struct net_device *dev = cq->dev; 78 struct mlx4_en_priv *priv = netdev_priv(dev); 79 struct mlx4_en_rx_ring *rx_ring = priv->rx_ring[cq->ring]; 80 int done; 81 82 if (!priv->port_up) 83 return LL_FLUSH_FAILED; 84 85 if (!mlx4_en_cq_lock_poll(cq)) 86 return LL_FLUSH_BUSY; 87 88 done = mlx4_en_process_rx_cq(dev, cq, 4); 89 if (likely(done)) 90 rx_ring->cleaned += done; 91 else 92 rx_ring->misses++; 93 94 mlx4_en_cq_unlock_poll(cq); 95 96 return done; 97 } 98 #endif /* CONFIG_NET_RX_BUSY_POLL */ 99 100 #ifdef CONFIG_RFS_ACCEL 101 102 struct mlx4_en_filter { 103 struct list_head next; 104 struct work_struct work; 105 106 u8 ip_proto; 107 __be32 src_ip; 108 __be32 dst_ip; 109 __be16 src_port; 110 __be16 dst_port; 111 112 int rxq_index; 113 struct mlx4_en_priv *priv; 114 u32 flow_id; /* RFS infrastructure id */ 115 int id; /* mlx4_en driver id */ 116 u64 reg_id; /* Flow steering API id */ 117 u8 activated; /* Used to prevent expiry before filter 118 * is attached 119 */ 120 struct hlist_node filter_chain; 121 }; 122 123 static void mlx4_en_filter_rfs_expire(struct mlx4_en_priv *priv); 124 125 static enum mlx4_net_trans_rule_id mlx4_ip_proto_to_trans_rule_id(u8 ip_proto) 126 { 127 switch (ip_proto) { 128 case IPPROTO_UDP: 129 return MLX4_NET_TRANS_RULE_ID_UDP; 130 case IPPROTO_TCP: 131 return MLX4_NET_TRANS_RULE_ID_TCP; 132 default: 133 return MLX4_NET_TRANS_RULE_NUM; 134 } 135 }; 136 137 static void mlx4_en_filter_work(struct work_struct *work) 138 { 139 struct mlx4_en_filter *filter = container_of(work, 140 struct mlx4_en_filter, 141 work); 142 struct mlx4_en_priv *priv = filter->priv; 143 struct mlx4_spec_list spec_tcp_udp = { 144 .id = mlx4_ip_proto_to_trans_rule_id(filter->ip_proto), 145 { 146 .tcp_udp = { 147 .dst_port = filter->dst_port, 148 .dst_port_msk = (__force __be16)-1, 149 .src_port = filter->src_port, 150 .src_port_msk = (__force __be16)-1, 151 }, 152 }, 153 }; 154 struct mlx4_spec_list spec_ip = { 155 .id = MLX4_NET_TRANS_RULE_ID_IPV4, 156 { 157 .ipv4 = { 158 .dst_ip = filter->dst_ip, 159 .dst_ip_msk = (__force __be32)-1, 160 .src_ip = filter->src_ip, 161 .src_ip_msk = (__force __be32)-1, 162 }, 163 }, 164 }; 165 struct mlx4_spec_list spec_eth = { 166 .id = MLX4_NET_TRANS_RULE_ID_ETH, 167 }; 168 struct mlx4_net_trans_rule rule = { 169 .list = LIST_HEAD_INIT(rule.list), 170 .queue_mode = MLX4_NET_TRANS_Q_LIFO, 171 .exclusive = 1, 172 .allow_loopback = 1, 173 .promisc_mode = MLX4_FS_REGULAR, 174 .port = priv->port, 175 .priority = MLX4_DOMAIN_RFS, 176 }; 177 int rc; 178 __be64 mac_mask = cpu_to_be64(MLX4_MAC_MASK << 16); 179 180 if (spec_tcp_udp.id >= MLX4_NET_TRANS_RULE_NUM) { 181 en_warn(priv, "RFS: ignoring unsupported ip protocol (%d)\n", 182 filter->ip_proto); 183 goto ignore; 184 } 185 list_add_tail(&spec_eth.list, &rule.list); 186 list_add_tail(&spec_ip.list, &rule.list); 187 list_add_tail(&spec_tcp_udp.list, &rule.list); 188 189 rule.qpn = priv->rss_map.qps[filter->rxq_index].qpn; 190 memcpy(spec_eth.eth.dst_mac, priv->dev->dev_addr, ETH_ALEN); 191 memcpy(spec_eth.eth.dst_mac_msk, &mac_mask, ETH_ALEN); 192 193 filter->activated = 0; 194 195 if (filter->reg_id) { 196 rc = mlx4_flow_detach(priv->mdev->dev, filter->reg_id); 197 if (rc && rc != -ENOENT) 198 en_err(priv, "Error detaching flow. rc = %d\n", rc); 199 } 200 201 rc = mlx4_flow_attach(priv->mdev->dev, &rule, &filter->reg_id); 202 if (rc) 203 en_err(priv, "Error attaching flow. err = %d\n", rc); 204 205 ignore: 206 mlx4_en_filter_rfs_expire(priv); 207 208 filter->activated = 1; 209 } 210 211 static inline struct hlist_head * 212 filter_hash_bucket(struct mlx4_en_priv *priv, __be32 src_ip, __be32 dst_ip, 213 __be16 src_port, __be16 dst_port) 214 { 215 unsigned long l; 216 int bucket_idx; 217 218 l = (__force unsigned long)src_port | 219 ((__force unsigned long)dst_port << 2); 220 l ^= (__force unsigned long)(src_ip ^ dst_ip); 221 222 bucket_idx = hash_long(l, MLX4_EN_FILTER_HASH_SHIFT); 223 224 return &priv->filter_hash[bucket_idx]; 225 } 226 227 static struct mlx4_en_filter * 228 mlx4_en_filter_alloc(struct mlx4_en_priv *priv, int rxq_index, __be32 src_ip, 229 __be32 dst_ip, u8 ip_proto, __be16 src_port, 230 __be16 dst_port, u32 flow_id) 231 { 232 struct mlx4_en_filter *filter = NULL; 233 234 filter = kzalloc(sizeof(struct mlx4_en_filter), GFP_ATOMIC); 235 if (!filter) 236 return NULL; 237 238 filter->priv = priv; 239 filter->rxq_index = rxq_index; 240 INIT_WORK(&filter->work, mlx4_en_filter_work); 241 242 filter->src_ip = src_ip; 243 filter->dst_ip = dst_ip; 244 filter->ip_proto = ip_proto; 245 filter->src_port = src_port; 246 filter->dst_port = dst_port; 247 248 filter->flow_id = flow_id; 249 250 filter->id = priv->last_filter_id++ % RPS_NO_FILTER; 251 252 list_add_tail(&filter->next, &priv->filters); 253 hlist_add_head(&filter->filter_chain, 254 filter_hash_bucket(priv, src_ip, dst_ip, src_port, 255 dst_port)); 256 257 return filter; 258 } 259 260 static void mlx4_en_filter_free(struct mlx4_en_filter *filter) 261 { 262 struct mlx4_en_priv *priv = filter->priv; 263 int rc; 264 265 list_del(&filter->next); 266 267 rc = mlx4_flow_detach(priv->mdev->dev, filter->reg_id); 268 if (rc && rc != -ENOENT) 269 en_err(priv, "Error detaching flow. rc = %d\n", rc); 270 271 kfree(filter); 272 } 273 274 static inline struct mlx4_en_filter * 275 mlx4_en_filter_find(struct mlx4_en_priv *priv, __be32 src_ip, __be32 dst_ip, 276 u8 ip_proto, __be16 src_port, __be16 dst_port) 277 { 278 struct mlx4_en_filter *filter; 279 struct mlx4_en_filter *ret = NULL; 280 281 hlist_for_each_entry(filter, 282 filter_hash_bucket(priv, src_ip, dst_ip, 283 src_port, dst_port), 284 filter_chain) { 285 if (filter->src_ip == src_ip && 286 filter->dst_ip == dst_ip && 287 filter->ip_proto == ip_proto && 288 filter->src_port == src_port && 289 filter->dst_port == dst_port) { 290 ret = filter; 291 break; 292 } 293 } 294 295 return ret; 296 } 297 298 static int 299 mlx4_en_filter_rfs(struct net_device *net_dev, const struct sk_buff *skb, 300 u16 rxq_index, u32 flow_id) 301 { 302 struct mlx4_en_priv *priv = netdev_priv(net_dev); 303 struct mlx4_en_filter *filter; 304 const struct iphdr *ip; 305 const __be16 *ports; 306 u8 ip_proto; 307 __be32 src_ip; 308 __be32 dst_ip; 309 __be16 src_port; 310 __be16 dst_port; 311 int nhoff = skb_network_offset(skb); 312 int ret = 0; 313 314 if (skb->protocol != htons(ETH_P_IP)) 315 return -EPROTONOSUPPORT; 316 317 ip = (const struct iphdr *)(skb->data + nhoff); 318 if (ip_is_fragment(ip)) 319 return -EPROTONOSUPPORT; 320 321 if ((ip->protocol != IPPROTO_TCP) && (ip->protocol != IPPROTO_UDP)) 322 return -EPROTONOSUPPORT; 323 ports = (const __be16 *)(skb->data + nhoff + 4 * ip->ihl); 324 325 ip_proto = ip->protocol; 326 src_ip = ip->saddr; 327 dst_ip = ip->daddr; 328 src_port = ports[0]; 329 dst_port = ports[1]; 330 331 spin_lock_bh(&priv->filters_lock); 332 filter = mlx4_en_filter_find(priv, src_ip, dst_ip, ip_proto, 333 src_port, dst_port); 334 if (filter) { 335 if (filter->rxq_index == rxq_index) 336 goto out; 337 338 filter->rxq_index = rxq_index; 339 } else { 340 filter = mlx4_en_filter_alloc(priv, rxq_index, 341 src_ip, dst_ip, ip_proto, 342 src_port, dst_port, flow_id); 343 if (!filter) { 344 ret = -ENOMEM; 345 goto err; 346 } 347 } 348 349 queue_work(priv->mdev->workqueue, &filter->work); 350 351 out: 352 ret = filter->id; 353 err: 354 spin_unlock_bh(&priv->filters_lock); 355 356 return ret; 357 } 358 359 void mlx4_en_cleanup_filters(struct mlx4_en_priv *priv) 360 { 361 struct mlx4_en_filter *filter, *tmp; 362 LIST_HEAD(del_list); 363 364 spin_lock_bh(&priv->filters_lock); 365 list_for_each_entry_safe(filter, tmp, &priv->filters, next) { 366 list_move(&filter->next, &del_list); 367 hlist_del(&filter->filter_chain); 368 } 369 spin_unlock_bh(&priv->filters_lock); 370 371 list_for_each_entry_safe(filter, tmp, &del_list, next) { 372 cancel_work_sync(&filter->work); 373 mlx4_en_filter_free(filter); 374 } 375 } 376 377 static void mlx4_en_filter_rfs_expire(struct mlx4_en_priv *priv) 378 { 379 struct mlx4_en_filter *filter = NULL, *tmp, *last_filter = NULL; 380 LIST_HEAD(del_list); 381 int i = 0; 382 383 spin_lock_bh(&priv->filters_lock); 384 list_for_each_entry_safe(filter, tmp, &priv->filters, next) { 385 if (i > MLX4_EN_FILTER_EXPIRY_QUOTA) 386 break; 387 388 if (filter->activated && 389 !work_pending(&filter->work) && 390 rps_may_expire_flow(priv->dev, 391 filter->rxq_index, filter->flow_id, 392 filter->id)) { 393 list_move(&filter->next, &del_list); 394 hlist_del(&filter->filter_chain); 395 } else 396 last_filter = filter; 397 398 i++; 399 } 400 401 if (last_filter && (&last_filter->next != priv->filters.next)) 402 list_move(&priv->filters, &last_filter->next); 403 404 spin_unlock_bh(&priv->filters_lock); 405 406 list_for_each_entry_safe(filter, tmp, &del_list, next) 407 mlx4_en_filter_free(filter); 408 } 409 #endif 410 411 static int mlx4_en_vlan_rx_add_vid(struct net_device *dev, 412 __be16 proto, u16 vid) 413 { 414 struct mlx4_en_priv *priv = netdev_priv(dev); 415 struct mlx4_en_dev *mdev = priv->mdev; 416 int err; 417 int idx; 418 419 en_dbg(HW, priv, "adding VLAN:%d\n", vid); 420 421 set_bit(vid, priv->active_vlans); 422 423 /* Add VID to port VLAN filter */ 424 mutex_lock(&mdev->state_lock); 425 if (mdev->device_up && priv->port_up) { 426 err = mlx4_SET_VLAN_FLTR(mdev->dev, priv); 427 if (err) 428 en_err(priv, "Failed configuring VLAN filter\n"); 429 } 430 if (mlx4_register_vlan(mdev->dev, priv->port, vid, &idx)) 431 en_dbg(HW, priv, "failed adding vlan %d\n", vid); 432 mutex_unlock(&mdev->state_lock); 433 434 return 0; 435 } 436 437 static int mlx4_en_vlan_rx_kill_vid(struct net_device *dev, 438 __be16 proto, u16 vid) 439 { 440 struct mlx4_en_priv *priv = netdev_priv(dev); 441 struct mlx4_en_dev *mdev = priv->mdev; 442 int err; 443 444 en_dbg(HW, priv, "Killing VID:%d\n", vid); 445 446 clear_bit(vid, priv->active_vlans); 447 448 /* Remove VID from port VLAN filter */ 449 mutex_lock(&mdev->state_lock); 450 mlx4_unregister_vlan(mdev->dev, priv->port, vid); 451 452 if (mdev->device_up && priv->port_up) { 453 err = mlx4_SET_VLAN_FLTR(mdev->dev, priv); 454 if (err) 455 en_err(priv, "Failed configuring VLAN filter\n"); 456 } 457 mutex_unlock(&mdev->state_lock); 458 459 return 0; 460 } 461 462 static void mlx4_en_u64_to_mac(unsigned char dst_mac[ETH_ALEN + 2], u64 src_mac) 463 { 464 int i; 465 for (i = ETH_ALEN - 1; i >= 0; --i) { 466 dst_mac[i] = src_mac & 0xff; 467 src_mac >>= 8; 468 } 469 memset(&dst_mac[ETH_ALEN], 0, 2); 470 } 471 472 473 static int mlx4_en_tunnel_steer_add(struct mlx4_en_priv *priv, unsigned char *addr, 474 int qpn, u64 *reg_id) 475 { 476 int err; 477 478 if (priv->mdev->dev->caps.tunnel_offload_mode != MLX4_TUNNEL_OFFLOAD_MODE_VXLAN || 479 priv->mdev->dev->caps.dmfs_high_steer_mode == MLX4_STEERING_DMFS_A0_STATIC) 480 return 0; /* do nothing */ 481 482 err = mlx4_tunnel_steer_add(priv->mdev->dev, addr, priv->port, qpn, 483 MLX4_DOMAIN_NIC, reg_id); 484 if (err) { 485 en_err(priv, "failed to add vxlan steering rule, err %d\n", err); 486 return err; 487 } 488 en_dbg(DRV, priv, "added vxlan steering rule, mac %pM reg_id %llx\n", addr, *reg_id); 489 return 0; 490 } 491 492 493 static int mlx4_en_uc_steer_add(struct mlx4_en_priv *priv, 494 unsigned char *mac, int *qpn, u64 *reg_id) 495 { 496 struct mlx4_en_dev *mdev = priv->mdev; 497 struct mlx4_dev *dev = mdev->dev; 498 int err; 499 500 switch (dev->caps.steering_mode) { 501 case MLX4_STEERING_MODE_B0: { 502 struct mlx4_qp qp; 503 u8 gid[16] = {0}; 504 505 qp.qpn = *qpn; 506 memcpy(&gid[10], mac, ETH_ALEN); 507 gid[5] = priv->port; 508 509 err = mlx4_unicast_attach(dev, &qp, gid, 0, MLX4_PROT_ETH); 510 break; 511 } 512 case MLX4_STEERING_MODE_DEVICE_MANAGED: { 513 struct mlx4_spec_list spec_eth = { {NULL} }; 514 __be64 mac_mask = cpu_to_be64(MLX4_MAC_MASK << 16); 515 516 struct mlx4_net_trans_rule rule = { 517 .queue_mode = MLX4_NET_TRANS_Q_FIFO, 518 .exclusive = 0, 519 .allow_loopback = 1, 520 .promisc_mode = MLX4_FS_REGULAR, 521 .priority = MLX4_DOMAIN_NIC, 522 }; 523 524 rule.port = priv->port; 525 rule.qpn = *qpn; 526 INIT_LIST_HEAD(&rule.list); 527 528 spec_eth.id = MLX4_NET_TRANS_RULE_ID_ETH; 529 memcpy(spec_eth.eth.dst_mac, mac, ETH_ALEN); 530 memcpy(spec_eth.eth.dst_mac_msk, &mac_mask, ETH_ALEN); 531 list_add_tail(&spec_eth.list, &rule.list); 532 533 err = mlx4_flow_attach(dev, &rule, reg_id); 534 break; 535 } 536 default: 537 return -EINVAL; 538 } 539 if (err) 540 en_warn(priv, "Failed Attaching Unicast\n"); 541 542 return err; 543 } 544 545 static void mlx4_en_uc_steer_release(struct mlx4_en_priv *priv, 546 unsigned char *mac, int qpn, u64 reg_id) 547 { 548 struct mlx4_en_dev *mdev = priv->mdev; 549 struct mlx4_dev *dev = mdev->dev; 550 551 switch (dev->caps.steering_mode) { 552 case MLX4_STEERING_MODE_B0: { 553 struct mlx4_qp qp; 554 u8 gid[16] = {0}; 555 556 qp.qpn = qpn; 557 memcpy(&gid[10], mac, ETH_ALEN); 558 gid[5] = priv->port; 559 560 mlx4_unicast_detach(dev, &qp, gid, MLX4_PROT_ETH); 561 break; 562 } 563 case MLX4_STEERING_MODE_DEVICE_MANAGED: { 564 mlx4_flow_detach(dev, reg_id); 565 break; 566 } 567 default: 568 en_err(priv, "Invalid steering mode.\n"); 569 } 570 } 571 572 static int mlx4_en_get_qp(struct mlx4_en_priv *priv) 573 { 574 struct mlx4_en_dev *mdev = priv->mdev; 575 struct mlx4_dev *dev = mdev->dev; 576 struct mlx4_mac_entry *entry; 577 int index = 0; 578 int err = 0; 579 u64 reg_id = 0; 580 int *qpn = &priv->base_qpn; 581 u64 mac = mlx4_mac_to_u64(priv->dev->dev_addr); 582 583 en_dbg(DRV, priv, "Registering MAC: %pM for adding\n", 584 priv->dev->dev_addr); 585 index = mlx4_register_mac(dev, priv->port, mac); 586 if (index < 0) { 587 err = index; 588 en_err(priv, "Failed adding MAC: %pM\n", 589 priv->dev->dev_addr); 590 return err; 591 } 592 593 if (dev->caps.steering_mode == MLX4_STEERING_MODE_A0) { 594 int base_qpn = mlx4_get_base_qpn(dev, priv->port); 595 *qpn = base_qpn + index; 596 return 0; 597 } 598 599 err = mlx4_qp_reserve_range(dev, 1, 1, qpn, MLX4_RESERVE_A0_QP); 600 en_dbg(DRV, priv, "Reserved qp %d\n", *qpn); 601 if (err) { 602 en_err(priv, "Failed to reserve qp for mac registration\n"); 603 goto qp_err; 604 } 605 606 err = mlx4_en_uc_steer_add(priv, priv->dev->dev_addr, qpn, ®_id); 607 if (err) 608 goto steer_err; 609 610 err = mlx4_en_tunnel_steer_add(priv, priv->dev->dev_addr, *qpn, 611 &priv->tunnel_reg_id); 612 if (err) 613 goto tunnel_err; 614 615 entry = kmalloc(sizeof(*entry), GFP_KERNEL); 616 if (!entry) { 617 err = -ENOMEM; 618 goto alloc_err; 619 } 620 memcpy(entry->mac, priv->dev->dev_addr, sizeof(entry->mac)); 621 memcpy(priv->current_mac, entry->mac, sizeof(priv->current_mac)); 622 entry->reg_id = reg_id; 623 624 hlist_add_head_rcu(&entry->hlist, 625 &priv->mac_hash[entry->mac[MLX4_EN_MAC_HASH_IDX]]); 626 627 return 0; 628 629 alloc_err: 630 if (priv->tunnel_reg_id) 631 mlx4_flow_detach(priv->mdev->dev, priv->tunnel_reg_id); 632 tunnel_err: 633 mlx4_en_uc_steer_release(priv, priv->dev->dev_addr, *qpn, reg_id); 634 635 steer_err: 636 mlx4_qp_release_range(dev, *qpn, 1); 637 638 qp_err: 639 mlx4_unregister_mac(dev, priv->port, mac); 640 return err; 641 } 642 643 static void mlx4_en_put_qp(struct mlx4_en_priv *priv) 644 { 645 struct mlx4_en_dev *mdev = priv->mdev; 646 struct mlx4_dev *dev = mdev->dev; 647 int qpn = priv->base_qpn; 648 u64 mac; 649 650 if (dev->caps.steering_mode == MLX4_STEERING_MODE_A0) { 651 mac = mlx4_mac_to_u64(priv->dev->dev_addr); 652 en_dbg(DRV, priv, "Registering MAC: %pM for deleting\n", 653 priv->dev->dev_addr); 654 mlx4_unregister_mac(dev, priv->port, mac); 655 } else { 656 struct mlx4_mac_entry *entry; 657 struct hlist_node *tmp; 658 struct hlist_head *bucket; 659 unsigned int i; 660 661 for (i = 0; i < MLX4_EN_MAC_HASH_SIZE; ++i) { 662 bucket = &priv->mac_hash[i]; 663 hlist_for_each_entry_safe(entry, tmp, bucket, hlist) { 664 mac = mlx4_mac_to_u64(entry->mac); 665 en_dbg(DRV, priv, "Registering MAC: %pM for deleting\n", 666 entry->mac); 667 mlx4_en_uc_steer_release(priv, entry->mac, 668 qpn, entry->reg_id); 669 670 mlx4_unregister_mac(dev, priv->port, mac); 671 hlist_del_rcu(&entry->hlist); 672 kfree_rcu(entry, rcu); 673 } 674 } 675 676 if (priv->tunnel_reg_id) { 677 mlx4_flow_detach(priv->mdev->dev, priv->tunnel_reg_id); 678 priv->tunnel_reg_id = 0; 679 } 680 681 en_dbg(DRV, priv, "Releasing qp: port %d, qpn %d\n", 682 priv->port, qpn); 683 mlx4_qp_release_range(dev, qpn, 1); 684 priv->flags &= ~MLX4_EN_FLAG_FORCE_PROMISC; 685 } 686 } 687 688 static int mlx4_en_replace_mac(struct mlx4_en_priv *priv, int qpn, 689 unsigned char *new_mac, unsigned char *prev_mac) 690 { 691 struct mlx4_en_dev *mdev = priv->mdev; 692 struct mlx4_dev *dev = mdev->dev; 693 int err = 0; 694 u64 new_mac_u64 = mlx4_mac_to_u64(new_mac); 695 696 if (dev->caps.steering_mode != MLX4_STEERING_MODE_A0) { 697 struct hlist_head *bucket; 698 unsigned int mac_hash; 699 struct mlx4_mac_entry *entry; 700 struct hlist_node *tmp; 701 u64 prev_mac_u64 = mlx4_mac_to_u64(prev_mac); 702 703 bucket = &priv->mac_hash[prev_mac[MLX4_EN_MAC_HASH_IDX]]; 704 hlist_for_each_entry_safe(entry, tmp, bucket, hlist) { 705 if (ether_addr_equal_64bits(entry->mac, prev_mac)) { 706 mlx4_en_uc_steer_release(priv, entry->mac, 707 qpn, entry->reg_id); 708 mlx4_unregister_mac(dev, priv->port, 709 prev_mac_u64); 710 hlist_del_rcu(&entry->hlist); 711 synchronize_rcu(); 712 memcpy(entry->mac, new_mac, ETH_ALEN); 713 entry->reg_id = 0; 714 mac_hash = new_mac[MLX4_EN_MAC_HASH_IDX]; 715 hlist_add_head_rcu(&entry->hlist, 716 &priv->mac_hash[mac_hash]); 717 mlx4_register_mac(dev, priv->port, new_mac_u64); 718 err = mlx4_en_uc_steer_add(priv, new_mac, 719 &qpn, 720 &entry->reg_id); 721 if (err) 722 return err; 723 if (priv->tunnel_reg_id) { 724 mlx4_flow_detach(priv->mdev->dev, priv->tunnel_reg_id); 725 priv->tunnel_reg_id = 0; 726 } 727 err = mlx4_en_tunnel_steer_add(priv, new_mac, qpn, 728 &priv->tunnel_reg_id); 729 return err; 730 } 731 } 732 return -EINVAL; 733 } 734 735 return __mlx4_replace_mac(dev, priv->port, qpn, new_mac_u64); 736 } 737 738 static int mlx4_en_do_set_mac(struct mlx4_en_priv *priv, 739 unsigned char new_mac[ETH_ALEN + 2]) 740 { 741 int err = 0; 742 743 if (priv->port_up) { 744 /* Remove old MAC and insert the new one */ 745 err = mlx4_en_replace_mac(priv, priv->base_qpn, 746 new_mac, priv->current_mac); 747 if (err) 748 en_err(priv, "Failed changing HW MAC address\n"); 749 } else 750 en_dbg(HW, priv, "Port is down while registering mac, exiting...\n"); 751 752 if (!err) 753 memcpy(priv->current_mac, new_mac, sizeof(priv->current_mac)); 754 755 return err; 756 } 757 758 static int mlx4_en_set_mac(struct net_device *dev, void *addr) 759 { 760 struct mlx4_en_priv *priv = netdev_priv(dev); 761 struct mlx4_en_dev *mdev = priv->mdev; 762 struct sockaddr *saddr = addr; 763 unsigned char new_mac[ETH_ALEN + 2]; 764 int err; 765 766 if (!is_valid_ether_addr(saddr->sa_data)) 767 return -EADDRNOTAVAIL; 768 769 mutex_lock(&mdev->state_lock); 770 memcpy(new_mac, saddr->sa_data, ETH_ALEN); 771 err = mlx4_en_do_set_mac(priv, new_mac); 772 if (!err) 773 memcpy(dev->dev_addr, saddr->sa_data, ETH_ALEN); 774 mutex_unlock(&mdev->state_lock); 775 776 return err; 777 } 778 779 static void mlx4_en_clear_list(struct net_device *dev) 780 { 781 struct mlx4_en_priv *priv = netdev_priv(dev); 782 struct mlx4_en_mc_list *tmp, *mc_to_del; 783 784 list_for_each_entry_safe(mc_to_del, tmp, &priv->mc_list, list) { 785 list_del(&mc_to_del->list); 786 kfree(mc_to_del); 787 } 788 } 789 790 static void mlx4_en_cache_mclist(struct net_device *dev) 791 { 792 struct mlx4_en_priv *priv = netdev_priv(dev); 793 struct netdev_hw_addr *ha; 794 struct mlx4_en_mc_list *tmp; 795 796 mlx4_en_clear_list(dev); 797 netdev_for_each_mc_addr(ha, dev) { 798 tmp = kzalloc(sizeof(struct mlx4_en_mc_list), GFP_ATOMIC); 799 if (!tmp) { 800 mlx4_en_clear_list(dev); 801 return; 802 } 803 memcpy(tmp->addr, ha->addr, ETH_ALEN); 804 list_add_tail(&tmp->list, &priv->mc_list); 805 } 806 } 807 808 static void update_mclist_flags(struct mlx4_en_priv *priv, 809 struct list_head *dst, 810 struct list_head *src) 811 { 812 struct mlx4_en_mc_list *dst_tmp, *src_tmp, *new_mc; 813 bool found; 814 815 /* Find all the entries that should be removed from dst, 816 * These are the entries that are not found in src 817 */ 818 list_for_each_entry(dst_tmp, dst, list) { 819 found = false; 820 list_for_each_entry(src_tmp, src, list) { 821 if (ether_addr_equal(dst_tmp->addr, src_tmp->addr)) { 822 found = true; 823 break; 824 } 825 } 826 if (!found) 827 dst_tmp->action = MCLIST_REM; 828 } 829 830 /* Add entries that exist in src but not in dst 831 * mark them as need to add 832 */ 833 list_for_each_entry(src_tmp, src, list) { 834 found = false; 835 list_for_each_entry(dst_tmp, dst, list) { 836 if (ether_addr_equal(dst_tmp->addr, src_tmp->addr)) { 837 dst_tmp->action = MCLIST_NONE; 838 found = true; 839 break; 840 } 841 } 842 if (!found) { 843 new_mc = kmemdup(src_tmp, 844 sizeof(struct mlx4_en_mc_list), 845 GFP_KERNEL); 846 if (!new_mc) 847 return; 848 849 new_mc->action = MCLIST_ADD; 850 list_add_tail(&new_mc->list, dst); 851 } 852 } 853 } 854 855 static void mlx4_en_set_rx_mode(struct net_device *dev) 856 { 857 struct mlx4_en_priv *priv = netdev_priv(dev); 858 859 if (!priv->port_up) 860 return; 861 862 queue_work(priv->mdev->workqueue, &priv->rx_mode_task); 863 } 864 865 static void mlx4_en_set_promisc_mode(struct mlx4_en_priv *priv, 866 struct mlx4_en_dev *mdev) 867 { 868 int err = 0; 869 870 if (!(priv->flags & MLX4_EN_FLAG_PROMISC)) { 871 if (netif_msg_rx_status(priv)) 872 en_warn(priv, "Entering promiscuous mode\n"); 873 priv->flags |= MLX4_EN_FLAG_PROMISC; 874 875 /* Enable promiscouos mode */ 876 switch (mdev->dev->caps.steering_mode) { 877 case MLX4_STEERING_MODE_DEVICE_MANAGED: 878 err = mlx4_flow_steer_promisc_add(mdev->dev, 879 priv->port, 880 priv->base_qpn, 881 MLX4_FS_ALL_DEFAULT); 882 if (err) 883 en_err(priv, "Failed enabling promiscuous mode\n"); 884 priv->flags |= MLX4_EN_FLAG_MC_PROMISC; 885 break; 886 887 case MLX4_STEERING_MODE_B0: 888 err = mlx4_unicast_promisc_add(mdev->dev, 889 priv->base_qpn, 890 priv->port); 891 if (err) 892 en_err(priv, "Failed enabling unicast promiscuous mode\n"); 893 894 /* Add the default qp number as multicast 895 * promisc 896 */ 897 if (!(priv->flags & MLX4_EN_FLAG_MC_PROMISC)) { 898 err = mlx4_multicast_promisc_add(mdev->dev, 899 priv->base_qpn, 900 priv->port); 901 if (err) 902 en_err(priv, "Failed enabling multicast promiscuous mode\n"); 903 priv->flags |= MLX4_EN_FLAG_MC_PROMISC; 904 } 905 break; 906 907 case MLX4_STEERING_MODE_A0: 908 err = mlx4_SET_PORT_qpn_calc(mdev->dev, 909 priv->port, 910 priv->base_qpn, 911 1); 912 if (err) 913 en_err(priv, "Failed enabling promiscuous mode\n"); 914 break; 915 } 916 917 /* Disable port multicast filter (unconditionally) */ 918 err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 919 0, MLX4_MCAST_DISABLE); 920 if (err) 921 en_err(priv, "Failed disabling multicast filter\n"); 922 } 923 } 924 925 static void mlx4_en_clear_promisc_mode(struct mlx4_en_priv *priv, 926 struct mlx4_en_dev *mdev) 927 { 928 int err = 0; 929 930 if (netif_msg_rx_status(priv)) 931 en_warn(priv, "Leaving promiscuous mode\n"); 932 priv->flags &= ~MLX4_EN_FLAG_PROMISC; 933 934 /* Disable promiscouos mode */ 935 switch (mdev->dev->caps.steering_mode) { 936 case MLX4_STEERING_MODE_DEVICE_MANAGED: 937 err = mlx4_flow_steer_promisc_remove(mdev->dev, 938 priv->port, 939 MLX4_FS_ALL_DEFAULT); 940 if (err) 941 en_err(priv, "Failed disabling promiscuous mode\n"); 942 priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC; 943 break; 944 945 case MLX4_STEERING_MODE_B0: 946 err = mlx4_unicast_promisc_remove(mdev->dev, 947 priv->base_qpn, 948 priv->port); 949 if (err) 950 en_err(priv, "Failed disabling unicast promiscuous mode\n"); 951 /* Disable Multicast promisc */ 952 if (priv->flags & MLX4_EN_FLAG_MC_PROMISC) { 953 err = mlx4_multicast_promisc_remove(mdev->dev, 954 priv->base_qpn, 955 priv->port); 956 if (err) 957 en_err(priv, "Failed disabling multicast promiscuous mode\n"); 958 priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC; 959 } 960 break; 961 962 case MLX4_STEERING_MODE_A0: 963 err = mlx4_SET_PORT_qpn_calc(mdev->dev, 964 priv->port, 965 priv->base_qpn, 0); 966 if (err) 967 en_err(priv, "Failed disabling promiscuous mode\n"); 968 break; 969 } 970 } 971 972 static void mlx4_en_do_multicast(struct mlx4_en_priv *priv, 973 struct net_device *dev, 974 struct mlx4_en_dev *mdev) 975 { 976 struct mlx4_en_mc_list *mclist, *tmp; 977 u64 mcast_addr = 0; 978 u8 mc_list[16] = {0}; 979 int err = 0; 980 981 /* Enable/disable the multicast filter according to IFF_ALLMULTI */ 982 if (dev->flags & IFF_ALLMULTI) { 983 err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 984 0, MLX4_MCAST_DISABLE); 985 if (err) 986 en_err(priv, "Failed disabling multicast filter\n"); 987 988 /* Add the default qp number as multicast promisc */ 989 if (!(priv->flags & MLX4_EN_FLAG_MC_PROMISC)) { 990 switch (mdev->dev->caps.steering_mode) { 991 case MLX4_STEERING_MODE_DEVICE_MANAGED: 992 err = mlx4_flow_steer_promisc_add(mdev->dev, 993 priv->port, 994 priv->base_qpn, 995 MLX4_FS_MC_DEFAULT); 996 break; 997 998 case MLX4_STEERING_MODE_B0: 999 err = mlx4_multicast_promisc_add(mdev->dev, 1000 priv->base_qpn, 1001 priv->port); 1002 break; 1003 1004 case MLX4_STEERING_MODE_A0: 1005 break; 1006 } 1007 if (err) 1008 en_err(priv, "Failed entering multicast promisc mode\n"); 1009 priv->flags |= MLX4_EN_FLAG_MC_PROMISC; 1010 } 1011 } else { 1012 /* Disable Multicast promisc */ 1013 if (priv->flags & MLX4_EN_FLAG_MC_PROMISC) { 1014 switch (mdev->dev->caps.steering_mode) { 1015 case MLX4_STEERING_MODE_DEVICE_MANAGED: 1016 err = mlx4_flow_steer_promisc_remove(mdev->dev, 1017 priv->port, 1018 MLX4_FS_MC_DEFAULT); 1019 break; 1020 1021 case MLX4_STEERING_MODE_B0: 1022 err = mlx4_multicast_promisc_remove(mdev->dev, 1023 priv->base_qpn, 1024 priv->port); 1025 break; 1026 1027 case MLX4_STEERING_MODE_A0: 1028 break; 1029 } 1030 if (err) 1031 en_err(priv, "Failed disabling multicast promiscuous mode\n"); 1032 priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC; 1033 } 1034 1035 err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 1036 0, MLX4_MCAST_DISABLE); 1037 if (err) 1038 en_err(priv, "Failed disabling multicast filter\n"); 1039 1040 /* Flush mcast filter and init it with broadcast address */ 1041 mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, ETH_BCAST, 1042 1, MLX4_MCAST_CONFIG); 1043 1044 /* Update multicast list - we cache all addresses so they won't 1045 * change while HW is updated holding the command semaphor */ 1046 netif_addr_lock_bh(dev); 1047 mlx4_en_cache_mclist(dev); 1048 netif_addr_unlock_bh(dev); 1049 list_for_each_entry(mclist, &priv->mc_list, list) { 1050 mcast_addr = mlx4_mac_to_u64(mclist->addr); 1051 mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 1052 mcast_addr, 0, MLX4_MCAST_CONFIG); 1053 } 1054 err = mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 1055 0, MLX4_MCAST_ENABLE); 1056 if (err) 1057 en_err(priv, "Failed enabling multicast filter\n"); 1058 1059 update_mclist_flags(priv, &priv->curr_list, &priv->mc_list); 1060 list_for_each_entry_safe(mclist, tmp, &priv->curr_list, list) { 1061 if (mclist->action == MCLIST_REM) { 1062 /* detach this address and delete from list */ 1063 memcpy(&mc_list[10], mclist->addr, ETH_ALEN); 1064 mc_list[5] = priv->port; 1065 err = mlx4_multicast_detach(mdev->dev, 1066 &priv->rss_map.indir_qp, 1067 mc_list, 1068 MLX4_PROT_ETH, 1069 mclist->reg_id); 1070 if (err) 1071 en_err(priv, "Fail to detach multicast address\n"); 1072 1073 if (mclist->tunnel_reg_id) { 1074 err = mlx4_flow_detach(priv->mdev->dev, mclist->tunnel_reg_id); 1075 if (err) 1076 en_err(priv, "Failed to detach multicast address\n"); 1077 } 1078 1079 /* remove from list */ 1080 list_del(&mclist->list); 1081 kfree(mclist); 1082 } else if (mclist->action == MCLIST_ADD) { 1083 /* attach the address */ 1084 memcpy(&mc_list[10], mclist->addr, ETH_ALEN); 1085 /* needed for B0 steering support */ 1086 mc_list[5] = priv->port; 1087 err = mlx4_multicast_attach(mdev->dev, 1088 &priv->rss_map.indir_qp, 1089 mc_list, 1090 priv->port, 0, 1091 MLX4_PROT_ETH, 1092 &mclist->reg_id); 1093 if (err) 1094 en_err(priv, "Fail to attach multicast address\n"); 1095 1096 err = mlx4_en_tunnel_steer_add(priv, &mc_list[10], priv->base_qpn, 1097 &mclist->tunnel_reg_id); 1098 if (err) 1099 en_err(priv, "Failed to attach multicast address\n"); 1100 } 1101 } 1102 } 1103 } 1104 1105 static void mlx4_en_do_uc_filter(struct mlx4_en_priv *priv, 1106 struct net_device *dev, 1107 struct mlx4_en_dev *mdev) 1108 { 1109 struct netdev_hw_addr *ha; 1110 struct mlx4_mac_entry *entry; 1111 struct hlist_node *tmp; 1112 bool found; 1113 u64 mac; 1114 int err = 0; 1115 struct hlist_head *bucket; 1116 unsigned int i; 1117 int removed = 0; 1118 u32 prev_flags; 1119 1120 /* Note that we do not need to protect our mac_hash traversal with rcu, 1121 * since all modification code is protected by mdev->state_lock 1122 */ 1123 1124 /* find what to remove */ 1125 for (i = 0; i < MLX4_EN_MAC_HASH_SIZE; ++i) { 1126 bucket = &priv->mac_hash[i]; 1127 hlist_for_each_entry_safe(entry, tmp, bucket, hlist) { 1128 found = false; 1129 netdev_for_each_uc_addr(ha, dev) { 1130 if (ether_addr_equal_64bits(entry->mac, 1131 ha->addr)) { 1132 found = true; 1133 break; 1134 } 1135 } 1136 1137 /* MAC address of the port is not in uc list */ 1138 if (ether_addr_equal_64bits(entry->mac, 1139 priv->current_mac)) 1140 found = true; 1141 1142 if (!found) { 1143 mac = mlx4_mac_to_u64(entry->mac); 1144 mlx4_en_uc_steer_release(priv, entry->mac, 1145 priv->base_qpn, 1146 entry->reg_id); 1147 mlx4_unregister_mac(mdev->dev, priv->port, mac); 1148 1149 hlist_del_rcu(&entry->hlist); 1150 kfree_rcu(entry, rcu); 1151 en_dbg(DRV, priv, "Removed MAC %pM on port:%d\n", 1152 entry->mac, priv->port); 1153 ++removed; 1154 } 1155 } 1156 } 1157 1158 /* if we didn't remove anything, there is no use in trying to add 1159 * again once we are in a forced promisc mode state 1160 */ 1161 if ((priv->flags & MLX4_EN_FLAG_FORCE_PROMISC) && 0 == removed) 1162 return; 1163 1164 prev_flags = priv->flags; 1165 priv->flags &= ~MLX4_EN_FLAG_FORCE_PROMISC; 1166 1167 /* find what to add */ 1168 netdev_for_each_uc_addr(ha, dev) { 1169 found = false; 1170 bucket = &priv->mac_hash[ha->addr[MLX4_EN_MAC_HASH_IDX]]; 1171 hlist_for_each_entry(entry, bucket, hlist) { 1172 if (ether_addr_equal_64bits(entry->mac, ha->addr)) { 1173 found = true; 1174 break; 1175 } 1176 } 1177 1178 if (!found) { 1179 entry = kmalloc(sizeof(*entry), GFP_KERNEL); 1180 if (!entry) { 1181 en_err(priv, "Failed adding MAC %pM on port:%d (out of memory)\n", 1182 ha->addr, priv->port); 1183 priv->flags |= MLX4_EN_FLAG_FORCE_PROMISC; 1184 break; 1185 } 1186 mac = mlx4_mac_to_u64(ha->addr); 1187 memcpy(entry->mac, ha->addr, ETH_ALEN); 1188 err = mlx4_register_mac(mdev->dev, priv->port, mac); 1189 if (err < 0) { 1190 en_err(priv, "Failed registering MAC %pM on port %d: %d\n", 1191 ha->addr, priv->port, err); 1192 kfree(entry); 1193 priv->flags |= MLX4_EN_FLAG_FORCE_PROMISC; 1194 break; 1195 } 1196 err = mlx4_en_uc_steer_add(priv, ha->addr, 1197 &priv->base_qpn, 1198 &entry->reg_id); 1199 if (err) { 1200 en_err(priv, "Failed adding MAC %pM on port %d: %d\n", 1201 ha->addr, priv->port, err); 1202 mlx4_unregister_mac(mdev->dev, priv->port, mac); 1203 kfree(entry); 1204 priv->flags |= MLX4_EN_FLAG_FORCE_PROMISC; 1205 break; 1206 } else { 1207 unsigned int mac_hash; 1208 en_dbg(DRV, priv, "Added MAC %pM on port:%d\n", 1209 ha->addr, priv->port); 1210 mac_hash = ha->addr[MLX4_EN_MAC_HASH_IDX]; 1211 bucket = &priv->mac_hash[mac_hash]; 1212 hlist_add_head_rcu(&entry->hlist, bucket); 1213 } 1214 } 1215 } 1216 1217 if (priv->flags & MLX4_EN_FLAG_FORCE_PROMISC) { 1218 en_warn(priv, "Forcing promiscuous mode on port:%d\n", 1219 priv->port); 1220 } else if (prev_flags & MLX4_EN_FLAG_FORCE_PROMISC) { 1221 en_warn(priv, "Stop forcing promiscuous mode on port:%d\n", 1222 priv->port); 1223 } 1224 } 1225 1226 static void mlx4_en_do_set_rx_mode(struct work_struct *work) 1227 { 1228 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 1229 rx_mode_task); 1230 struct mlx4_en_dev *mdev = priv->mdev; 1231 struct net_device *dev = priv->dev; 1232 1233 mutex_lock(&mdev->state_lock); 1234 if (!mdev->device_up) { 1235 en_dbg(HW, priv, "Card is not up, ignoring rx mode change.\n"); 1236 goto out; 1237 } 1238 if (!priv->port_up) { 1239 en_dbg(HW, priv, "Port is down, ignoring rx mode change.\n"); 1240 goto out; 1241 } 1242 1243 if (!netif_carrier_ok(dev)) { 1244 if (!mlx4_en_QUERY_PORT(mdev, priv->port)) { 1245 if (priv->port_state.link_state) { 1246 priv->last_link_state = MLX4_DEV_EVENT_PORT_UP; 1247 netif_carrier_on(dev); 1248 en_dbg(LINK, priv, "Link Up\n"); 1249 } 1250 } 1251 } 1252 1253 if (dev->priv_flags & IFF_UNICAST_FLT) 1254 mlx4_en_do_uc_filter(priv, dev, mdev); 1255 1256 /* Promsicuous mode: disable all filters */ 1257 if ((dev->flags & IFF_PROMISC) || 1258 (priv->flags & MLX4_EN_FLAG_FORCE_PROMISC)) { 1259 mlx4_en_set_promisc_mode(priv, mdev); 1260 goto out; 1261 } 1262 1263 /* Not in promiscuous mode */ 1264 if (priv->flags & MLX4_EN_FLAG_PROMISC) 1265 mlx4_en_clear_promisc_mode(priv, mdev); 1266 1267 mlx4_en_do_multicast(priv, dev, mdev); 1268 out: 1269 mutex_unlock(&mdev->state_lock); 1270 } 1271 1272 #ifdef CONFIG_NET_POLL_CONTROLLER 1273 static void mlx4_en_netpoll(struct net_device *dev) 1274 { 1275 struct mlx4_en_priv *priv = netdev_priv(dev); 1276 struct mlx4_en_cq *cq; 1277 int i; 1278 1279 for (i = 0; i < priv->rx_ring_num; i++) { 1280 cq = priv->rx_cq[i]; 1281 napi_schedule(&cq->napi); 1282 } 1283 } 1284 #endif 1285 1286 static void mlx4_en_tx_timeout(struct net_device *dev) 1287 { 1288 struct mlx4_en_priv *priv = netdev_priv(dev); 1289 struct mlx4_en_dev *mdev = priv->mdev; 1290 int i; 1291 1292 if (netif_msg_timer(priv)) 1293 en_warn(priv, "Tx timeout called on port:%d\n", priv->port); 1294 1295 for (i = 0; i < priv->tx_ring_num; i++) { 1296 if (!netif_tx_queue_stopped(netdev_get_tx_queue(dev, i))) 1297 continue; 1298 en_warn(priv, "TX timeout on queue: %d, QP: 0x%x, CQ: 0x%x, Cons: 0x%x, Prod: 0x%x\n", 1299 i, priv->tx_ring[i]->qpn, priv->tx_ring[i]->cqn, 1300 priv->tx_ring[i]->cons, priv->tx_ring[i]->prod); 1301 } 1302 1303 priv->port_stats.tx_timeout++; 1304 en_dbg(DRV, priv, "Scheduling watchdog\n"); 1305 queue_work(mdev->workqueue, &priv->watchdog_task); 1306 } 1307 1308 1309 static struct net_device_stats *mlx4_en_get_stats(struct net_device *dev) 1310 { 1311 struct mlx4_en_priv *priv = netdev_priv(dev); 1312 1313 spin_lock_bh(&priv->stats_lock); 1314 memcpy(&priv->ret_stats, &priv->stats, sizeof(priv->stats)); 1315 spin_unlock_bh(&priv->stats_lock); 1316 1317 return &priv->ret_stats; 1318 } 1319 1320 static void mlx4_en_set_default_moderation(struct mlx4_en_priv *priv) 1321 { 1322 struct mlx4_en_cq *cq; 1323 int i; 1324 1325 /* If we haven't received a specific coalescing setting 1326 * (module param), we set the moderation parameters as follows: 1327 * - moder_cnt is set to the number of mtu sized packets to 1328 * satisfy our coalescing target. 1329 * - moder_time is set to a fixed value. 1330 */ 1331 priv->rx_frames = MLX4_EN_RX_COAL_TARGET; 1332 priv->rx_usecs = MLX4_EN_RX_COAL_TIME; 1333 priv->tx_frames = MLX4_EN_TX_COAL_PKTS; 1334 priv->tx_usecs = MLX4_EN_TX_COAL_TIME; 1335 en_dbg(INTR, priv, "Default coalesing params for mtu:%d - rx_frames:%d rx_usecs:%d\n", 1336 priv->dev->mtu, priv->rx_frames, priv->rx_usecs); 1337 1338 /* Setup cq moderation params */ 1339 for (i = 0; i < priv->rx_ring_num; i++) { 1340 cq = priv->rx_cq[i]; 1341 cq->moder_cnt = priv->rx_frames; 1342 cq->moder_time = priv->rx_usecs; 1343 priv->last_moder_time[i] = MLX4_EN_AUTO_CONF; 1344 priv->last_moder_packets[i] = 0; 1345 priv->last_moder_bytes[i] = 0; 1346 } 1347 1348 for (i = 0; i < priv->tx_ring_num; i++) { 1349 cq = priv->tx_cq[i]; 1350 cq->moder_cnt = priv->tx_frames; 1351 cq->moder_time = priv->tx_usecs; 1352 } 1353 1354 /* Reset auto-moderation params */ 1355 priv->pkt_rate_low = MLX4_EN_RX_RATE_LOW; 1356 priv->rx_usecs_low = MLX4_EN_RX_COAL_TIME_LOW; 1357 priv->pkt_rate_high = MLX4_EN_RX_RATE_HIGH; 1358 priv->rx_usecs_high = MLX4_EN_RX_COAL_TIME_HIGH; 1359 priv->sample_interval = MLX4_EN_SAMPLE_INTERVAL; 1360 priv->adaptive_rx_coal = 1; 1361 priv->last_moder_jiffies = 0; 1362 priv->last_moder_tx_packets = 0; 1363 } 1364 1365 static void mlx4_en_auto_moderation(struct mlx4_en_priv *priv) 1366 { 1367 unsigned long period = (unsigned long) (jiffies - priv->last_moder_jiffies); 1368 struct mlx4_en_cq *cq; 1369 unsigned long packets; 1370 unsigned long rate; 1371 unsigned long avg_pkt_size; 1372 unsigned long rx_packets; 1373 unsigned long rx_bytes; 1374 unsigned long rx_pkt_diff; 1375 int moder_time; 1376 int ring, err; 1377 1378 if (!priv->adaptive_rx_coal || period < priv->sample_interval * HZ) 1379 return; 1380 1381 for (ring = 0; ring < priv->rx_ring_num; ring++) { 1382 spin_lock_bh(&priv->stats_lock); 1383 rx_packets = priv->rx_ring[ring]->packets; 1384 rx_bytes = priv->rx_ring[ring]->bytes; 1385 spin_unlock_bh(&priv->stats_lock); 1386 1387 rx_pkt_diff = ((unsigned long) (rx_packets - 1388 priv->last_moder_packets[ring])); 1389 packets = rx_pkt_diff; 1390 rate = packets * HZ / period; 1391 avg_pkt_size = packets ? ((unsigned long) (rx_bytes - 1392 priv->last_moder_bytes[ring])) / packets : 0; 1393 1394 /* Apply auto-moderation only when packet rate 1395 * exceeds a rate that it matters */ 1396 if (rate > (MLX4_EN_RX_RATE_THRESH / priv->rx_ring_num) && 1397 avg_pkt_size > MLX4_EN_AVG_PKT_SMALL) { 1398 if (rate < priv->pkt_rate_low) 1399 moder_time = priv->rx_usecs_low; 1400 else if (rate > priv->pkt_rate_high) 1401 moder_time = priv->rx_usecs_high; 1402 else 1403 moder_time = (rate - priv->pkt_rate_low) * 1404 (priv->rx_usecs_high - priv->rx_usecs_low) / 1405 (priv->pkt_rate_high - priv->pkt_rate_low) + 1406 priv->rx_usecs_low; 1407 } else { 1408 moder_time = priv->rx_usecs_low; 1409 } 1410 1411 if (moder_time != priv->last_moder_time[ring]) { 1412 priv->last_moder_time[ring] = moder_time; 1413 cq = priv->rx_cq[ring]; 1414 cq->moder_time = moder_time; 1415 cq->moder_cnt = priv->rx_frames; 1416 err = mlx4_en_set_cq_moder(priv, cq); 1417 if (err) 1418 en_err(priv, "Failed modifying moderation for cq:%d\n", 1419 ring); 1420 } 1421 priv->last_moder_packets[ring] = rx_packets; 1422 priv->last_moder_bytes[ring] = rx_bytes; 1423 } 1424 1425 priv->last_moder_jiffies = jiffies; 1426 } 1427 1428 static void mlx4_en_do_get_stats(struct work_struct *work) 1429 { 1430 struct delayed_work *delay = to_delayed_work(work); 1431 struct mlx4_en_priv *priv = container_of(delay, struct mlx4_en_priv, 1432 stats_task); 1433 struct mlx4_en_dev *mdev = priv->mdev; 1434 int err; 1435 1436 mutex_lock(&mdev->state_lock); 1437 if (mdev->device_up) { 1438 if (priv->port_up) { 1439 err = mlx4_en_DUMP_ETH_STATS(mdev, priv->port, 0); 1440 if (err) 1441 en_dbg(HW, priv, "Could not update stats\n"); 1442 1443 mlx4_en_auto_moderation(priv); 1444 } 1445 1446 queue_delayed_work(mdev->workqueue, &priv->stats_task, STATS_DELAY); 1447 } 1448 if (mdev->mac_removed[MLX4_MAX_PORTS + 1 - priv->port]) { 1449 mlx4_en_do_set_mac(priv, priv->current_mac); 1450 mdev->mac_removed[MLX4_MAX_PORTS + 1 - priv->port] = 0; 1451 } 1452 mutex_unlock(&mdev->state_lock); 1453 } 1454 1455 /* mlx4_en_service_task - Run service task for tasks that needed to be done 1456 * periodically 1457 */ 1458 static void mlx4_en_service_task(struct work_struct *work) 1459 { 1460 struct delayed_work *delay = to_delayed_work(work); 1461 struct mlx4_en_priv *priv = container_of(delay, struct mlx4_en_priv, 1462 service_task); 1463 struct mlx4_en_dev *mdev = priv->mdev; 1464 1465 mutex_lock(&mdev->state_lock); 1466 if (mdev->device_up) { 1467 if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_TS) 1468 mlx4_en_ptp_overflow_check(mdev); 1469 1470 queue_delayed_work(mdev->workqueue, &priv->service_task, 1471 SERVICE_TASK_DELAY); 1472 } 1473 mutex_unlock(&mdev->state_lock); 1474 } 1475 1476 static void mlx4_en_linkstate(struct work_struct *work) 1477 { 1478 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 1479 linkstate_task); 1480 struct mlx4_en_dev *mdev = priv->mdev; 1481 int linkstate = priv->link_state; 1482 1483 mutex_lock(&mdev->state_lock); 1484 /* If observable port state changed set carrier state and 1485 * report to system log */ 1486 if (priv->last_link_state != linkstate) { 1487 if (linkstate == MLX4_DEV_EVENT_PORT_DOWN) { 1488 en_info(priv, "Link Down\n"); 1489 netif_carrier_off(priv->dev); 1490 } else { 1491 en_info(priv, "Link Up\n"); 1492 netif_carrier_on(priv->dev); 1493 } 1494 } 1495 priv->last_link_state = linkstate; 1496 mutex_unlock(&mdev->state_lock); 1497 } 1498 1499 static int mlx4_en_init_affinity_hint(struct mlx4_en_priv *priv, int ring_idx) 1500 { 1501 struct mlx4_en_rx_ring *ring = priv->rx_ring[ring_idx]; 1502 int numa_node = priv->mdev->dev->numa_node; 1503 int ret = 0; 1504 1505 if (!zalloc_cpumask_var(&ring->affinity_mask, GFP_KERNEL)) 1506 return -ENOMEM; 1507 1508 ret = cpumask_set_cpu_local_first(ring_idx, numa_node, 1509 ring->affinity_mask); 1510 if (ret) 1511 free_cpumask_var(ring->affinity_mask); 1512 1513 return ret; 1514 } 1515 1516 static void mlx4_en_free_affinity_hint(struct mlx4_en_priv *priv, int ring_idx) 1517 { 1518 free_cpumask_var(priv->rx_ring[ring_idx]->affinity_mask); 1519 } 1520 1521 int mlx4_en_start_port(struct net_device *dev) 1522 { 1523 struct mlx4_en_priv *priv = netdev_priv(dev); 1524 struct mlx4_en_dev *mdev = priv->mdev; 1525 struct mlx4_en_cq *cq; 1526 struct mlx4_en_tx_ring *tx_ring; 1527 int rx_index = 0; 1528 int tx_index = 0; 1529 int err = 0; 1530 int i; 1531 int j; 1532 u8 mc_list[16] = {0}; 1533 1534 if (priv->port_up) { 1535 en_dbg(DRV, priv, "start port called while port already up\n"); 1536 return 0; 1537 } 1538 1539 INIT_LIST_HEAD(&priv->mc_list); 1540 INIT_LIST_HEAD(&priv->curr_list); 1541 INIT_LIST_HEAD(&priv->ethtool_list); 1542 memset(&priv->ethtool_rules[0], 0, 1543 sizeof(struct ethtool_flow_id) * MAX_NUM_OF_FS_RULES); 1544 1545 /* Calculate Rx buf size */ 1546 dev->mtu = min(dev->mtu, priv->max_mtu); 1547 mlx4_en_calc_rx_buf(dev); 1548 en_dbg(DRV, priv, "Rx buf size:%d\n", priv->rx_skb_size); 1549 1550 /* Configure rx cq's and rings */ 1551 err = mlx4_en_activate_rx_rings(priv); 1552 if (err) { 1553 en_err(priv, "Failed to activate RX rings\n"); 1554 return err; 1555 } 1556 for (i = 0; i < priv->rx_ring_num; i++) { 1557 cq = priv->rx_cq[i]; 1558 1559 mlx4_en_cq_init_lock(cq); 1560 1561 err = mlx4_en_init_affinity_hint(priv, i); 1562 if (err) { 1563 en_err(priv, "Failed preparing IRQ affinity hint\n"); 1564 goto cq_err; 1565 } 1566 1567 err = mlx4_en_activate_cq(priv, cq, i); 1568 if (err) { 1569 en_err(priv, "Failed activating Rx CQ\n"); 1570 mlx4_en_free_affinity_hint(priv, i); 1571 goto cq_err; 1572 } 1573 1574 for (j = 0; j < cq->size; j++) { 1575 struct mlx4_cqe *cqe = NULL; 1576 1577 cqe = mlx4_en_get_cqe(cq->buf, j, priv->cqe_size) + 1578 priv->cqe_factor; 1579 cqe->owner_sr_opcode = MLX4_CQE_OWNER_MASK; 1580 } 1581 1582 err = mlx4_en_set_cq_moder(priv, cq); 1583 if (err) { 1584 en_err(priv, "Failed setting cq moderation parameters\n"); 1585 mlx4_en_deactivate_cq(priv, cq); 1586 mlx4_en_free_affinity_hint(priv, i); 1587 goto cq_err; 1588 } 1589 mlx4_en_arm_cq(priv, cq); 1590 priv->rx_ring[i]->cqn = cq->mcq.cqn; 1591 ++rx_index; 1592 } 1593 1594 /* Set qp number */ 1595 en_dbg(DRV, priv, "Getting qp number for port %d\n", priv->port); 1596 err = mlx4_en_get_qp(priv); 1597 if (err) { 1598 en_err(priv, "Failed getting eth qp\n"); 1599 goto cq_err; 1600 } 1601 mdev->mac_removed[priv->port] = 0; 1602 1603 err = mlx4_en_config_rss_steer(priv); 1604 if (err) { 1605 en_err(priv, "Failed configuring rss steering\n"); 1606 goto mac_err; 1607 } 1608 1609 err = mlx4_en_create_drop_qp(priv); 1610 if (err) 1611 goto rss_err; 1612 1613 /* Configure tx cq's and rings */ 1614 for (i = 0; i < priv->tx_ring_num; i++) { 1615 /* Configure cq */ 1616 cq = priv->tx_cq[i]; 1617 err = mlx4_en_activate_cq(priv, cq, i); 1618 if (err) { 1619 en_err(priv, "Failed allocating Tx CQ\n"); 1620 goto tx_err; 1621 } 1622 err = mlx4_en_set_cq_moder(priv, cq); 1623 if (err) { 1624 en_err(priv, "Failed setting cq moderation parameters\n"); 1625 mlx4_en_deactivate_cq(priv, cq); 1626 goto tx_err; 1627 } 1628 en_dbg(DRV, priv, "Resetting index of collapsed CQ:%d to -1\n", i); 1629 cq->buf->wqe_index = cpu_to_be16(0xffff); 1630 1631 /* Configure ring */ 1632 tx_ring = priv->tx_ring[i]; 1633 err = mlx4_en_activate_tx_ring(priv, tx_ring, cq->mcq.cqn, 1634 i / priv->num_tx_rings_p_up); 1635 if (err) { 1636 en_err(priv, "Failed allocating Tx ring\n"); 1637 mlx4_en_deactivate_cq(priv, cq); 1638 goto tx_err; 1639 } 1640 tx_ring->tx_queue = netdev_get_tx_queue(dev, i); 1641 1642 /* Arm CQ for TX completions */ 1643 mlx4_en_arm_cq(priv, cq); 1644 1645 /* Set initial ownership of all Tx TXBBs to SW (1) */ 1646 for (j = 0; j < tx_ring->buf_size; j += STAMP_STRIDE) 1647 *((u32 *) (tx_ring->buf + j)) = 0xffffffff; 1648 ++tx_index; 1649 } 1650 1651 /* Configure port */ 1652 err = mlx4_SET_PORT_general(mdev->dev, priv->port, 1653 priv->rx_skb_size + ETH_FCS_LEN, 1654 priv->prof->tx_pause, 1655 priv->prof->tx_ppp, 1656 priv->prof->rx_pause, 1657 priv->prof->rx_ppp); 1658 if (err) { 1659 en_err(priv, "Failed setting port general configurations for port %d, with error %d\n", 1660 priv->port, err); 1661 goto tx_err; 1662 } 1663 /* Set default qp number */ 1664 err = mlx4_SET_PORT_qpn_calc(mdev->dev, priv->port, priv->base_qpn, 0); 1665 if (err) { 1666 en_err(priv, "Failed setting default qp numbers\n"); 1667 goto tx_err; 1668 } 1669 1670 if (mdev->dev->caps.tunnel_offload_mode == MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) { 1671 err = mlx4_SET_PORT_VXLAN(mdev->dev, priv->port, VXLAN_STEER_BY_OUTER_MAC, 1); 1672 if (err) { 1673 en_err(priv, "Failed setting port L2 tunnel configuration, err %d\n", 1674 err); 1675 goto tx_err; 1676 } 1677 } 1678 1679 /* Init port */ 1680 en_dbg(HW, priv, "Initializing port\n"); 1681 err = mlx4_INIT_PORT(mdev->dev, priv->port); 1682 if (err) { 1683 en_err(priv, "Failed Initializing port\n"); 1684 goto tx_err; 1685 } 1686 1687 /* Attach rx QP to bradcast address */ 1688 memset(&mc_list[10], 0xff, ETH_ALEN); 1689 mc_list[5] = priv->port; /* needed for B0 steering support */ 1690 if (mlx4_multicast_attach(mdev->dev, &priv->rss_map.indir_qp, mc_list, 1691 priv->port, 0, MLX4_PROT_ETH, 1692 &priv->broadcast_id)) 1693 mlx4_warn(mdev, "Failed Attaching Broadcast\n"); 1694 1695 /* Must redo promiscuous mode setup. */ 1696 priv->flags &= ~(MLX4_EN_FLAG_PROMISC | MLX4_EN_FLAG_MC_PROMISC); 1697 1698 /* Schedule multicast task to populate multicast list */ 1699 queue_work(mdev->workqueue, &priv->rx_mode_task); 1700 1701 mlx4_set_stats_bitmap(mdev->dev, &priv->stats_bitmap); 1702 1703 #ifdef CONFIG_MLX4_EN_VXLAN 1704 if (priv->mdev->dev->caps.tunnel_offload_mode == MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) 1705 vxlan_get_rx_port(dev); 1706 #endif 1707 priv->port_up = true; 1708 netif_tx_start_all_queues(dev); 1709 netif_device_attach(dev); 1710 1711 return 0; 1712 1713 tx_err: 1714 while (tx_index--) { 1715 mlx4_en_deactivate_tx_ring(priv, priv->tx_ring[tx_index]); 1716 mlx4_en_deactivate_cq(priv, priv->tx_cq[tx_index]); 1717 } 1718 mlx4_en_destroy_drop_qp(priv); 1719 rss_err: 1720 mlx4_en_release_rss_steer(priv); 1721 mac_err: 1722 mlx4_en_put_qp(priv); 1723 cq_err: 1724 while (rx_index--) { 1725 mlx4_en_deactivate_cq(priv, priv->rx_cq[rx_index]); 1726 mlx4_en_free_affinity_hint(priv, i); 1727 } 1728 for (i = 0; i < priv->rx_ring_num; i++) 1729 mlx4_en_deactivate_rx_ring(priv, priv->rx_ring[i]); 1730 1731 return err; /* need to close devices */ 1732 } 1733 1734 1735 void mlx4_en_stop_port(struct net_device *dev, int detach) 1736 { 1737 struct mlx4_en_priv *priv = netdev_priv(dev); 1738 struct mlx4_en_dev *mdev = priv->mdev; 1739 struct mlx4_en_mc_list *mclist, *tmp; 1740 struct ethtool_flow_id *flow, *tmp_flow; 1741 int i; 1742 u8 mc_list[16] = {0}; 1743 1744 if (!priv->port_up) { 1745 en_dbg(DRV, priv, "stop port called while port already down\n"); 1746 return; 1747 } 1748 1749 /* close port*/ 1750 mlx4_CLOSE_PORT(mdev->dev, priv->port); 1751 1752 /* Synchronize with tx routine */ 1753 netif_tx_lock_bh(dev); 1754 if (detach) 1755 netif_device_detach(dev); 1756 netif_tx_stop_all_queues(dev); 1757 netif_tx_unlock_bh(dev); 1758 1759 netif_tx_disable(dev); 1760 1761 /* Set port as not active */ 1762 priv->port_up = false; 1763 1764 /* Promsicuous mode */ 1765 if (mdev->dev->caps.steering_mode == 1766 MLX4_STEERING_MODE_DEVICE_MANAGED) { 1767 priv->flags &= ~(MLX4_EN_FLAG_PROMISC | 1768 MLX4_EN_FLAG_MC_PROMISC); 1769 mlx4_flow_steer_promisc_remove(mdev->dev, 1770 priv->port, 1771 MLX4_FS_ALL_DEFAULT); 1772 mlx4_flow_steer_promisc_remove(mdev->dev, 1773 priv->port, 1774 MLX4_FS_MC_DEFAULT); 1775 } else if (priv->flags & MLX4_EN_FLAG_PROMISC) { 1776 priv->flags &= ~MLX4_EN_FLAG_PROMISC; 1777 1778 /* Disable promiscouos mode */ 1779 mlx4_unicast_promisc_remove(mdev->dev, priv->base_qpn, 1780 priv->port); 1781 1782 /* Disable Multicast promisc */ 1783 if (priv->flags & MLX4_EN_FLAG_MC_PROMISC) { 1784 mlx4_multicast_promisc_remove(mdev->dev, priv->base_qpn, 1785 priv->port); 1786 priv->flags &= ~MLX4_EN_FLAG_MC_PROMISC; 1787 } 1788 } 1789 1790 /* Detach All multicasts */ 1791 memset(&mc_list[10], 0xff, ETH_ALEN); 1792 mc_list[5] = priv->port; /* needed for B0 steering support */ 1793 mlx4_multicast_detach(mdev->dev, &priv->rss_map.indir_qp, mc_list, 1794 MLX4_PROT_ETH, priv->broadcast_id); 1795 list_for_each_entry(mclist, &priv->curr_list, list) { 1796 memcpy(&mc_list[10], mclist->addr, ETH_ALEN); 1797 mc_list[5] = priv->port; 1798 mlx4_multicast_detach(mdev->dev, &priv->rss_map.indir_qp, 1799 mc_list, MLX4_PROT_ETH, mclist->reg_id); 1800 if (mclist->tunnel_reg_id) 1801 mlx4_flow_detach(mdev->dev, mclist->tunnel_reg_id); 1802 } 1803 mlx4_en_clear_list(dev); 1804 list_for_each_entry_safe(mclist, tmp, &priv->curr_list, list) { 1805 list_del(&mclist->list); 1806 kfree(mclist); 1807 } 1808 1809 /* Flush multicast filter */ 1810 mlx4_SET_MCAST_FLTR(mdev->dev, priv->port, 0, 1, MLX4_MCAST_CONFIG); 1811 1812 /* Remove flow steering rules for the port*/ 1813 if (mdev->dev->caps.steering_mode == 1814 MLX4_STEERING_MODE_DEVICE_MANAGED) { 1815 ASSERT_RTNL(); 1816 list_for_each_entry_safe(flow, tmp_flow, 1817 &priv->ethtool_list, list) { 1818 mlx4_flow_detach(mdev->dev, flow->id); 1819 list_del(&flow->list); 1820 } 1821 } 1822 1823 mlx4_en_destroy_drop_qp(priv); 1824 1825 /* Free TX Rings */ 1826 for (i = 0; i < priv->tx_ring_num; i++) { 1827 mlx4_en_deactivate_tx_ring(priv, priv->tx_ring[i]); 1828 mlx4_en_deactivate_cq(priv, priv->tx_cq[i]); 1829 } 1830 msleep(10); 1831 1832 for (i = 0; i < priv->tx_ring_num; i++) 1833 mlx4_en_free_tx_buf(dev, priv->tx_ring[i]); 1834 1835 /* Free RSS qps */ 1836 mlx4_en_release_rss_steer(priv); 1837 1838 /* Unregister Mac address for the port */ 1839 mlx4_en_put_qp(priv); 1840 if (!(mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_REASSIGN_MAC_EN)) 1841 mdev->mac_removed[priv->port] = 1; 1842 1843 /* Free RX Rings */ 1844 for (i = 0; i < priv->rx_ring_num; i++) { 1845 struct mlx4_en_cq *cq = priv->rx_cq[i]; 1846 1847 local_bh_disable(); 1848 while (!mlx4_en_cq_lock_napi(cq)) { 1849 pr_info("CQ %d locked\n", i); 1850 mdelay(1); 1851 } 1852 local_bh_enable(); 1853 1854 napi_synchronize(&cq->napi); 1855 mlx4_en_deactivate_rx_ring(priv, priv->rx_ring[i]); 1856 mlx4_en_deactivate_cq(priv, cq); 1857 1858 mlx4_en_free_affinity_hint(priv, i); 1859 } 1860 } 1861 1862 static void mlx4_en_restart(struct work_struct *work) 1863 { 1864 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 1865 watchdog_task); 1866 struct mlx4_en_dev *mdev = priv->mdev; 1867 struct net_device *dev = priv->dev; 1868 1869 en_dbg(DRV, priv, "Watchdog task called for port %d\n", priv->port); 1870 1871 mutex_lock(&mdev->state_lock); 1872 if (priv->port_up) { 1873 mlx4_en_stop_port(dev, 1); 1874 if (mlx4_en_start_port(dev)) 1875 en_err(priv, "Failed restarting port %d\n", priv->port); 1876 } 1877 mutex_unlock(&mdev->state_lock); 1878 } 1879 1880 static void mlx4_en_clear_stats(struct net_device *dev) 1881 { 1882 struct mlx4_en_priv *priv = netdev_priv(dev); 1883 struct mlx4_en_dev *mdev = priv->mdev; 1884 int i; 1885 1886 if (mlx4_en_DUMP_ETH_STATS(mdev, priv->port, 1)) 1887 en_dbg(HW, priv, "Failed dumping statistics\n"); 1888 1889 memset(&priv->stats, 0, sizeof(priv->stats)); 1890 memset(&priv->pstats, 0, sizeof(priv->pstats)); 1891 memset(&priv->pkstats, 0, sizeof(priv->pkstats)); 1892 memset(&priv->port_stats, 0, sizeof(priv->port_stats)); 1893 1894 for (i = 0; i < priv->tx_ring_num; i++) { 1895 priv->tx_ring[i]->bytes = 0; 1896 priv->tx_ring[i]->packets = 0; 1897 priv->tx_ring[i]->tx_csum = 0; 1898 } 1899 for (i = 0; i < priv->rx_ring_num; i++) { 1900 priv->rx_ring[i]->bytes = 0; 1901 priv->rx_ring[i]->packets = 0; 1902 priv->rx_ring[i]->csum_ok = 0; 1903 priv->rx_ring[i]->csum_none = 0; 1904 priv->rx_ring[i]->csum_complete = 0; 1905 } 1906 } 1907 1908 static int mlx4_en_open(struct net_device *dev) 1909 { 1910 struct mlx4_en_priv *priv = netdev_priv(dev); 1911 struct mlx4_en_dev *mdev = priv->mdev; 1912 int err = 0; 1913 1914 mutex_lock(&mdev->state_lock); 1915 1916 if (!mdev->device_up) { 1917 en_err(priv, "Cannot open - device down/disabled\n"); 1918 err = -EBUSY; 1919 goto out; 1920 } 1921 1922 /* Reset HW statistics and SW counters */ 1923 mlx4_en_clear_stats(dev); 1924 1925 err = mlx4_en_start_port(dev); 1926 if (err) 1927 en_err(priv, "Failed starting port:%d\n", priv->port); 1928 1929 out: 1930 mutex_unlock(&mdev->state_lock); 1931 return err; 1932 } 1933 1934 1935 static int mlx4_en_close(struct net_device *dev) 1936 { 1937 struct mlx4_en_priv *priv = netdev_priv(dev); 1938 struct mlx4_en_dev *mdev = priv->mdev; 1939 1940 en_dbg(IFDOWN, priv, "Close port called\n"); 1941 1942 mutex_lock(&mdev->state_lock); 1943 1944 mlx4_en_stop_port(dev, 0); 1945 netif_carrier_off(dev); 1946 1947 mutex_unlock(&mdev->state_lock); 1948 return 0; 1949 } 1950 1951 void mlx4_en_free_resources(struct mlx4_en_priv *priv) 1952 { 1953 int i; 1954 1955 #ifdef CONFIG_RFS_ACCEL 1956 free_irq_cpu_rmap(priv->dev->rx_cpu_rmap); 1957 priv->dev->rx_cpu_rmap = NULL; 1958 #endif 1959 1960 for (i = 0; i < priv->tx_ring_num; i++) { 1961 if (priv->tx_ring && priv->tx_ring[i]) 1962 mlx4_en_destroy_tx_ring(priv, &priv->tx_ring[i]); 1963 if (priv->tx_cq && priv->tx_cq[i]) 1964 mlx4_en_destroy_cq(priv, &priv->tx_cq[i]); 1965 } 1966 1967 for (i = 0; i < priv->rx_ring_num; i++) { 1968 if (priv->rx_ring[i]) 1969 mlx4_en_destroy_rx_ring(priv, &priv->rx_ring[i], 1970 priv->prof->rx_ring_size, priv->stride); 1971 if (priv->rx_cq[i]) 1972 mlx4_en_destroy_cq(priv, &priv->rx_cq[i]); 1973 } 1974 1975 if (priv->base_tx_qpn) { 1976 mlx4_qp_release_range(priv->mdev->dev, priv->base_tx_qpn, priv->tx_ring_num); 1977 priv->base_tx_qpn = 0; 1978 } 1979 } 1980 1981 int mlx4_en_alloc_resources(struct mlx4_en_priv *priv) 1982 { 1983 struct mlx4_en_port_profile *prof = priv->prof; 1984 int i; 1985 int node; 1986 1987 /* Create tx Rings */ 1988 for (i = 0; i < priv->tx_ring_num; i++) { 1989 node = cpu_to_node(i % num_online_cpus()); 1990 if (mlx4_en_create_cq(priv, &priv->tx_cq[i], 1991 prof->tx_ring_size, i, TX, node)) 1992 goto err; 1993 1994 if (mlx4_en_create_tx_ring(priv, &priv->tx_ring[i], 1995 prof->tx_ring_size, TXBB_SIZE, 1996 node, i)) 1997 goto err; 1998 } 1999 2000 /* Create rx Rings */ 2001 for (i = 0; i < priv->rx_ring_num; i++) { 2002 node = cpu_to_node(i % num_online_cpus()); 2003 if (mlx4_en_create_cq(priv, &priv->rx_cq[i], 2004 prof->rx_ring_size, i, RX, node)) 2005 goto err; 2006 2007 if (mlx4_en_create_rx_ring(priv, &priv->rx_ring[i], 2008 prof->rx_ring_size, priv->stride, 2009 node)) 2010 goto err; 2011 } 2012 2013 #ifdef CONFIG_RFS_ACCEL 2014 if (priv->mdev->dev->caps.comp_pool) { 2015 priv->dev->rx_cpu_rmap = alloc_irq_cpu_rmap(priv->mdev->dev->caps.comp_pool); 2016 if (!priv->dev->rx_cpu_rmap) 2017 goto err; 2018 } 2019 #endif 2020 2021 return 0; 2022 2023 err: 2024 en_err(priv, "Failed to allocate NIC resources\n"); 2025 for (i = 0; i < priv->rx_ring_num; i++) { 2026 if (priv->rx_ring[i]) 2027 mlx4_en_destroy_rx_ring(priv, &priv->rx_ring[i], 2028 prof->rx_ring_size, 2029 priv->stride); 2030 if (priv->rx_cq[i]) 2031 mlx4_en_destroy_cq(priv, &priv->rx_cq[i]); 2032 } 2033 for (i = 0; i < priv->tx_ring_num; i++) { 2034 if (priv->tx_ring[i]) 2035 mlx4_en_destroy_tx_ring(priv, &priv->tx_ring[i]); 2036 if (priv->tx_cq[i]) 2037 mlx4_en_destroy_cq(priv, &priv->tx_cq[i]); 2038 } 2039 return -ENOMEM; 2040 } 2041 2042 2043 void mlx4_en_destroy_netdev(struct net_device *dev) 2044 { 2045 struct mlx4_en_priv *priv = netdev_priv(dev); 2046 struct mlx4_en_dev *mdev = priv->mdev; 2047 2048 en_dbg(DRV, priv, "Destroying netdev on port:%d\n", priv->port); 2049 2050 /* Unregister device - this will close the port if it was up */ 2051 if (priv->registered) 2052 unregister_netdev(dev); 2053 2054 if (priv->allocated) 2055 mlx4_free_hwq_res(mdev->dev, &priv->res, MLX4_EN_PAGE_SIZE); 2056 2057 cancel_delayed_work(&priv->stats_task); 2058 cancel_delayed_work(&priv->service_task); 2059 /* flush any pending task for this netdev */ 2060 flush_workqueue(mdev->workqueue); 2061 2062 /* Detach the netdev so tasks would not attempt to access it */ 2063 mutex_lock(&mdev->state_lock); 2064 mdev->pndev[priv->port] = NULL; 2065 mdev->upper[priv->port] = NULL; 2066 mutex_unlock(&mdev->state_lock); 2067 2068 mlx4_en_free_resources(priv); 2069 2070 kfree(priv->tx_ring); 2071 kfree(priv->tx_cq); 2072 2073 free_netdev(dev); 2074 } 2075 2076 static int mlx4_en_change_mtu(struct net_device *dev, int new_mtu) 2077 { 2078 struct mlx4_en_priv *priv = netdev_priv(dev); 2079 struct mlx4_en_dev *mdev = priv->mdev; 2080 int err = 0; 2081 2082 en_dbg(DRV, priv, "Change MTU called - current:%d new:%d\n", 2083 dev->mtu, new_mtu); 2084 2085 if ((new_mtu < MLX4_EN_MIN_MTU) || (new_mtu > priv->max_mtu)) { 2086 en_err(priv, "Bad MTU size:%d.\n", new_mtu); 2087 return -EPERM; 2088 } 2089 dev->mtu = new_mtu; 2090 2091 if (netif_running(dev)) { 2092 mutex_lock(&mdev->state_lock); 2093 if (!mdev->device_up) { 2094 /* NIC is probably restarting - let watchdog task reset 2095 * the port */ 2096 en_dbg(DRV, priv, "Change MTU called with card down!?\n"); 2097 } else { 2098 mlx4_en_stop_port(dev, 1); 2099 err = mlx4_en_start_port(dev); 2100 if (err) { 2101 en_err(priv, "Failed restarting port:%d\n", 2102 priv->port); 2103 queue_work(mdev->workqueue, &priv->watchdog_task); 2104 } 2105 } 2106 mutex_unlock(&mdev->state_lock); 2107 } 2108 return 0; 2109 } 2110 2111 static int mlx4_en_hwtstamp_set(struct net_device *dev, struct ifreq *ifr) 2112 { 2113 struct mlx4_en_priv *priv = netdev_priv(dev); 2114 struct mlx4_en_dev *mdev = priv->mdev; 2115 struct hwtstamp_config config; 2116 2117 if (copy_from_user(&config, ifr->ifr_data, sizeof(config))) 2118 return -EFAULT; 2119 2120 /* reserved for future extensions */ 2121 if (config.flags) 2122 return -EINVAL; 2123 2124 /* device doesn't support time stamping */ 2125 if (!(mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_TS)) 2126 return -EINVAL; 2127 2128 /* TX HW timestamp */ 2129 switch (config.tx_type) { 2130 case HWTSTAMP_TX_OFF: 2131 case HWTSTAMP_TX_ON: 2132 break; 2133 default: 2134 return -ERANGE; 2135 } 2136 2137 /* RX HW timestamp */ 2138 switch (config.rx_filter) { 2139 case HWTSTAMP_FILTER_NONE: 2140 break; 2141 case HWTSTAMP_FILTER_ALL: 2142 case HWTSTAMP_FILTER_SOME: 2143 case HWTSTAMP_FILTER_PTP_V1_L4_EVENT: 2144 case HWTSTAMP_FILTER_PTP_V1_L4_SYNC: 2145 case HWTSTAMP_FILTER_PTP_V1_L4_DELAY_REQ: 2146 case HWTSTAMP_FILTER_PTP_V2_L4_EVENT: 2147 case HWTSTAMP_FILTER_PTP_V2_L4_SYNC: 2148 case HWTSTAMP_FILTER_PTP_V2_L4_DELAY_REQ: 2149 case HWTSTAMP_FILTER_PTP_V2_L2_EVENT: 2150 case HWTSTAMP_FILTER_PTP_V2_L2_SYNC: 2151 case HWTSTAMP_FILTER_PTP_V2_L2_DELAY_REQ: 2152 case HWTSTAMP_FILTER_PTP_V2_EVENT: 2153 case HWTSTAMP_FILTER_PTP_V2_SYNC: 2154 case HWTSTAMP_FILTER_PTP_V2_DELAY_REQ: 2155 config.rx_filter = HWTSTAMP_FILTER_ALL; 2156 break; 2157 default: 2158 return -ERANGE; 2159 } 2160 2161 if (mlx4_en_reset_config(dev, config, dev->features)) { 2162 config.tx_type = HWTSTAMP_TX_OFF; 2163 config.rx_filter = HWTSTAMP_FILTER_NONE; 2164 } 2165 2166 return copy_to_user(ifr->ifr_data, &config, 2167 sizeof(config)) ? -EFAULT : 0; 2168 } 2169 2170 static int mlx4_en_hwtstamp_get(struct net_device *dev, struct ifreq *ifr) 2171 { 2172 struct mlx4_en_priv *priv = netdev_priv(dev); 2173 2174 return copy_to_user(ifr->ifr_data, &priv->hwtstamp_config, 2175 sizeof(priv->hwtstamp_config)) ? -EFAULT : 0; 2176 } 2177 2178 static int mlx4_en_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd) 2179 { 2180 switch (cmd) { 2181 case SIOCSHWTSTAMP: 2182 return mlx4_en_hwtstamp_set(dev, ifr); 2183 case SIOCGHWTSTAMP: 2184 return mlx4_en_hwtstamp_get(dev, ifr); 2185 default: 2186 return -EOPNOTSUPP; 2187 } 2188 } 2189 2190 static int mlx4_en_set_features(struct net_device *netdev, 2191 netdev_features_t features) 2192 { 2193 struct mlx4_en_priv *priv = netdev_priv(netdev); 2194 int ret = 0; 2195 2196 if (DEV_FEATURE_CHANGED(netdev, features, NETIF_F_HW_VLAN_CTAG_RX)) { 2197 en_info(priv, "Turn %s RX vlan strip offload\n", 2198 (features & NETIF_F_HW_VLAN_CTAG_RX) ? "ON" : "OFF"); 2199 ret = mlx4_en_reset_config(netdev, priv->hwtstamp_config, 2200 features); 2201 if (ret) 2202 return ret; 2203 } 2204 2205 if (DEV_FEATURE_CHANGED(netdev, features, NETIF_F_HW_VLAN_CTAG_TX)) 2206 en_info(priv, "Turn %s TX vlan strip offload\n", 2207 (features & NETIF_F_HW_VLAN_CTAG_TX) ? "ON" : "OFF"); 2208 2209 if (features & NETIF_F_LOOPBACK) 2210 priv->ctrl_flags |= cpu_to_be32(MLX4_WQE_CTRL_FORCE_LOOPBACK); 2211 else 2212 priv->ctrl_flags &= 2213 cpu_to_be32(~MLX4_WQE_CTRL_FORCE_LOOPBACK); 2214 2215 mlx4_en_update_loopback_state(netdev, features); 2216 2217 return 0; 2218 2219 } 2220 2221 static int mlx4_en_set_vf_mac(struct net_device *dev, int queue, u8 *mac) 2222 { 2223 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2224 struct mlx4_en_dev *mdev = en_priv->mdev; 2225 u64 mac_u64 = mlx4_mac_to_u64(mac); 2226 2227 if (!is_valid_ether_addr(mac)) 2228 return -EINVAL; 2229 2230 return mlx4_set_vf_mac(mdev->dev, en_priv->port, queue, mac_u64); 2231 } 2232 2233 static int mlx4_en_set_vf_vlan(struct net_device *dev, int vf, u16 vlan, u8 qos) 2234 { 2235 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2236 struct mlx4_en_dev *mdev = en_priv->mdev; 2237 2238 return mlx4_set_vf_vlan(mdev->dev, en_priv->port, vf, vlan, qos); 2239 } 2240 2241 static int mlx4_en_set_vf_spoofchk(struct net_device *dev, int vf, bool setting) 2242 { 2243 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2244 struct mlx4_en_dev *mdev = en_priv->mdev; 2245 2246 return mlx4_set_vf_spoofchk(mdev->dev, en_priv->port, vf, setting); 2247 } 2248 2249 static int mlx4_en_get_vf_config(struct net_device *dev, int vf, struct ifla_vf_info *ivf) 2250 { 2251 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2252 struct mlx4_en_dev *mdev = en_priv->mdev; 2253 2254 return mlx4_get_vf_config(mdev->dev, en_priv->port, vf, ivf); 2255 } 2256 2257 static int mlx4_en_set_vf_link_state(struct net_device *dev, int vf, int link_state) 2258 { 2259 struct mlx4_en_priv *en_priv = netdev_priv(dev); 2260 struct mlx4_en_dev *mdev = en_priv->mdev; 2261 2262 return mlx4_set_vf_link_state(mdev->dev, en_priv->port, vf, link_state); 2263 } 2264 2265 #define PORT_ID_BYTE_LEN 8 2266 static int mlx4_en_get_phys_port_id(struct net_device *dev, 2267 struct netdev_phys_item_id *ppid) 2268 { 2269 struct mlx4_en_priv *priv = netdev_priv(dev); 2270 struct mlx4_dev *mdev = priv->mdev->dev; 2271 int i; 2272 u64 phys_port_id = mdev->caps.phys_port_id[priv->port]; 2273 2274 if (!phys_port_id) 2275 return -EOPNOTSUPP; 2276 2277 ppid->id_len = sizeof(phys_port_id); 2278 for (i = PORT_ID_BYTE_LEN - 1; i >= 0; --i) { 2279 ppid->id[i] = phys_port_id & 0xff; 2280 phys_port_id >>= 8; 2281 } 2282 return 0; 2283 } 2284 2285 #ifdef CONFIG_MLX4_EN_VXLAN 2286 static void mlx4_en_add_vxlan_offloads(struct work_struct *work) 2287 { 2288 int ret; 2289 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 2290 vxlan_add_task); 2291 2292 ret = mlx4_config_vxlan_port(priv->mdev->dev, priv->vxlan_port); 2293 if (ret) 2294 goto out; 2295 2296 ret = mlx4_SET_PORT_VXLAN(priv->mdev->dev, priv->port, 2297 VXLAN_STEER_BY_OUTER_MAC, 1); 2298 out: 2299 if (ret) { 2300 en_err(priv, "failed setting L2 tunnel configuration ret %d\n", ret); 2301 return; 2302 } 2303 2304 /* set offloads */ 2305 priv->dev->hw_enc_features |= NETIF_F_IP_CSUM | NETIF_F_RXCSUM | 2306 NETIF_F_TSO | NETIF_F_GSO_UDP_TUNNEL; 2307 priv->dev->hw_features |= NETIF_F_GSO_UDP_TUNNEL; 2308 priv->dev->features |= NETIF_F_GSO_UDP_TUNNEL; 2309 } 2310 2311 static void mlx4_en_del_vxlan_offloads(struct work_struct *work) 2312 { 2313 int ret; 2314 struct mlx4_en_priv *priv = container_of(work, struct mlx4_en_priv, 2315 vxlan_del_task); 2316 /* unset offloads */ 2317 priv->dev->hw_enc_features &= ~(NETIF_F_IP_CSUM | NETIF_F_RXCSUM | 2318 NETIF_F_TSO | NETIF_F_GSO_UDP_TUNNEL); 2319 priv->dev->hw_features &= ~NETIF_F_GSO_UDP_TUNNEL; 2320 priv->dev->features &= ~NETIF_F_GSO_UDP_TUNNEL; 2321 2322 ret = mlx4_SET_PORT_VXLAN(priv->mdev->dev, priv->port, 2323 VXLAN_STEER_BY_OUTER_MAC, 0); 2324 if (ret) 2325 en_err(priv, "failed setting L2 tunnel configuration ret %d\n", ret); 2326 2327 priv->vxlan_port = 0; 2328 } 2329 2330 static void mlx4_en_add_vxlan_port(struct net_device *dev, 2331 sa_family_t sa_family, __be16 port) 2332 { 2333 struct mlx4_en_priv *priv = netdev_priv(dev); 2334 __be16 current_port; 2335 2336 if (priv->mdev->dev->caps.tunnel_offload_mode != MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) 2337 return; 2338 2339 if (sa_family == AF_INET6) 2340 return; 2341 2342 current_port = priv->vxlan_port; 2343 if (current_port && current_port != port) { 2344 en_warn(priv, "vxlan port %d configured, can't add port %d\n", 2345 ntohs(current_port), ntohs(port)); 2346 return; 2347 } 2348 2349 priv->vxlan_port = port; 2350 queue_work(priv->mdev->workqueue, &priv->vxlan_add_task); 2351 } 2352 2353 static void mlx4_en_del_vxlan_port(struct net_device *dev, 2354 sa_family_t sa_family, __be16 port) 2355 { 2356 struct mlx4_en_priv *priv = netdev_priv(dev); 2357 __be16 current_port; 2358 2359 if (priv->mdev->dev->caps.tunnel_offload_mode != MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) 2360 return; 2361 2362 if (sa_family == AF_INET6) 2363 return; 2364 2365 current_port = priv->vxlan_port; 2366 if (current_port != port) { 2367 en_dbg(DRV, priv, "vxlan port %d isn't configured, ignoring\n", ntohs(port)); 2368 return; 2369 } 2370 2371 queue_work(priv->mdev->workqueue, &priv->vxlan_del_task); 2372 } 2373 2374 static netdev_features_t mlx4_en_features_check(struct sk_buff *skb, 2375 struct net_device *dev, 2376 netdev_features_t features) 2377 { 2378 return vxlan_features_check(skb, features); 2379 } 2380 #endif 2381 2382 static const struct net_device_ops mlx4_netdev_ops = { 2383 .ndo_open = mlx4_en_open, 2384 .ndo_stop = mlx4_en_close, 2385 .ndo_start_xmit = mlx4_en_xmit, 2386 .ndo_select_queue = mlx4_en_select_queue, 2387 .ndo_get_stats = mlx4_en_get_stats, 2388 .ndo_set_rx_mode = mlx4_en_set_rx_mode, 2389 .ndo_set_mac_address = mlx4_en_set_mac, 2390 .ndo_validate_addr = eth_validate_addr, 2391 .ndo_change_mtu = mlx4_en_change_mtu, 2392 .ndo_do_ioctl = mlx4_en_ioctl, 2393 .ndo_tx_timeout = mlx4_en_tx_timeout, 2394 .ndo_vlan_rx_add_vid = mlx4_en_vlan_rx_add_vid, 2395 .ndo_vlan_rx_kill_vid = mlx4_en_vlan_rx_kill_vid, 2396 #ifdef CONFIG_NET_POLL_CONTROLLER 2397 .ndo_poll_controller = mlx4_en_netpoll, 2398 #endif 2399 .ndo_set_features = mlx4_en_set_features, 2400 .ndo_setup_tc = mlx4_en_setup_tc, 2401 #ifdef CONFIG_RFS_ACCEL 2402 .ndo_rx_flow_steer = mlx4_en_filter_rfs, 2403 #endif 2404 #ifdef CONFIG_NET_RX_BUSY_POLL 2405 .ndo_busy_poll = mlx4_en_low_latency_recv, 2406 #endif 2407 .ndo_get_phys_port_id = mlx4_en_get_phys_port_id, 2408 #ifdef CONFIG_MLX4_EN_VXLAN 2409 .ndo_add_vxlan_port = mlx4_en_add_vxlan_port, 2410 .ndo_del_vxlan_port = mlx4_en_del_vxlan_port, 2411 .ndo_features_check = mlx4_en_features_check, 2412 #endif 2413 }; 2414 2415 static const struct net_device_ops mlx4_netdev_ops_master = { 2416 .ndo_open = mlx4_en_open, 2417 .ndo_stop = mlx4_en_close, 2418 .ndo_start_xmit = mlx4_en_xmit, 2419 .ndo_select_queue = mlx4_en_select_queue, 2420 .ndo_get_stats = mlx4_en_get_stats, 2421 .ndo_set_rx_mode = mlx4_en_set_rx_mode, 2422 .ndo_set_mac_address = mlx4_en_set_mac, 2423 .ndo_validate_addr = eth_validate_addr, 2424 .ndo_change_mtu = mlx4_en_change_mtu, 2425 .ndo_tx_timeout = mlx4_en_tx_timeout, 2426 .ndo_vlan_rx_add_vid = mlx4_en_vlan_rx_add_vid, 2427 .ndo_vlan_rx_kill_vid = mlx4_en_vlan_rx_kill_vid, 2428 .ndo_set_vf_mac = mlx4_en_set_vf_mac, 2429 .ndo_set_vf_vlan = mlx4_en_set_vf_vlan, 2430 .ndo_set_vf_spoofchk = mlx4_en_set_vf_spoofchk, 2431 .ndo_set_vf_link_state = mlx4_en_set_vf_link_state, 2432 .ndo_get_vf_config = mlx4_en_get_vf_config, 2433 #ifdef CONFIG_NET_POLL_CONTROLLER 2434 .ndo_poll_controller = mlx4_en_netpoll, 2435 #endif 2436 .ndo_set_features = mlx4_en_set_features, 2437 .ndo_setup_tc = mlx4_en_setup_tc, 2438 #ifdef CONFIG_RFS_ACCEL 2439 .ndo_rx_flow_steer = mlx4_en_filter_rfs, 2440 #endif 2441 .ndo_get_phys_port_id = mlx4_en_get_phys_port_id, 2442 #ifdef CONFIG_MLX4_EN_VXLAN 2443 .ndo_add_vxlan_port = mlx4_en_add_vxlan_port, 2444 .ndo_del_vxlan_port = mlx4_en_del_vxlan_port, 2445 .ndo_features_check = mlx4_en_features_check, 2446 #endif 2447 }; 2448 2449 struct mlx4_en_bond { 2450 struct work_struct work; 2451 struct mlx4_en_priv *priv; 2452 int is_bonded; 2453 struct mlx4_port_map port_map; 2454 }; 2455 2456 static void mlx4_en_bond_work(struct work_struct *work) 2457 { 2458 struct mlx4_en_bond *bond = container_of(work, 2459 struct mlx4_en_bond, 2460 work); 2461 int err = 0; 2462 struct mlx4_dev *dev = bond->priv->mdev->dev; 2463 2464 if (bond->is_bonded) { 2465 if (!mlx4_is_bonded(dev)) { 2466 err = mlx4_bond(dev); 2467 if (err) 2468 en_err(bond->priv, "Fail to bond device\n"); 2469 } 2470 if (!err) { 2471 err = mlx4_port_map_set(dev, &bond->port_map); 2472 if (err) 2473 en_err(bond->priv, "Fail to set port map [%d][%d]: %d\n", 2474 bond->port_map.port1, 2475 bond->port_map.port2, 2476 err); 2477 } 2478 } else if (mlx4_is_bonded(dev)) { 2479 err = mlx4_unbond(dev); 2480 if (err) 2481 en_err(bond->priv, "Fail to unbond device\n"); 2482 } 2483 dev_put(bond->priv->dev); 2484 kfree(bond); 2485 } 2486 2487 static int mlx4_en_queue_bond_work(struct mlx4_en_priv *priv, int is_bonded, 2488 u8 v2p_p1, u8 v2p_p2) 2489 { 2490 struct mlx4_en_bond *bond = NULL; 2491 2492 bond = kzalloc(sizeof(*bond), GFP_ATOMIC); 2493 if (!bond) 2494 return -ENOMEM; 2495 2496 INIT_WORK(&bond->work, mlx4_en_bond_work); 2497 bond->priv = priv; 2498 bond->is_bonded = is_bonded; 2499 bond->port_map.port1 = v2p_p1; 2500 bond->port_map.port2 = v2p_p2; 2501 dev_hold(priv->dev); 2502 queue_work(priv->mdev->workqueue, &bond->work); 2503 return 0; 2504 } 2505 2506 int mlx4_en_netdev_event(struct notifier_block *this, 2507 unsigned long event, void *ptr) 2508 { 2509 struct net_device *ndev = netdev_notifier_info_to_dev(ptr); 2510 u8 port = 0; 2511 struct mlx4_en_dev *mdev; 2512 struct mlx4_dev *dev; 2513 int i, num_eth_ports = 0; 2514 bool do_bond = true; 2515 struct mlx4_en_priv *priv; 2516 u8 v2p_port1 = 0; 2517 u8 v2p_port2 = 0; 2518 2519 if (!net_eq(dev_net(ndev), &init_net)) 2520 return NOTIFY_DONE; 2521 2522 mdev = container_of(this, struct mlx4_en_dev, nb); 2523 dev = mdev->dev; 2524 2525 /* Go into this mode only when two network devices set on two ports 2526 * of the same mlx4 device are slaves of the same bonding master 2527 */ 2528 mlx4_foreach_port(i, dev, MLX4_PORT_TYPE_ETH) { 2529 ++num_eth_ports; 2530 if (!port && (mdev->pndev[i] == ndev)) 2531 port = i; 2532 mdev->upper[i] = mdev->pndev[i] ? 2533 netdev_master_upper_dev_get(mdev->pndev[i]) : NULL; 2534 /* condition not met: network device is a slave */ 2535 if (!mdev->upper[i]) 2536 do_bond = false; 2537 if (num_eth_ports < 2) 2538 continue; 2539 /* condition not met: same master */ 2540 if (mdev->upper[i] != mdev->upper[i-1]) 2541 do_bond = false; 2542 } 2543 /* condition not met: 2 salves */ 2544 do_bond = (num_eth_ports == 2) ? do_bond : false; 2545 2546 /* handle only events that come with enough info */ 2547 if ((do_bond && (event != NETDEV_BONDING_INFO)) || !port) 2548 return NOTIFY_DONE; 2549 2550 priv = netdev_priv(ndev); 2551 if (do_bond) { 2552 struct netdev_notifier_bonding_info *notifier_info = ptr; 2553 struct netdev_bonding_info *bonding_info = 2554 ¬ifier_info->bonding_info; 2555 2556 /* required mode 1, 2 or 4 */ 2557 if ((bonding_info->master.bond_mode != BOND_MODE_ACTIVEBACKUP) && 2558 (bonding_info->master.bond_mode != BOND_MODE_XOR) && 2559 (bonding_info->master.bond_mode != BOND_MODE_8023AD)) 2560 do_bond = false; 2561 2562 /* require exactly 2 slaves */ 2563 if (bonding_info->master.num_slaves != 2) 2564 do_bond = false; 2565 2566 /* calc v2p */ 2567 if (do_bond) { 2568 if (bonding_info->master.bond_mode == 2569 BOND_MODE_ACTIVEBACKUP) { 2570 /* in active-backup mode virtual ports are 2571 * mapped to the physical port of the active 2572 * slave */ 2573 if (bonding_info->slave.state == 2574 BOND_STATE_BACKUP) { 2575 if (port == 1) { 2576 v2p_port1 = 2; 2577 v2p_port2 = 2; 2578 } else { 2579 v2p_port1 = 1; 2580 v2p_port2 = 1; 2581 } 2582 } else { /* BOND_STATE_ACTIVE */ 2583 if (port == 1) { 2584 v2p_port1 = 1; 2585 v2p_port2 = 1; 2586 } else { 2587 v2p_port1 = 2; 2588 v2p_port2 = 2; 2589 } 2590 } 2591 } else { /* Active-Active */ 2592 /* in active-active mode a virtual port is 2593 * mapped to the native physical port if and only 2594 * if the physical port is up */ 2595 __s8 link = bonding_info->slave.link; 2596 2597 if (port == 1) 2598 v2p_port2 = 2; 2599 else 2600 v2p_port1 = 1; 2601 if ((link == BOND_LINK_UP) || 2602 (link == BOND_LINK_FAIL)) { 2603 if (port == 1) 2604 v2p_port1 = 1; 2605 else 2606 v2p_port2 = 2; 2607 } else { /* BOND_LINK_DOWN || BOND_LINK_BACK */ 2608 if (port == 1) 2609 v2p_port1 = 2; 2610 else 2611 v2p_port2 = 1; 2612 } 2613 } 2614 } 2615 } 2616 2617 mlx4_en_queue_bond_work(priv, do_bond, 2618 v2p_port1, v2p_port2); 2619 2620 return NOTIFY_DONE; 2621 } 2622 2623 int mlx4_en_init_netdev(struct mlx4_en_dev *mdev, int port, 2624 struct mlx4_en_port_profile *prof) 2625 { 2626 struct net_device *dev; 2627 struct mlx4_en_priv *priv; 2628 int i; 2629 int err; 2630 u64 mac_u64; 2631 2632 dev = alloc_etherdev_mqs(sizeof(struct mlx4_en_priv), 2633 MAX_TX_RINGS, MAX_RX_RINGS); 2634 if (dev == NULL) 2635 return -ENOMEM; 2636 2637 netif_set_real_num_tx_queues(dev, prof->tx_ring_num); 2638 netif_set_real_num_rx_queues(dev, prof->rx_ring_num); 2639 2640 SET_NETDEV_DEV(dev, &mdev->dev->persist->pdev->dev); 2641 dev->dev_port = port - 1; 2642 2643 /* 2644 * Initialize driver private data 2645 */ 2646 2647 priv = netdev_priv(dev); 2648 memset(priv, 0, sizeof(struct mlx4_en_priv)); 2649 spin_lock_init(&priv->stats_lock); 2650 INIT_WORK(&priv->rx_mode_task, mlx4_en_do_set_rx_mode); 2651 INIT_WORK(&priv->watchdog_task, mlx4_en_restart); 2652 INIT_WORK(&priv->linkstate_task, mlx4_en_linkstate); 2653 INIT_DELAYED_WORK(&priv->stats_task, mlx4_en_do_get_stats); 2654 INIT_DELAYED_WORK(&priv->service_task, mlx4_en_service_task); 2655 #ifdef CONFIG_MLX4_EN_VXLAN 2656 INIT_WORK(&priv->vxlan_add_task, mlx4_en_add_vxlan_offloads); 2657 INIT_WORK(&priv->vxlan_del_task, mlx4_en_del_vxlan_offloads); 2658 #endif 2659 #ifdef CONFIG_RFS_ACCEL 2660 INIT_LIST_HEAD(&priv->filters); 2661 spin_lock_init(&priv->filters_lock); 2662 #endif 2663 2664 priv->dev = dev; 2665 priv->mdev = mdev; 2666 priv->ddev = &mdev->pdev->dev; 2667 priv->prof = prof; 2668 priv->port = port; 2669 priv->port_up = false; 2670 priv->flags = prof->flags; 2671 priv->pflags = MLX4_EN_PRIV_FLAGS_BLUEFLAME; 2672 priv->ctrl_flags = cpu_to_be32(MLX4_WQE_CTRL_CQ_UPDATE | 2673 MLX4_WQE_CTRL_SOLICITED); 2674 priv->num_tx_rings_p_up = mdev->profile.num_tx_rings_p_up; 2675 priv->tx_ring_num = prof->tx_ring_num; 2676 priv->tx_work_limit = MLX4_EN_DEFAULT_TX_WORK; 2677 netdev_rss_key_fill(priv->rss_key, sizeof(priv->rss_key)); 2678 2679 priv->tx_ring = kzalloc(sizeof(struct mlx4_en_tx_ring *) * MAX_TX_RINGS, 2680 GFP_KERNEL); 2681 if (!priv->tx_ring) { 2682 err = -ENOMEM; 2683 goto out; 2684 } 2685 priv->tx_cq = kzalloc(sizeof(struct mlx4_en_cq *) * MAX_TX_RINGS, 2686 GFP_KERNEL); 2687 if (!priv->tx_cq) { 2688 err = -ENOMEM; 2689 goto out; 2690 } 2691 priv->rx_ring_num = prof->rx_ring_num; 2692 priv->cqe_factor = (mdev->dev->caps.cqe_size == 64) ? 1 : 0; 2693 priv->cqe_size = mdev->dev->caps.cqe_size; 2694 priv->mac_index = -1; 2695 priv->msg_enable = MLX4_EN_MSG_LEVEL; 2696 #ifdef CONFIG_MLX4_EN_DCB 2697 if (!mlx4_is_slave(priv->mdev->dev)) { 2698 if (mdev->dev->caps.flags & MLX4_DEV_CAP_FLAG_SET_ETH_SCHED) { 2699 dev->dcbnl_ops = &mlx4_en_dcbnl_ops; 2700 } else { 2701 en_info(priv, "enabling only PFC DCB ops\n"); 2702 dev->dcbnl_ops = &mlx4_en_dcbnl_pfc_ops; 2703 } 2704 } 2705 #endif 2706 2707 for (i = 0; i < MLX4_EN_MAC_HASH_SIZE; ++i) 2708 INIT_HLIST_HEAD(&priv->mac_hash[i]); 2709 2710 /* Query for default mac and max mtu */ 2711 priv->max_mtu = mdev->dev->caps.eth_mtu_cap[priv->port]; 2712 2713 if (mdev->dev->caps.rx_checksum_flags_port[priv->port] & 2714 MLX4_RX_CSUM_MODE_VAL_NON_TCP_UDP) 2715 priv->flags |= MLX4_EN_FLAG_RX_CSUM_NON_TCP_UDP; 2716 2717 /* Set default MAC */ 2718 dev->addr_len = ETH_ALEN; 2719 mlx4_en_u64_to_mac(dev->dev_addr, mdev->dev->caps.def_mac[priv->port]); 2720 if (!is_valid_ether_addr(dev->dev_addr)) { 2721 if (mlx4_is_slave(priv->mdev->dev)) { 2722 eth_hw_addr_random(dev); 2723 en_warn(priv, "Assigned random MAC address %pM\n", dev->dev_addr); 2724 mac_u64 = mlx4_mac_to_u64(dev->dev_addr); 2725 mdev->dev->caps.def_mac[priv->port] = mac_u64; 2726 } else { 2727 en_err(priv, "Port: %d, invalid mac burned: %pM, quiting\n", 2728 priv->port, dev->dev_addr); 2729 err = -EINVAL; 2730 goto out; 2731 } 2732 } 2733 2734 memcpy(priv->current_mac, dev->dev_addr, sizeof(priv->current_mac)); 2735 2736 priv->stride = roundup_pow_of_two(sizeof(struct mlx4_en_rx_desc) + 2737 DS_SIZE * MLX4_EN_MAX_RX_FRAGS); 2738 err = mlx4_en_alloc_resources(priv); 2739 if (err) 2740 goto out; 2741 2742 /* Initialize time stamping config */ 2743 priv->hwtstamp_config.flags = 0; 2744 priv->hwtstamp_config.tx_type = HWTSTAMP_TX_OFF; 2745 priv->hwtstamp_config.rx_filter = HWTSTAMP_FILTER_NONE; 2746 2747 /* Allocate page for receive rings */ 2748 err = mlx4_alloc_hwq_res(mdev->dev, &priv->res, 2749 MLX4_EN_PAGE_SIZE, MLX4_EN_PAGE_SIZE); 2750 if (err) { 2751 en_err(priv, "Failed to allocate page for rx qps\n"); 2752 goto out; 2753 } 2754 priv->allocated = 1; 2755 2756 /* 2757 * Initialize netdev entry points 2758 */ 2759 if (mlx4_is_master(priv->mdev->dev)) 2760 dev->netdev_ops = &mlx4_netdev_ops_master; 2761 else 2762 dev->netdev_ops = &mlx4_netdev_ops; 2763 dev->watchdog_timeo = MLX4_EN_WATCHDOG_TIMEOUT; 2764 netif_set_real_num_tx_queues(dev, priv->tx_ring_num); 2765 netif_set_real_num_rx_queues(dev, priv->rx_ring_num); 2766 2767 dev->ethtool_ops = &mlx4_en_ethtool_ops; 2768 2769 /* 2770 * Set driver features 2771 */ 2772 dev->hw_features = NETIF_F_SG | NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM; 2773 if (mdev->LSO_support) 2774 dev->hw_features |= NETIF_F_TSO | NETIF_F_TSO6; 2775 2776 dev->vlan_features = dev->hw_features; 2777 2778 dev->hw_features |= NETIF_F_RXCSUM | NETIF_F_RXHASH; 2779 dev->features = dev->hw_features | NETIF_F_HIGHDMA | 2780 NETIF_F_HW_VLAN_CTAG_TX | NETIF_F_HW_VLAN_CTAG_RX | 2781 NETIF_F_HW_VLAN_CTAG_FILTER; 2782 dev->hw_features |= NETIF_F_LOOPBACK | 2783 NETIF_F_HW_VLAN_CTAG_TX | NETIF_F_HW_VLAN_CTAG_RX; 2784 2785 if (mdev->dev->caps.steering_mode == 2786 MLX4_STEERING_MODE_DEVICE_MANAGED && 2787 mdev->dev->caps.dmfs_high_steer_mode != MLX4_STEERING_DMFS_A0_STATIC) 2788 dev->hw_features |= NETIF_F_NTUPLE; 2789 2790 if (mdev->dev->caps.steering_mode != MLX4_STEERING_MODE_A0) 2791 dev->priv_flags |= IFF_UNICAST_FLT; 2792 2793 /* Setting a default hash function value */ 2794 if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_RSS_TOP) { 2795 priv->rss_hash_fn = ETH_RSS_HASH_TOP; 2796 } else if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_RSS_XOR) { 2797 priv->rss_hash_fn = ETH_RSS_HASH_XOR; 2798 } else { 2799 en_warn(priv, 2800 "No RSS hash capabilities exposed, using Toeplitz\n"); 2801 priv->rss_hash_fn = ETH_RSS_HASH_TOP; 2802 } 2803 2804 mdev->pndev[port] = dev; 2805 mdev->upper[port] = NULL; 2806 2807 netif_carrier_off(dev); 2808 mlx4_en_set_default_moderation(priv); 2809 2810 err = register_netdev(dev); 2811 if (err) { 2812 en_err(priv, "Netdev registration failed for port %d\n", port); 2813 goto out; 2814 } 2815 priv->registered = 1; 2816 2817 en_warn(priv, "Using %d TX rings\n", prof->tx_ring_num); 2818 en_warn(priv, "Using %d RX rings\n", prof->rx_ring_num); 2819 2820 mlx4_en_update_loopback_state(priv->dev, priv->dev->features); 2821 2822 /* Configure port */ 2823 mlx4_en_calc_rx_buf(dev); 2824 err = mlx4_SET_PORT_general(mdev->dev, priv->port, 2825 priv->rx_skb_size + ETH_FCS_LEN, 2826 prof->tx_pause, prof->tx_ppp, 2827 prof->rx_pause, prof->rx_ppp); 2828 if (err) { 2829 en_err(priv, "Failed setting port general configurations for port %d, with error %d\n", 2830 priv->port, err); 2831 goto out; 2832 } 2833 2834 if (mdev->dev->caps.tunnel_offload_mode == MLX4_TUNNEL_OFFLOAD_MODE_VXLAN) { 2835 err = mlx4_SET_PORT_VXLAN(mdev->dev, priv->port, VXLAN_STEER_BY_OUTER_MAC, 1); 2836 if (err) { 2837 en_err(priv, "Failed setting port L2 tunnel configuration, err %d\n", 2838 err); 2839 goto out; 2840 } 2841 } 2842 2843 /* Init port */ 2844 en_warn(priv, "Initializing port\n"); 2845 err = mlx4_INIT_PORT(mdev->dev, priv->port); 2846 if (err) { 2847 en_err(priv, "Failed Initializing port\n"); 2848 goto out; 2849 } 2850 queue_delayed_work(mdev->workqueue, &priv->stats_task, STATS_DELAY); 2851 2852 if (mdev->dev->caps.flags2 & MLX4_DEV_CAP_FLAG2_TS) 2853 queue_delayed_work(mdev->workqueue, &priv->service_task, 2854 SERVICE_TASK_DELAY); 2855 2856 return 0; 2857 2858 out: 2859 mlx4_en_destroy_netdev(dev); 2860 return err; 2861 } 2862 2863 int mlx4_en_reset_config(struct net_device *dev, 2864 struct hwtstamp_config ts_config, 2865 netdev_features_t features) 2866 { 2867 struct mlx4_en_priv *priv = netdev_priv(dev); 2868 struct mlx4_en_dev *mdev = priv->mdev; 2869 int port_up = 0; 2870 int err = 0; 2871 2872 if (priv->hwtstamp_config.tx_type == ts_config.tx_type && 2873 priv->hwtstamp_config.rx_filter == ts_config.rx_filter && 2874 !DEV_FEATURE_CHANGED(dev, features, NETIF_F_HW_VLAN_CTAG_RX)) 2875 return 0; /* Nothing to change */ 2876 2877 if (DEV_FEATURE_CHANGED(dev, features, NETIF_F_HW_VLAN_CTAG_RX) && 2878 (features & NETIF_F_HW_VLAN_CTAG_RX) && 2879 (priv->hwtstamp_config.rx_filter != HWTSTAMP_FILTER_NONE)) { 2880 en_warn(priv, "Can't turn ON rx vlan offload while time-stamping rx filter is ON\n"); 2881 return -EINVAL; 2882 } 2883 2884 mutex_lock(&mdev->state_lock); 2885 if (priv->port_up) { 2886 port_up = 1; 2887 mlx4_en_stop_port(dev, 1); 2888 } 2889 2890 mlx4_en_free_resources(priv); 2891 2892 en_warn(priv, "Changing device configuration rx filter(%x) rx vlan(%x)\n", 2893 ts_config.rx_filter, !!(features & NETIF_F_HW_VLAN_CTAG_RX)); 2894 2895 priv->hwtstamp_config.tx_type = ts_config.tx_type; 2896 priv->hwtstamp_config.rx_filter = ts_config.rx_filter; 2897 2898 if (DEV_FEATURE_CHANGED(dev, features, NETIF_F_HW_VLAN_CTAG_RX)) { 2899 if (features & NETIF_F_HW_VLAN_CTAG_RX) 2900 dev->features |= NETIF_F_HW_VLAN_CTAG_RX; 2901 else 2902 dev->features &= ~NETIF_F_HW_VLAN_CTAG_RX; 2903 } else if (ts_config.rx_filter == HWTSTAMP_FILTER_NONE) { 2904 /* RX time-stamping is OFF, update the RX vlan offload 2905 * to the latest wanted state 2906 */ 2907 if (dev->wanted_features & NETIF_F_HW_VLAN_CTAG_RX) 2908 dev->features |= NETIF_F_HW_VLAN_CTAG_RX; 2909 else 2910 dev->features &= ~NETIF_F_HW_VLAN_CTAG_RX; 2911 } 2912 2913 /* RX vlan offload and RX time-stamping can't co-exist ! 2914 * Regardless of the caller's choice, 2915 * Turn Off RX vlan offload in case of time-stamping is ON 2916 */ 2917 if (ts_config.rx_filter != HWTSTAMP_FILTER_NONE) { 2918 if (dev->features & NETIF_F_HW_VLAN_CTAG_RX) 2919 en_warn(priv, "Turning off RX vlan offload since RX time-stamping is ON\n"); 2920 dev->features &= ~NETIF_F_HW_VLAN_CTAG_RX; 2921 } 2922 2923 err = mlx4_en_alloc_resources(priv); 2924 if (err) { 2925 en_err(priv, "Failed reallocating port resources\n"); 2926 goto out; 2927 } 2928 if (port_up) { 2929 err = mlx4_en_start_port(dev); 2930 if (err) 2931 en_err(priv, "Failed starting port\n"); 2932 } 2933 2934 out: 2935 mutex_unlock(&mdev->state_lock); 2936 netdev_features_change(dev); 2937 return err; 2938 } 2939