11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * Copyright (c) 2004 Topspin Communications. All rights reserved. 32a1d9b7fSRoland Dreier * Copyright (c) 2005 Sun Microsystems, Inc. All rights reserved. 42a1d9b7fSRoland Dreier * Copyright (c) 2004 Voltaire, Inc. All rights reserved. 51da177e4SLinus Torvalds * 61da177e4SLinus Torvalds * This software is available to you under a choice of one of two 71da177e4SLinus Torvalds * licenses. You may choose to be licensed under the terms of the GNU 81da177e4SLinus Torvalds * General Public License (GPL) Version 2, available from the file 91da177e4SLinus Torvalds * COPYING in the main directory of this source tree, or the 101da177e4SLinus Torvalds * OpenIB.org BSD license below: 111da177e4SLinus Torvalds * 121da177e4SLinus Torvalds * Redistribution and use in source and binary forms, with or 131da177e4SLinus Torvalds * without modification, are permitted provided that the following 141da177e4SLinus Torvalds * conditions are met: 151da177e4SLinus Torvalds * 161da177e4SLinus Torvalds * - Redistributions of source code must retain the above 171da177e4SLinus Torvalds * copyright notice, this list of conditions and the following 181da177e4SLinus Torvalds * disclaimer. 191da177e4SLinus Torvalds * 201da177e4SLinus Torvalds * - Redistributions in binary form must reproduce the above 211da177e4SLinus Torvalds * copyright notice, this list of conditions and the following 221da177e4SLinus Torvalds * disclaimer in the documentation and/or other materials 231da177e4SLinus Torvalds * provided with the distribution. 241da177e4SLinus Torvalds * 251da177e4SLinus Torvalds * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 261da177e4SLinus Torvalds * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 271da177e4SLinus Torvalds * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 281da177e4SLinus Torvalds * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 291da177e4SLinus Torvalds * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 301da177e4SLinus Torvalds * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 311da177e4SLinus Torvalds * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 321da177e4SLinus Torvalds * SOFTWARE. 331da177e4SLinus Torvalds */ 341da177e4SLinus Torvalds 351da177e4SLinus Torvalds #include "ipoib.h" 361da177e4SLinus Torvalds 371da177e4SLinus Torvalds #include <linux/module.h> 381da177e4SLinus Torvalds 391da177e4SLinus Torvalds #include <linux/init.h> 401da177e4SLinus Torvalds #include <linux/slab.h> 410f485251SShirley Ma #include <linux/kernel.h> 4210313cbbSRoland Dreier #include <linux/vmalloc.h> 431da177e4SLinus Torvalds 441da177e4SLinus Torvalds #include <linux/if_arp.h> /* For ARPHRD_xxx */ 451da177e4SLinus Torvalds 461da177e4SLinus Torvalds #include <linux/ip.h> 471da177e4SLinus Torvalds #include <linux/in.h> 481da177e4SLinus Torvalds 4914c85021SArnaldo Carvalho de Melo #include <net/dst.h> 5014c85021SArnaldo Carvalho de Melo 511da177e4SLinus Torvalds MODULE_AUTHOR("Roland Dreier"); 521da177e4SLinus Torvalds MODULE_DESCRIPTION("IP-over-InfiniBand net driver"); 531da177e4SLinus Torvalds MODULE_LICENSE("Dual BSD/GPL"); 541da177e4SLinus Torvalds 550f485251SShirley Ma int ipoib_sendq_size __read_mostly = IPOIB_TX_RING_SIZE; 560f485251SShirley Ma int ipoib_recvq_size __read_mostly = IPOIB_RX_RING_SIZE; 570f485251SShirley Ma 580f485251SShirley Ma module_param_named(send_queue_size, ipoib_sendq_size, int, 0444); 590f485251SShirley Ma MODULE_PARM_DESC(send_queue_size, "Number of descriptors in send queue"); 600f485251SShirley Ma module_param_named(recv_queue_size, ipoib_recvq_size, int, 0444); 610f485251SShirley Ma MODULE_PARM_DESC(recv_queue_size, "Number of descriptors in receive queue"); 620f485251SShirley Ma 631da177e4SLinus Torvalds #ifdef CONFIG_INFINIBAND_IPOIB_DEBUG 641da177e4SLinus Torvalds int ipoib_debug_level; 651da177e4SLinus Torvalds 661da177e4SLinus Torvalds module_param_named(debug_level, ipoib_debug_level, int, 0644); 671da177e4SLinus Torvalds MODULE_PARM_DESC(debug_level, "Enable debug tracing if > 0"); 681da177e4SLinus Torvalds #endif 691da177e4SLinus Torvalds 701732b0efSRoland Dreier struct ipoib_path_iter { 711732b0efSRoland Dreier struct net_device *dev; 721732b0efSRoland Dreier struct ipoib_path path; 731732b0efSRoland Dreier }; 741732b0efSRoland Dreier 751da177e4SLinus Torvalds static const u8 ipv4_bcast_addr[] = { 761da177e4SLinus Torvalds 0x00, 0xff, 0xff, 0xff, 771da177e4SLinus Torvalds 0xff, 0x12, 0x40, 0x1b, 0x00, 0x00, 0x00, 0x00, 781da177e4SLinus Torvalds 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0xff, 0xff 791da177e4SLinus Torvalds }; 801da177e4SLinus Torvalds 811da177e4SLinus Torvalds struct workqueue_struct *ipoib_workqueue; 821da177e4SLinus Torvalds 83c1a0b23bSMichael S. Tsirkin struct ib_sa_client ipoib_sa_client; 84c1a0b23bSMichael S. Tsirkin 851da177e4SLinus Torvalds static void ipoib_add_one(struct ib_device *device); 861da177e4SLinus Torvalds static void ipoib_remove_one(struct ib_device *device); 871da177e4SLinus Torvalds 881da177e4SLinus Torvalds static struct ib_client ipoib_client = { 891da177e4SLinus Torvalds .name = "ipoib", 901da177e4SLinus Torvalds .add = ipoib_add_one, 911da177e4SLinus Torvalds .remove = ipoib_remove_one 921da177e4SLinus Torvalds }; 931da177e4SLinus Torvalds 941da177e4SLinus Torvalds int ipoib_open(struct net_device *dev) 951da177e4SLinus Torvalds { 961da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 971da177e4SLinus Torvalds 981da177e4SLinus Torvalds ipoib_dbg(priv, "bringing up interface\n"); 991da177e4SLinus Torvalds 100e028cc55SYossi Etigin set_bit(IPOIB_FLAG_ADMIN_UP, &priv->flags); 1011da177e4SLinus Torvalds 1021da177e4SLinus Torvalds if (ipoib_pkey_dev_delay_open(dev)) 1031da177e4SLinus Torvalds return 0; 1041da177e4SLinus Torvalds 105b8a1b1ceSRoland Dreier if (ipoib_ib_dev_open(dev)) 106b8a1b1ceSRoland Dreier goto err_disable; 107fe25c561SYossi Etigin 108b8a1b1ceSRoland Dreier if (ipoib_ib_dev_up(dev)) 109b8a1b1ceSRoland Dreier goto err_stop; 1101da177e4SLinus Torvalds 1111da177e4SLinus Torvalds if (!test_bit(IPOIB_FLAG_SUBINTERFACE, &priv->flags)) { 1121da177e4SLinus Torvalds struct ipoib_dev_priv *cpriv; 1131da177e4SLinus Torvalds 1141da177e4SLinus Torvalds /* Bring up any child interfaces too */ 11595ed644fSIngo Molnar mutex_lock(&priv->vlan_mutex); 1161da177e4SLinus Torvalds list_for_each_entry(cpriv, &priv->child_intfs, list) { 1171da177e4SLinus Torvalds int flags; 1181da177e4SLinus Torvalds 1191da177e4SLinus Torvalds flags = cpriv->dev->flags; 1201da177e4SLinus Torvalds if (flags & IFF_UP) 1211da177e4SLinus Torvalds continue; 1221da177e4SLinus Torvalds 1231da177e4SLinus Torvalds dev_change_flags(cpriv->dev, flags | IFF_UP); 1241da177e4SLinus Torvalds } 12595ed644fSIngo Molnar mutex_unlock(&priv->vlan_mutex); 1261da177e4SLinus Torvalds } 1271da177e4SLinus Torvalds 1281da177e4SLinus Torvalds netif_start_queue(dev); 1291da177e4SLinus Torvalds 1301da177e4SLinus Torvalds return 0; 131b8a1b1ceSRoland Dreier 132b8a1b1ceSRoland Dreier err_stop: 133b8a1b1ceSRoland Dreier ipoib_ib_dev_stop(dev, 1); 134b8a1b1ceSRoland Dreier 135b8a1b1ceSRoland Dreier err_disable: 136b8a1b1ceSRoland Dreier clear_bit(IPOIB_FLAG_ADMIN_UP, &priv->flags); 137b8a1b1ceSRoland Dreier 138b8a1b1ceSRoland Dreier return -EINVAL; 1391da177e4SLinus Torvalds } 1401da177e4SLinus Torvalds 1411da177e4SLinus Torvalds static int ipoib_stop(struct net_device *dev) 1421da177e4SLinus Torvalds { 1431da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 1441da177e4SLinus Torvalds 1451da177e4SLinus Torvalds ipoib_dbg(priv, "stopping interface\n"); 1461da177e4SLinus Torvalds 1471da177e4SLinus Torvalds clear_bit(IPOIB_FLAG_ADMIN_UP, &priv->flags); 1481da177e4SLinus Torvalds 1491da177e4SLinus Torvalds netif_stop_queue(dev); 1501da177e4SLinus Torvalds 151a77a57a1SRoland Dreier ipoib_ib_dev_down(dev, 0); 152a77a57a1SRoland Dreier ipoib_ib_dev_stop(dev, 0); 1531da177e4SLinus Torvalds 1541da177e4SLinus Torvalds if (!test_bit(IPOIB_FLAG_SUBINTERFACE, &priv->flags)) { 1551da177e4SLinus Torvalds struct ipoib_dev_priv *cpriv; 1561da177e4SLinus Torvalds 1571da177e4SLinus Torvalds /* Bring down any child interfaces too */ 15895ed644fSIngo Molnar mutex_lock(&priv->vlan_mutex); 1591da177e4SLinus Torvalds list_for_each_entry(cpriv, &priv->child_intfs, list) { 1601da177e4SLinus Torvalds int flags; 1611da177e4SLinus Torvalds 1621da177e4SLinus Torvalds flags = cpriv->dev->flags; 1631da177e4SLinus Torvalds if (!(flags & IFF_UP)) 1641da177e4SLinus Torvalds continue; 1651da177e4SLinus Torvalds 1661da177e4SLinus Torvalds dev_change_flags(cpriv->dev, flags & ~IFF_UP); 1671da177e4SLinus Torvalds } 16895ed644fSIngo Molnar mutex_unlock(&priv->vlan_mutex); 1691da177e4SLinus Torvalds } 1701da177e4SLinus Torvalds 1711da177e4SLinus Torvalds return 0; 1721da177e4SLinus Torvalds } 1731da177e4SLinus Torvalds 1743d96c74dSMichał Mirosław static u32 ipoib_fix_features(struct net_device *dev, u32 features) 1753d96c74dSMichał Mirosław { 1763d96c74dSMichał Mirosław struct ipoib_dev_priv *priv = netdev_priv(dev); 1773d96c74dSMichał Mirosław 1783d96c74dSMichał Mirosław if (test_bit(IPOIB_FLAG_ADMIN_CM, &priv->flags)) 1793d96c74dSMichał Mirosław features &= ~(NETIF_F_SG | NETIF_F_IP_CSUM | NETIF_F_TSO); 1803d96c74dSMichał Mirosław 1813d96c74dSMichał Mirosław return features; 1823d96c74dSMichał Mirosław } 1833d96c74dSMichał Mirosław 1841da177e4SLinus Torvalds static int ipoib_change_mtu(struct net_device *dev, int new_mtu) 1851da177e4SLinus Torvalds { 1861da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 1871da177e4SLinus Torvalds 188839fcabaSMichael S. Tsirkin /* dev->mtu > 2K ==> connected mode */ 189586a6934SPradeep Satyanarayana if (ipoib_cm_admin_enabled(dev)) { 190586a6934SPradeep Satyanarayana if (new_mtu > ipoib_cm_max_mtu(dev)) 191586a6934SPradeep Satyanarayana return -EINVAL; 192586a6934SPradeep Satyanarayana 193839fcabaSMichael S. Tsirkin if (new_mtu > priv->mcast_mtu) 194839fcabaSMichael S. Tsirkin ipoib_warn(priv, "mtu > %d will cause multicast packet drops.\n", 195839fcabaSMichael S. Tsirkin priv->mcast_mtu); 196586a6934SPradeep Satyanarayana 197839fcabaSMichael S. Tsirkin dev->mtu = new_mtu; 198839fcabaSMichael S. Tsirkin return 0; 199839fcabaSMichael S. Tsirkin } 200839fcabaSMichael S. Tsirkin 201bc7b3a36SShirley Ma if (new_mtu > IPOIB_UD_MTU(priv->max_ib_mtu)) 2021da177e4SLinus Torvalds return -EINVAL; 2031da177e4SLinus Torvalds 2041da177e4SLinus Torvalds priv->admin_mtu = new_mtu; 2051da177e4SLinus Torvalds 2061da177e4SLinus Torvalds dev->mtu = min(priv->mcast_mtu, priv->admin_mtu); 2071da177e4SLinus Torvalds 2081da177e4SLinus Torvalds return 0; 2091da177e4SLinus Torvalds } 2101da177e4SLinus Torvalds 21137c22a77SJack Morgenstein static struct ipoib_path *__path_find(struct net_device *dev, void *gid) 2121da177e4SLinus Torvalds { 2131da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 2141da177e4SLinus Torvalds struct rb_node *n = priv->path_tree.rb_node; 2151da177e4SLinus Torvalds struct ipoib_path *path; 2161da177e4SLinus Torvalds int ret; 2171da177e4SLinus Torvalds 2181da177e4SLinus Torvalds while (n) { 2191da177e4SLinus Torvalds path = rb_entry(n, struct ipoib_path, rb_node); 2201da177e4SLinus Torvalds 22137c22a77SJack Morgenstein ret = memcmp(gid, path->pathrec.dgid.raw, 2221da177e4SLinus Torvalds sizeof (union ib_gid)); 2231da177e4SLinus Torvalds 2241da177e4SLinus Torvalds if (ret < 0) 2251da177e4SLinus Torvalds n = n->rb_left; 2261da177e4SLinus Torvalds else if (ret > 0) 2271da177e4SLinus Torvalds n = n->rb_right; 2281da177e4SLinus Torvalds else 2291da177e4SLinus Torvalds return path; 2301da177e4SLinus Torvalds } 2311da177e4SLinus Torvalds 2321da177e4SLinus Torvalds return NULL; 2331da177e4SLinus Torvalds } 2341da177e4SLinus Torvalds 2351da177e4SLinus Torvalds static int __path_add(struct net_device *dev, struct ipoib_path *path) 2361da177e4SLinus Torvalds { 2371da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 2381da177e4SLinus Torvalds struct rb_node **n = &priv->path_tree.rb_node; 2391da177e4SLinus Torvalds struct rb_node *pn = NULL; 2401da177e4SLinus Torvalds struct ipoib_path *tpath; 2411da177e4SLinus Torvalds int ret; 2421da177e4SLinus Torvalds 2431da177e4SLinus Torvalds while (*n) { 2441da177e4SLinus Torvalds pn = *n; 2451da177e4SLinus Torvalds tpath = rb_entry(pn, struct ipoib_path, rb_node); 2461da177e4SLinus Torvalds 2471da177e4SLinus Torvalds ret = memcmp(path->pathrec.dgid.raw, tpath->pathrec.dgid.raw, 2481da177e4SLinus Torvalds sizeof (union ib_gid)); 2491da177e4SLinus Torvalds if (ret < 0) 2501da177e4SLinus Torvalds n = &pn->rb_left; 2511da177e4SLinus Torvalds else if (ret > 0) 2521da177e4SLinus Torvalds n = &pn->rb_right; 2531da177e4SLinus Torvalds else 2541da177e4SLinus Torvalds return -EEXIST; 2551da177e4SLinus Torvalds } 2561da177e4SLinus Torvalds 2571da177e4SLinus Torvalds rb_link_node(&path->rb_node, pn, n); 2581da177e4SLinus Torvalds rb_insert_color(&path->rb_node, &priv->path_tree); 2591da177e4SLinus Torvalds 2601da177e4SLinus Torvalds list_add_tail(&path->list, &priv->path_list); 2611da177e4SLinus Torvalds 2621da177e4SLinus Torvalds return 0; 2631da177e4SLinus Torvalds } 2641da177e4SLinus Torvalds 2651da177e4SLinus Torvalds static void path_free(struct net_device *dev, struct ipoib_path *path) 2661da177e4SLinus Torvalds { 2671da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 2681da177e4SLinus Torvalds struct ipoib_neigh *neigh, *tn; 2691da177e4SLinus Torvalds struct sk_buff *skb; 2701da177e4SLinus Torvalds unsigned long flags; 2711da177e4SLinus Torvalds 2721da177e4SLinus Torvalds while ((skb = __skb_dequeue(&path->queue))) 2731da177e4SLinus Torvalds dev_kfree_skb_irq(skb); 2741da177e4SLinus Torvalds 2751da177e4SLinus Torvalds spin_lock_irqsave(&priv->lock, flags); 2761da177e4SLinus Torvalds 2771da177e4SLinus Torvalds list_for_each_entry_safe(neigh, tn, &path->neigh_list, list) { 2781da177e4SLinus Torvalds /* 2791da177e4SLinus Torvalds * It's safe to call ipoib_put_ah() inside priv->lock 2801da177e4SLinus Torvalds * here, because we know that path->ah will always 2811da177e4SLinus Torvalds * hold one more reference, so ipoib_put_ah() will 2821da177e4SLinus Torvalds * never do more than decrement the ref count. 2831da177e4SLinus Torvalds */ 2841da177e4SLinus Torvalds if (neigh->ah) 2851da177e4SLinus Torvalds ipoib_put_ah(neigh->ah); 286d2e0655eSMichael S. Tsirkin 2872745b5b7SMichael S. Tsirkin ipoib_neigh_free(dev, neigh); 2881da177e4SLinus Torvalds } 2891da177e4SLinus Torvalds 2901da177e4SLinus Torvalds spin_unlock_irqrestore(&priv->lock, flags); 2911da177e4SLinus Torvalds 2921da177e4SLinus Torvalds if (path->ah) 2931da177e4SLinus Torvalds ipoib_put_ah(path->ah); 2941da177e4SLinus Torvalds 2951da177e4SLinus Torvalds kfree(path); 2961da177e4SLinus Torvalds } 2971da177e4SLinus Torvalds 2981732b0efSRoland Dreier #ifdef CONFIG_INFINIBAND_IPOIB_DEBUG 2991732b0efSRoland Dreier 3001732b0efSRoland Dreier struct ipoib_path_iter *ipoib_path_iter_init(struct net_device *dev) 3011732b0efSRoland Dreier { 3021732b0efSRoland Dreier struct ipoib_path_iter *iter; 3031732b0efSRoland Dreier 3041732b0efSRoland Dreier iter = kmalloc(sizeof *iter, GFP_KERNEL); 3051732b0efSRoland Dreier if (!iter) 3061732b0efSRoland Dreier return NULL; 3071732b0efSRoland Dreier 3081732b0efSRoland Dreier iter->dev = dev; 3091732b0efSRoland Dreier memset(iter->path.pathrec.dgid.raw, 0, 16); 3101732b0efSRoland Dreier 3111732b0efSRoland Dreier if (ipoib_path_iter_next(iter)) { 3121732b0efSRoland Dreier kfree(iter); 3131732b0efSRoland Dreier return NULL; 3141732b0efSRoland Dreier } 3151732b0efSRoland Dreier 3161732b0efSRoland Dreier return iter; 3171732b0efSRoland Dreier } 3181732b0efSRoland Dreier 3191732b0efSRoland Dreier int ipoib_path_iter_next(struct ipoib_path_iter *iter) 3201732b0efSRoland Dreier { 3211732b0efSRoland Dreier struct ipoib_dev_priv *priv = netdev_priv(iter->dev); 3221732b0efSRoland Dreier struct rb_node *n; 3231732b0efSRoland Dreier struct ipoib_path *path; 3241732b0efSRoland Dreier int ret = 1; 3251732b0efSRoland Dreier 3261732b0efSRoland Dreier spin_lock_irq(&priv->lock); 3271732b0efSRoland Dreier 3281732b0efSRoland Dreier n = rb_first(&priv->path_tree); 3291732b0efSRoland Dreier 3301732b0efSRoland Dreier while (n) { 3311732b0efSRoland Dreier path = rb_entry(n, struct ipoib_path, rb_node); 3321732b0efSRoland Dreier 3331732b0efSRoland Dreier if (memcmp(iter->path.pathrec.dgid.raw, path->pathrec.dgid.raw, 3341732b0efSRoland Dreier sizeof (union ib_gid)) < 0) { 3351732b0efSRoland Dreier iter->path = *path; 3361732b0efSRoland Dreier ret = 0; 3371732b0efSRoland Dreier break; 3381732b0efSRoland Dreier } 3391732b0efSRoland Dreier 3401732b0efSRoland Dreier n = rb_next(n); 3411732b0efSRoland Dreier } 3421732b0efSRoland Dreier 3431732b0efSRoland Dreier spin_unlock_irq(&priv->lock); 3441732b0efSRoland Dreier 3451732b0efSRoland Dreier return ret; 3461732b0efSRoland Dreier } 3471732b0efSRoland Dreier 3481732b0efSRoland Dreier void ipoib_path_iter_read(struct ipoib_path_iter *iter, 3491732b0efSRoland Dreier struct ipoib_path *path) 3501732b0efSRoland Dreier { 3511732b0efSRoland Dreier *path = iter->path; 3521732b0efSRoland Dreier } 3531732b0efSRoland Dreier 3541732b0efSRoland Dreier #endif /* CONFIG_INFINIBAND_IPOIB_DEBUG */ 3551732b0efSRoland Dreier 356ee1e2c82SMoni Shoua void ipoib_mark_paths_invalid(struct net_device *dev) 357ee1e2c82SMoni Shoua { 358ee1e2c82SMoni Shoua struct ipoib_dev_priv *priv = netdev_priv(dev); 359ee1e2c82SMoni Shoua struct ipoib_path *path, *tp; 360ee1e2c82SMoni Shoua 361ee1e2c82SMoni Shoua spin_lock_irq(&priv->lock); 362ee1e2c82SMoni Shoua 363ee1e2c82SMoni Shoua list_for_each_entry_safe(path, tp, &priv->path_list, list) { 3645b095d98SHarvey Harrison ipoib_dbg(priv, "mark path LID 0x%04x GID %pI6 invalid\n", 365ee1e2c82SMoni Shoua be16_to_cpu(path->pathrec.dlid), 366fcace2feSHarvey Harrison path->pathrec.dgid.raw); 367ee1e2c82SMoni Shoua path->valid = 0; 368ee1e2c82SMoni Shoua } 369ee1e2c82SMoni Shoua 370ee1e2c82SMoni Shoua spin_unlock_irq(&priv->lock); 371ee1e2c82SMoni Shoua } 372ee1e2c82SMoni Shoua 3731da177e4SLinus Torvalds void ipoib_flush_paths(struct net_device *dev) 3741da177e4SLinus Torvalds { 3751da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 3761da177e4SLinus Torvalds struct ipoib_path *path, *tp; 3771da177e4SLinus Torvalds LIST_HEAD(remove_list); 378943c246eSRoland Dreier unsigned long flags; 3791da177e4SLinus Torvalds 380943c246eSRoland Dreier netif_tx_lock_bh(dev); 381943c246eSRoland Dreier spin_lock_irqsave(&priv->lock, flags); 3821da177e4SLinus Torvalds 383157de229SRobert P. J. Day list_splice_init(&priv->path_list, &remove_list); 3841da177e4SLinus Torvalds 3851da177e4SLinus Torvalds list_for_each_entry(path, &remove_list, list) 3861da177e4SLinus Torvalds rb_erase(&path->rb_node, &priv->path_tree); 3871da177e4SLinus Torvalds 3881da177e4SLinus Torvalds list_for_each_entry_safe(path, tp, &remove_list, list) { 3891da177e4SLinus Torvalds if (path->query) 3901da177e4SLinus Torvalds ib_sa_cancel_query(path->query_id, path->query); 391943c246eSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 392943c246eSRoland Dreier netif_tx_unlock_bh(dev); 3931da177e4SLinus Torvalds wait_for_completion(&path->done); 3941da177e4SLinus Torvalds path_free(dev, path); 395943c246eSRoland Dreier netif_tx_lock_bh(dev); 396943c246eSRoland Dreier spin_lock_irqsave(&priv->lock, flags); 3971da177e4SLinus Torvalds } 398943c246eSRoland Dreier 399943c246eSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 400943c246eSRoland Dreier netif_tx_unlock_bh(dev); 4011da177e4SLinus Torvalds } 4021da177e4SLinus Torvalds 4031da177e4SLinus Torvalds static void path_rec_completion(int status, 4041da177e4SLinus Torvalds struct ib_sa_path_rec *pathrec, 4051da177e4SLinus Torvalds void *path_ptr) 4061da177e4SLinus Torvalds { 4071da177e4SLinus Torvalds struct ipoib_path *path = path_ptr; 4081da177e4SLinus Torvalds struct net_device *dev = path->dev; 4091da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 4101da177e4SLinus Torvalds struct ipoib_ah *ah = NULL; 411c9da4badSRoland Dreier struct ipoib_ah *old_ah = NULL; 412d04d01b1SMichael S. Tsirkin struct ipoib_neigh *neigh, *tn; 4131da177e4SLinus Torvalds struct sk_buff_head skqueue; 4141da177e4SLinus Torvalds struct sk_buff *skb; 4151da177e4SLinus Torvalds unsigned long flags; 4161da177e4SLinus Torvalds 417843613b0SRoland Dreier if (!status) 4185b095d98SHarvey Harrison ipoib_dbg(priv, "PathRec LID 0x%04x for GID %pI6\n", 419fcace2feSHarvey Harrison be16_to_cpu(pathrec->dlid), pathrec->dgid.raw); 4201da177e4SLinus Torvalds else 4215b095d98SHarvey Harrison ipoib_dbg(priv, "PathRec status %d for GID %pI6\n", 422fcace2feSHarvey Harrison status, path->pathrec.dgid.raw); 4231da177e4SLinus Torvalds 4241da177e4SLinus Torvalds skb_queue_head_init(&skqueue); 4251da177e4SLinus Torvalds 4261da177e4SLinus Torvalds if (!status) { 42746f1b3d7SSean Hefty struct ib_ah_attr av; 4281da177e4SLinus Torvalds 42946f1b3d7SSean Hefty if (!ib_init_ah_from_path(priv->ca, priv->port, pathrec, &av)) 4301da177e4SLinus Torvalds ah = ipoib_create_ah(dev, priv->pd, &av); 4311da177e4SLinus Torvalds } 4321da177e4SLinus Torvalds 4331da177e4SLinus Torvalds spin_lock_irqsave(&priv->lock, flags); 4341da177e4SLinus Torvalds 4353874397cSMike Marciniszyn if (!IS_ERR_OR_NULL(ah)) { 4361da177e4SLinus Torvalds path->pathrec = *pathrec; 4371da177e4SLinus Torvalds 438c9da4badSRoland Dreier old_ah = path->ah; 439c9da4badSRoland Dreier path->ah = ah; 440c9da4badSRoland Dreier 4411da177e4SLinus Torvalds ipoib_dbg(priv, "created address handle %p for LID 0x%04x, SL %d\n", 4421da177e4SLinus Torvalds ah, be16_to_cpu(pathrec->dlid), pathrec->sl); 4431da177e4SLinus Torvalds 4441da177e4SLinus Torvalds while ((skb = __skb_dequeue(&path->queue))) 4451da177e4SLinus Torvalds __skb_queue_tail(&skqueue, skb); 4461da177e4SLinus Torvalds 447d04d01b1SMichael S. Tsirkin list_for_each_entry_safe(neigh, tn, &path->neigh_list, list) { 448ee1e2c82SMoni Shoua if (neigh->ah) { 449ee1e2c82SMoni Shoua WARN_ON(neigh->ah != old_ah); 450ee1e2c82SMoni Shoua /* 451ee1e2c82SMoni Shoua * Dropping the ah reference inside 452ee1e2c82SMoni Shoua * priv->lock is safe here, because we 453ee1e2c82SMoni Shoua * will hold one more reference from 454ee1e2c82SMoni Shoua * the original value of path->ah (ie 455ee1e2c82SMoni Shoua * old_ah). 456ee1e2c82SMoni Shoua */ 457ee1e2c82SMoni Shoua ipoib_put_ah(neigh->ah); 458ee1e2c82SMoni Shoua } 4591da177e4SLinus Torvalds kref_get(&path->ah->ref); 4601da177e4SLinus Torvalds neigh->ah = path->ah; 4618a7f7521SMichael S. Tsirkin memcpy(&neigh->dgid.raw, &path->pathrec.dgid.raw, 4628a7f7521SMichael S. Tsirkin sizeof(union ib_gid)); 4631da177e4SLinus Torvalds 464839fcabaSMichael S. Tsirkin if (ipoib_cm_enabled(dev, neigh->neighbour)) { 465839fcabaSMichael S. Tsirkin if (!ipoib_cm_get(neigh)) 466839fcabaSMichael S. Tsirkin ipoib_cm_set(neigh, ipoib_cm_create_tx(dev, 467839fcabaSMichael S. Tsirkin path, 468839fcabaSMichael S. Tsirkin neigh)); 469839fcabaSMichael S. Tsirkin if (!ipoib_cm_get(neigh)) { 470839fcabaSMichael S. Tsirkin list_del(&neigh->list); 471839fcabaSMichael S. Tsirkin if (neigh->ah) 472839fcabaSMichael S. Tsirkin ipoib_put_ah(neigh->ah); 473839fcabaSMichael S. Tsirkin ipoib_neigh_free(dev, neigh); 474839fcabaSMichael S. Tsirkin continue; 475839fcabaSMichael S. Tsirkin } 476839fcabaSMichael S. Tsirkin } 477839fcabaSMichael S. Tsirkin 4781da177e4SLinus Torvalds while ((skb = __skb_dequeue(&neigh->queue))) 4791da177e4SLinus Torvalds __skb_queue_tail(&skqueue, skb); 4801da177e4SLinus Torvalds } 481ee1e2c82SMoni Shoua path->valid = 1; 4825872a9fcSRoland Dreier } 4831da177e4SLinus Torvalds 4845872a9fcSRoland Dreier path->query = NULL; 4851da177e4SLinus Torvalds complete(&path->done); 4861da177e4SLinus Torvalds 4871da177e4SLinus Torvalds spin_unlock_irqrestore(&priv->lock, flags); 4881da177e4SLinus Torvalds 489ee1e2c82SMoni Shoua if (old_ah) 490ee1e2c82SMoni Shoua ipoib_put_ah(old_ah); 491ee1e2c82SMoni Shoua 4921da177e4SLinus Torvalds while ((skb = __skb_dequeue(&skqueue))) { 4931da177e4SLinus Torvalds skb->dev = dev; 4941da177e4SLinus Torvalds if (dev_queue_xmit(skb)) 4951da177e4SLinus Torvalds ipoib_warn(priv, "dev_queue_xmit failed " 4961da177e4SLinus Torvalds "to requeue packet\n"); 4971da177e4SLinus Torvalds } 4981da177e4SLinus Torvalds } 4991da177e4SLinus Torvalds 50037c22a77SJack Morgenstein static struct ipoib_path *path_rec_create(struct net_device *dev, void *gid) 5011da177e4SLinus Torvalds { 5021da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 5031da177e4SLinus Torvalds struct ipoib_path *path; 5041da177e4SLinus Torvalds 5051401b53aSJack Morgenstein if (!priv->broadcast) 5061401b53aSJack Morgenstein return NULL; 5071401b53aSJack Morgenstein 50821a38489SRoland Dreier path = kzalloc(sizeof *path, GFP_ATOMIC); 5091da177e4SLinus Torvalds if (!path) 5101da177e4SLinus Torvalds return NULL; 5111da177e4SLinus Torvalds 5121da177e4SLinus Torvalds path->dev = dev; 5131da177e4SLinus Torvalds 5141da177e4SLinus Torvalds skb_queue_head_init(&path->queue); 5151da177e4SLinus Torvalds 5161da177e4SLinus Torvalds INIT_LIST_HEAD(&path->neigh_list); 5171da177e4SLinus Torvalds 51837c22a77SJack Morgenstein memcpy(path->pathrec.dgid.raw, gid, sizeof (union ib_gid)); 5191da177e4SLinus Torvalds path->pathrec.sgid = priv->local_gid; 5201da177e4SLinus Torvalds path->pathrec.pkey = cpu_to_be16(priv->pkey); 5211da177e4SLinus Torvalds path->pathrec.numb_path = 1; 52281668838SSean Hefty path->pathrec.traffic_class = priv->broadcast->mcmember.traffic_class; 5231da177e4SLinus Torvalds 5241da177e4SLinus Torvalds return path; 5251da177e4SLinus Torvalds } 5261da177e4SLinus Torvalds 5271da177e4SLinus Torvalds static int path_rec_start(struct net_device *dev, 5281da177e4SLinus Torvalds struct ipoib_path *path) 5291da177e4SLinus Torvalds { 5301da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 5311da177e4SLinus Torvalds 5325b095d98SHarvey Harrison ipoib_dbg(priv, "Start path record lookup for %pI6\n", 533fcace2feSHarvey Harrison path->pathrec.dgid.raw); 5341da177e4SLinus Torvalds 53565c7eddaSRoland Dreier init_completion(&path->done); 53665c7eddaSRoland Dreier 5371da177e4SLinus Torvalds path->query_id = 538c1a0b23bSMichael S. Tsirkin ib_sa_path_rec_get(&ipoib_sa_client, priv->ca, priv->port, 5391da177e4SLinus Torvalds &path->pathrec, 5401da177e4SLinus Torvalds IB_SA_PATH_REC_DGID | 5411da177e4SLinus Torvalds IB_SA_PATH_REC_SGID | 5421da177e4SLinus Torvalds IB_SA_PATH_REC_NUMB_PATH | 54381668838SSean Hefty IB_SA_PATH_REC_TRAFFIC_CLASS | 5441da177e4SLinus Torvalds IB_SA_PATH_REC_PKEY, 5451da177e4SLinus Torvalds 1000, GFP_ATOMIC, 5461da177e4SLinus Torvalds path_rec_completion, 5471da177e4SLinus Torvalds path, &path->query); 5481da177e4SLinus Torvalds if (path->query_id < 0) { 54901b3fc8bSOr Gerlitz ipoib_warn(priv, "ib_sa_path_rec_get failed: %d\n", path->query_id); 5501da177e4SLinus Torvalds path->query = NULL; 55193a3ab93SYossi Etigin complete(&path->done); 5521da177e4SLinus Torvalds return path->query_id; 5531da177e4SLinus Torvalds } 5541da177e4SLinus Torvalds 5551da177e4SLinus Torvalds return 0; 5561da177e4SLinus Torvalds } 5571da177e4SLinus Torvalds 5581da177e4SLinus Torvalds static void neigh_add_path(struct sk_buff *skb, struct net_device *dev) 5591da177e4SLinus Torvalds { 5601da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 5611da177e4SLinus Torvalds struct ipoib_path *path; 5621da177e4SLinus Torvalds struct ipoib_neigh *neigh; 56369cce1d1SDavid S. Miller struct neighbour *n; 564943c246eSRoland Dreier unsigned long flags; 5651da177e4SLinus Torvalds 56669cce1d1SDavid S. Miller n = dst_get_neighbour(skb_dst(skb)); 56769cce1d1SDavid S. Miller neigh = ipoib_neigh_alloc(n, skb->dev); 5681da177e4SLinus Torvalds if (!neigh) { 569de903512SRoland Dreier ++dev->stats.tx_dropped; 5701da177e4SLinus Torvalds dev_kfree_skb_any(skb); 5711da177e4SLinus Torvalds return; 5721da177e4SLinus Torvalds } 5731da177e4SLinus Torvalds 574943c246eSRoland Dreier spin_lock_irqsave(&priv->lock, flags); 5751da177e4SLinus Torvalds 57669cce1d1SDavid S. Miller path = __path_find(dev, n->ha + 4); 5771da177e4SLinus Torvalds if (!path) { 57869cce1d1SDavid S. Miller path = path_rec_create(dev, n->ha + 4); 5791da177e4SLinus Torvalds if (!path) 580d2e0655eSMichael S. Tsirkin goto err_path; 5811da177e4SLinus Torvalds 5821da177e4SLinus Torvalds __path_add(dev, path); 5831da177e4SLinus Torvalds } 5841da177e4SLinus Torvalds 5851da177e4SLinus Torvalds list_add_tail(&neigh->list, &path->neigh_list); 5861da177e4SLinus Torvalds 58747f7a071SMichael S. Tsirkin if (path->ah) { 5881da177e4SLinus Torvalds kref_get(&path->ah->ref); 5891da177e4SLinus Torvalds neigh->ah = path->ah; 5908a7f7521SMichael S. Tsirkin memcpy(&neigh->dgid.raw, &path->pathrec.dgid.raw, 5918a7f7521SMichael S. Tsirkin sizeof(union ib_gid)); 5921da177e4SLinus Torvalds 593839fcabaSMichael S. Tsirkin if (ipoib_cm_enabled(dev, neigh->neighbour)) { 594839fcabaSMichael S. Tsirkin if (!ipoib_cm_get(neigh)) 595839fcabaSMichael S. Tsirkin ipoib_cm_set(neigh, ipoib_cm_create_tx(dev, path, neigh)); 596839fcabaSMichael S. Tsirkin if (!ipoib_cm_get(neigh)) { 597839fcabaSMichael S. Tsirkin list_del(&neigh->list); 598839fcabaSMichael S. Tsirkin if (neigh->ah) 599839fcabaSMichael S. Tsirkin ipoib_put_ah(neigh->ah); 600839fcabaSMichael S. Tsirkin ipoib_neigh_free(dev, neigh); 601839fcabaSMichael S. Tsirkin goto err_drop; 602839fcabaSMichael S. Tsirkin } 603839fcabaSMichael S. Tsirkin if (skb_queue_len(&neigh->queue) < IPOIB_MAX_PATH_REC_QUEUE) 604839fcabaSMichael S. Tsirkin __skb_queue_tail(&neigh->queue, skb); 605839fcabaSMichael S. Tsirkin else { 606839fcabaSMichael S. Tsirkin ipoib_warn(priv, "queue length limit %d. Packet drop.\n", 607839fcabaSMichael S. Tsirkin skb_queue_len(&neigh->queue)); 608839fcabaSMichael S. Tsirkin goto err_drop; 609839fcabaSMichael S. Tsirkin } 610721d67cdSRoland Dreier } else { 611721d67cdSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 61269cce1d1SDavid S. Miller ipoib_send(dev, skb, path->ah, IPOIB_QPN(n->ha)); 613721d67cdSRoland Dreier return; 614721d67cdSRoland Dreier } 6151da177e4SLinus Torvalds } else { 6161da177e4SLinus Torvalds neigh->ah = NULL; 6171da177e4SLinus Torvalds 6181da177e4SLinus Torvalds if (!path->query && path_rec_start(dev, path)) 619d2e0655eSMichael S. Tsirkin goto err_list; 6202745b5b7SMichael S. Tsirkin 6212745b5b7SMichael S. Tsirkin __skb_queue_tail(&neigh->queue, skb); 6221da177e4SLinus Torvalds } 6231da177e4SLinus Torvalds 624943c246eSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 6251da177e4SLinus Torvalds return; 6261da177e4SLinus Torvalds 627d2e0655eSMichael S. Tsirkin err_list: 6281da177e4SLinus Torvalds list_del(&neigh->list); 6291da177e4SLinus Torvalds 630d2e0655eSMichael S. Tsirkin err_path: 6312745b5b7SMichael S. Tsirkin ipoib_neigh_free(dev, neigh); 632839fcabaSMichael S. Tsirkin err_drop: 633de903512SRoland Dreier ++dev->stats.tx_dropped; 6341da177e4SLinus Torvalds dev_kfree_skb_any(skb); 6351da177e4SLinus Torvalds 636943c246eSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 6371da177e4SLinus Torvalds } 6381da177e4SLinus Torvalds 639d70ed607SRoland Dreier static void ipoib_path_lookup(struct sk_buff *skb, struct net_device *dev) 6401da177e4SLinus Torvalds { 6411da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(skb->dev); 64269cce1d1SDavid S. Miller struct dst_entry *dst = skb_dst(skb); 64369cce1d1SDavid S. Miller struct neighbour *n; 6441da177e4SLinus Torvalds 6451da177e4SLinus Torvalds /* Look up path record for unicasts */ 64669cce1d1SDavid S. Miller n = dst_get_neighbour(dst); 64769cce1d1SDavid S. Miller if (n->ha[4] != 0xff) { 6481da177e4SLinus Torvalds neigh_add_path(skb, dev); 6491da177e4SLinus Torvalds return; 6501da177e4SLinus Torvalds } 6511da177e4SLinus Torvalds 6521da177e4SLinus Torvalds /* Add in the P_Key for multicasts */ 65369cce1d1SDavid S. Miller n->ha[8] = (priv->pkey >> 8) & 0xff; 65469cce1d1SDavid S. Miller n->ha[9] = priv->pkey & 0xff; 65569cce1d1SDavid S. Miller ipoib_mcast_send(dev, n->ha + 4, skb); 6561da177e4SLinus Torvalds } 6571da177e4SLinus Torvalds 6581da177e4SLinus Torvalds static void unicast_arp_send(struct sk_buff *skb, struct net_device *dev, 6591da177e4SLinus Torvalds struct ipoib_pseudoheader *phdr) 6601da177e4SLinus Torvalds { 6611da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 6621da177e4SLinus Torvalds struct ipoib_path *path; 663943c246eSRoland Dreier unsigned long flags; 6641da177e4SLinus Torvalds 665943c246eSRoland Dreier spin_lock_irqsave(&priv->lock, flags); 6661da177e4SLinus Torvalds 66737c22a77SJack Morgenstein path = __path_find(dev, phdr->hwaddr + 4); 668ee1e2c82SMoni Shoua if (!path || !path->valid) { 66971d98b46SJack Morgenstein int new_path = 0; 67071d98b46SJack Morgenstein 67171d98b46SJack Morgenstein if (!path) { 67237c22a77SJack Morgenstein path = path_rec_create(dev, phdr->hwaddr + 4); 67371d98b46SJack Morgenstein new_path = 1; 67471d98b46SJack Morgenstein } 6751da177e4SLinus Torvalds if (path) { 6761da177e4SLinus Torvalds /* put pseudoheader back on for next time */ 6771da177e4SLinus Torvalds skb_push(skb, sizeof *phdr); 6781da177e4SLinus Torvalds __skb_queue_tail(&path->queue, skb); 6791da177e4SLinus Torvalds 680ff79ae80SYossi Etigin if (!path->query && path_rec_start(dev, path)) { 681943c246eSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 68271d98b46SJack Morgenstein if (new_path) 6831da177e4SLinus Torvalds path_free(dev, path); 6841da177e4SLinus Torvalds return; 6851da177e4SLinus Torvalds } else 6861da177e4SLinus Torvalds __path_add(dev, path); 6871da177e4SLinus Torvalds } else { 688de903512SRoland Dreier ++dev->stats.tx_dropped; 6891da177e4SLinus Torvalds dev_kfree_skb_any(skb); 6901da177e4SLinus Torvalds } 6911da177e4SLinus Torvalds 692943c246eSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 6931da177e4SLinus Torvalds return; 6941da177e4SLinus Torvalds } 6951da177e4SLinus Torvalds 69647f7a071SMichael S. Tsirkin if (path->ah) { 6971da177e4SLinus Torvalds ipoib_dbg(priv, "Send unicast ARP to %04x\n", 6981da177e4SLinus Torvalds be16_to_cpu(path->pathrec.dlid)); 6991da177e4SLinus Torvalds 700721d67cdSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 701073ae841SMichael S. Tsirkin ipoib_send(dev, skb, path->ah, IPOIB_QPN(phdr->hwaddr)); 702721d67cdSRoland Dreier return; 7031da177e4SLinus Torvalds } else if ((path->query || !path_rec_start(dev, path)) && 7041da177e4SLinus Torvalds skb_queue_len(&path->queue) < IPOIB_MAX_PATH_REC_QUEUE) { 7051da177e4SLinus Torvalds /* put pseudoheader back on for next time */ 7061da177e4SLinus Torvalds skb_push(skb, sizeof *phdr); 7071da177e4SLinus Torvalds __skb_queue_tail(&path->queue, skb); 7081da177e4SLinus Torvalds } else { 709de903512SRoland Dreier ++dev->stats.tx_dropped; 7101da177e4SLinus Torvalds dev_kfree_skb_any(skb); 7111da177e4SLinus Torvalds } 7121da177e4SLinus Torvalds 713943c246eSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 7141da177e4SLinus Torvalds } 7151da177e4SLinus Torvalds 7161da177e4SLinus Torvalds static int ipoib_start_xmit(struct sk_buff *skb, struct net_device *dev) 7171da177e4SLinus Torvalds { 7181da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 7191da177e4SLinus Torvalds struct ipoib_neigh *neigh; 72022cfb0bfSBernd Schubert struct neighbour *n = NULL; 7211da177e4SLinus Torvalds unsigned long flags; 7221da177e4SLinus Torvalds 72322cfb0bfSBernd Schubert if (likely(skb_dst(skb))) 72469cce1d1SDavid S. Miller n = dst_get_neighbour(skb_dst(skb)); 72522cfb0bfSBernd Schubert 72622cfb0bfSBernd Schubert if (likely(n)) { 72769cce1d1SDavid S. Miller if (unlikely(!*to_ipoib_neigh(n))) { 728d70ed607SRoland Dreier ipoib_path_lookup(skb, dev); 729943c246eSRoland Dreier return NETDEV_TX_OK; 7301da177e4SLinus Torvalds } 7311da177e4SLinus Torvalds 73269cce1d1SDavid S. Miller neigh = *to_ipoib_neigh(n); 7331da177e4SLinus Torvalds 734200d1713SMoni Shoua if (unlikely((memcmp(&neigh->dgid.raw, 73569cce1d1SDavid S. Miller n->ha + 4, 736200d1713SMoni Shoua sizeof(union ib_gid))) || 737200d1713SMoni Shoua (neigh->dev != dev))) { 738943c246eSRoland Dreier spin_lock_irqsave(&priv->lock, flags); 7398a7f7521SMichael S. Tsirkin /* 7408a7f7521SMichael S. Tsirkin * It's safe to call ipoib_put_ah() inside 7418a7f7521SMichael S. Tsirkin * priv->lock here, because we know that 7428a7f7521SMichael S. Tsirkin * path->ah will always hold one more reference, 7438a7f7521SMichael S. Tsirkin * so ipoib_put_ah() will never do more than 7448a7f7521SMichael S. Tsirkin * decrement the ref count. 7458a7f7521SMichael S. Tsirkin */ 746a50df398SYossi Etigin if (neigh->ah) 7478a7f7521SMichael S. Tsirkin ipoib_put_ah(neigh->ah); 7488a7f7521SMichael S. Tsirkin list_del(&neigh->list); 7492745b5b7SMichael S. Tsirkin ipoib_neigh_free(dev, neigh); 750943c246eSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 7518a7f7521SMichael S. Tsirkin ipoib_path_lookup(skb, dev); 752943c246eSRoland Dreier return NETDEV_TX_OK; 7538a7f7521SMichael S. Tsirkin } 7548a7f7521SMichael S. Tsirkin 755bafff974SOr Gerlitz if (ipoib_cm_get(neigh)) { 756bafff974SOr Gerlitz if (ipoib_cm_up(neigh)) { 757bafff974SOr Gerlitz ipoib_cm_send(dev, skb, ipoib_cm_get(neigh)); 758943c246eSRoland Dreier return NETDEV_TX_OK; 759bafff974SOr Gerlitz } 760bafff974SOr Gerlitz } else if (neigh->ah) { 76169cce1d1SDavid S. Miller ipoib_send(dev, skb, neigh->ah, IPOIB_QPN(n->ha)); 762943c246eSRoland Dreier return NETDEV_TX_OK; 7631da177e4SLinus Torvalds } 7641da177e4SLinus Torvalds 7651da177e4SLinus Torvalds if (skb_queue_len(&neigh->queue) < IPOIB_MAX_PATH_REC_QUEUE) { 766943c246eSRoland Dreier spin_lock_irqsave(&priv->lock, flags); 7671da177e4SLinus Torvalds __skb_queue_tail(&neigh->queue, skb); 768943c246eSRoland Dreier spin_unlock_irqrestore(&priv->lock, flags); 7691da177e4SLinus Torvalds } else { 770de903512SRoland Dreier ++dev->stats.tx_dropped; 7711da177e4SLinus Torvalds dev_kfree_skb_any(skb); 7721da177e4SLinus Torvalds } 7731da177e4SLinus Torvalds } else { 7741da177e4SLinus Torvalds struct ipoib_pseudoheader *phdr = 7751da177e4SLinus Torvalds (struct ipoib_pseudoheader *) skb->data; 7761da177e4SLinus Torvalds skb_pull(skb, sizeof *phdr); 7771da177e4SLinus Torvalds 7781da177e4SLinus Torvalds if (phdr->hwaddr[4] == 0xff) { 7791da177e4SLinus Torvalds /* Add in the P_Key for multicast*/ 7801da177e4SLinus Torvalds phdr->hwaddr[8] = (priv->pkey >> 8) & 0xff; 7811da177e4SLinus Torvalds phdr->hwaddr[9] = priv->pkey & 0xff; 7821da177e4SLinus Torvalds 78337c22a77SJack Morgenstein ipoib_mcast_send(dev, phdr->hwaddr + 4, skb); 7841da177e4SLinus Torvalds } else { 7850dca0f7bSHal Rosenstock /* unicast GID -- should be ARP or RARP reply */ 7861da177e4SLinus Torvalds 7870dca0f7bSHal Rosenstock if ((be16_to_cpup((__be16 *) skb->data) != ETH_P_ARP) && 7880dca0f7bSHal Rosenstock (be16_to_cpup((__be16 *) skb->data) != ETH_P_RARP)) { 7895b095d98SHarvey Harrison ipoib_warn(priv, "Unicast, no %s: type %04x, QPN %06x %pI6\n", 790adf30907SEric Dumazet skb_dst(skb) ? "neigh" : "dst", 79197f52eb4SSean Hefty be16_to_cpup((__be16 *) skb->data), 792073ae841SMichael S. Tsirkin IPOIB_QPN(phdr->hwaddr), 793fcace2feSHarvey Harrison phdr->hwaddr + 4); 7941da177e4SLinus Torvalds dev_kfree_skb_any(skb); 795de903512SRoland Dreier ++dev->stats.tx_dropped; 796943c246eSRoland Dreier return NETDEV_TX_OK; 7971da177e4SLinus Torvalds } 7981da177e4SLinus Torvalds 7991da177e4SLinus Torvalds unicast_arp_send(skb, dev, phdr); 8001da177e4SLinus Torvalds } 8011da177e4SLinus Torvalds } 8021da177e4SLinus Torvalds 8031da177e4SLinus Torvalds return NETDEV_TX_OK; 8041da177e4SLinus Torvalds } 8051da177e4SLinus Torvalds 8061da177e4SLinus Torvalds static void ipoib_timeout(struct net_device *dev) 8071da177e4SLinus Torvalds { 8081da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 8091da177e4SLinus Torvalds 8104b2d319bSRoland Dreier ipoib_warn(priv, "transmit timeout: latency %d msecs\n", 8114b2d319bSRoland Dreier jiffies_to_msecs(jiffies - dev->trans_start)); 8124b2d319bSRoland Dreier ipoib_warn(priv, "queue stopped %d, tx_head %u, tx_tail %u\n", 8134b2d319bSRoland Dreier netif_queue_stopped(dev), 8144b2d319bSRoland Dreier priv->tx_head, priv->tx_tail); 8151da177e4SLinus Torvalds /* XXX reset QP, etc. */ 8161da177e4SLinus Torvalds } 8171da177e4SLinus Torvalds 8181da177e4SLinus Torvalds static int ipoib_hard_header(struct sk_buff *skb, 8191da177e4SLinus Torvalds struct net_device *dev, 8201da177e4SLinus Torvalds unsigned short type, 8213b04dddeSStephen Hemminger const void *daddr, const void *saddr, unsigned len) 8221da177e4SLinus Torvalds { 8231da177e4SLinus Torvalds struct ipoib_header *header; 82469cce1d1SDavid S. Miller struct dst_entry *dst; 82569cce1d1SDavid S. Miller struct neighbour *n; 8261da177e4SLinus Torvalds 8271da177e4SLinus Torvalds header = (struct ipoib_header *) skb_push(skb, sizeof *header); 8281da177e4SLinus Torvalds 8291da177e4SLinus Torvalds header->proto = htons(type); 8301da177e4SLinus Torvalds header->reserved = 0; 8311da177e4SLinus Torvalds 8321da177e4SLinus Torvalds /* 8331da177e4SLinus Torvalds * If we don't have a neighbour structure, stuff the 8341da177e4SLinus Torvalds * destination address onto the front of the skb so we can 8351da177e4SLinus Torvalds * figure out where to send the packet later. 8361da177e4SLinus Torvalds */ 83769cce1d1SDavid S. Miller dst = skb_dst(skb); 83869cce1d1SDavid S. Miller n = NULL; 83969cce1d1SDavid S. Miller if (dst) 84069cce1d1SDavid S. Miller n = dst_get_neighbour(dst); 84169cce1d1SDavid S. Miller if ((!dst || !n) && daddr) { 8421da177e4SLinus Torvalds struct ipoib_pseudoheader *phdr = 8431da177e4SLinus Torvalds (struct ipoib_pseudoheader *) skb_push(skb, sizeof *phdr); 8441da177e4SLinus Torvalds memcpy(phdr->hwaddr, daddr, INFINIBAND_ALEN); 8451da177e4SLinus Torvalds } 8461da177e4SLinus Torvalds 8471da177e4SLinus Torvalds return 0; 8481da177e4SLinus Torvalds } 8491da177e4SLinus Torvalds 8501da177e4SLinus Torvalds static void ipoib_set_mcast_list(struct net_device *dev) 8511da177e4SLinus Torvalds { 8521da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 8531da177e4SLinus Torvalds 8547a343d4cSLeonid Arsh if (!test_bit(IPOIB_FLAG_OPER_UP, &priv->flags)) { 8557a343d4cSLeonid Arsh ipoib_dbg(priv, "IPOIB_FLAG_OPER_UP not set"); 8567a343d4cSLeonid Arsh return; 8577a343d4cSLeonid Arsh } 8587a343d4cSLeonid Arsh 8591ad62a19SMichael S. Tsirkin queue_work(ipoib_workqueue, &priv->restart_task); 8601da177e4SLinus Torvalds } 8611da177e4SLinus Torvalds 862ecbb4169SAlexey Kuznetsov static void ipoib_neigh_cleanup(struct neighbour *n) 8631da177e4SLinus Torvalds { 8641da177e4SLinus Torvalds struct ipoib_neigh *neigh; 8651da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(n->dev); 8661da177e4SLinus Torvalds unsigned long flags; 8671da177e4SLinus Torvalds struct ipoib_ah *ah = NULL; 8681da177e4SLinus Torvalds 869732a2170SMoni Shoua neigh = *to_ipoib_neigh(n); 8707bc531ddSOr Gerlitz if (neigh) 871732a2170SMoni Shoua priv = netdev_priv(neigh->dev); 8727bc531ddSOr Gerlitz else 873732a2170SMoni Shoua return; 8741da177e4SLinus Torvalds ipoib_dbg(priv, 8755b095d98SHarvey Harrison "neigh_cleanup for %06x %pI6\n", 876073ae841SMichael S. Tsirkin IPOIB_QPN(n->ha), 877fcace2feSHarvey Harrison n->ha + 4); 8781da177e4SLinus Torvalds 8791da177e4SLinus Torvalds spin_lock_irqsave(&priv->lock, flags); 8801da177e4SLinus Torvalds 8811da177e4SLinus Torvalds if (neigh->ah) 8821da177e4SLinus Torvalds ah = neigh->ah; 8831da177e4SLinus Torvalds list_del(&neigh->list); 8842745b5b7SMichael S. Tsirkin ipoib_neigh_free(n->dev, neigh); 8851da177e4SLinus Torvalds 8861da177e4SLinus Torvalds spin_unlock_irqrestore(&priv->lock, flags); 8871da177e4SLinus Torvalds 8881da177e4SLinus Torvalds if (ah) 8891da177e4SLinus Torvalds ipoib_put_ah(ah); 8901da177e4SLinus Torvalds } 8911da177e4SLinus Torvalds 892732a2170SMoni Shoua struct ipoib_neigh *ipoib_neigh_alloc(struct neighbour *neighbour, 893732a2170SMoni Shoua struct net_device *dev) 894d2e0655eSMichael S. Tsirkin { 895d2e0655eSMichael S. Tsirkin struct ipoib_neigh *neigh; 896d2e0655eSMichael S. Tsirkin 897d2e0655eSMichael S. Tsirkin neigh = kmalloc(sizeof *neigh, GFP_ATOMIC); 898d2e0655eSMichael S. Tsirkin if (!neigh) 899d2e0655eSMichael S. Tsirkin return NULL; 900d2e0655eSMichael S. Tsirkin 901d2e0655eSMichael S. Tsirkin neigh->neighbour = neighbour; 902732a2170SMoni Shoua neigh->dev = dev; 9030cd4d0fdSDavid J. Wilder memset(&neigh->dgid.raw, 0, sizeof (union ib_gid)); 904d2e0655eSMichael S. Tsirkin *to_ipoib_neigh(neighbour) = neigh; 90582b39913SRoland Dreier skb_queue_head_init(&neigh->queue); 906839fcabaSMichael S. Tsirkin ipoib_cm_set(neigh, NULL); 907d2e0655eSMichael S. Tsirkin 908d2e0655eSMichael S. Tsirkin return neigh; 909d2e0655eSMichael S. Tsirkin } 910d2e0655eSMichael S. Tsirkin 9112745b5b7SMichael S. Tsirkin void ipoib_neigh_free(struct net_device *dev, struct ipoib_neigh *neigh) 912d2e0655eSMichael S. Tsirkin { 9132745b5b7SMichael S. Tsirkin struct sk_buff *skb; 914d2e0655eSMichael S. Tsirkin *to_ipoib_neigh(neigh->neighbour) = NULL; 9152745b5b7SMichael S. Tsirkin while ((skb = __skb_dequeue(&neigh->queue))) { 916de903512SRoland Dreier ++dev->stats.tx_dropped; 9172745b5b7SMichael S. Tsirkin dev_kfree_skb_any(skb); 9182745b5b7SMichael S. Tsirkin } 919839fcabaSMichael S. Tsirkin if (ipoib_cm_get(neigh)) 920839fcabaSMichael S. Tsirkin ipoib_cm_destroy_tx(ipoib_cm_get(neigh)); 921d2e0655eSMichael S. Tsirkin kfree(neigh); 922d2e0655eSMichael S. Tsirkin } 923d2e0655eSMichael S. Tsirkin 9241da177e4SLinus Torvalds static int ipoib_neigh_setup_dev(struct net_device *dev, struct neigh_parms *parms) 9251da177e4SLinus Torvalds { 926ecbb4169SAlexey Kuznetsov parms->neigh_cleanup = ipoib_neigh_cleanup; 9271da177e4SLinus Torvalds 9281da177e4SLinus Torvalds return 0; 9291da177e4SLinus Torvalds } 9301da177e4SLinus Torvalds 9311da177e4SLinus Torvalds int ipoib_dev_init(struct net_device *dev, struct ib_device *ca, int port) 9321da177e4SLinus Torvalds { 9331da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 9341da177e4SLinus Torvalds 9351da177e4SLinus Torvalds /* Allocate RX/TX "rings" to hold queued skbs */ 9360f485251SShirley Ma priv->rx_ring = kzalloc(ipoib_recvq_size * sizeof *priv->rx_ring, 9371da177e4SLinus Torvalds GFP_KERNEL); 9381da177e4SLinus Torvalds if (!priv->rx_ring) { 9391da177e4SLinus Torvalds printk(KERN_WARNING "%s: failed to allocate RX ring (%d entries)\n", 9400f485251SShirley Ma ca->name, ipoib_recvq_size); 9411da177e4SLinus Torvalds goto out; 9421da177e4SLinus Torvalds } 9431da177e4SLinus Torvalds 944948579cdSJoe Perches priv->tx_ring = vzalloc(ipoib_sendq_size * sizeof *priv->tx_ring); 9451da177e4SLinus Torvalds if (!priv->tx_ring) { 9461da177e4SLinus Torvalds printk(KERN_WARNING "%s: failed to allocate TX ring (%d entries)\n", 9470f485251SShirley Ma ca->name, ipoib_sendq_size); 9481da177e4SLinus Torvalds goto out_rx_ring_cleanup; 9491da177e4SLinus Torvalds } 9501da177e4SLinus Torvalds 9511b524963SMichael S. Tsirkin /* priv->tx_head, tx_tail & tx_outstanding are already 0 */ 9521da177e4SLinus Torvalds 9531da177e4SLinus Torvalds if (ipoib_ib_dev_init(dev, ca, port)) 9541da177e4SLinus Torvalds goto out_tx_ring_cleanup; 9551da177e4SLinus Torvalds 9561da177e4SLinus Torvalds return 0; 9571da177e4SLinus Torvalds 9581da177e4SLinus Torvalds out_tx_ring_cleanup: 95910313cbbSRoland Dreier vfree(priv->tx_ring); 9601da177e4SLinus Torvalds 9611da177e4SLinus Torvalds out_rx_ring_cleanup: 9621da177e4SLinus Torvalds kfree(priv->rx_ring); 9631da177e4SLinus Torvalds 9641da177e4SLinus Torvalds out: 9651da177e4SLinus Torvalds return -ENOMEM; 9661da177e4SLinus Torvalds } 9671da177e4SLinus Torvalds 9681da177e4SLinus Torvalds void ipoib_dev_cleanup(struct net_device *dev) 9691da177e4SLinus Torvalds { 9701da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev), *cpriv, *tcpriv; 9711da177e4SLinus Torvalds 9721732b0efSRoland Dreier ipoib_delete_debug_files(dev); 9731da177e4SLinus Torvalds 9741da177e4SLinus Torvalds /* Delete any child interfaces first */ 9751da177e4SLinus Torvalds list_for_each_entry_safe(cpriv, tcpriv, &priv->child_intfs, list) { 9761da177e4SLinus Torvalds unregister_netdev(cpriv->dev); 9771da177e4SLinus Torvalds ipoib_dev_cleanup(cpriv->dev); 9781da177e4SLinus Torvalds free_netdev(cpriv->dev); 9791da177e4SLinus Torvalds } 9801da177e4SLinus Torvalds 9811da177e4SLinus Torvalds ipoib_ib_dev_cleanup(dev); 9821da177e4SLinus Torvalds 9831da177e4SLinus Torvalds kfree(priv->rx_ring); 98410313cbbSRoland Dreier vfree(priv->tx_ring); 98592a6b34bSHal Rosenstock 98692a6b34bSHal Rosenstock priv->rx_ring = NULL; 9871da177e4SLinus Torvalds priv->tx_ring = NULL; 9881da177e4SLinus Torvalds } 9891da177e4SLinus Torvalds 9903b04dddeSStephen Hemminger static const struct header_ops ipoib_header_ops = { 9913b04dddeSStephen Hemminger .create = ipoib_hard_header, 9923b04dddeSStephen Hemminger }; 9933b04dddeSStephen Hemminger 994fe8114e8SStephen Hemminger static const struct net_device_ops ipoib_netdev_ops = { 995fe8114e8SStephen Hemminger .ndo_open = ipoib_open, 996fe8114e8SStephen Hemminger .ndo_stop = ipoib_stop, 997fe8114e8SStephen Hemminger .ndo_change_mtu = ipoib_change_mtu, 9983d96c74dSMichał Mirosław .ndo_fix_features = ipoib_fix_features, 999fe8114e8SStephen Hemminger .ndo_start_xmit = ipoib_start_xmit, 1000fe8114e8SStephen Hemminger .ndo_tx_timeout = ipoib_timeout, 1001afc4b13dSJiri Pirko .ndo_set_rx_mode = ipoib_set_mcast_list, 1002fe8114e8SStephen Hemminger .ndo_neigh_setup = ipoib_neigh_setup_dev, 1003fe8114e8SStephen Hemminger }; 1004fe8114e8SStephen Hemminger 10051da177e4SLinus Torvalds static void ipoib_setup(struct net_device *dev) 10061da177e4SLinus Torvalds { 10071da177e4SLinus Torvalds struct ipoib_dev_priv *priv = netdev_priv(dev); 10081da177e4SLinus Torvalds 1009fe8114e8SStephen Hemminger dev->netdev_ops = &ipoib_netdev_ops; 10103b04dddeSStephen Hemminger dev->header_ops = &ipoib_header_ops; 1011bea3348eSStephen Hemminger 101282c24c18SEli Cohen ipoib_set_ethtool_ops(dev); 101382c24c18SEli Cohen 1014bea3348eSStephen Hemminger netif_napi_add(dev, &priv->napi, ipoib_poll, 100); 10151da177e4SLinus Torvalds 10161da177e4SLinus Torvalds dev->watchdog_timeo = HZ; 10171da177e4SLinus Torvalds 10181da177e4SLinus Torvalds dev->flags |= IFF_BROADCAST | IFF_MULTICAST; 10191da177e4SLinus Torvalds 10201da177e4SLinus Torvalds /* 10211da177e4SLinus Torvalds * We add in INFINIBAND_ALEN to allow for the destination 10221da177e4SLinus Torvalds * address "pseudoheader" for skbs without neighbour struct. 10231da177e4SLinus Torvalds */ 10241da177e4SLinus Torvalds dev->hard_header_len = IPOIB_ENCAP_LEN + INFINIBAND_ALEN; 10251da177e4SLinus Torvalds dev->addr_len = INFINIBAND_ALEN; 10261da177e4SLinus Torvalds dev->type = ARPHRD_INFINIBAND; 10270f485251SShirley Ma dev->tx_queue_len = ipoib_sendq_size * 2; 1028eb14032fSEli Cohen dev->features = (NETIF_F_VLAN_CHALLENGED | 1029eb14032fSEli Cohen NETIF_F_HIGHDMA); 103086d15cd8SEric Dumazet dev->priv_flags &= ~IFF_XMIT_DST_RELEASE; 10311da177e4SLinus Torvalds 10321da177e4SLinus Torvalds memcpy(dev->broadcast, ipv4_bcast_addr, INFINIBAND_ALEN); 10331da177e4SLinus Torvalds 10341da177e4SLinus Torvalds netif_carrier_off(dev); 10351da177e4SLinus Torvalds 10361da177e4SLinus Torvalds priv->dev = dev; 10371da177e4SLinus Torvalds 10381da177e4SLinus Torvalds spin_lock_init(&priv->lock); 10391da177e4SLinus Torvalds 104095ed644fSIngo Molnar mutex_init(&priv->vlan_mutex); 10411da177e4SLinus Torvalds 10421da177e4SLinus Torvalds INIT_LIST_HEAD(&priv->path_list); 10431da177e4SLinus Torvalds INIT_LIST_HEAD(&priv->child_intfs); 10441da177e4SLinus Torvalds INIT_LIST_HEAD(&priv->dead_ahs); 10451da177e4SLinus Torvalds INIT_LIST_HEAD(&priv->multicast_list); 10461da177e4SLinus Torvalds 104726bbf13cSYosef Etigin INIT_DELAYED_WORK(&priv->pkey_poll_task, ipoib_pkey_poll); 1048c4028958SDavid Howells INIT_DELAYED_WORK(&priv->mcast_task, ipoib_mcast_join_task); 1049e8224e4bSYossi Etigin INIT_WORK(&priv->carrier_on_task, ipoib_mcast_carrier_on_task); 1050ee1e2c82SMoni Shoua INIT_WORK(&priv->flush_light, ipoib_ib_dev_flush_light); 1051ee1e2c82SMoni Shoua INIT_WORK(&priv->flush_normal, ipoib_ib_dev_flush_normal); 1052ee1e2c82SMoni Shoua INIT_WORK(&priv->flush_heavy, ipoib_ib_dev_flush_heavy); 1053c4028958SDavid Howells INIT_WORK(&priv->restart_task, ipoib_mcast_restart_task); 1054c4028958SDavid Howells INIT_DELAYED_WORK(&priv->ah_reap_task, ipoib_reap_ah); 10551da177e4SLinus Torvalds } 10561da177e4SLinus Torvalds 10571da177e4SLinus Torvalds struct ipoib_dev_priv *ipoib_intf_alloc(const char *name) 10581da177e4SLinus Torvalds { 10591da177e4SLinus Torvalds struct net_device *dev; 10601da177e4SLinus Torvalds 10611da177e4SLinus Torvalds dev = alloc_netdev((int) sizeof (struct ipoib_dev_priv), name, 10621da177e4SLinus Torvalds ipoib_setup); 10631da177e4SLinus Torvalds if (!dev) 10641da177e4SLinus Torvalds return NULL; 10651da177e4SLinus Torvalds 10661da177e4SLinus Torvalds return netdev_priv(dev); 10671da177e4SLinus Torvalds } 10681da177e4SLinus Torvalds 106943cb76d9SGreg Kroah-Hartman static ssize_t show_pkey(struct device *dev, 107043cb76d9SGreg Kroah-Hartman struct device_attribute *attr, char *buf) 10711da177e4SLinus Torvalds { 107243cb76d9SGreg Kroah-Hartman struct ipoib_dev_priv *priv = netdev_priv(to_net_dev(dev)); 10731da177e4SLinus Torvalds 10741da177e4SLinus Torvalds return sprintf(buf, "0x%04x\n", priv->pkey); 10751da177e4SLinus Torvalds } 107643cb76d9SGreg Kroah-Hartman static DEVICE_ATTR(pkey, S_IRUGO, show_pkey, NULL); 10771da177e4SLinus Torvalds 1078335a64a5SOr Gerlitz static ssize_t show_umcast(struct device *dev, 1079335a64a5SOr Gerlitz struct device_attribute *attr, char *buf) 1080335a64a5SOr Gerlitz { 1081335a64a5SOr Gerlitz struct ipoib_dev_priv *priv = netdev_priv(to_net_dev(dev)); 1082335a64a5SOr Gerlitz 1083335a64a5SOr Gerlitz return sprintf(buf, "%d\n", test_bit(IPOIB_FLAG_UMCAST, &priv->flags)); 1084335a64a5SOr Gerlitz } 1085335a64a5SOr Gerlitz 1086335a64a5SOr Gerlitz static ssize_t set_umcast(struct device *dev, 1087335a64a5SOr Gerlitz struct device_attribute *attr, 1088335a64a5SOr Gerlitz const char *buf, size_t count) 1089335a64a5SOr Gerlitz { 1090335a64a5SOr Gerlitz struct ipoib_dev_priv *priv = netdev_priv(to_net_dev(dev)); 1091335a64a5SOr Gerlitz unsigned long umcast_val = simple_strtoul(buf, NULL, 0); 1092335a64a5SOr Gerlitz 1093335a64a5SOr Gerlitz if (umcast_val > 0) { 1094335a64a5SOr Gerlitz set_bit(IPOIB_FLAG_UMCAST, &priv->flags); 1095335a64a5SOr Gerlitz ipoib_warn(priv, "ignoring multicast groups joined directly " 1096335a64a5SOr Gerlitz "by userspace\n"); 1097335a64a5SOr Gerlitz } else 1098335a64a5SOr Gerlitz clear_bit(IPOIB_FLAG_UMCAST, &priv->flags); 1099335a64a5SOr Gerlitz 1100335a64a5SOr Gerlitz return count; 1101335a64a5SOr Gerlitz } 1102335a64a5SOr Gerlitz static DEVICE_ATTR(umcast, S_IWUSR | S_IRUGO, show_umcast, set_umcast); 1103335a64a5SOr Gerlitz 1104335a64a5SOr Gerlitz int ipoib_add_umcast_attr(struct net_device *dev) 1105335a64a5SOr Gerlitz { 1106335a64a5SOr Gerlitz return device_create_file(&dev->dev, &dev_attr_umcast); 1107335a64a5SOr Gerlitz } 1108335a64a5SOr Gerlitz 110943cb76d9SGreg Kroah-Hartman static ssize_t create_child(struct device *dev, 111043cb76d9SGreg Kroah-Hartman struct device_attribute *attr, 11111da177e4SLinus Torvalds const char *buf, size_t count) 11121da177e4SLinus Torvalds { 11131da177e4SLinus Torvalds int pkey; 11141da177e4SLinus Torvalds int ret; 11151da177e4SLinus Torvalds 11161da177e4SLinus Torvalds if (sscanf(buf, "%i", &pkey) != 1) 11171da177e4SLinus Torvalds return -EINVAL; 11181da177e4SLinus Torvalds 11191da177e4SLinus Torvalds if (pkey < 0 || pkey > 0xffff) 11201da177e4SLinus Torvalds return -EINVAL; 11211da177e4SLinus Torvalds 11224ce05937SRoland Dreier /* 11234ce05937SRoland Dreier * Set the full membership bit, so that we join the right 11244ce05937SRoland Dreier * broadcast group, etc. 11254ce05937SRoland Dreier */ 11264ce05937SRoland Dreier pkey |= 0x8000; 11274ce05937SRoland Dreier 112843cb76d9SGreg Kroah-Hartman ret = ipoib_vlan_add(to_net_dev(dev), pkey); 11291da177e4SLinus Torvalds 11301da177e4SLinus Torvalds return ret ? ret : count; 11311da177e4SLinus Torvalds } 11327a52b34bSOr Gerlitz static DEVICE_ATTR(create_child, S_IWUSR, NULL, create_child); 11331da177e4SLinus Torvalds 113443cb76d9SGreg Kroah-Hartman static ssize_t delete_child(struct device *dev, 113543cb76d9SGreg Kroah-Hartman struct device_attribute *attr, 11361da177e4SLinus Torvalds const char *buf, size_t count) 11371da177e4SLinus Torvalds { 11381da177e4SLinus Torvalds int pkey; 11391da177e4SLinus Torvalds int ret; 11401da177e4SLinus Torvalds 11411da177e4SLinus Torvalds if (sscanf(buf, "%i", &pkey) != 1) 11421da177e4SLinus Torvalds return -EINVAL; 11431da177e4SLinus Torvalds 11441da177e4SLinus Torvalds if (pkey < 0 || pkey > 0xffff) 11451da177e4SLinus Torvalds return -EINVAL; 11461da177e4SLinus Torvalds 114743cb76d9SGreg Kroah-Hartman ret = ipoib_vlan_delete(to_net_dev(dev), pkey); 11481da177e4SLinus Torvalds 11491da177e4SLinus Torvalds return ret ? ret : count; 11501da177e4SLinus Torvalds 11511da177e4SLinus Torvalds } 11527a52b34bSOr Gerlitz static DEVICE_ATTR(delete_child, S_IWUSR, NULL, delete_child); 11531da177e4SLinus Torvalds 11541da177e4SLinus Torvalds int ipoib_add_pkey_attr(struct net_device *dev) 11551da177e4SLinus Torvalds { 115643cb76d9SGreg Kroah-Hartman return device_create_file(&dev->dev, &dev_attr_pkey); 11571da177e4SLinus Torvalds } 11581da177e4SLinus Torvalds 115983bb63f6SOr Gerlitz int ipoib_set_dev_features(struct ipoib_dev_priv *priv, struct ib_device *hca) 116083bb63f6SOr Gerlitz { 116183bb63f6SOr Gerlitz struct ib_device_attr *device_attr; 116283bb63f6SOr Gerlitz int result = -ENOMEM; 116383bb63f6SOr Gerlitz 116483bb63f6SOr Gerlitz device_attr = kmalloc(sizeof *device_attr, GFP_KERNEL); 116583bb63f6SOr Gerlitz if (!device_attr) { 116683bb63f6SOr Gerlitz printk(KERN_WARNING "%s: allocation of %zu bytes failed\n", 116783bb63f6SOr Gerlitz hca->name, sizeof *device_attr); 116883bb63f6SOr Gerlitz return result; 116983bb63f6SOr Gerlitz } 117083bb63f6SOr Gerlitz 117183bb63f6SOr Gerlitz result = ib_query_device(hca, device_attr); 117283bb63f6SOr Gerlitz if (result) { 117383bb63f6SOr Gerlitz printk(KERN_WARNING "%s: ib_query_device failed (ret = %d)\n", 117483bb63f6SOr Gerlitz hca->name, result); 117583bb63f6SOr Gerlitz kfree(device_attr); 117683bb63f6SOr Gerlitz return result; 117783bb63f6SOr Gerlitz } 117883bb63f6SOr Gerlitz priv->hca_caps = device_attr->device_cap_flags; 117983bb63f6SOr Gerlitz 118083bb63f6SOr Gerlitz kfree(device_attr); 118183bb63f6SOr Gerlitz 118283bb63f6SOr Gerlitz if (priv->hca_caps & IB_DEVICE_UD_IP_CSUM) { 11833d96c74dSMichał Mirosław priv->dev->hw_features = NETIF_F_SG | 11843d96c74dSMichał Mirosław NETIF_F_IP_CSUM | NETIF_F_RXCSUM; 11853d96c74dSMichał Mirosław 11863d96c74dSMichał Mirosław if (priv->hca_caps & IB_DEVICE_UD_TSO) 11873d96c74dSMichał Mirosław priv->dev->hw_features |= NETIF_F_TSO; 11883d96c74dSMichał Mirosław 11893d96c74dSMichał Mirosław priv->dev->features |= priv->dev->hw_features; 119083bb63f6SOr Gerlitz } 119183bb63f6SOr Gerlitz 119283bb63f6SOr Gerlitz return 0; 119383bb63f6SOr Gerlitz } 119483bb63f6SOr Gerlitz 11951da177e4SLinus Torvalds static struct net_device *ipoib_add_port(const char *format, 11961da177e4SLinus Torvalds struct ib_device *hca, u8 port) 11971da177e4SLinus Torvalds { 11981da177e4SLinus Torvalds struct ipoib_dev_priv *priv; 1199bc7b3a36SShirley Ma struct ib_port_attr attr; 12001da177e4SLinus Torvalds int result = -ENOMEM; 12011da177e4SLinus Torvalds 12021da177e4SLinus Torvalds priv = ipoib_intf_alloc(format); 12031da177e4SLinus Torvalds if (!priv) 12041da177e4SLinus Torvalds goto alloc_mem_failed; 12051da177e4SLinus Torvalds 12061da177e4SLinus Torvalds SET_NETDEV_DEV(priv->dev, hca->dma_device); 1207c3aa9b18SEli Cohen priv->dev->dev_id = port - 1; 12081da177e4SLinus Torvalds 1209bc7b3a36SShirley Ma if (!ib_query_port(hca, port, &attr)) 1210bc7b3a36SShirley Ma priv->max_ib_mtu = ib_mtu_enum_to_int(attr.max_mtu); 1211bc7b3a36SShirley Ma else { 1212bc7b3a36SShirley Ma printk(KERN_WARNING "%s: ib_query_port %d failed\n", 1213bc7b3a36SShirley Ma hca->name, port); 1214bc7b3a36SShirley Ma goto device_init_failed; 1215bc7b3a36SShirley Ma } 1216bc7b3a36SShirley Ma 1217bc7b3a36SShirley Ma /* MTU will be reset when mcast join happens */ 1218bc7b3a36SShirley Ma priv->dev->mtu = IPOIB_UD_MTU(priv->max_ib_mtu); 1219bc7b3a36SShirley Ma priv->mcast_mtu = priv->admin_mtu = priv->dev->mtu; 1220bc7b3a36SShirley Ma 12211da177e4SLinus Torvalds result = ib_query_pkey(hca, port, 0, &priv->pkey); 12221da177e4SLinus Torvalds if (result) { 12231da177e4SLinus Torvalds printk(KERN_WARNING "%s: ib_query_pkey port %d failed (ret = %d)\n", 12241da177e4SLinus Torvalds hca->name, port, result); 1225ca6de177SEli Cohen goto device_init_failed; 12261da177e4SLinus Torvalds } 12271da177e4SLinus Torvalds 122883bb63f6SOr Gerlitz if (ipoib_set_dev_features(priv, hca)) 12296046136cSEli Cohen goto device_init_failed; 1230af40da89SVladimir Sokolovsky 12314ce05937SRoland Dreier /* 12324ce05937SRoland Dreier * Set the full membership bit, so that we join the right 12334ce05937SRoland Dreier * broadcast group, etc. 12344ce05937SRoland Dreier */ 12354ce05937SRoland Dreier priv->pkey |= 0x8000; 12364ce05937SRoland Dreier 12371da177e4SLinus Torvalds priv->dev->broadcast[8] = priv->pkey >> 8; 12381da177e4SLinus Torvalds priv->dev->broadcast[9] = priv->pkey & 0xff; 12391da177e4SLinus Torvalds 12401da177e4SLinus Torvalds result = ib_query_gid(hca, port, 0, &priv->local_gid); 12411da177e4SLinus Torvalds if (result) { 12421da177e4SLinus Torvalds printk(KERN_WARNING "%s: ib_query_gid port %d failed (ret = %d)\n", 12431da177e4SLinus Torvalds hca->name, port, result); 1244ca6de177SEli Cohen goto device_init_failed; 12451da177e4SLinus Torvalds } else 12461da177e4SLinus Torvalds memcpy(priv->dev->dev_addr + 4, priv->local_gid.raw, sizeof (union ib_gid)); 12471da177e4SLinus Torvalds 12481da177e4SLinus Torvalds result = ipoib_dev_init(priv->dev, hca, port); 12491da177e4SLinus Torvalds if (result < 0) { 12501da177e4SLinus Torvalds printk(KERN_WARNING "%s: failed to initialize port %d (ret = %d)\n", 12511da177e4SLinus Torvalds hca->name, port, result); 12521da177e4SLinus Torvalds goto device_init_failed; 12531da177e4SLinus Torvalds } 12541da177e4SLinus Torvalds 12551da177e4SLinus Torvalds INIT_IB_EVENT_HANDLER(&priv->event_handler, 12561da177e4SLinus Torvalds priv->ca, ipoib_event); 12571da177e4SLinus Torvalds result = ib_register_event_handler(&priv->event_handler); 12581da177e4SLinus Torvalds if (result < 0) { 12591da177e4SLinus Torvalds printk(KERN_WARNING "%s: ib_register_event_handler failed for " 12601da177e4SLinus Torvalds "port %d (ret = %d)\n", 12611da177e4SLinus Torvalds hca->name, port, result); 12621da177e4SLinus Torvalds goto event_failed; 12631da177e4SLinus Torvalds } 12641da177e4SLinus Torvalds 12651da177e4SLinus Torvalds result = register_netdev(priv->dev); 12661da177e4SLinus Torvalds if (result) { 12671da177e4SLinus Torvalds printk(KERN_WARNING "%s: couldn't register ipoib port %d; error %d\n", 12681da177e4SLinus Torvalds hca->name, port, result); 12691da177e4SLinus Torvalds goto register_failed; 12701da177e4SLinus Torvalds } 12711da177e4SLinus Torvalds 12721732b0efSRoland Dreier ipoib_create_debug_files(priv->dev); 12731da177e4SLinus Torvalds 1274839fcabaSMichael S. Tsirkin if (ipoib_cm_add_mode_attr(priv->dev)) 1275839fcabaSMichael S. Tsirkin goto sysfs_failed; 12761da177e4SLinus Torvalds if (ipoib_add_pkey_attr(priv->dev)) 12771da177e4SLinus Torvalds goto sysfs_failed; 1278335a64a5SOr Gerlitz if (ipoib_add_umcast_attr(priv->dev)) 1279335a64a5SOr Gerlitz goto sysfs_failed; 128043cb76d9SGreg Kroah-Hartman if (device_create_file(&priv->dev->dev, &dev_attr_create_child)) 12811da177e4SLinus Torvalds goto sysfs_failed; 128243cb76d9SGreg Kroah-Hartman if (device_create_file(&priv->dev->dev, &dev_attr_delete_child)) 12831da177e4SLinus Torvalds goto sysfs_failed; 12841da177e4SLinus Torvalds 12851da177e4SLinus Torvalds return priv->dev; 12861da177e4SLinus Torvalds 12871da177e4SLinus Torvalds sysfs_failed: 12881732b0efSRoland Dreier ipoib_delete_debug_files(priv->dev); 12891da177e4SLinus Torvalds unregister_netdev(priv->dev); 12901da177e4SLinus Torvalds 12911da177e4SLinus Torvalds register_failed: 12921da177e4SLinus Torvalds ib_unregister_event_handler(&priv->event_handler); 1293a77a57a1SRoland Dreier flush_workqueue(ipoib_workqueue); 12941da177e4SLinus Torvalds 12951da177e4SLinus Torvalds event_failed: 12961da177e4SLinus Torvalds ipoib_dev_cleanup(priv->dev); 12971da177e4SLinus Torvalds 12981da177e4SLinus Torvalds device_init_failed: 12991da177e4SLinus Torvalds free_netdev(priv->dev); 13001da177e4SLinus Torvalds 13011da177e4SLinus Torvalds alloc_mem_failed: 13021da177e4SLinus Torvalds return ERR_PTR(result); 13031da177e4SLinus Torvalds } 13041da177e4SLinus Torvalds 13051da177e4SLinus Torvalds static void ipoib_add_one(struct ib_device *device) 13061da177e4SLinus Torvalds { 13071da177e4SLinus Torvalds struct list_head *dev_list; 13081da177e4SLinus Torvalds struct net_device *dev; 13091da177e4SLinus Torvalds struct ipoib_dev_priv *priv; 13101da177e4SLinus Torvalds int s, e, p; 13111da177e4SLinus Torvalds 131207ebafbaSTom Tucker if (rdma_node_get_transport(device->node_type) != RDMA_TRANSPORT_IB) 131307ebafbaSTom Tucker return; 131407ebafbaSTom Tucker 13151da177e4SLinus Torvalds dev_list = kmalloc(sizeof *dev_list, GFP_KERNEL); 13161da177e4SLinus Torvalds if (!dev_list) 13171da177e4SLinus Torvalds return; 13181da177e4SLinus Torvalds 13191da177e4SLinus Torvalds INIT_LIST_HEAD(dev_list); 13201da177e4SLinus Torvalds 132107ebafbaSTom Tucker if (device->node_type == RDMA_NODE_IB_SWITCH) { 13221da177e4SLinus Torvalds s = 0; 13231da177e4SLinus Torvalds e = 0; 13241da177e4SLinus Torvalds } else { 13251da177e4SLinus Torvalds s = 1; 13261da177e4SLinus Torvalds e = device->phys_port_cnt; 13271da177e4SLinus Torvalds } 13281da177e4SLinus Torvalds 13291da177e4SLinus Torvalds for (p = s; p <= e; ++p) { 13307b4c8769SEli Cohen if (rdma_port_get_link_layer(device, p) != IB_LINK_LAYER_INFINIBAND) 13317b4c8769SEli Cohen continue; 13321da177e4SLinus Torvalds dev = ipoib_add_port("ib%d", device, p); 13331da177e4SLinus Torvalds if (!IS_ERR(dev)) { 13341da177e4SLinus Torvalds priv = netdev_priv(dev); 13351da177e4SLinus Torvalds list_add_tail(&priv->list, dev_list); 13361da177e4SLinus Torvalds } 13371da177e4SLinus Torvalds } 13381da177e4SLinus Torvalds 13391da177e4SLinus Torvalds ib_set_client_data(device, &ipoib_client, dev_list); 13401da177e4SLinus Torvalds } 13411da177e4SLinus Torvalds 13421da177e4SLinus Torvalds static void ipoib_remove_one(struct ib_device *device) 13431da177e4SLinus Torvalds { 13441da177e4SLinus Torvalds struct ipoib_dev_priv *priv, *tmp; 13451da177e4SLinus Torvalds struct list_head *dev_list; 13461da177e4SLinus Torvalds 134707ebafbaSTom Tucker if (rdma_node_get_transport(device->node_type) != RDMA_TRANSPORT_IB) 134807ebafbaSTom Tucker return; 134907ebafbaSTom Tucker 13501da177e4SLinus Torvalds dev_list = ib_get_client_data(device, &ipoib_client); 13511da177e4SLinus Torvalds 13521da177e4SLinus Torvalds list_for_each_entry_safe(priv, tmp, dev_list, list) { 13531da177e4SLinus Torvalds ib_unregister_event_handler(&priv->event_handler); 1354a77a57a1SRoland Dreier 1355a77a57a1SRoland Dreier rtnl_lock(); 1356a77a57a1SRoland Dreier dev_change_flags(priv->dev, priv->dev->flags & ~IFF_UP); 1357a77a57a1SRoland Dreier rtnl_unlock(); 1358a77a57a1SRoland Dreier 1359a77a57a1SRoland Dreier flush_workqueue(ipoib_workqueue); 13601da177e4SLinus Torvalds 13611da177e4SLinus Torvalds unregister_netdev(priv->dev); 13621da177e4SLinus Torvalds ipoib_dev_cleanup(priv->dev); 13631da177e4SLinus Torvalds free_netdev(priv->dev); 13641da177e4SLinus Torvalds } 136506c56e44SMichael S. Tsirkin 136606c56e44SMichael S. Tsirkin kfree(dev_list); 13671da177e4SLinus Torvalds } 13681da177e4SLinus Torvalds 13691da177e4SLinus Torvalds static int __init ipoib_init_module(void) 13701da177e4SLinus Torvalds { 13711da177e4SLinus Torvalds int ret; 13721da177e4SLinus Torvalds 13730f485251SShirley Ma ipoib_recvq_size = roundup_pow_of_two(ipoib_recvq_size); 13740f485251SShirley Ma ipoib_recvq_size = min(ipoib_recvq_size, IPOIB_MAX_QUEUE_SIZE); 13750f485251SShirley Ma ipoib_recvq_size = max(ipoib_recvq_size, IPOIB_MIN_QUEUE_SIZE); 13760f485251SShirley Ma 13770f485251SShirley Ma ipoib_sendq_size = roundup_pow_of_two(ipoib_sendq_size); 13780f485251SShirley Ma ipoib_sendq_size = min(ipoib_sendq_size, IPOIB_MAX_QUEUE_SIZE); 1379732eacc0SHagen Paul Pfeifer ipoib_sendq_size = max3(ipoib_sendq_size, 2 * MAX_SEND_CQE, IPOIB_MIN_QUEUE_SIZE); 138068e995a2SPradeep Satyanarayana #ifdef CONFIG_INFINIBAND_IPOIB_CM 138168e995a2SPradeep Satyanarayana ipoib_max_conn_qp = min(ipoib_max_conn_qp, IPOIB_CM_MAX_CONN_QP); 138268e995a2SPradeep Satyanarayana #endif 13830f485251SShirley Ma 1384f89271daSEli Cohen /* 1385f89271daSEli Cohen * When copying small received packets, we only copy from the 1386f89271daSEli Cohen * linear data part of the SKB, so we rely on this condition. 1387f89271daSEli Cohen */ 1388f89271daSEli Cohen BUILD_BUG_ON(IPOIB_CM_COPYBREAK > IPOIB_CM_HEAD_SIZE); 1389f89271daSEli Cohen 13901da177e4SLinus Torvalds ret = ipoib_register_debugfs(); 13911da177e4SLinus Torvalds if (ret) 13921da177e4SLinus Torvalds return ret; 13931da177e4SLinus Torvalds 13941da177e4SLinus Torvalds /* 13951da177e4SLinus Torvalds * We create our own workqueue mainly because we want to be 13961da177e4SLinus Torvalds * able to flush it when devices are being removed. We can't 13971da177e4SLinus Torvalds * use schedule_work()/flush_scheduled_work() because both 13981da177e4SLinus Torvalds * unregister_netdev() and linkwatch_event take the rtnl lock, 13991da177e4SLinus Torvalds * so flush_scheduled_work() can deadlock during device 14001da177e4SLinus Torvalds * removal. 14011da177e4SLinus Torvalds */ 14021da177e4SLinus Torvalds ipoib_workqueue = create_singlethread_workqueue("ipoib"); 14031da177e4SLinus Torvalds if (!ipoib_workqueue) { 14041da177e4SLinus Torvalds ret = -ENOMEM; 14051da177e4SLinus Torvalds goto err_fs; 14061da177e4SLinus Torvalds } 14071da177e4SLinus Torvalds 1408c1a0b23bSMichael S. Tsirkin ib_sa_register_client(&ipoib_sa_client); 1409c1a0b23bSMichael S. Tsirkin 14101da177e4SLinus Torvalds ret = ib_register_client(&ipoib_client); 14111da177e4SLinus Torvalds if (ret) 1412c1a0b23bSMichael S. Tsirkin goto err_sa; 14131da177e4SLinus Torvalds 14141da177e4SLinus Torvalds return 0; 14151da177e4SLinus Torvalds 1416c1a0b23bSMichael S. Tsirkin err_sa: 1417c1a0b23bSMichael S. Tsirkin ib_sa_unregister_client(&ipoib_sa_client); 14181da177e4SLinus Torvalds destroy_workqueue(ipoib_workqueue); 14191da177e4SLinus Torvalds 14209adec1a8SRoland Dreier err_fs: 14219adec1a8SRoland Dreier ipoib_unregister_debugfs(); 14229adec1a8SRoland Dreier 14231da177e4SLinus Torvalds return ret; 14241da177e4SLinus Torvalds } 14251da177e4SLinus Torvalds 14261da177e4SLinus Torvalds static void __exit ipoib_cleanup_module(void) 14271da177e4SLinus Torvalds { 14281da177e4SLinus Torvalds ib_unregister_client(&ipoib_client); 1429c1a0b23bSMichael S. Tsirkin ib_sa_unregister_client(&ipoib_sa_client); 14309adec1a8SRoland Dreier ipoib_unregister_debugfs(); 14311da177e4SLinus Torvalds destroy_workqueue(ipoib_workqueue); 14321da177e4SLinus Torvalds } 14331da177e4SLinus Torvalds 14341da177e4SLinus Torvalds module_init(ipoib_init_module); 14351da177e4SLinus Torvalds module_exit(ipoib_cleanup_module); 1436