1 /* 2 * Copyright (c) 2004, 2005 Topspin Communications. All rights reserved. 3 * Copyright (c) 2005 Mellanox Technologies. All rights reserved. 4 * 5 * This software is available to you under a choice of one of two 6 * licenses. You may choose to be licensed under the terms of the GNU 7 * General Public License (GPL) Version 2, available from the file 8 * COPYING in the main directory of this source tree, or the 9 * OpenIB.org BSD license below: 10 * 11 * Redistribution and use in source and binary forms, with or 12 * without modification, are permitted provided that the following 13 * conditions are met: 14 * 15 * - Redistributions of source code must retain the above 16 * copyright notice, this list of conditions and the following 17 * disclaimer. 18 * 19 * - Redistributions in binary form must reproduce the above 20 * copyright notice, this list of conditions and the following 21 * disclaimer in the documentation and/or other materials 22 * provided with the distribution. 23 * 24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 31 * SOFTWARE. 32 */ 33 34 #include <linux/slab.h> 35 36 #include "ipoib.h" 37 38 int ipoib_mcast_attach(struct net_device *dev, u16 mlid, union ib_gid *mgid, int set_qkey) 39 { 40 struct ipoib_dev_priv *priv = netdev_priv(dev); 41 struct ib_qp_attr *qp_attr = NULL; 42 int ret; 43 u16 pkey_index; 44 45 if (ib_find_pkey(priv->ca, priv->port, priv->pkey, &pkey_index)) { 46 clear_bit(IPOIB_PKEY_ASSIGNED, &priv->flags); 47 ret = -ENXIO; 48 goto out; 49 } 50 set_bit(IPOIB_PKEY_ASSIGNED, &priv->flags); 51 52 if (set_qkey) { 53 ret = -ENOMEM; 54 qp_attr = kmalloc(sizeof *qp_attr, GFP_KERNEL); 55 if (!qp_attr) 56 goto out; 57 58 /* set correct QKey for QP */ 59 qp_attr->qkey = priv->qkey; 60 ret = ib_modify_qp(priv->qp, qp_attr, IB_QP_QKEY); 61 if (ret) { 62 ipoib_warn(priv, "failed to modify QP, ret = %d\n", ret); 63 goto out; 64 } 65 } 66 67 /* attach QP to multicast group */ 68 ret = ib_attach_mcast(priv->qp, mgid, mlid); 69 if (ret) 70 ipoib_warn(priv, "failed to attach to multicast group, ret = %d\n", ret); 71 72 out: 73 kfree(qp_attr); 74 return ret; 75 } 76 77 int ipoib_init_qp(struct net_device *dev) 78 { 79 struct ipoib_dev_priv *priv = netdev_priv(dev); 80 int ret; 81 struct ib_qp_attr qp_attr; 82 int attr_mask; 83 84 if (!test_bit(IPOIB_PKEY_ASSIGNED, &priv->flags)) 85 return -1; 86 87 qp_attr.qp_state = IB_QPS_INIT; 88 qp_attr.qkey = 0; 89 qp_attr.port_num = priv->port; 90 qp_attr.pkey_index = priv->pkey_index; 91 attr_mask = 92 IB_QP_QKEY | 93 IB_QP_PORT | 94 IB_QP_PKEY_INDEX | 95 IB_QP_STATE; 96 ret = ib_modify_qp(priv->qp, &qp_attr, attr_mask); 97 if (ret) { 98 ipoib_warn(priv, "failed to modify QP to init, ret = %d\n", ret); 99 goto out_fail; 100 } 101 102 qp_attr.qp_state = IB_QPS_RTR; 103 /* Can't set this in a INIT->RTR transition */ 104 attr_mask &= ~IB_QP_PORT; 105 ret = ib_modify_qp(priv->qp, &qp_attr, attr_mask); 106 if (ret) { 107 ipoib_warn(priv, "failed to modify QP to RTR, ret = %d\n", ret); 108 goto out_fail; 109 } 110 111 qp_attr.qp_state = IB_QPS_RTS; 112 qp_attr.sq_psn = 0; 113 attr_mask |= IB_QP_SQ_PSN; 114 attr_mask &= ~IB_QP_PKEY_INDEX; 115 ret = ib_modify_qp(priv->qp, &qp_attr, attr_mask); 116 if (ret) { 117 ipoib_warn(priv, "failed to modify QP to RTS, ret = %d\n", ret); 118 goto out_fail; 119 } 120 121 return 0; 122 123 out_fail: 124 qp_attr.qp_state = IB_QPS_RESET; 125 if (ib_modify_qp(priv->qp, &qp_attr, IB_QP_STATE)) 126 ipoib_warn(priv, "Failed to modify QP to RESET state\n"); 127 128 return ret; 129 } 130 131 int ipoib_transport_dev_init(struct net_device *dev, struct ib_device *ca) 132 { 133 struct ipoib_dev_priv *priv = netdev_priv(dev); 134 struct ib_qp_init_attr init_attr = { 135 .cap = { 136 .max_send_wr = ipoib_sendq_size, 137 .max_recv_wr = ipoib_recvq_size, 138 .max_send_sge = min_t(u32, priv->ca->attrs.max_sge, 139 MAX_SKB_FRAGS + 1), 140 .max_recv_sge = IPOIB_UD_RX_SG 141 }, 142 .sq_sig_type = IB_SIGNAL_ALL_WR, 143 .qp_type = IB_QPT_UD 144 }; 145 struct ib_cq_init_attr cq_attr = {}; 146 147 int ret, size; 148 int i; 149 150 priv->pd = ib_alloc_pd(priv->ca, 0); 151 if (IS_ERR(priv->pd)) { 152 printk(KERN_WARNING "%s: failed to allocate PD\n", ca->name); 153 return -ENODEV; 154 } 155 156 /* 157 * the various IPoIB tasks assume they will never race against 158 * themselves, so always use a single thread workqueue 159 */ 160 priv->wq = alloc_ordered_workqueue("ipoib_wq", WQ_MEM_RECLAIM); 161 if (!priv->wq) { 162 printk(KERN_WARNING "ipoib: failed to allocate device WQ\n"); 163 goto out_free_pd; 164 } 165 166 size = ipoib_recvq_size + 1; 167 ret = ipoib_cm_dev_init(dev); 168 if (!ret) { 169 size += ipoib_sendq_size; 170 if (ipoib_cm_has_srq(dev)) 171 size += ipoib_recvq_size + 1; /* 1 extra for rx_drain_qp */ 172 else 173 size += ipoib_recvq_size * ipoib_max_conn_qp; 174 } else 175 if (ret != -ENOSYS) 176 goto out_free_wq; 177 178 cq_attr.cqe = size; 179 priv->recv_cq = ib_create_cq(priv->ca, ipoib_ib_completion, NULL, 180 dev, &cq_attr); 181 if (IS_ERR(priv->recv_cq)) { 182 printk(KERN_WARNING "%s: failed to create receive CQ\n", ca->name); 183 goto out_cm_dev_cleanup; 184 } 185 186 cq_attr.cqe = ipoib_sendq_size; 187 priv->send_cq = ib_create_cq(priv->ca, ipoib_send_comp_handler, NULL, 188 dev, &cq_attr); 189 if (IS_ERR(priv->send_cq)) { 190 printk(KERN_WARNING "%s: failed to create send CQ\n", ca->name); 191 goto out_free_recv_cq; 192 } 193 194 if (ib_req_notify_cq(priv->recv_cq, IB_CQ_NEXT_COMP)) 195 goto out_free_send_cq; 196 197 init_attr.send_cq = priv->send_cq; 198 init_attr.recv_cq = priv->recv_cq; 199 200 if (priv->hca_caps & IB_DEVICE_UD_TSO) 201 init_attr.create_flags |= IB_QP_CREATE_IPOIB_UD_LSO; 202 203 if (priv->hca_caps & IB_DEVICE_BLOCK_MULTICAST_LOOPBACK) 204 init_attr.create_flags |= IB_QP_CREATE_BLOCK_MULTICAST_LOOPBACK; 205 206 if (priv->hca_caps & IB_DEVICE_MANAGED_FLOW_STEERING) 207 init_attr.create_flags |= IB_QP_CREATE_NETIF_QP; 208 209 priv->qp = ib_create_qp(priv->pd, &init_attr); 210 if (IS_ERR(priv->qp)) { 211 printk(KERN_WARNING "%s: failed to create QP\n", ca->name); 212 goto out_free_send_cq; 213 } 214 215 priv->dev->dev_addr[1] = (priv->qp->qp_num >> 16) & 0xff; 216 priv->dev->dev_addr[2] = (priv->qp->qp_num >> 8) & 0xff; 217 priv->dev->dev_addr[3] = (priv->qp->qp_num ) & 0xff; 218 219 for (i = 0; i < MAX_SKB_FRAGS + 1; ++i) 220 priv->tx_sge[i].lkey = priv->pd->local_dma_lkey; 221 222 priv->tx_wr.wr.opcode = IB_WR_SEND; 223 priv->tx_wr.wr.sg_list = priv->tx_sge; 224 priv->tx_wr.wr.send_flags = IB_SEND_SIGNALED; 225 226 priv->rx_sge[0].lkey = priv->pd->local_dma_lkey; 227 228 priv->rx_sge[0].length = IPOIB_UD_BUF_SIZE(priv->max_ib_mtu); 229 priv->rx_wr.num_sge = 1; 230 231 priv->rx_wr.next = NULL; 232 priv->rx_wr.sg_list = priv->rx_sge; 233 234 if (init_attr.cap.max_send_sge > 1) 235 dev->features |= NETIF_F_SG; 236 237 priv->max_send_sge = init_attr.cap.max_send_sge; 238 239 return 0; 240 241 out_free_send_cq: 242 ib_destroy_cq(priv->send_cq); 243 244 out_free_recv_cq: 245 ib_destroy_cq(priv->recv_cq); 246 247 out_cm_dev_cleanup: 248 ipoib_cm_dev_cleanup(dev); 249 250 out_free_wq: 251 destroy_workqueue(priv->wq); 252 priv->wq = NULL; 253 254 out_free_pd: 255 ib_dealloc_pd(priv->pd); 256 257 return -ENODEV; 258 } 259 260 void ipoib_transport_dev_cleanup(struct net_device *dev) 261 { 262 struct ipoib_dev_priv *priv = netdev_priv(dev); 263 264 if (priv->qp) { 265 if (ib_destroy_qp(priv->qp)) 266 ipoib_warn(priv, "ib_qp_destroy failed\n"); 267 268 priv->qp = NULL; 269 clear_bit(IPOIB_PKEY_ASSIGNED, &priv->flags); 270 } 271 272 if (ib_destroy_cq(priv->send_cq)) 273 ipoib_warn(priv, "ib_cq_destroy (send) failed\n"); 274 275 if (ib_destroy_cq(priv->recv_cq)) 276 ipoib_warn(priv, "ib_cq_destroy (recv) failed\n"); 277 278 ipoib_cm_dev_cleanup(dev); 279 280 if (priv->wq) { 281 flush_workqueue(priv->wq); 282 destroy_workqueue(priv->wq); 283 priv->wq = NULL; 284 } 285 286 ib_dealloc_pd(priv->pd); 287 } 288 289 void ipoib_event(struct ib_event_handler *handler, 290 struct ib_event *record) 291 { 292 struct ipoib_dev_priv *priv = 293 container_of(handler, struct ipoib_dev_priv, event_handler); 294 295 if (record->element.port_num != priv->port) 296 return; 297 298 ipoib_dbg(priv, "Event %d on device %s port %d\n", record->event, 299 record->device->name, record->element.port_num); 300 301 if (record->event == IB_EVENT_SM_CHANGE || 302 record->event == IB_EVENT_CLIENT_REREGISTER) { 303 queue_work(ipoib_workqueue, &priv->flush_light); 304 } else if (record->event == IB_EVENT_PORT_ERR || 305 record->event == IB_EVENT_PORT_ACTIVE || 306 record->event == IB_EVENT_LID_CHANGE) { 307 queue_work(ipoib_workqueue, &priv->flush_normal); 308 } else if (record->event == IB_EVENT_PKEY_CHANGE) { 309 queue_work(ipoib_workqueue, &priv->flush_heavy); 310 } else if (record->event == IB_EVENT_GID_CHANGE && 311 !test_bit(IPOIB_FLAG_DEV_ADDR_SET, &priv->flags)) { 312 queue_work(ipoib_workqueue, &priv->flush_light); 313 } 314 } 315