1 /* QLogic qedr NIC Driver 2 * Copyright (c) 2015-2016 QLogic Corporation 3 * 4 * This software is available to you under a choice of one of two 5 * licenses. You may choose to be licensed under the terms of the GNU 6 * General Public License (GPL) Version 2, available from the file 7 * COPYING in the main directory of this source tree, or the 8 * OpenIB.org BSD license below: 9 * 10 * Redistribution and use in source and binary forms, with or 11 * without modification, are permitted provided that the following 12 * conditions are met: 13 * 14 * - Redistributions of source code must retain the above 15 * copyright notice, this list of conditions and the following 16 * disclaimer. 17 * 18 * - Redistributions in binary form must reproduce the above 19 * copyright notice, this list of conditions and the following 20 * disclaimer in the documentation and /or other materials 21 * provided with the distribution. 22 * 23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 30 * SOFTWARE. 31 */ 32 #include <linux/dma-mapping.h> 33 #include <linux/crc32.h> 34 #include <net/ip.h> 35 #include <net/ipv6.h> 36 #include <net/udp.h> 37 #include <linux/iommu.h> 38 39 #include <rdma/ib_verbs.h> 40 #include <rdma/ib_user_verbs.h> 41 #include <rdma/iw_cm.h> 42 #include <rdma/ib_umem.h> 43 #include <rdma/ib_addr.h> 44 #include <rdma/ib_cache.h> 45 46 #include <linux/qed/common_hsi.h> 47 #include "qedr_hsi_rdma.h" 48 #include <linux/qed/qed_if.h> 49 #include "qedr.h" 50 #include "verbs.h" 51 #include <rdma/qedr-abi.h> 52 #include "qedr_roce_cm.h" 53 54 #define QEDR_SRQ_WQE_ELEM_SIZE sizeof(union rdma_srq_elm) 55 #define RDMA_MAX_SGE_PER_SRQ (4) 56 #define RDMA_MAX_SRQ_WQE_SIZE (RDMA_MAX_SGE_PER_SRQ + 1) 57 58 #define DB_ADDR_SHIFT(addr) ((addr) << DB_PWM_ADDR_OFFSET_SHIFT) 59 60 static inline int qedr_ib_copy_to_udata(struct ib_udata *udata, void *src, 61 size_t len) 62 { 63 size_t min_len = min_t(size_t, len, udata->outlen); 64 65 return ib_copy_to_udata(udata, src, min_len); 66 } 67 68 int qedr_query_pkey(struct ib_device *ibdev, u8 port, u16 index, u16 *pkey) 69 { 70 if (index > QEDR_ROCE_PKEY_TABLE_LEN) 71 return -EINVAL; 72 73 *pkey = QEDR_ROCE_PKEY_DEFAULT; 74 return 0; 75 } 76 77 int qedr_iw_query_gid(struct ib_device *ibdev, u8 port, 78 int index, union ib_gid *sgid) 79 { 80 struct qedr_dev *dev = get_qedr_dev(ibdev); 81 82 memset(sgid->raw, 0, sizeof(sgid->raw)); 83 ether_addr_copy(sgid->raw, dev->ndev->dev_addr); 84 85 DP_DEBUG(dev, QEDR_MSG_INIT, "QUERY sgid[%d]=%llx:%llx\n", index, 86 sgid->global.interface_id, sgid->global.subnet_prefix); 87 88 return 0; 89 } 90 91 int qedr_query_srq(struct ib_srq *ibsrq, struct ib_srq_attr *srq_attr) 92 { 93 struct qedr_dev *dev = get_qedr_dev(ibsrq->device); 94 struct qedr_device_attr *qattr = &dev->attr; 95 struct qedr_srq *srq = get_qedr_srq(ibsrq); 96 97 srq_attr->srq_limit = srq->srq_limit; 98 srq_attr->max_wr = qattr->max_srq_wr; 99 srq_attr->max_sge = qattr->max_sge; 100 101 return 0; 102 } 103 104 int qedr_query_device(struct ib_device *ibdev, 105 struct ib_device_attr *attr, struct ib_udata *udata) 106 { 107 struct qedr_dev *dev = get_qedr_dev(ibdev); 108 struct qedr_device_attr *qattr = &dev->attr; 109 110 if (!dev->rdma_ctx) { 111 DP_ERR(dev, 112 "qedr_query_device called with invalid params rdma_ctx=%p\n", 113 dev->rdma_ctx); 114 return -EINVAL; 115 } 116 117 memset(attr, 0, sizeof(*attr)); 118 119 attr->fw_ver = qattr->fw_ver; 120 attr->sys_image_guid = qattr->sys_image_guid; 121 attr->max_mr_size = qattr->max_mr_size; 122 attr->page_size_cap = qattr->page_size_caps; 123 attr->vendor_id = qattr->vendor_id; 124 attr->vendor_part_id = qattr->vendor_part_id; 125 attr->hw_ver = qattr->hw_ver; 126 attr->max_qp = qattr->max_qp; 127 attr->max_qp_wr = max_t(u32, qattr->max_sqe, qattr->max_rqe); 128 attr->device_cap_flags = IB_DEVICE_CURR_QP_STATE_MOD | 129 IB_DEVICE_RC_RNR_NAK_GEN | 130 IB_DEVICE_LOCAL_DMA_LKEY | IB_DEVICE_MEM_MGT_EXTENSIONS; 131 132 attr->max_send_sge = qattr->max_sge; 133 attr->max_recv_sge = qattr->max_sge; 134 attr->max_sge_rd = qattr->max_sge; 135 attr->max_cq = qattr->max_cq; 136 attr->max_cqe = qattr->max_cqe; 137 attr->max_mr = qattr->max_mr; 138 attr->max_mw = qattr->max_mw; 139 attr->max_pd = qattr->max_pd; 140 attr->atomic_cap = dev->atomic_cap; 141 attr->max_fmr = qattr->max_fmr; 142 attr->max_map_per_fmr = 16; 143 attr->max_qp_init_rd_atom = 144 1 << (fls(qattr->max_qp_req_rd_atomic_resc) - 1); 145 attr->max_qp_rd_atom = 146 min(1 << (fls(qattr->max_qp_resp_rd_atomic_resc) - 1), 147 attr->max_qp_init_rd_atom); 148 149 attr->max_srq = qattr->max_srq; 150 attr->max_srq_sge = qattr->max_srq_sge; 151 attr->max_srq_wr = qattr->max_srq_wr; 152 153 attr->local_ca_ack_delay = qattr->dev_ack_delay; 154 attr->max_fast_reg_page_list_len = qattr->max_mr / 8; 155 attr->max_pkeys = QEDR_ROCE_PKEY_MAX; 156 attr->max_ah = qattr->max_ah; 157 158 return 0; 159 } 160 161 #define QEDR_SPEED_SDR (1) 162 #define QEDR_SPEED_DDR (2) 163 #define QEDR_SPEED_QDR (4) 164 #define QEDR_SPEED_FDR10 (8) 165 #define QEDR_SPEED_FDR (16) 166 #define QEDR_SPEED_EDR (32) 167 168 static inline void get_link_speed_and_width(int speed, u8 *ib_speed, 169 u8 *ib_width) 170 { 171 switch (speed) { 172 case 1000: 173 *ib_speed = QEDR_SPEED_SDR; 174 *ib_width = IB_WIDTH_1X; 175 break; 176 case 10000: 177 *ib_speed = QEDR_SPEED_QDR; 178 *ib_width = IB_WIDTH_1X; 179 break; 180 181 case 20000: 182 *ib_speed = QEDR_SPEED_DDR; 183 *ib_width = IB_WIDTH_4X; 184 break; 185 186 case 25000: 187 *ib_speed = QEDR_SPEED_EDR; 188 *ib_width = IB_WIDTH_1X; 189 break; 190 191 case 40000: 192 *ib_speed = QEDR_SPEED_QDR; 193 *ib_width = IB_WIDTH_4X; 194 break; 195 196 case 50000: 197 *ib_speed = QEDR_SPEED_QDR; 198 *ib_width = IB_WIDTH_4X; 199 break; 200 201 case 100000: 202 *ib_speed = QEDR_SPEED_EDR; 203 *ib_width = IB_WIDTH_4X; 204 break; 205 206 default: 207 /* Unsupported */ 208 *ib_speed = QEDR_SPEED_SDR; 209 *ib_width = IB_WIDTH_1X; 210 } 211 } 212 213 int qedr_query_port(struct ib_device *ibdev, u8 port, struct ib_port_attr *attr) 214 { 215 struct qedr_dev *dev; 216 struct qed_rdma_port *rdma_port; 217 218 dev = get_qedr_dev(ibdev); 219 if (port > 1) { 220 DP_ERR(dev, "invalid_port=0x%x\n", port); 221 return -EINVAL; 222 } 223 224 if (!dev->rdma_ctx) { 225 DP_ERR(dev, "rdma_ctx is NULL\n"); 226 return -EINVAL; 227 } 228 229 rdma_port = dev->ops->rdma_query_port(dev->rdma_ctx); 230 231 /* *attr being zeroed by the caller, avoid zeroing it here */ 232 if (rdma_port->port_state == QED_RDMA_PORT_UP) { 233 attr->state = IB_PORT_ACTIVE; 234 attr->phys_state = 5; 235 } else { 236 attr->state = IB_PORT_DOWN; 237 attr->phys_state = 3; 238 } 239 attr->max_mtu = IB_MTU_4096; 240 attr->active_mtu = iboe_get_mtu(dev->ndev->mtu); 241 attr->lid = 0; 242 attr->lmc = 0; 243 attr->sm_lid = 0; 244 attr->sm_sl = 0; 245 attr->ip_gids = true; 246 if (rdma_protocol_iwarp(&dev->ibdev, 1)) { 247 attr->gid_tbl_len = 1; 248 attr->pkey_tbl_len = 1; 249 } else { 250 attr->gid_tbl_len = QEDR_MAX_SGID; 251 attr->pkey_tbl_len = QEDR_ROCE_PKEY_TABLE_LEN; 252 } 253 attr->bad_pkey_cntr = rdma_port->pkey_bad_counter; 254 attr->qkey_viol_cntr = 0; 255 get_link_speed_and_width(rdma_port->link_speed, 256 &attr->active_speed, &attr->active_width); 257 attr->max_msg_sz = rdma_port->max_msg_size; 258 attr->max_vl_num = 4; 259 260 return 0; 261 } 262 263 int qedr_modify_port(struct ib_device *ibdev, u8 port, int mask, 264 struct ib_port_modify *props) 265 { 266 struct qedr_dev *dev; 267 268 dev = get_qedr_dev(ibdev); 269 if (port > 1) { 270 DP_ERR(dev, "invalid_port=0x%x\n", port); 271 return -EINVAL; 272 } 273 274 return 0; 275 } 276 277 static int qedr_add_mmap(struct qedr_ucontext *uctx, u64 phy_addr, 278 unsigned long len) 279 { 280 struct qedr_mm *mm; 281 282 mm = kzalloc(sizeof(*mm), GFP_KERNEL); 283 if (!mm) 284 return -ENOMEM; 285 286 mm->key.phy_addr = phy_addr; 287 /* This function might be called with a length which is not a multiple 288 * of PAGE_SIZE, while the mapping is PAGE_SIZE grained and the kernel 289 * forces this granularity by increasing the requested size if needed. 290 * When qedr_mmap is called, it will search the list with the updated 291 * length as a key. To prevent search failures, the length is rounded up 292 * in advance to PAGE_SIZE. 293 */ 294 mm->key.len = roundup(len, PAGE_SIZE); 295 INIT_LIST_HEAD(&mm->entry); 296 297 mutex_lock(&uctx->mm_list_lock); 298 list_add(&mm->entry, &uctx->mm_head); 299 mutex_unlock(&uctx->mm_list_lock); 300 301 DP_DEBUG(uctx->dev, QEDR_MSG_MISC, 302 "added (addr=0x%llx,len=0x%lx) for ctx=%p\n", 303 (unsigned long long)mm->key.phy_addr, 304 (unsigned long)mm->key.len, uctx); 305 306 return 0; 307 } 308 309 static bool qedr_search_mmap(struct qedr_ucontext *uctx, u64 phy_addr, 310 unsigned long len) 311 { 312 bool found = false; 313 struct qedr_mm *mm; 314 315 mutex_lock(&uctx->mm_list_lock); 316 list_for_each_entry(mm, &uctx->mm_head, entry) { 317 if (len != mm->key.len || phy_addr != mm->key.phy_addr) 318 continue; 319 320 found = true; 321 break; 322 } 323 mutex_unlock(&uctx->mm_list_lock); 324 DP_DEBUG(uctx->dev, QEDR_MSG_MISC, 325 "searched for (addr=0x%llx,len=0x%lx) for ctx=%p, result=%d\n", 326 mm->key.phy_addr, mm->key.len, uctx, found); 327 328 return found; 329 } 330 331 struct ib_ucontext *qedr_alloc_ucontext(struct ib_device *ibdev, 332 struct ib_udata *udata) 333 { 334 int rc; 335 struct qedr_ucontext *ctx; 336 struct qedr_alloc_ucontext_resp uresp; 337 struct qedr_dev *dev = get_qedr_dev(ibdev); 338 struct qed_rdma_add_user_out_params oparams; 339 340 if (!udata) 341 return ERR_PTR(-EFAULT); 342 343 ctx = kzalloc(sizeof(*ctx), GFP_KERNEL); 344 if (!ctx) 345 return ERR_PTR(-ENOMEM); 346 347 rc = dev->ops->rdma_add_user(dev->rdma_ctx, &oparams); 348 if (rc) { 349 DP_ERR(dev, 350 "failed to allocate a DPI for a new RoCE application, rc=%d. To overcome this consider to increase the number of DPIs, increase the doorbell BAR size or just close unnecessary RoCE applications. In order to increase the number of DPIs consult the qedr readme\n", 351 rc); 352 goto err; 353 } 354 355 ctx->dpi = oparams.dpi; 356 ctx->dpi_addr = oparams.dpi_addr; 357 ctx->dpi_phys_addr = oparams.dpi_phys_addr; 358 ctx->dpi_size = oparams.dpi_size; 359 INIT_LIST_HEAD(&ctx->mm_head); 360 mutex_init(&ctx->mm_list_lock); 361 362 memset(&uresp, 0, sizeof(uresp)); 363 364 uresp.dpm_enabled = dev->user_dpm_enabled; 365 uresp.wids_enabled = 1; 366 uresp.wid_count = oparams.wid_count; 367 uresp.db_pa = ctx->dpi_phys_addr; 368 uresp.db_size = ctx->dpi_size; 369 uresp.max_send_wr = dev->attr.max_sqe; 370 uresp.max_recv_wr = dev->attr.max_rqe; 371 uresp.max_srq_wr = dev->attr.max_srq_wr; 372 uresp.sges_per_send_wr = QEDR_MAX_SQE_ELEMENTS_PER_SQE; 373 uresp.sges_per_recv_wr = QEDR_MAX_RQE_ELEMENTS_PER_RQE; 374 uresp.sges_per_srq_wr = dev->attr.max_srq_sge; 375 uresp.max_cqes = QEDR_MAX_CQES; 376 377 rc = qedr_ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 378 if (rc) 379 goto err; 380 381 ctx->dev = dev; 382 383 rc = qedr_add_mmap(ctx, ctx->dpi_phys_addr, ctx->dpi_size); 384 if (rc) 385 goto err; 386 387 DP_DEBUG(dev, QEDR_MSG_INIT, "Allocating user context %p\n", 388 &ctx->ibucontext); 389 return &ctx->ibucontext; 390 391 err: 392 kfree(ctx); 393 return ERR_PTR(rc); 394 } 395 396 int qedr_dealloc_ucontext(struct ib_ucontext *ibctx) 397 { 398 struct qedr_ucontext *uctx = get_qedr_ucontext(ibctx); 399 struct qedr_mm *mm, *tmp; 400 int status = 0; 401 402 DP_DEBUG(uctx->dev, QEDR_MSG_INIT, "Deallocating user context %p\n", 403 uctx); 404 uctx->dev->ops->rdma_remove_user(uctx->dev->rdma_ctx, uctx->dpi); 405 406 list_for_each_entry_safe(mm, tmp, &uctx->mm_head, entry) { 407 DP_DEBUG(uctx->dev, QEDR_MSG_MISC, 408 "deleted (addr=0x%llx,len=0x%lx) for ctx=%p\n", 409 mm->key.phy_addr, mm->key.len, uctx); 410 list_del(&mm->entry); 411 kfree(mm); 412 } 413 414 kfree(uctx); 415 return status; 416 } 417 418 int qedr_mmap(struct ib_ucontext *context, struct vm_area_struct *vma) 419 { 420 struct qedr_ucontext *ucontext = get_qedr_ucontext(context); 421 struct qedr_dev *dev = get_qedr_dev(context->device); 422 unsigned long phys_addr = vma->vm_pgoff << PAGE_SHIFT; 423 unsigned long len = (vma->vm_end - vma->vm_start); 424 unsigned long dpi_start; 425 426 dpi_start = dev->db_phys_addr + (ucontext->dpi * ucontext->dpi_size); 427 428 DP_DEBUG(dev, QEDR_MSG_INIT, 429 "mmap invoked with vm_start=0x%pK, vm_end=0x%pK,vm_pgoff=0x%pK; dpi_start=0x%pK dpi_size=0x%x\n", 430 (void *)vma->vm_start, (void *)vma->vm_end, 431 (void *)vma->vm_pgoff, (void *)dpi_start, ucontext->dpi_size); 432 433 if ((vma->vm_start & (PAGE_SIZE - 1)) || (len & (PAGE_SIZE - 1))) { 434 DP_ERR(dev, 435 "failed mmap, addresses must be page aligned: start=0x%pK, end=0x%pK\n", 436 (void *)vma->vm_start, (void *)vma->vm_end); 437 return -EINVAL; 438 } 439 440 if (!qedr_search_mmap(ucontext, phys_addr, len)) { 441 DP_ERR(dev, "failed mmap, vm_pgoff=0x%lx is not authorized\n", 442 vma->vm_pgoff); 443 return -EINVAL; 444 } 445 446 if (phys_addr < dpi_start || 447 ((phys_addr + len) > (dpi_start + ucontext->dpi_size))) { 448 DP_ERR(dev, 449 "failed mmap, pages are outside of dpi; page address=0x%pK, dpi_start=0x%pK, dpi_size=0x%x\n", 450 (void *)phys_addr, (void *)dpi_start, 451 ucontext->dpi_size); 452 return -EINVAL; 453 } 454 455 if (vma->vm_flags & VM_READ) { 456 DP_ERR(dev, "failed mmap, cannot map doorbell bar for read\n"); 457 return -EINVAL; 458 } 459 460 vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot); 461 return io_remap_pfn_range(vma, vma->vm_start, vma->vm_pgoff, len, 462 vma->vm_page_prot); 463 } 464 465 struct ib_pd *qedr_alloc_pd(struct ib_device *ibdev, 466 struct ib_ucontext *context, struct ib_udata *udata) 467 { 468 struct qedr_dev *dev = get_qedr_dev(ibdev); 469 struct qedr_pd *pd; 470 u16 pd_id; 471 int rc; 472 473 DP_DEBUG(dev, QEDR_MSG_INIT, "Function called from: %s\n", 474 (udata && context) ? "User Lib" : "Kernel"); 475 476 if (!dev->rdma_ctx) { 477 DP_ERR(dev, "invalid RDMA context\n"); 478 return ERR_PTR(-EINVAL); 479 } 480 481 pd = kzalloc(sizeof(*pd), GFP_KERNEL); 482 if (!pd) 483 return ERR_PTR(-ENOMEM); 484 485 rc = dev->ops->rdma_alloc_pd(dev->rdma_ctx, &pd_id); 486 if (rc) 487 goto err; 488 489 pd->pd_id = pd_id; 490 491 if (udata && context) { 492 struct qedr_alloc_pd_uresp uresp = { 493 .pd_id = pd_id, 494 }; 495 496 rc = qedr_ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 497 if (rc) { 498 DP_ERR(dev, "copy error pd_id=0x%x.\n", pd_id); 499 dev->ops->rdma_dealloc_pd(dev->rdma_ctx, pd_id); 500 goto err; 501 } 502 503 pd->uctx = get_qedr_ucontext(context); 504 pd->uctx->pd = pd; 505 } 506 507 return &pd->ibpd; 508 509 err: 510 kfree(pd); 511 return ERR_PTR(rc); 512 } 513 514 int qedr_dealloc_pd(struct ib_pd *ibpd) 515 { 516 struct qedr_dev *dev = get_qedr_dev(ibpd->device); 517 struct qedr_pd *pd = get_qedr_pd(ibpd); 518 519 if (!pd) { 520 pr_err("Invalid PD received in dealloc_pd\n"); 521 return -EINVAL; 522 } 523 524 DP_DEBUG(dev, QEDR_MSG_INIT, "Deallocating PD %d\n", pd->pd_id); 525 dev->ops->rdma_dealloc_pd(dev->rdma_ctx, pd->pd_id); 526 527 kfree(pd); 528 529 return 0; 530 } 531 532 static void qedr_free_pbl(struct qedr_dev *dev, 533 struct qedr_pbl_info *pbl_info, struct qedr_pbl *pbl) 534 { 535 struct pci_dev *pdev = dev->pdev; 536 int i; 537 538 for (i = 0; i < pbl_info->num_pbls; i++) { 539 if (!pbl[i].va) 540 continue; 541 dma_free_coherent(&pdev->dev, pbl_info->pbl_size, 542 pbl[i].va, pbl[i].pa); 543 } 544 545 kfree(pbl); 546 } 547 548 #define MIN_FW_PBL_PAGE_SIZE (4 * 1024) 549 #define MAX_FW_PBL_PAGE_SIZE (64 * 1024) 550 551 #define NUM_PBES_ON_PAGE(_page_size) (_page_size / sizeof(u64)) 552 #define MAX_PBES_ON_PAGE NUM_PBES_ON_PAGE(MAX_FW_PBL_PAGE_SIZE) 553 #define MAX_PBES_TWO_LAYER (MAX_PBES_ON_PAGE * MAX_PBES_ON_PAGE) 554 555 static struct qedr_pbl *qedr_alloc_pbl_tbl(struct qedr_dev *dev, 556 struct qedr_pbl_info *pbl_info, 557 gfp_t flags) 558 { 559 struct pci_dev *pdev = dev->pdev; 560 struct qedr_pbl *pbl_table; 561 dma_addr_t *pbl_main_tbl; 562 dma_addr_t pa; 563 void *va; 564 int i; 565 566 pbl_table = kcalloc(pbl_info->num_pbls, sizeof(*pbl_table), flags); 567 if (!pbl_table) 568 return ERR_PTR(-ENOMEM); 569 570 for (i = 0; i < pbl_info->num_pbls; i++) { 571 va = dma_zalloc_coherent(&pdev->dev, pbl_info->pbl_size, 572 &pa, flags); 573 if (!va) 574 goto err; 575 576 pbl_table[i].va = va; 577 pbl_table[i].pa = pa; 578 } 579 580 /* Two-Layer PBLs, if we have more than one pbl we need to initialize 581 * the first one with physical pointers to all of the rest 582 */ 583 pbl_main_tbl = (dma_addr_t *)pbl_table[0].va; 584 for (i = 0; i < pbl_info->num_pbls - 1; i++) 585 pbl_main_tbl[i] = pbl_table[i + 1].pa; 586 587 return pbl_table; 588 589 err: 590 for (i--; i >= 0; i--) 591 dma_free_coherent(&pdev->dev, pbl_info->pbl_size, 592 pbl_table[i].va, pbl_table[i].pa); 593 594 qedr_free_pbl(dev, pbl_info, pbl_table); 595 596 return ERR_PTR(-ENOMEM); 597 } 598 599 static int qedr_prepare_pbl_tbl(struct qedr_dev *dev, 600 struct qedr_pbl_info *pbl_info, 601 u32 num_pbes, int two_layer_capable) 602 { 603 u32 pbl_capacity; 604 u32 pbl_size; 605 u32 num_pbls; 606 607 if ((num_pbes > MAX_PBES_ON_PAGE) && two_layer_capable) { 608 if (num_pbes > MAX_PBES_TWO_LAYER) { 609 DP_ERR(dev, "prepare pbl table: too many pages %d\n", 610 num_pbes); 611 return -EINVAL; 612 } 613 614 /* calculate required pbl page size */ 615 pbl_size = MIN_FW_PBL_PAGE_SIZE; 616 pbl_capacity = NUM_PBES_ON_PAGE(pbl_size) * 617 NUM_PBES_ON_PAGE(pbl_size); 618 619 while (pbl_capacity < num_pbes) { 620 pbl_size *= 2; 621 pbl_capacity = pbl_size / sizeof(u64); 622 pbl_capacity = pbl_capacity * pbl_capacity; 623 } 624 625 num_pbls = DIV_ROUND_UP(num_pbes, NUM_PBES_ON_PAGE(pbl_size)); 626 num_pbls++; /* One for the layer0 ( points to the pbls) */ 627 pbl_info->two_layered = true; 628 } else { 629 /* One layered PBL */ 630 num_pbls = 1; 631 pbl_size = max_t(u32, MIN_FW_PBL_PAGE_SIZE, 632 roundup_pow_of_two((num_pbes * sizeof(u64)))); 633 pbl_info->two_layered = false; 634 } 635 636 pbl_info->num_pbls = num_pbls; 637 pbl_info->pbl_size = pbl_size; 638 pbl_info->num_pbes = num_pbes; 639 640 DP_DEBUG(dev, QEDR_MSG_MR, 641 "prepare pbl table: num_pbes=%d, num_pbls=%d, pbl_size=%d\n", 642 pbl_info->num_pbes, pbl_info->num_pbls, pbl_info->pbl_size); 643 644 return 0; 645 } 646 647 static void qedr_populate_pbls(struct qedr_dev *dev, struct ib_umem *umem, 648 struct qedr_pbl *pbl, 649 struct qedr_pbl_info *pbl_info, u32 pg_shift) 650 { 651 int shift, pg_cnt, pages, pbe_cnt, total_num_pbes = 0; 652 u32 fw_pg_cnt, fw_pg_per_umem_pg; 653 struct qedr_pbl *pbl_tbl; 654 struct scatterlist *sg; 655 struct regpair *pbe; 656 u64 pg_addr; 657 int entry; 658 659 if (!pbl_info->num_pbes) 660 return; 661 662 /* If we have a two layered pbl, the first pbl points to the rest 663 * of the pbls and the first entry lays on the second pbl in the table 664 */ 665 if (pbl_info->two_layered) 666 pbl_tbl = &pbl[1]; 667 else 668 pbl_tbl = pbl; 669 670 pbe = (struct regpair *)pbl_tbl->va; 671 if (!pbe) { 672 DP_ERR(dev, "cannot populate PBL due to a NULL PBE\n"); 673 return; 674 } 675 676 pbe_cnt = 0; 677 678 shift = umem->page_shift; 679 680 fw_pg_per_umem_pg = BIT(umem->page_shift - pg_shift); 681 682 for_each_sg(umem->sg_head.sgl, sg, umem->nmap, entry) { 683 pages = sg_dma_len(sg) >> shift; 684 pg_addr = sg_dma_address(sg); 685 for (pg_cnt = 0; pg_cnt < pages; pg_cnt++) { 686 for (fw_pg_cnt = 0; fw_pg_cnt < fw_pg_per_umem_pg;) { 687 pbe->lo = cpu_to_le32(pg_addr); 688 pbe->hi = cpu_to_le32(upper_32_bits(pg_addr)); 689 690 pg_addr += BIT(pg_shift); 691 pbe_cnt++; 692 total_num_pbes++; 693 pbe++; 694 695 if (total_num_pbes == pbl_info->num_pbes) 696 return; 697 698 /* If the given pbl is full storing the pbes, 699 * move to next pbl. 700 */ 701 if (pbe_cnt == 702 (pbl_info->pbl_size / sizeof(u64))) { 703 pbl_tbl++; 704 pbe = (struct regpair *)pbl_tbl->va; 705 pbe_cnt = 0; 706 } 707 708 fw_pg_cnt++; 709 } 710 } 711 } 712 } 713 714 static int qedr_copy_cq_uresp(struct qedr_dev *dev, 715 struct qedr_cq *cq, struct ib_udata *udata) 716 { 717 struct qedr_create_cq_uresp uresp; 718 int rc; 719 720 memset(&uresp, 0, sizeof(uresp)); 721 722 uresp.db_offset = DB_ADDR_SHIFT(DQ_PWM_OFFSET_UCM_RDMA_CQ_CONS_32BIT); 723 uresp.icid = cq->icid; 724 725 rc = qedr_ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 726 if (rc) 727 DP_ERR(dev, "copy error cqid=0x%x.\n", cq->icid); 728 729 return rc; 730 } 731 732 static void consume_cqe(struct qedr_cq *cq) 733 { 734 if (cq->latest_cqe == cq->toggle_cqe) 735 cq->pbl_toggle ^= RDMA_CQE_REQUESTER_TOGGLE_BIT_MASK; 736 737 cq->latest_cqe = qed_chain_consume(&cq->pbl); 738 } 739 740 static inline int qedr_align_cq_entries(int entries) 741 { 742 u64 size, aligned_size; 743 744 /* We allocate an extra entry that we don't report to the FW. */ 745 size = (entries + 1) * QEDR_CQE_SIZE; 746 aligned_size = ALIGN(size, PAGE_SIZE); 747 748 return aligned_size / QEDR_CQE_SIZE; 749 } 750 751 static inline int qedr_init_user_queue(struct ib_ucontext *ib_ctx, 752 struct qedr_dev *dev, 753 struct qedr_userq *q, 754 u64 buf_addr, size_t buf_len, 755 int access, int dmasync, 756 int alloc_and_init) 757 { 758 u32 fw_pages; 759 int rc; 760 761 q->buf_addr = buf_addr; 762 q->buf_len = buf_len; 763 q->umem = ib_umem_get(ib_ctx, q->buf_addr, q->buf_len, access, dmasync); 764 if (IS_ERR(q->umem)) { 765 DP_ERR(dev, "create user queue: failed ib_umem_get, got %ld\n", 766 PTR_ERR(q->umem)); 767 return PTR_ERR(q->umem); 768 } 769 770 fw_pages = ib_umem_page_count(q->umem) << 771 (q->umem->page_shift - FW_PAGE_SHIFT); 772 773 rc = qedr_prepare_pbl_tbl(dev, &q->pbl_info, fw_pages, 0); 774 if (rc) 775 goto err0; 776 777 if (alloc_and_init) { 778 q->pbl_tbl = qedr_alloc_pbl_tbl(dev, &q->pbl_info, GFP_KERNEL); 779 if (IS_ERR(q->pbl_tbl)) { 780 rc = PTR_ERR(q->pbl_tbl); 781 goto err0; 782 } 783 qedr_populate_pbls(dev, q->umem, q->pbl_tbl, &q->pbl_info, 784 FW_PAGE_SHIFT); 785 } else { 786 q->pbl_tbl = kzalloc(sizeof(*q->pbl_tbl), GFP_KERNEL); 787 if (!q->pbl_tbl) { 788 rc = -ENOMEM; 789 goto err0; 790 } 791 } 792 793 return 0; 794 795 err0: 796 ib_umem_release(q->umem); 797 q->umem = NULL; 798 799 return rc; 800 } 801 802 static inline void qedr_init_cq_params(struct qedr_cq *cq, 803 struct qedr_ucontext *ctx, 804 struct qedr_dev *dev, int vector, 805 int chain_entries, int page_cnt, 806 u64 pbl_ptr, 807 struct qed_rdma_create_cq_in_params 808 *params) 809 { 810 memset(params, 0, sizeof(*params)); 811 params->cq_handle_hi = upper_32_bits((uintptr_t)cq); 812 params->cq_handle_lo = lower_32_bits((uintptr_t)cq); 813 params->cnq_id = vector; 814 params->cq_size = chain_entries - 1; 815 params->dpi = (ctx) ? ctx->dpi : dev->dpi; 816 params->pbl_num_pages = page_cnt; 817 params->pbl_ptr = pbl_ptr; 818 params->pbl_two_level = 0; 819 } 820 821 static void doorbell_cq(struct qedr_cq *cq, u32 cons, u8 flags) 822 { 823 cq->db.data.agg_flags = flags; 824 cq->db.data.value = cpu_to_le32(cons); 825 writeq(cq->db.raw, cq->db_addr); 826 827 /* Make sure write would stick */ 828 mmiowb(); 829 } 830 831 int qedr_arm_cq(struct ib_cq *ibcq, enum ib_cq_notify_flags flags) 832 { 833 struct qedr_cq *cq = get_qedr_cq(ibcq); 834 unsigned long sflags; 835 struct qedr_dev *dev; 836 837 dev = get_qedr_dev(ibcq->device); 838 839 if (cq->destroyed) { 840 DP_ERR(dev, 841 "warning: arm was invoked after destroy for cq %p (icid=%d)\n", 842 cq, cq->icid); 843 return -EINVAL; 844 } 845 846 847 if (cq->cq_type == QEDR_CQ_TYPE_GSI) 848 return 0; 849 850 spin_lock_irqsave(&cq->cq_lock, sflags); 851 852 cq->arm_flags = 0; 853 854 if (flags & IB_CQ_SOLICITED) 855 cq->arm_flags |= DQ_UCM_ROCE_CQ_ARM_SE_CF_CMD; 856 857 if (flags & IB_CQ_NEXT_COMP) 858 cq->arm_flags |= DQ_UCM_ROCE_CQ_ARM_CF_CMD; 859 860 doorbell_cq(cq, cq->cq_cons - 1, cq->arm_flags); 861 862 spin_unlock_irqrestore(&cq->cq_lock, sflags); 863 864 return 0; 865 } 866 867 struct ib_cq *qedr_create_cq(struct ib_device *ibdev, 868 const struct ib_cq_init_attr *attr, 869 struct ib_ucontext *ib_ctx, struct ib_udata *udata) 870 { 871 struct qedr_ucontext *ctx = get_qedr_ucontext(ib_ctx); 872 struct qed_rdma_destroy_cq_out_params destroy_oparams; 873 struct qed_rdma_destroy_cq_in_params destroy_iparams; 874 struct qedr_dev *dev = get_qedr_dev(ibdev); 875 struct qed_rdma_create_cq_in_params params; 876 struct qedr_create_cq_ureq ureq; 877 int vector = attr->comp_vector; 878 int entries = attr->cqe; 879 struct qedr_cq *cq; 880 int chain_entries; 881 int page_cnt; 882 u64 pbl_ptr; 883 u16 icid; 884 int rc; 885 886 DP_DEBUG(dev, QEDR_MSG_INIT, 887 "create_cq: called from %s. entries=%d, vector=%d\n", 888 udata ? "User Lib" : "Kernel", entries, vector); 889 890 if (entries > QEDR_MAX_CQES) { 891 DP_ERR(dev, 892 "create cq: the number of entries %d is too high. Must be equal or below %d.\n", 893 entries, QEDR_MAX_CQES); 894 return ERR_PTR(-EINVAL); 895 } 896 897 chain_entries = qedr_align_cq_entries(entries); 898 chain_entries = min_t(int, chain_entries, QEDR_MAX_CQES); 899 900 cq = kzalloc(sizeof(*cq), GFP_KERNEL); 901 if (!cq) 902 return ERR_PTR(-ENOMEM); 903 904 if (udata) { 905 memset(&ureq, 0, sizeof(ureq)); 906 if (ib_copy_from_udata(&ureq, udata, sizeof(ureq))) { 907 DP_ERR(dev, 908 "create cq: problem copying data from user space\n"); 909 goto err0; 910 } 911 912 if (!ureq.len) { 913 DP_ERR(dev, 914 "create cq: cannot create a cq with 0 entries\n"); 915 goto err0; 916 } 917 918 cq->cq_type = QEDR_CQ_TYPE_USER; 919 920 rc = qedr_init_user_queue(ib_ctx, dev, &cq->q, ureq.addr, 921 ureq.len, IB_ACCESS_LOCAL_WRITE, 922 1, 1); 923 if (rc) 924 goto err0; 925 926 pbl_ptr = cq->q.pbl_tbl->pa; 927 page_cnt = cq->q.pbl_info.num_pbes; 928 929 cq->ibcq.cqe = chain_entries; 930 } else { 931 cq->cq_type = QEDR_CQ_TYPE_KERNEL; 932 933 rc = dev->ops->common->chain_alloc(dev->cdev, 934 QED_CHAIN_USE_TO_CONSUME, 935 QED_CHAIN_MODE_PBL, 936 QED_CHAIN_CNT_TYPE_U32, 937 chain_entries, 938 sizeof(union rdma_cqe), 939 &cq->pbl, NULL); 940 if (rc) 941 goto err1; 942 943 page_cnt = qed_chain_get_page_cnt(&cq->pbl); 944 pbl_ptr = qed_chain_get_pbl_phys(&cq->pbl); 945 cq->ibcq.cqe = cq->pbl.capacity; 946 } 947 948 qedr_init_cq_params(cq, ctx, dev, vector, chain_entries, page_cnt, 949 pbl_ptr, ¶ms); 950 951 rc = dev->ops->rdma_create_cq(dev->rdma_ctx, ¶ms, &icid); 952 if (rc) 953 goto err2; 954 955 cq->icid = icid; 956 cq->sig = QEDR_CQ_MAGIC_NUMBER; 957 spin_lock_init(&cq->cq_lock); 958 959 if (ib_ctx) { 960 rc = qedr_copy_cq_uresp(dev, cq, udata); 961 if (rc) 962 goto err3; 963 } else { 964 /* Generate doorbell address. */ 965 cq->db_addr = dev->db_addr + 966 DB_ADDR_SHIFT(DQ_PWM_OFFSET_UCM_RDMA_CQ_CONS_32BIT); 967 cq->db.data.icid = cq->icid; 968 cq->db.data.params = DB_AGG_CMD_SET << 969 RDMA_PWM_VAL32_DATA_AGG_CMD_SHIFT; 970 971 /* point to the very last element, passing it we will toggle */ 972 cq->toggle_cqe = qed_chain_get_last_elem(&cq->pbl); 973 cq->pbl_toggle = RDMA_CQE_REQUESTER_TOGGLE_BIT_MASK; 974 cq->latest_cqe = NULL; 975 consume_cqe(cq); 976 cq->cq_cons = qed_chain_get_cons_idx_u32(&cq->pbl); 977 } 978 979 DP_DEBUG(dev, QEDR_MSG_CQ, 980 "create cq: icid=0x%0x, addr=%p, size(entries)=0x%0x\n", 981 cq->icid, cq, params.cq_size); 982 983 return &cq->ibcq; 984 985 err3: 986 destroy_iparams.icid = cq->icid; 987 dev->ops->rdma_destroy_cq(dev->rdma_ctx, &destroy_iparams, 988 &destroy_oparams); 989 err2: 990 if (udata) 991 qedr_free_pbl(dev, &cq->q.pbl_info, cq->q.pbl_tbl); 992 else 993 dev->ops->common->chain_free(dev->cdev, &cq->pbl); 994 err1: 995 if (udata) 996 ib_umem_release(cq->q.umem); 997 err0: 998 kfree(cq); 999 return ERR_PTR(-EINVAL); 1000 } 1001 1002 int qedr_resize_cq(struct ib_cq *ibcq, int new_cnt, struct ib_udata *udata) 1003 { 1004 struct qedr_dev *dev = get_qedr_dev(ibcq->device); 1005 struct qedr_cq *cq = get_qedr_cq(ibcq); 1006 1007 DP_ERR(dev, "cq %p RESIZE NOT SUPPORTED\n", cq); 1008 1009 return 0; 1010 } 1011 1012 #define QEDR_DESTROY_CQ_MAX_ITERATIONS (10) 1013 #define QEDR_DESTROY_CQ_ITER_DURATION (10) 1014 1015 int qedr_destroy_cq(struct ib_cq *ibcq) 1016 { 1017 struct qedr_dev *dev = get_qedr_dev(ibcq->device); 1018 struct qed_rdma_destroy_cq_out_params oparams; 1019 struct qed_rdma_destroy_cq_in_params iparams; 1020 struct qedr_cq *cq = get_qedr_cq(ibcq); 1021 int iter; 1022 int rc; 1023 1024 DP_DEBUG(dev, QEDR_MSG_CQ, "destroy cq %p (icid=%d)\n", cq, cq->icid); 1025 1026 cq->destroyed = 1; 1027 1028 /* GSIs CQs are handled by driver, so they don't exist in the FW */ 1029 if (cq->cq_type == QEDR_CQ_TYPE_GSI) 1030 goto done; 1031 1032 iparams.icid = cq->icid; 1033 rc = dev->ops->rdma_destroy_cq(dev->rdma_ctx, &iparams, &oparams); 1034 if (rc) 1035 return rc; 1036 1037 dev->ops->common->chain_free(dev->cdev, &cq->pbl); 1038 1039 if (ibcq->uobject && ibcq->uobject->context) { 1040 qedr_free_pbl(dev, &cq->q.pbl_info, cq->q.pbl_tbl); 1041 ib_umem_release(cq->q.umem); 1042 } 1043 1044 /* We don't want the IRQ handler to handle a non-existing CQ so we 1045 * wait until all CNQ interrupts, if any, are received. This will always 1046 * happen and will always happen very fast. If not, then a serious error 1047 * has occured. That is why we can use a long delay. 1048 * We spin for a short time so we don’t lose time on context switching 1049 * in case all the completions are handled in that span. Otherwise 1050 * we sleep for a while and check again. Since the CNQ may be 1051 * associated with (only) the current CPU we use msleep to allow the 1052 * current CPU to be freed. 1053 * The CNQ notification is increased in qedr_irq_handler(). 1054 */ 1055 iter = QEDR_DESTROY_CQ_MAX_ITERATIONS; 1056 while (oparams.num_cq_notif != READ_ONCE(cq->cnq_notif) && iter) { 1057 udelay(QEDR_DESTROY_CQ_ITER_DURATION); 1058 iter--; 1059 } 1060 1061 iter = QEDR_DESTROY_CQ_MAX_ITERATIONS; 1062 while (oparams.num_cq_notif != READ_ONCE(cq->cnq_notif) && iter) { 1063 msleep(QEDR_DESTROY_CQ_ITER_DURATION); 1064 iter--; 1065 } 1066 1067 if (oparams.num_cq_notif != cq->cnq_notif) 1068 goto err; 1069 1070 /* Note that we don't need to have explicit code to wait for the 1071 * completion of the event handler because it is invoked from the EQ. 1072 * Since the destroy CQ ramrod has also been received on the EQ we can 1073 * be certain that there's no event handler in process. 1074 */ 1075 done: 1076 cq->sig = ~cq->sig; 1077 1078 kfree(cq); 1079 1080 return 0; 1081 1082 err: 1083 DP_ERR(dev, 1084 "CQ %p (icid=%d) not freed, expecting %d ints but got %d ints\n", 1085 cq, cq->icid, oparams.num_cq_notif, cq->cnq_notif); 1086 1087 return -EINVAL; 1088 } 1089 1090 static inline int get_gid_info_from_table(struct ib_qp *ibqp, 1091 struct ib_qp_attr *attr, 1092 int attr_mask, 1093 struct qed_rdma_modify_qp_in_params 1094 *qp_params) 1095 { 1096 const struct ib_gid_attr *gid_attr; 1097 enum rdma_network_type nw_type; 1098 const struct ib_global_route *grh = rdma_ah_read_grh(&attr->ah_attr); 1099 u32 ipv4_addr; 1100 int i; 1101 1102 gid_attr = grh->sgid_attr; 1103 qp_params->vlan_id = rdma_vlan_dev_vlan_id(gid_attr->ndev); 1104 1105 nw_type = rdma_gid_attr_network_type(gid_attr); 1106 switch (nw_type) { 1107 case RDMA_NETWORK_IPV6: 1108 memcpy(&qp_params->sgid.bytes[0], &gid_attr->gid.raw[0], 1109 sizeof(qp_params->sgid)); 1110 memcpy(&qp_params->dgid.bytes[0], 1111 &grh->dgid, 1112 sizeof(qp_params->dgid)); 1113 qp_params->roce_mode = ROCE_V2_IPV6; 1114 SET_FIELD(qp_params->modify_flags, 1115 QED_ROCE_MODIFY_QP_VALID_ROCE_MODE, 1); 1116 break; 1117 case RDMA_NETWORK_IB: 1118 memcpy(&qp_params->sgid.bytes[0], &gid_attr->gid.raw[0], 1119 sizeof(qp_params->sgid)); 1120 memcpy(&qp_params->dgid.bytes[0], 1121 &grh->dgid, 1122 sizeof(qp_params->dgid)); 1123 qp_params->roce_mode = ROCE_V1; 1124 break; 1125 case RDMA_NETWORK_IPV4: 1126 memset(&qp_params->sgid, 0, sizeof(qp_params->sgid)); 1127 memset(&qp_params->dgid, 0, sizeof(qp_params->dgid)); 1128 ipv4_addr = qedr_get_ipv4_from_gid(gid_attr->gid.raw); 1129 qp_params->sgid.ipv4_addr = ipv4_addr; 1130 ipv4_addr = 1131 qedr_get_ipv4_from_gid(grh->dgid.raw); 1132 qp_params->dgid.ipv4_addr = ipv4_addr; 1133 SET_FIELD(qp_params->modify_flags, 1134 QED_ROCE_MODIFY_QP_VALID_ROCE_MODE, 1); 1135 qp_params->roce_mode = ROCE_V2_IPV4; 1136 break; 1137 } 1138 1139 for (i = 0; i < 4; i++) { 1140 qp_params->sgid.dwords[i] = ntohl(qp_params->sgid.dwords[i]); 1141 qp_params->dgid.dwords[i] = ntohl(qp_params->dgid.dwords[i]); 1142 } 1143 1144 if (qp_params->vlan_id >= VLAN_CFI_MASK) 1145 qp_params->vlan_id = 0; 1146 1147 return 0; 1148 } 1149 1150 static int qedr_check_qp_attrs(struct ib_pd *ibpd, struct qedr_dev *dev, 1151 struct ib_qp_init_attr *attrs) 1152 { 1153 struct qedr_device_attr *qattr = &dev->attr; 1154 1155 /* QP0... attrs->qp_type == IB_QPT_GSI */ 1156 if (attrs->qp_type != IB_QPT_RC && attrs->qp_type != IB_QPT_GSI) { 1157 DP_DEBUG(dev, QEDR_MSG_QP, 1158 "create qp: unsupported qp type=0x%x requested\n", 1159 attrs->qp_type); 1160 return -EINVAL; 1161 } 1162 1163 if (attrs->cap.max_send_wr > qattr->max_sqe) { 1164 DP_ERR(dev, 1165 "create qp: cannot create a SQ with %d elements (max_send_wr=0x%x)\n", 1166 attrs->cap.max_send_wr, qattr->max_sqe); 1167 return -EINVAL; 1168 } 1169 1170 if (attrs->cap.max_inline_data > qattr->max_inline) { 1171 DP_ERR(dev, 1172 "create qp: unsupported inline data size=0x%x requested (max_inline=0x%x)\n", 1173 attrs->cap.max_inline_data, qattr->max_inline); 1174 return -EINVAL; 1175 } 1176 1177 if (attrs->cap.max_send_sge > qattr->max_sge) { 1178 DP_ERR(dev, 1179 "create qp: unsupported send_sge=0x%x requested (max_send_sge=0x%x)\n", 1180 attrs->cap.max_send_sge, qattr->max_sge); 1181 return -EINVAL; 1182 } 1183 1184 if (attrs->cap.max_recv_sge > qattr->max_sge) { 1185 DP_ERR(dev, 1186 "create qp: unsupported recv_sge=0x%x requested (max_recv_sge=0x%x)\n", 1187 attrs->cap.max_recv_sge, qattr->max_sge); 1188 return -EINVAL; 1189 } 1190 1191 /* Unprivileged user space cannot create special QP */ 1192 if (ibpd->uobject && attrs->qp_type == IB_QPT_GSI) { 1193 DP_ERR(dev, 1194 "create qp: userspace can't create special QPs of type=0x%x\n", 1195 attrs->qp_type); 1196 return -EINVAL; 1197 } 1198 1199 return 0; 1200 } 1201 1202 static int qedr_copy_srq_uresp(struct qedr_dev *dev, 1203 struct qedr_srq *srq, struct ib_udata *udata) 1204 { 1205 struct qedr_create_srq_uresp uresp = {}; 1206 int rc; 1207 1208 uresp.srq_id = srq->srq_id; 1209 1210 rc = ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 1211 if (rc) 1212 DP_ERR(dev, "create srq: problem copying data to user space\n"); 1213 1214 return rc; 1215 } 1216 1217 static void qedr_copy_rq_uresp(struct qedr_dev *dev, 1218 struct qedr_create_qp_uresp *uresp, 1219 struct qedr_qp *qp) 1220 { 1221 /* iWARP requires two doorbells per RQ. */ 1222 if (rdma_protocol_iwarp(&dev->ibdev, 1)) { 1223 uresp->rq_db_offset = 1224 DB_ADDR_SHIFT(DQ_PWM_OFFSET_TCM_IWARP_RQ_PROD); 1225 uresp->rq_db2_offset = DB_ADDR_SHIFT(DQ_PWM_OFFSET_TCM_FLAGS); 1226 } else { 1227 uresp->rq_db_offset = 1228 DB_ADDR_SHIFT(DQ_PWM_OFFSET_TCM_ROCE_RQ_PROD); 1229 } 1230 1231 uresp->rq_icid = qp->icid; 1232 } 1233 1234 static void qedr_copy_sq_uresp(struct qedr_dev *dev, 1235 struct qedr_create_qp_uresp *uresp, 1236 struct qedr_qp *qp) 1237 { 1238 uresp->sq_db_offset = DB_ADDR_SHIFT(DQ_PWM_OFFSET_XCM_RDMA_SQ_PROD); 1239 1240 /* iWARP uses the same cid for rq and sq */ 1241 if (rdma_protocol_iwarp(&dev->ibdev, 1)) 1242 uresp->sq_icid = qp->icid; 1243 else 1244 uresp->sq_icid = qp->icid + 1; 1245 } 1246 1247 static int qedr_copy_qp_uresp(struct qedr_dev *dev, 1248 struct qedr_qp *qp, struct ib_udata *udata) 1249 { 1250 struct qedr_create_qp_uresp uresp; 1251 int rc; 1252 1253 memset(&uresp, 0, sizeof(uresp)); 1254 qedr_copy_sq_uresp(dev, &uresp, qp); 1255 qedr_copy_rq_uresp(dev, &uresp, qp); 1256 1257 uresp.atomic_supported = dev->atomic_cap != IB_ATOMIC_NONE; 1258 uresp.qp_id = qp->qp_id; 1259 1260 rc = qedr_ib_copy_to_udata(udata, &uresp, sizeof(uresp)); 1261 if (rc) 1262 DP_ERR(dev, 1263 "create qp: failed a copy to user space with qp icid=0x%x.\n", 1264 qp->icid); 1265 1266 return rc; 1267 } 1268 1269 static void qedr_set_common_qp_params(struct qedr_dev *dev, 1270 struct qedr_qp *qp, 1271 struct qedr_pd *pd, 1272 struct ib_qp_init_attr *attrs) 1273 { 1274 spin_lock_init(&qp->q_lock); 1275 atomic_set(&qp->refcnt, 1); 1276 qp->pd = pd; 1277 qp->qp_type = attrs->qp_type; 1278 qp->max_inline_data = attrs->cap.max_inline_data; 1279 qp->sq.max_sges = attrs->cap.max_send_sge; 1280 qp->state = QED_ROCE_QP_STATE_RESET; 1281 qp->signaled = (attrs->sq_sig_type == IB_SIGNAL_ALL_WR) ? true : false; 1282 qp->sq_cq = get_qedr_cq(attrs->send_cq); 1283 qp->dev = dev; 1284 1285 if (attrs->srq) { 1286 qp->srq = get_qedr_srq(attrs->srq); 1287 } else { 1288 qp->rq_cq = get_qedr_cq(attrs->recv_cq); 1289 qp->rq.max_sges = attrs->cap.max_recv_sge; 1290 DP_DEBUG(dev, QEDR_MSG_QP, 1291 "RQ params:\trq_max_sges = %d, rq_cq_id = %d\n", 1292 qp->rq.max_sges, qp->rq_cq->icid); 1293 } 1294 1295 DP_DEBUG(dev, QEDR_MSG_QP, 1296 "QP params:\tpd = %d, qp_type = %d, max_inline_data = %d, state = %d, signaled = %d, use_srq=%d\n", 1297 pd->pd_id, qp->qp_type, qp->max_inline_data, 1298 qp->state, qp->signaled, (attrs->srq) ? 1 : 0); 1299 DP_DEBUG(dev, QEDR_MSG_QP, 1300 "SQ params:\tsq_max_sges = %d, sq_cq_id = %d\n", 1301 qp->sq.max_sges, qp->sq_cq->icid); 1302 } 1303 1304 static void qedr_set_roce_db_info(struct qedr_dev *dev, struct qedr_qp *qp) 1305 { 1306 qp->sq.db = dev->db_addr + 1307 DB_ADDR_SHIFT(DQ_PWM_OFFSET_XCM_RDMA_SQ_PROD); 1308 qp->sq.db_data.data.icid = qp->icid + 1; 1309 if (!qp->srq) { 1310 qp->rq.db = dev->db_addr + 1311 DB_ADDR_SHIFT(DQ_PWM_OFFSET_TCM_ROCE_RQ_PROD); 1312 qp->rq.db_data.data.icid = qp->icid; 1313 } 1314 } 1315 1316 static int qedr_check_srq_params(struct ib_pd *ibpd, struct qedr_dev *dev, 1317 struct ib_srq_init_attr *attrs, 1318 struct ib_udata *udata) 1319 { 1320 struct qedr_device_attr *qattr = &dev->attr; 1321 1322 if (attrs->attr.max_wr > qattr->max_srq_wr) { 1323 DP_ERR(dev, 1324 "create srq: unsupported srq_wr=0x%x requested (max_srq_wr=0x%x)\n", 1325 attrs->attr.max_wr, qattr->max_srq_wr); 1326 return -EINVAL; 1327 } 1328 1329 if (attrs->attr.max_sge > qattr->max_sge) { 1330 DP_ERR(dev, 1331 "create srq: unsupported sge=0x%x requested (max_srq_sge=0x%x)\n", 1332 attrs->attr.max_sge, qattr->max_sge); 1333 return -EINVAL; 1334 } 1335 1336 return 0; 1337 } 1338 1339 static void qedr_free_srq_user_params(struct qedr_srq *srq) 1340 { 1341 qedr_free_pbl(srq->dev, &srq->usrq.pbl_info, srq->usrq.pbl_tbl); 1342 ib_umem_release(srq->usrq.umem); 1343 ib_umem_release(srq->prod_umem); 1344 } 1345 1346 static void qedr_free_srq_kernel_params(struct qedr_srq *srq) 1347 { 1348 struct qedr_srq_hwq_info *hw_srq = &srq->hw_srq; 1349 struct qedr_dev *dev = srq->dev; 1350 1351 dev->ops->common->chain_free(dev->cdev, &hw_srq->pbl); 1352 1353 dma_free_coherent(&dev->pdev->dev, sizeof(struct rdma_srq_producers), 1354 hw_srq->virt_prod_pair_addr, 1355 hw_srq->phy_prod_pair_addr); 1356 } 1357 1358 static int qedr_init_srq_user_params(struct ib_ucontext *ib_ctx, 1359 struct qedr_srq *srq, 1360 struct qedr_create_srq_ureq *ureq, 1361 int access, int dmasync) 1362 { 1363 struct scatterlist *sg; 1364 int rc; 1365 1366 rc = qedr_init_user_queue(ib_ctx, srq->dev, &srq->usrq, ureq->srq_addr, 1367 ureq->srq_len, access, dmasync, 1); 1368 if (rc) 1369 return rc; 1370 1371 srq->prod_umem = ib_umem_get(ib_ctx, ureq->prod_pair_addr, 1372 sizeof(struct rdma_srq_producers), 1373 access, dmasync); 1374 if (IS_ERR(srq->prod_umem)) { 1375 qedr_free_pbl(srq->dev, &srq->usrq.pbl_info, srq->usrq.pbl_tbl); 1376 ib_umem_release(srq->usrq.umem); 1377 DP_ERR(srq->dev, 1378 "create srq: failed ib_umem_get for producer, got %ld\n", 1379 PTR_ERR(srq->prod_umem)); 1380 return PTR_ERR(srq->prod_umem); 1381 } 1382 1383 sg = srq->prod_umem->sg_head.sgl; 1384 srq->hw_srq.phy_prod_pair_addr = sg_dma_address(sg); 1385 1386 return 0; 1387 } 1388 1389 static int qedr_alloc_srq_kernel_params(struct qedr_srq *srq, 1390 struct qedr_dev *dev, 1391 struct ib_srq_init_attr *init_attr) 1392 { 1393 struct qedr_srq_hwq_info *hw_srq = &srq->hw_srq; 1394 dma_addr_t phy_prod_pair_addr; 1395 u32 num_elems; 1396 void *va; 1397 int rc; 1398 1399 va = dma_alloc_coherent(&dev->pdev->dev, 1400 sizeof(struct rdma_srq_producers), 1401 &phy_prod_pair_addr, GFP_KERNEL); 1402 if (!va) { 1403 DP_ERR(dev, 1404 "create srq: failed to allocate dma memory for producer\n"); 1405 return -ENOMEM; 1406 } 1407 1408 hw_srq->phy_prod_pair_addr = phy_prod_pair_addr; 1409 hw_srq->virt_prod_pair_addr = va; 1410 1411 num_elems = init_attr->attr.max_wr * RDMA_MAX_SRQ_WQE_SIZE; 1412 rc = dev->ops->common->chain_alloc(dev->cdev, 1413 QED_CHAIN_USE_TO_CONSUME_PRODUCE, 1414 QED_CHAIN_MODE_PBL, 1415 QED_CHAIN_CNT_TYPE_U32, 1416 num_elems, 1417 QEDR_SRQ_WQE_ELEM_SIZE, 1418 &hw_srq->pbl, NULL); 1419 if (rc) 1420 goto err0; 1421 1422 hw_srq->num_elems = num_elems; 1423 1424 return 0; 1425 1426 err0: 1427 dma_free_coherent(&dev->pdev->dev, sizeof(struct rdma_srq_producers), 1428 va, phy_prod_pair_addr); 1429 return rc; 1430 } 1431 1432 static int qedr_idr_add(struct qedr_dev *dev, struct qedr_idr *qidr, 1433 void *ptr, u32 id); 1434 static void qedr_idr_remove(struct qedr_dev *dev, 1435 struct qedr_idr *qidr, u32 id); 1436 1437 struct ib_srq *qedr_create_srq(struct ib_pd *ibpd, 1438 struct ib_srq_init_attr *init_attr, 1439 struct ib_udata *udata) 1440 { 1441 struct qed_rdma_destroy_srq_in_params destroy_in_params; 1442 struct qed_rdma_create_srq_in_params in_params = {}; 1443 struct qedr_dev *dev = get_qedr_dev(ibpd->device); 1444 struct qed_rdma_create_srq_out_params out_params; 1445 struct qedr_pd *pd = get_qedr_pd(ibpd); 1446 struct qedr_create_srq_ureq ureq = {}; 1447 u64 pbl_base_addr, phy_prod_pair_addr; 1448 struct ib_ucontext *ib_ctx = NULL; 1449 struct qedr_srq_hwq_info *hw_srq; 1450 struct qedr_ucontext *ctx = NULL; 1451 u32 page_cnt, page_size; 1452 struct qedr_srq *srq; 1453 int rc = 0; 1454 1455 DP_DEBUG(dev, QEDR_MSG_QP, 1456 "create SRQ called from %s (pd %p)\n", 1457 (udata) ? "User lib" : "kernel", pd); 1458 1459 rc = qedr_check_srq_params(ibpd, dev, init_attr, udata); 1460 if (rc) 1461 return ERR_PTR(-EINVAL); 1462 1463 srq = kzalloc(sizeof(*srq), GFP_KERNEL); 1464 if (!srq) 1465 return ERR_PTR(-ENOMEM); 1466 1467 srq->dev = dev; 1468 hw_srq = &srq->hw_srq; 1469 spin_lock_init(&srq->lock); 1470 1471 hw_srq->max_wr = init_attr->attr.max_wr; 1472 hw_srq->max_sges = init_attr->attr.max_sge; 1473 1474 if (udata && ibpd->uobject && ibpd->uobject->context) { 1475 ib_ctx = ibpd->uobject->context; 1476 ctx = get_qedr_ucontext(ib_ctx); 1477 1478 if (ib_copy_from_udata(&ureq, udata, sizeof(ureq))) { 1479 DP_ERR(dev, 1480 "create srq: problem copying data from user space\n"); 1481 goto err0; 1482 } 1483 1484 rc = qedr_init_srq_user_params(ib_ctx, srq, &ureq, 0, 0); 1485 if (rc) 1486 goto err0; 1487 1488 page_cnt = srq->usrq.pbl_info.num_pbes; 1489 pbl_base_addr = srq->usrq.pbl_tbl->pa; 1490 phy_prod_pair_addr = hw_srq->phy_prod_pair_addr; 1491 page_size = BIT(srq->usrq.umem->page_shift); 1492 } else { 1493 struct qed_chain *pbl; 1494 1495 rc = qedr_alloc_srq_kernel_params(srq, dev, init_attr); 1496 if (rc) 1497 goto err0; 1498 1499 pbl = &hw_srq->pbl; 1500 page_cnt = qed_chain_get_page_cnt(pbl); 1501 pbl_base_addr = qed_chain_get_pbl_phys(pbl); 1502 phy_prod_pair_addr = hw_srq->phy_prod_pair_addr; 1503 page_size = QED_CHAIN_PAGE_SIZE; 1504 } 1505 1506 in_params.pd_id = pd->pd_id; 1507 in_params.pbl_base_addr = pbl_base_addr; 1508 in_params.prod_pair_addr = phy_prod_pair_addr; 1509 in_params.num_pages = page_cnt; 1510 in_params.page_size = page_size; 1511 1512 rc = dev->ops->rdma_create_srq(dev->rdma_ctx, &in_params, &out_params); 1513 if (rc) 1514 goto err1; 1515 1516 srq->srq_id = out_params.srq_id; 1517 1518 if (udata) { 1519 rc = qedr_copy_srq_uresp(dev, srq, udata); 1520 if (rc) 1521 goto err2; 1522 } 1523 1524 rc = qedr_idr_add(dev, &dev->srqidr, srq, srq->srq_id); 1525 if (rc) 1526 goto err2; 1527 1528 DP_DEBUG(dev, QEDR_MSG_SRQ, 1529 "create srq: created srq with srq_id=0x%0x\n", srq->srq_id); 1530 return &srq->ibsrq; 1531 1532 err2: 1533 destroy_in_params.srq_id = srq->srq_id; 1534 1535 dev->ops->rdma_destroy_srq(dev->rdma_ctx, &destroy_in_params); 1536 err1: 1537 if (udata) 1538 qedr_free_srq_user_params(srq); 1539 else 1540 qedr_free_srq_kernel_params(srq); 1541 err0: 1542 kfree(srq); 1543 1544 return ERR_PTR(-EFAULT); 1545 } 1546 1547 int qedr_destroy_srq(struct ib_srq *ibsrq) 1548 { 1549 struct qed_rdma_destroy_srq_in_params in_params = {}; 1550 struct qedr_dev *dev = get_qedr_dev(ibsrq->device); 1551 struct qedr_srq *srq = get_qedr_srq(ibsrq); 1552 1553 qedr_idr_remove(dev, &dev->srqidr, srq->srq_id); 1554 in_params.srq_id = srq->srq_id; 1555 dev->ops->rdma_destroy_srq(dev->rdma_ctx, &in_params); 1556 1557 if (ibsrq->pd->uobject) 1558 qedr_free_srq_user_params(srq); 1559 else 1560 qedr_free_srq_kernel_params(srq); 1561 1562 DP_DEBUG(dev, QEDR_MSG_SRQ, 1563 "destroy srq: destroyed srq with srq_id=0x%0x\n", 1564 srq->srq_id); 1565 kfree(srq); 1566 1567 return 0; 1568 } 1569 1570 int qedr_modify_srq(struct ib_srq *ibsrq, struct ib_srq_attr *attr, 1571 enum ib_srq_attr_mask attr_mask, struct ib_udata *udata) 1572 { 1573 struct qed_rdma_modify_srq_in_params in_params = {}; 1574 struct qedr_dev *dev = get_qedr_dev(ibsrq->device); 1575 struct qedr_srq *srq = get_qedr_srq(ibsrq); 1576 int rc; 1577 1578 if (attr_mask & IB_SRQ_MAX_WR) { 1579 DP_ERR(dev, 1580 "modify srq: invalid attribute mask=0x%x specified for %p\n", 1581 attr_mask, srq); 1582 return -EINVAL; 1583 } 1584 1585 if (attr_mask & IB_SRQ_LIMIT) { 1586 if (attr->srq_limit >= srq->hw_srq.max_wr) { 1587 DP_ERR(dev, 1588 "modify srq: invalid srq_limit=0x%x (max_srq_limit=0x%x)\n", 1589 attr->srq_limit, srq->hw_srq.max_wr); 1590 return -EINVAL; 1591 } 1592 1593 in_params.srq_id = srq->srq_id; 1594 in_params.wqe_limit = attr->srq_limit; 1595 rc = dev->ops->rdma_modify_srq(dev->rdma_ctx, &in_params); 1596 if (rc) 1597 return rc; 1598 } 1599 1600 srq->srq_limit = attr->srq_limit; 1601 1602 DP_DEBUG(dev, QEDR_MSG_SRQ, 1603 "modify srq: modified srq with srq_id=0x%0x\n", srq->srq_id); 1604 1605 return 0; 1606 } 1607 1608 static inline void 1609 qedr_init_common_qp_in_params(struct qedr_dev *dev, 1610 struct qedr_pd *pd, 1611 struct qedr_qp *qp, 1612 struct ib_qp_init_attr *attrs, 1613 bool fmr_and_reserved_lkey, 1614 struct qed_rdma_create_qp_in_params *params) 1615 { 1616 /* QP handle to be written in an async event */ 1617 params->qp_handle_async_lo = lower_32_bits((uintptr_t) qp); 1618 params->qp_handle_async_hi = upper_32_bits((uintptr_t) qp); 1619 1620 params->signal_all = (attrs->sq_sig_type == IB_SIGNAL_ALL_WR); 1621 params->fmr_and_reserved_lkey = fmr_and_reserved_lkey; 1622 params->pd = pd->pd_id; 1623 params->dpi = pd->uctx ? pd->uctx->dpi : dev->dpi; 1624 params->sq_cq_id = get_qedr_cq(attrs->send_cq)->icid; 1625 params->stats_queue = 0; 1626 params->srq_id = 0; 1627 params->use_srq = false; 1628 1629 if (!qp->srq) { 1630 params->rq_cq_id = get_qedr_cq(attrs->recv_cq)->icid; 1631 1632 } else { 1633 params->rq_cq_id = get_qedr_cq(attrs->recv_cq)->icid; 1634 params->srq_id = qp->srq->srq_id; 1635 params->use_srq = true; 1636 } 1637 } 1638 1639 static inline void qedr_qp_user_print(struct qedr_dev *dev, struct qedr_qp *qp) 1640 { 1641 DP_DEBUG(dev, QEDR_MSG_QP, "create qp: successfully created user QP. " 1642 "qp=%p. " 1643 "sq_addr=0x%llx, " 1644 "sq_len=%zd, " 1645 "rq_addr=0x%llx, " 1646 "rq_len=%zd" 1647 "\n", 1648 qp, 1649 qp->usq.buf_addr, 1650 qp->usq.buf_len, qp->urq.buf_addr, qp->urq.buf_len); 1651 } 1652 1653 static int qedr_idr_add(struct qedr_dev *dev, struct qedr_idr *qidr, 1654 void *ptr, u32 id) 1655 { 1656 int rc; 1657 1658 idr_preload(GFP_KERNEL); 1659 spin_lock_irq(&qidr->idr_lock); 1660 1661 rc = idr_alloc(&qidr->idr, ptr, id, id + 1, GFP_ATOMIC); 1662 1663 spin_unlock_irq(&qidr->idr_lock); 1664 idr_preload_end(); 1665 1666 return rc < 0 ? rc : 0; 1667 } 1668 1669 static void qedr_idr_remove(struct qedr_dev *dev, struct qedr_idr *qidr, u32 id) 1670 { 1671 spin_lock_irq(&qidr->idr_lock); 1672 idr_remove(&qidr->idr, id); 1673 spin_unlock_irq(&qidr->idr_lock); 1674 } 1675 1676 static inline void 1677 qedr_iwarp_populate_user_qp(struct qedr_dev *dev, 1678 struct qedr_qp *qp, 1679 struct qed_rdma_create_qp_out_params *out_params) 1680 { 1681 qp->usq.pbl_tbl->va = out_params->sq_pbl_virt; 1682 qp->usq.pbl_tbl->pa = out_params->sq_pbl_phys; 1683 1684 qedr_populate_pbls(dev, qp->usq.umem, qp->usq.pbl_tbl, 1685 &qp->usq.pbl_info, FW_PAGE_SHIFT); 1686 if (!qp->srq) { 1687 qp->urq.pbl_tbl->va = out_params->rq_pbl_virt; 1688 qp->urq.pbl_tbl->pa = out_params->rq_pbl_phys; 1689 } 1690 1691 qedr_populate_pbls(dev, qp->urq.umem, qp->urq.pbl_tbl, 1692 &qp->urq.pbl_info, FW_PAGE_SHIFT); 1693 } 1694 1695 static void qedr_cleanup_user(struct qedr_dev *dev, struct qedr_qp *qp) 1696 { 1697 if (qp->usq.umem) 1698 ib_umem_release(qp->usq.umem); 1699 qp->usq.umem = NULL; 1700 1701 if (qp->urq.umem) 1702 ib_umem_release(qp->urq.umem); 1703 qp->urq.umem = NULL; 1704 } 1705 1706 static int qedr_create_user_qp(struct qedr_dev *dev, 1707 struct qedr_qp *qp, 1708 struct ib_pd *ibpd, 1709 struct ib_udata *udata, 1710 struct ib_qp_init_attr *attrs) 1711 { 1712 struct qed_rdma_create_qp_in_params in_params; 1713 struct qed_rdma_create_qp_out_params out_params; 1714 struct qedr_pd *pd = get_qedr_pd(ibpd); 1715 struct ib_ucontext *ib_ctx = NULL; 1716 struct qedr_create_qp_ureq ureq; 1717 int alloc_and_init = rdma_protocol_roce(&dev->ibdev, 1); 1718 int rc = -EINVAL; 1719 1720 ib_ctx = ibpd->uobject->context; 1721 1722 memset(&ureq, 0, sizeof(ureq)); 1723 rc = ib_copy_from_udata(&ureq, udata, sizeof(ureq)); 1724 if (rc) { 1725 DP_ERR(dev, "Problem copying data from user space\n"); 1726 return rc; 1727 } 1728 1729 /* SQ - read access only (0), dma sync not required (0) */ 1730 rc = qedr_init_user_queue(ib_ctx, dev, &qp->usq, ureq.sq_addr, 1731 ureq.sq_len, 0, 0, alloc_and_init); 1732 if (rc) 1733 return rc; 1734 1735 if (!qp->srq) { 1736 /* RQ - read access only (0), dma sync not required (0) */ 1737 rc = qedr_init_user_queue(ib_ctx, dev, &qp->urq, ureq.rq_addr, 1738 ureq.rq_len, 0, 0, alloc_and_init); 1739 if (rc) 1740 return rc; 1741 } 1742 1743 memset(&in_params, 0, sizeof(in_params)); 1744 qedr_init_common_qp_in_params(dev, pd, qp, attrs, false, &in_params); 1745 in_params.qp_handle_lo = ureq.qp_handle_lo; 1746 in_params.qp_handle_hi = ureq.qp_handle_hi; 1747 in_params.sq_num_pages = qp->usq.pbl_info.num_pbes; 1748 in_params.sq_pbl_ptr = qp->usq.pbl_tbl->pa; 1749 if (!qp->srq) { 1750 in_params.rq_num_pages = qp->urq.pbl_info.num_pbes; 1751 in_params.rq_pbl_ptr = qp->urq.pbl_tbl->pa; 1752 } 1753 1754 qp->qed_qp = dev->ops->rdma_create_qp(dev->rdma_ctx, 1755 &in_params, &out_params); 1756 1757 if (!qp->qed_qp) { 1758 rc = -ENOMEM; 1759 goto err1; 1760 } 1761 1762 if (rdma_protocol_iwarp(&dev->ibdev, 1)) 1763 qedr_iwarp_populate_user_qp(dev, qp, &out_params); 1764 1765 qp->qp_id = out_params.qp_id; 1766 qp->icid = out_params.icid; 1767 1768 rc = qedr_copy_qp_uresp(dev, qp, udata); 1769 if (rc) 1770 goto err; 1771 1772 qedr_qp_user_print(dev, qp); 1773 1774 return 0; 1775 err: 1776 rc = dev->ops->rdma_destroy_qp(dev->rdma_ctx, qp->qed_qp); 1777 if (rc) 1778 DP_ERR(dev, "create qp: fatal fault. rc=%d", rc); 1779 1780 err1: 1781 qedr_cleanup_user(dev, qp); 1782 return rc; 1783 } 1784 1785 static void qedr_set_iwarp_db_info(struct qedr_dev *dev, struct qedr_qp *qp) 1786 { 1787 qp->sq.db = dev->db_addr + 1788 DB_ADDR_SHIFT(DQ_PWM_OFFSET_XCM_RDMA_SQ_PROD); 1789 qp->sq.db_data.data.icid = qp->icid; 1790 1791 qp->rq.db = dev->db_addr + 1792 DB_ADDR_SHIFT(DQ_PWM_OFFSET_TCM_IWARP_RQ_PROD); 1793 qp->rq.db_data.data.icid = qp->icid; 1794 qp->rq.iwarp_db2 = dev->db_addr + 1795 DB_ADDR_SHIFT(DQ_PWM_OFFSET_TCM_FLAGS); 1796 qp->rq.iwarp_db2_data.data.icid = qp->icid; 1797 qp->rq.iwarp_db2_data.data.value = DQ_TCM_IWARP_POST_RQ_CF_CMD; 1798 } 1799 1800 static int 1801 qedr_roce_create_kernel_qp(struct qedr_dev *dev, 1802 struct qedr_qp *qp, 1803 struct qed_rdma_create_qp_in_params *in_params, 1804 u32 n_sq_elems, u32 n_rq_elems) 1805 { 1806 struct qed_rdma_create_qp_out_params out_params; 1807 int rc; 1808 1809 rc = dev->ops->common->chain_alloc(dev->cdev, 1810 QED_CHAIN_USE_TO_PRODUCE, 1811 QED_CHAIN_MODE_PBL, 1812 QED_CHAIN_CNT_TYPE_U32, 1813 n_sq_elems, 1814 QEDR_SQE_ELEMENT_SIZE, 1815 &qp->sq.pbl, NULL); 1816 1817 if (rc) 1818 return rc; 1819 1820 in_params->sq_num_pages = qed_chain_get_page_cnt(&qp->sq.pbl); 1821 in_params->sq_pbl_ptr = qed_chain_get_pbl_phys(&qp->sq.pbl); 1822 1823 rc = dev->ops->common->chain_alloc(dev->cdev, 1824 QED_CHAIN_USE_TO_CONSUME_PRODUCE, 1825 QED_CHAIN_MODE_PBL, 1826 QED_CHAIN_CNT_TYPE_U32, 1827 n_rq_elems, 1828 QEDR_RQE_ELEMENT_SIZE, 1829 &qp->rq.pbl, NULL); 1830 if (rc) 1831 return rc; 1832 1833 in_params->rq_num_pages = qed_chain_get_page_cnt(&qp->rq.pbl); 1834 in_params->rq_pbl_ptr = qed_chain_get_pbl_phys(&qp->rq.pbl); 1835 1836 qp->qed_qp = dev->ops->rdma_create_qp(dev->rdma_ctx, 1837 in_params, &out_params); 1838 1839 if (!qp->qed_qp) 1840 return -EINVAL; 1841 1842 qp->qp_id = out_params.qp_id; 1843 qp->icid = out_params.icid; 1844 1845 qedr_set_roce_db_info(dev, qp); 1846 return rc; 1847 } 1848 1849 static int 1850 qedr_iwarp_create_kernel_qp(struct qedr_dev *dev, 1851 struct qedr_qp *qp, 1852 struct qed_rdma_create_qp_in_params *in_params, 1853 u32 n_sq_elems, u32 n_rq_elems) 1854 { 1855 struct qed_rdma_create_qp_out_params out_params; 1856 struct qed_chain_ext_pbl ext_pbl; 1857 int rc; 1858 1859 in_params->sq_num_pages = QED_CHAIN_PAGE_CNT(n_sq_elems, 1860 QEDR_SQE_ELEMENT_SIZE, 1861 QED_CHAIN_MODE_PBL); 1862 in_params->rq_num_pages = QED_CHAIN_PAGE_CNT(n_rq_elems, 1863 QEDR_RQE_ELEMENT_SIZE, 1864 QED_CHAIN_MODE_PBL); 1865 1866 qp->qed_qp = dev->ops->rdma_create_qp(dev->rdma_ctx, 1867 in_params, &out_params); 1868 1869 if (!qp->qed_qp) 1870 return -EINVAL; 1871 1872 /* Now we allocate the chain */ 1873 ext_pbl.p_pbl_virt = out_params.sq_pbl_virt; 1874 ext_pbl.p_pbl_phys = out_params.sq_pbl_phys; 1875 1876 rc = dev->ops->common->chain_alloc(dev->cdev, 1877 QED_CHAIN_USE_TO_PRODUCE, 1878 QED_CHAIN_MODE_PBL, 1879 QED_CHAIN_CNT_TYPE_U32, 1880 n_sq_elems, 1881 QEDR_SQE_ELEMENT_SIZE, 1882 &qp->sq.pbl, &ext_pbl); 1883 1884 if (rc) 1885 goto err; 1886 1887 ext_pbl.p_pbl_virt = out_params.rq_pbl_virt; 1888 ext_pbl.p_pbl_phys = out_params.rq_pbl_phys; 1889 1890 rc = dev->ops->common->chain_alloc(dev->cdev, 1891 QED_CHAIN_USE_TO_CONSUME_PRODUCE, 1892 QED_CHAIN_MODE_PBL, 1893 QED_CHAIN_CNT_TYPE_U32, 1894 n_rq_elems, 1895 QEDR_RQE_ELEMENT_SIZE, 1896 &qp->rq.pbl, &ext_pbl); 1897 1898 if (rc) 1899 goto err; 1900 1901 qp->qp_id = out_params.qp_id; 1902 qp->icid = out_params.icid; 1903 1904 qedr_set_iwarp_db_info(dev, qp); 1905 return rc; 1906 1907 err: 1908 dev->ops->rdma_destroy_qp(dev->rdma_ctx, qp->qed_qp); 1909 1910 return rc; 1911 } 1912 1913 static void qedr_cleanup_kernel(struct qedr_dev *dev, struct qedr_qp *qp) 1914 { 1915 dev->ops->common->chain_free(dev->cdev, &qp->sq.pbl); 1916 kfree(qp->wqe_wr_id); 1917 1918 dev->ops->common->chain_free(dev->cdev, &qp->rq.pbl); 1919 kfree(qp->rqe_wr_id); 1920 } 1921 1922 static int qedr_create_kernel_qp(struct qedr_dev *dev, 1923 struct qedr_qp *qp, 1924 struct ib_pd *ibpd, 1925 struct ib_qp_init_attr *attrs) 1926 { 1927 struct qed_rdma_create_qp_in_params in_params; 1928 struct qedr_pd *pd = get_qedr_pd(ibpd); 1929 int rc = -EINVAL; 1930 u32 n_rq_elems; 1931 u32 n_sq_elems; 1932 u32 n_sq_entries; 1933 1934 memset(&in_params, 0, sizeof(in_params)); 1935 1936 /* A single work request may take up to QEDR_MAX_SQ_WQE_SIZE elements in 1937 * the ring. The ring should allow at least a single WR, even if the 1938 * user requested none, due to allocation issues. 1939 * We should add an extra WR since the prod and cons indices of 1940 * wqe_wr_id are managed in such a way that the WQ is considered full 1941 * when (prod+1)%max_wr==cons. We currently don't do that because we 1942 * double the number of entries due an iSER issue that pushes far more 1943 * WRs than indicated. If we decline its ib_post_send() then we get 1944 * error prints in the dmesg we'd like to avoid. 1945 */ 1946 qp->sq.max_wr = min_t(u32, attrs->cap.max_send_wr * dev->wq_multiplier, 1947 dev->attr.max_sqe); 1948 1949 qp->wqe_wr_id = kcalloc(qp->sq.max_wr, sizeof(*qp->wqe_wr_id), 1950 GFP_KERNEL); 1951 if (!qp->wqe_wr_id) { 1952 DP_ERR(dev, "create qp: failed SQ shadow memory allocation\n"); 1953 return -ENOMEM; 1954 } 1955 1956 /* QP handle to be written in CQE */ 1957 in_params.qp_handle_lo = lower_32_bits((uintptr_t) qp); 1958 in_params.qp_handle_hi = upper_32_bits((uintptr_t) qp); 1959 1960 /* A single work request may take up to QEDR_MAX_RQ_WQE_SIZE elements in 1961 * the ring. There ring should allow at least a single WR, even if the 1962 * user requested none, due to allocation issues. 1963 */ 1964 qp->rq.max_wr = (u16) max_t(u32, attrs->cap.max_recv_wr, 1); 1965 1966 /* Allocate driver internal RQ array */ 1967 qp->rqe_wr_id = kcalloc(qp->rq.max_wr, sizeof(*qp->rqe_wr_id), 1968 GFP_KERNEL); 1969 if (!qp->rqe_wr_id) { 1970 DP_ERR(dev, 1971 "create qp: failed RQ shadow memory allocation\n"); 1972 kfree(qp->wqe_wr_id); 1973 return -ENOMEM; 1974 } 1975 1976 qedr_init_common_qp_in_params(dev, pd, qp, attrs, true, &in_params); 1977 1978 n_sq_entries = attrs->cap.max_send_wr; 1979 n_sq_entries = min_t(u32, n_sq_entries, dev->attr.max_sqe); 1980 n_sq_entries = max_t(u32, n_sq_entries, 1); 1981 n_sq_elems = n_sq_entries * QEDR_MAX_SQE_ELEMENTS_PER_SQE; 1982 1983 n_rq_elems = qp->rq.max_wr * QEDR_MAX_RQE_ELEMENTS_PER_RQE; 1984 1985 if (rdma_protocol_iwarp(&dev->ibdev, 1)) 1986 rc = qedr_iwarp_create_kernel_qp(dev, qp, &in_params, 1987 n_sq_elems, n_rq_elems); 1988 else 1989 rc = qedr_roce_create_kernel_qp(dev, qp, &in_params, 1990 n_sq_elems, n_rq_elems); 1991 if (rc) 1992 qedr_cleanup_kernel(dev, qp); 1993 1994 return rc; 1995 } 1996 1997 struct ib_qp *qedr_create_qp(struct ib_pd *ibpd, 1998 struct ib_qp_init_attr *attrs, 1999 struct ib_udata *udata) 2000 { 2001 struct qedr_dev *dev = get_qedr_dev(ibpd->device); 2002 struct qedr_pd *pd = get_qedr_pd(ibpd); 2003 struct qedr_qp *qp; 2004 struct ib_qp *ibqp; 2005 int rc = 0; 2006 2007 DP_DEBUG(dev, QEDR_MSG_QP, "create qp: called from %s, pd=%p\n", 2008 udata ? "user library" : "kernel", pd); 2009 2010 rc = qedr_check_qp_attrs(ibpd, dev, attrs); 2011 if (rc) 2012 return ERR_PTR(rc); 2013 2014 DP_DEBUG(dev, QEDR_MSG_QP, 2015 "create qp: called from %s, event_handler=%p, eepd=%p sq_cq=%p, sq_icid=%d, rq_cq=%p, rq_icid=%d\n", 2016 udata ? "user library" : "kernel", attrs->event_handler, pd, 2017 get_qedr_cq(attrs->send_cq), 2018 get_qedr_cq(attrs->send_cq)->icid, 2019 get_qedr_cq(attrs->recv_cq), 2020 attrs->recv_cq ? get_qedr_cq(attrs->recv_cq)->icid : 0); 2021 2022 qp = kzalloc(sizeof(*qp), GFP_KERNEL); 2023 if (!qp) { 2024 DP_ERR(dev, "create qp: failed allocating memory\n"); 2025 return ERR_PTR(-ENOMEM); 2026 } 2027 2028 qedr_set_common_qp_params(dev, qp, pd, attrs); 2029 2030 if (attrs->qp_type == IB_QPT_GSI) { 2031 ibqp = qedr_create_gsi_qp(dev, attrs, qp); 2032 if (IS_ERR(ibqp)) 2033 kfree(qp); 2034 return ibqp; 2035 } 2036 2037 if (udata) 2038 rc = qedr_create_user_qp(dev, qp, ibpd, udata, attrs); 2039 else 2040 rc = qedr_create_kernel_qp(dev, qp, ibpd, attrs); 2041 2042 if (rc) 2043 goto err; 2044 2045 qp->ibqp.qp_num = qp->qp_id; 2046 2047 if (rdma_protocol_iwarp(&dev->ibdev, 1)) { 2048 rc = qedr_idr_add(dev, &dev->qpidr, qp, qp->qp_id); 2049 if (rc) 2050 goto err; 2051 } 2052 2053 return &qp->ibqp; 2054 2055 err: 2056 kfree(qp); 2057 2058 return ERR_PTR(-EFAULT); 2059 } 2060 2061 static enum ib_qp_state qedr_get_ibqp_state(enum qed_roce_qp_state qp_state) 2062 { 2063 switch (qp_state) { 2064 case QED_ROCE_QP_STATE_RESET: 2065 return IB_QPS_RESET; 2066 case QED_ROCE_QP_STATE_INIT: 2067 return IB_QPS_INIT; 2068 case QED_ROCE_QP_STATE_RTR: 2069 return IB_QPS_RTR; 2070 case QED_ROCE_QP_STATE_RTS: 2071 return IB_QPS_RTS; 2072 case QED_ROCE_QP_STATE_SQD: 2073 return IB_QPS_SQD; 2074 case QED_ROCE_QP_STATE_ERR: 2075 return IB_QPS_ERR; 2076 case QED_ROCE_QP_STATE_SQE: 2077 return IB_QPS_SQE; 2078 } 2079 return IB_QPS_ERR; 2080 } 2081 2082 static enum qed_roce_qp_state qedr_get_state_from_ibqp( 2083 enum ib_qp_state qp_state) 2084 { 2085 switch (qp_state) { 2086 case IB_QPS_RESET: 2087 return QED_ROCE_QP_STATE_RESET; 2088 case IB_QPS_INIT: 2089 return QED_ROCE_QP_STATE_INIT; 2090 case IB_QPS_RTR: 2091 return QED_ROCE_QP_STATE_RTR; 2092 case IB_QPS_RTS: 2093 return QED_ROCE_QP_STATE_RTS; 2094 case IB_QPS_SQD: 2095 return QED_ROCE_QP_STATE_SQD; 2096 case IB_QPS_ERR: 2097 return QED_ROCE_QP_STATE_ERR; 2098 default: 2099 return QED_ROCE_QP_STATE_ERR; 2100 } 2101 } 2102 2103 static void qedr_reset_qp_hwq_info(struct qedr_qp_hwq_info *qph) 2104 { 2105 qed_chain_reset(&qph->pbl); 2106 qph->prod = 0; 2107 qph->cons = 0; 2108 qph->wqe_cons = 0; 2109 qph->db_data.data.value = cpu_to_le16(0); 2110 } 2111 2112 static int qedr_update_qp_state(struct qedr_dev *dev, 2113 struct qedr_qp *qp, 2114 enum qed_roce_qp_state cur_state, 2115 enum qed_roce_qp_state new_state) 2116 { 2117 int status = 0; 2118 2119 if (new_state == cur_state) 2120 return 0; 2121 2122 switch (cur_state) { 2123 case QED_ROCE_QP_STATE_RESET: 2124 switch (new_state) { 2125 case QED_ROCE_QP_STATE_INIT: 2126 qp->prev_wqe_size = 0; 2127 qedr_reset_qp_hwq_info(&qp->sq); 2128 qedr_reset_qp_hwq_info(&qp->rq); 2129 break; 2130 default: 2131 status = -EINVAL; 2132 break; 2133 }; 2134 break; 2135 case QED_ROCE_QP_STATE_INIT: 2136 switch (new_state) { 2137 case QED_ROCE_QP_STATE_RTR: 2138 /* Update doorbell (in case post_recv was 2139 * done before move to RTR) 2140 */ 2141 2142 if (rdma_protocol_roce(&dev->ibdev, 1)) { 2143 writel(qp->rq.db_data.raw, qp->rq.db); 2144 /* Make sure write takes effect */ 2145 mmiowb(); 2146 } 2147 break; 2148 case QED_ROCE_QP_STATE_ERR: 2149 break; 2150 default: 2151 /* Invalid state change. */ 2152 status = -EINVAL; 2153 break; 2154 }; 2155 break; 2156 case QED_ROCE_QP_STATE_RTR: 2157 /* RTR->XXX */ 2158 switch (new_state) { 2159 case QED_ROCE_QP_STATE_RTS: 2160 break; 2161 case QED_ROCE_QP_STATE_ERR: 2162 break; 2163 default: 2164 /* Invalid state change. */ 2165 status = -EINVAL; 2166 break; 2167 }; 2168 break; 2169 case QED_ROCE_QP_STATE_RTS: 2170 /* RTS->XXX */ 2171 switch (new_state) { 2172 case QED_ROCE_QP_STATE_SQD: 2173 break; 2174 case QED_ROCE_QP_STATE_ERR: 2175 break; 2176 default: 2177 /* Invalid state change. */ 2178 status = -EINVAL; 2179 break; 2180 }; 2181 break; 2182 case QED_ROCE_QP_STATE_SQD: 2183 /* SQD->XXX */ 2184 switch (new_state) { 2185 case QED_ROCE_QP_STATE_RTS: 2186 case QED_ROCE_QP_STATE_ERR: 2187 break; 2188 default: 2189 /* Invalid state change. */ 2190 status = -EINVAL; 2191 break; 2192 }; 2193 break; 2194 case QED_ROCE_QP_STATE_ERR: 2195 /* ERR->XXX */ 2196 switch (new_state) { 2197 case QED_ROCE_QP_STATE_RESET: 2198 if ((qp->rq.prod != qp->rq.cons) || 2199 (qp->sq.prod != qp->sq.cons)) { 2200 DP_NOTICE(dev, 2201 "Error->Reset with rq/sq not empty rq.prod=%x rq.cons=%x sq.prod=%x sq.cons=%x\n", 2202 qp->rq.prod, qp->rq.cons, qp->sq.prod, 2203 qp->sq.cons); 2204 status = -EINVAL; 2205 } 2206 break; 2207 default: 2208 status = -EINVAL; 2209 break; 2210 }; 2211 break; 2212 default: 2213 status = -EINVAL; 2214 break; 2215 }; 2216 2217 return status; 2218 } 2219 2220 int qedr_modify_qp(struct ib_qp *ibqp, struct ib_qp_attr *attr, 2221 int attr_mask, struct ib_udata *udata) 2222 { 2223 struct qedr_qp *qp = get_qedr_qp(ibqp); 2224 struct qed_rdma_modify_qp_in_params qp_params = { 0 }; 2225 struct qedr_dev *dev = get_qedr_dev(&qp->dev->ibdev); 2226 const struct ib_global_route *grh = rdma_ah_read_grh(&attr->ah_attr); 2227 enum ib_qp_state old_qp_state, new_qp_state; 2228 enum qed_roce_qp_state cur_state; 2229 int rc = 0; 2230 2231 DP_DEBUG(dev, QEDR_MSG_QP, 2232 "modify qp: qp %p attr_mask=0x%x, state=%d", qp, attr_mask, 2233 attr->qp_state); 2234 2235 old_qp_state = qedr_get_ibqp_state(qp->state); 2236 if (attr_mask & IB_QP_STATE) 2237 new_qp_state = attr->qp_state; 2238 else 2239 new_qp_state = old_qp_state; 2240 2241 if (rdma_protocol_roce(&dev->ibdev, 1)) { 2242 if (!ib_modify_qp_is_ok(old_qp_state, new_qp_state, 2243 ibqp->qp_type, attr_mask, 2244 IB_LINK_LAYER_ETHERNET)) { 2245 DP_ERR(dev, 2246 "modify qp: invalid attribute mask=0x%x specified for\n" 2247 "qpn=0x%x of type=0x%x old_qp_state=0x%x, new_qp_state=0x%x\n", 2248 attr_mask, qp->qp_id, ibqp->qp_type, 2249 old_qp_state, new_qp_state); 2250 rc = -EINVAL; 2251 goto err; 2252 } 2253 } 2254 2255 /* Translate the masks... */ 2256 if (attr_mask & IB_QP_STATE) { 2257 SET_FIELD(qp_params.modify_flags, 2258 QED_RDMA_MODIFY_QP_VALID_NEW_STATE, 1); 2259 qp_params.new_state = qedr_get_state_from_ibqp(attr->qp_state); 2260 } 2261 2262 if (attr_mask & IB_QP_EN_SQD_ASYNC_NOTIFY) 2263 qp_params.sqd_async = true; 2264 2265 if (attr_mask & IB_QP_PKEY_INDEX) { 2266 SET_FIELD(qp_params.modify_flags, 2267 QED_ROCE_MODIFY_QP_VALID_PKEY, 1); 2268 if (attr->pkey_index >= QEDR_ROCE_PKEY_TABLE_LEN) { 2269 rc = -EINVAL; 2270 goto err; 2271 } 2272 2273 qp_params.pkey = QEDR_ROCE_PKEY_DEFAULT; 2274 } 2275 2276 if (attr_mask & IB_QP_QKEY) 2277 qp->qkey = attr->qkey; 2278 2279 if (attr_mask & IB_QP_ACCESS_FLAGS) { 2280 SET_FIELD(qp_params.modify_flags, 2281 QED_RDMA_MODIFY_QP_VALID_RDMA_OPS_EN, 1); 2282 qp_params.incoming_rdma_read_en = attr->qp_access_flags & 2283 IB_ACCESS_REMOTE_READ; 2284 qp_params.incoming_rdma_write_en = attr->qp_access_flags & 2285 IB_ACCESS_REMOTE_WRITE; 2286 qp_params.incoming_atomic_en = attr->qp_access_flags & 2287 IB_ACCESS_REMOTE_ATOMIC; 2288 } 2289 2290 if (attr_mask & (IB_QP_AV | IB_QP_PATH_MTU)) { 2291 if (rdma_protocol_iwarp(&dev->ibdev, 1)) 2292 return -EINVAL; 2293 2294 if (attr_mask & IB_QP_PATH_MTU) { 2295 if (attr->path_mtu < IB_MTU_256 || 2296 attr->path_mtu > IB_MTU_4096) { 2297 pr_err("error: Only MTU sizes of 256, 512, 1024, 2048 and 4096 are supported by RoCE\n"); 2298 rc = -EINVAL; 2299 goto err; 2300 } 2301 qp->mtu = min(ib_mtu_enum_to_int(attr->path_mtu), 2302 ib_mtu_enum_to_int(iboe_get_mtu 2303 (dev->ndev->mtu))); 2304 } 2305 2306 if (!qp->mtu) { 2307 qp->mtu = 2308 ib_mtu_enum_to_int(iboe_get_mtu(dev->ndev->mtu)); 2309 pr_err("Fixing zeroed MTU to qp->mtu = %d\n", qp->mtu); 2310 } 2311 2312 SET_FIELD(qp_params.modify_flags, 2313 QED_ROCE_MODIFY_QP_VALID_ADDRESS_VECTOR, 1); 2314 2315 qp_params.traffic_class_tos = grh->traffic_class; 2316 qp_params.flow_label = grh->flow_label; 2317 qp_params.hop_limit_ttl = grh->hop_limit; 2318 2319 qp->sgid_idx = grh->sgid_index; 2320 2321 rc = get_gid_info_from_table(ibqp, attr, attr_mask, &qp_params); 2322 if (rc) { 2323 DP_ERR(dev, 2324 "modify qp: problems with GID index %d (rc=%d)\n", 2325 grh->sgid_index, rc); 2326 return rc; 2327 } 2328 2329 rc = qedr_get_dmac(dev, &attr->ah_attr, 2330 qp_params.remote_mac_addr); 2331 if (rc) 2332 return rc; 2333 2334 qp_params.use_local_mac = true; 2335 ether_addr_copy(qp_params.local_mac_addr, dev->ndev->dev_addr); 2336 2337 DP_DEBUG(dev, QEDR_MSG_QP, "dgid=%x:%x:%x:%x\n", 2338 qp_params.dgid.dwords[0], qp_params.dgid.dwords[1], 2339 qp_params.dgid.dwords[2], qp_params.dgid.dwords[3]); 2340 DP_DEBUG(dev, QEDR_MSG_QP, "sgid=%x:%x:%x:%x\n", 2341 qp_params.sgid.dwords[0], qp_params.sgid.dwords[1], 2342 qp_params.sgid.dwords[2], qp_params.sgid.dwords[3]); 2343 DP_DEBUG(dev, QEDR_MSG_QP, "remote_mac=[%pM]\n", 2344 qp_params.remote_mac_addr); 2345 2346 qp_params.mtu = qp->mtu; 2347 qp_params.lb_indication = false; 2348 } 2349 2350 if (!qp_params.mtu) { 2351 /* Stay with current MTU */ 2352 if (qp->mtu) 2353 qp_params.mtu = qp->mtu; 2354 else 2355 qp_params.mtu = 2356 ib_mtu_enum_to_int(iboe_get_mtu(dev->ndev->mtu)); 2357 } 2358 2359 if (attr_mask & IB_QP_TIMEOUT) { 2360 SET_FIELD(qp_params.modify_flags, 2361 QED_ROCE_MODIFY_QP_VALID_ACK_TIMEOUT, 1); 2362 2363 /* The received timeout value is an exponent used like this: 2364 * "12.7.34 LOCAL ACK TIMEOUT 2365 * Value representing the transport (ACK) timeout for use by 2366 * the remote, expressed as: 4.096 * 2^timeout [usec]" 2367 * The FW expects timeout in msec so we need to divide the usec 2368 * result by 1000. We'll approximate 1000~2^10, and 4.096 ~ 2^2, 2369 * so we get: 2^2 * 2^timeout / 2^10 = 2^(timeout - 8). 2370 * The value of zero means infinite so we use a 'max_t' to make 2371 * sure that sub 1 msec values will be configured as 1 msec. 2372 */ 2373 if (attr->timeout) 2374 qp_params.ack_timeout = 2375 1 << max_t(int, attr->timeout - 8, 0); 2376 else 2377 qp_params.ack_timeout = 0; 2378 } 2379 2380 if (attr_mask & IB_QP_RETRY_CNT) { 2381 SET_FIELD(qp_params.modify_flags, 2382 QED_ROCE_MODIFY_QP_VALID_RETRY_CNT, 1); 2383 qp_params.retry_cnt = attr->retry_cnt; 2384 } 2385 2386 if (attr_mask & IB_QP_RNR_RETRY) { 2387 SET_FIELD(qp_params.modify_flags, 2388 QED_ROCE_MODIFY_QP_VALID_RNR_RETRY_CNT, 1); 2389 qp_params.rnr_retry_cnt = attr->rnr_retry; 2390 } 2391 2392 if (attr_mask & IB_QP_RQ_PSN) { 2393 SET_FIELD(qp_params.modify_flags, 2394 QED_ROCE_MODIFY_QP_VALID_RQ_PSN, 1); 2395 qp_params.rq_psn = attr->rq_psn; 2396 qp->rq_psn = attr->rq_psn; 2397 } 2398 2399 if (attr_mask & IB_QP_MAX_QP_RD_ATOMIC) { 2400 if (attr->max_rd_atomic > dev->attr.max_qp_req_rd_atomic_resc) { 2401 rc = -EINVAL; 2402 DP_ERR(dev, 2403 "unsupported max_rd_atomic=%d, supported=%d\n", 2404 attr->max_rd_atomic, 2405 dev->attr.max_qp_req_rd_atomic_resc); 2406 goto err; 2407 } 2408 2409 SET_FIELD(qp_params.modify_flags, 2410 QED_RDMA_MODIFY_QP_VALID_MAX_RD_ATOMIC_REQ, 1); 2411 qp_params.max_rd_atomic_req = attr->max_rd_atomic; 2412 } 2413 2414 if (attr_mask & IB_QP_MIN_RNR_TIMER) { 2415 SET_FIELD(qp_params.modify_flags, 2416 QED_ROCE_MODIFY_QP_VALID_MIN_RNR_NAK_TIMER, 1); 2417 qp_params.min_rnr_nak_timer = attr->min_rnr_timer; 2418 } 2419 2420 if (attr_mask & IB_QP_SQ_PSN) { 2421 SET_FIELD(qp_params.modify_flags, 2422 QED_ROCE_MODIFY_QP_VALID_SQ_PSN, 1); 2423 qp_params.sq_psn = attr->sq_psn; 2424 qp->sq_psn = attr->sq_psn; 2425 } 2426 2427 if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC) { 2428 if (attr->max_dest_rd_atomic > 2429 dev->attr.max_qp_resp_rd_atomic_resc) { 2430 DP_ERR(dev, 2431 "unsupported max_dest_rd_atomic=%d, supported=%d\n", 2432 attr->max_dest_rd_atomic, 2433 dev->attr.max_qp_resp_rd_atomic_resc); 2434 2435 rc = -EINVAL; 2436 goto err; 2437 } 2438 2439 SET_FIELD(qp_params.modify_flags, 2440 QED_RDMA_MODIFY_QP_VALID_MAX_RD_ATOMIC_RESP, 1); 2441 qp_params.max_rd_atomic_resp = attr->max_dest_rd_atomic; 2442 } 2443 2444 if (attr_mask & IB_QP_DEST_QPN) { 2445 SET_FIELD(qp_params.modify_flags, 2446 QED_ROCE_MODIFY_QP_VALID_DEST_QP, 1); 2447 2448 qp_params.dest_qp = attr->dest_qp_num; 2449 qp->dest_qp_num = attr->dest_qp_num; 2450 } 2451 2452 cur_state = qp->state; 2453 2454 /* Update the QP state before the actual ramrod to prevent a race with 2455 * fast path. Modifying the QP state to error will cause the device to 2456 * flush the CQEs and while polling the flushed CQEs will considered as 2457 * a potential issue if the QP isn't in error state. 2458 */ 2459 if ((attr_mask & IB_QP_STATE) && qp->qp_type != IB_QPT_GSI && 2460 !udata && qp_params.new_state == QED_ROCE_QP_STATE_ERR) 2461 qp->state = QED_ROCE_QP_STATE_ERR; 2462 2463 if (qp->qp_type != IB_QPT_GSI) 2464 rc = dev->ops->rdma_modify_qp(dev->rdma_ctx, 2465 qp->qed_qp, &qp_params); 2466 2467 if (attr_mask & IB_QP_STATE) { 2468 if ((qp->qp_type != IB_QPT_GSI) && (!udata)) 2469 rc = qedr_update_qp_state(dev, qp, cur_state, 2470 qp_params.new_state); 2471 qp->state = qp_params.new_state; 2472 } 2473 2474 err: 2475 return rc; 2476 } 2477 2478 static int qedr_to_ib_qp_acc_flags(struct qed_rdma_query_qp_out_params *params) 2479 { 2480 int ib_qp_acc_flags = 0; 2481 2482 if (params->incoming_rdma_write_en) 2483 ib_qp_acc_flags |= IB_ACCESS_REMOTE_WRITE; 2484 if (params->incoming_rdma_read_en) 2485 ib_qp_acc_flags |= IB_ACCESS_REMOTE_READ; 2486 if (params->incoming_atomic_en) 2487 ib_qp_acc_flags |= IB_ACCESS_REMOTE_ATOMIC; 2488 ib_qp_acc_flags |= IB_ACCESS_LOCAL_WRITE; 2489 return ib_qp_acc_flags; 2490 } 2491 2492 int qedr_query_qp(struct ib_qp *ibqp, 2493 struct ib_qp_attr *qp_attr, 2494 int attr_mask, struct ib_qp_init_attr *qp_init_attr) 2495 { 2496 struct qed_rdma_query_qp_out_params params; 2497 struct qedr_qp *qp = get_qedr_qp(ibqp); 2498 struct qedr_dev *dev = qp->dev; 2499 int rc = 0; 2500 2501 memset(¶ms, 0, sizeof(params)); 2502 2503 rc = dev->ops->rdma_query_qp(dev->rdma_ctx, qp->qed_qp, ¶ms); 2504 if (rc) 2505 goto err; 2506 2507 memset(qp_attr, 0, sizeof(*qp_attr)); 2508 memset(qp_init_attr, 0, sizeof(*qp_init_attr)); 2509 2510 qp_attr->qp_state = qedr_get_ibqp_state(params.state); 2511 qp_attr->cur_qp_state = qedr_get_ibqp_state(params.state); 2512 qp_attr->path_mtu = ib_mtu_int_to_enum(params.mtu); 2513 qp_attr->path_mig_state = IB_MIG_MIGRATED; 2514 qp_attr->rq_psn = params.rq_psn; 2515 qp_attr->sq_psn = params.sq_psn; 2516 qp_attr->dest_qp_num = params.dest_qp; 2517 2518 qp_attr->qp_access_flags = qedr_to_ib_qp_acc_flags(¶ms); 2519 2520 qp_attr->cap.max_send_wr = qp->sq.max_wr; 2521 qp_attr->cap.max_recv_wr = qp->rq.max_wr; 2522 qp_attr->cap.max_send_sge = qp->sq.max_sges; 2523 qp_attr->cap.max_recv_sge = qp->rq.max_sges; 2524 qp_attr->cap.max_inline_data = ROCE_REQ_MAX_INLINE_DATA_SIZE; 2525 qp_init_attr->cap = qp_attr->cap; 2526 2527 qp_attr->ah_attr.type = RDMA_AH_ATTR_TYPE_ROCE; 2528 rdma_ah_set_grh(&qp_attr->ah_attr, NULL, 2529 params.flow_label, qp->sgid_idx, 2530 params.hop_limit_ttl, params.traffic_class_tos); 2531 rdma_ah_set_dgid_raw(&qp_attr->ah_attr, ¶ms.dgid.bytes[0]); 2532 rdma_ah_set_port_num(&qp_attr->ah_attr, 1); 2533 rdma_ah_set_sl(&qp_attr->ah_attr, 0); 2534 qp_attr->timeout = params.timeout; 2535 qp_attr->rnr_retry = params.rnr_retry; 2536 qp_attr->retry_cnt = params.retry_cnt; 2537 qp_attr->min_rnr_timer = params.min_rnr_nak_timer; 2538 qp_attr->pkey_index = params.pkey_index; 2539 qp_attr->port_num = 1; 2540 rdma_ah_set_path_bits(&qp_attr->ah_attr, 0); 2541 rdma_ah_set_static_rate(&qp_attr->ah_attr, 0); 2542 qp_attr->alt_pkey_index = 0; 2543 qp_attr->alt_port_num = 0; 2544 qp_attr->alt_timeout = 0; 2545 memset(&qp_attr->alt_ah_attr, 0, sizeof(qp_attr->alt_ah_attr)); 2546 2547 qp_attr->sq_draining = (params.state == QED_ROCE_QP_STATE_SQD) ? 1 : 0; 2548 qp_attr->max_dest_rd_atomic = params.max_dest_rd_atomic; 2549 qp_attr->max_rd_atomic = params.max_rd_atomic; 2550 qp_attr->en_sqd_async_notify = (params.sqd_async) ? 1 : 0; 2551 2552 DP_DEBUG(dev, QEDR_MSG_QP, "QEDR_QUERY_QP: max_inline_data=%d\n", 2553 qp_attr->cap.max_inline_data); 2554 2555 err: 2556 return rc; 2557 } 2558 2559 static int qedr_free_qp_resources(struct qedr_dev *dev, struct qedr_qp *qp) 2560 { 2561 int rc = 0; 2562 2563 if (qp->qp_type != IB_QPT_GSI) { 2564 rc = dev->ops->rdma_destroy_qp(dev->rdma_ctx, qp->qed_qp); 2565 if (rc) 2566 return rc; 2567 } 2568 2569 if (qp->ibqp.uobject && qp->ibqp.uobject->context) 2570 qedr_cleanup_user(dev, qp); 2571 else 2572 qedr_cleanup_kernel(dev, qp); 2573 2574 return 0; 2575 } 2576 2577 int qedr_destroy_qp(struct ib_qp *ibqp) 2578 { 2579 struct qedr_qp *qp = get_qedr_qp(ibqp); 2580 struct qedr_dev *dev = qp->dev; 2581 struct ib_qp_attr attr; 2582 int attr_mask = 0; 2583 int rc = 0; 2584 2585 DP_DEBUG(dev, QEDR_MSG_QP, "destroy qp: destroying %p, qp type=%d\n", 2586 qp, qp->qp_type); 2587 2588 if (rdma_protocol_roce(&dev->ibdev, 1)) { 2589 if ((qp->state != QED_ROCE_QP_STATE_RESET) && 2590 (qp->state != QED_ROCE_QP_STATE_ERR) && 2591 (qp->state != QED_ROCE_QP_STATE_INIT)) { 2592 2593 attr.qp_state = IB_QPS_ERR; 2594 attr_mask |= IB_QP_STATE; 2595 2596 /* Change the QP state to ERROR */ 2597 qedr_modify_qp(ibqp, &attr, attr_mask, NULL); 2598 } 2599 } else { 2600 /* Wait for the connect/accept to complete */ 2601 if (qp->ep) { 2602 int wait_count = 1; 2603 2604 while (qp->ep->during_connect) { 2605 DP_DEBUG(dev, QEDR_MSG_QP, 2606 "Still in during connect/accept\n"); 2607 2608 msleep(100); 2609 if (wait_count++ > 200) { 2610 DP_NOTICE(dev, 2611 "during connect timeout\n"); 2612 break; 2613 } 2614 } 2615 } 2616 } 2617 2618 if (qp->qp_type == IB_QPT_GSI) 2619 qedr_destroy_gsi_qp(dev); 2620 2621 qedr_free_qp_resources(dev, qp); 2622 2623 if (atomic_dec_and_test(&qp->refcnt) && 2624 rdma_protocol_iwarp(&dev->ibdev, 1)) { 2625 qedr_idr_remove(dev, &dev->qpidr, qp->qp_id); 2626 kfree(qp); 2627 } 2628 return rc; 2629 } 2630 2631 struct ib_ah *qedr_create_ah(struct ib_pd *ibpd, struct rdma_ah_attr *attr, 2632 struct ib_udata *udata) 2633 { 2634 struct qedr_ah *ah; 2635 2636 ah = kzalloc(sizeof(*ah), GFP_ATOMIC); 2637 if (!ah) 2638 return ERR_PTR(-ENOMEM); 2639 2640 rdma_copy_ah_attr(&ah->attr, attr); 2641 2642 return &ah->ibah; 2643 } 2644 2645 int qedr_destroy_ah(struct ib_ah *ibah) 2646 { 2647 struct qedr_ah *ah = get_qedr_ah(ibah); 2648 2649 rdma_destroy_ah_attr(&ah->attr); 2650 kfree(ah); 2651 return 0; 2652 } 2653 2654 static void free_mr_info(struct qedr_dev *dev, struct mr_info *info) 2655 { 2656 struct qedr_pbl *pbl, *tmp; 2657 2658 if (info->pbl_table) 2659 list_add_tail(&info->pbl_table->list_entry, 2660 &info->free_pbl_list); 2661 2662 if (!list_empty(&info->inuse_pbl_list)) 2663 list_splice(&info->inuse_pbl_list, &info->free_pbl_list); 2664 2665 list_for_each_entry_safe(pbl, tmp, &info->free_pbl_list, list_entry) { 2666 list_del(&pbl->list_entry); 2667 qedr_free_pbl(dev, &info->pbl_info, pbl); 2668 } 2669 } 2670 2671 static int init_mr_info(struct qedr_dev *dev, struct mr_info *info, 2672 size_t page_list_len, bool two_layered) 2673 { 2674 struct qedr_pbl *tmp; 2675 int rc; 2676 2677 INIT_LIST_HEAD(&info->free_pbl_list); 2678 INIT_LIST_HEAD(&info->inuse_pbl_list); 2679 2680 rc = qedr_prepare_pbl_tbl(dev, &info->pbl_info, 2681 page_list_len, two_layered); 2682 if (rc) 2683 goto done; 2684 2685 info->pbl_table = qedr_alloc_pbl_tbl(dev, &info->pbl_info, GFP_KERNEL); 2686 if (IS_ERR(info->pbl_table)) { 2687 rc = PTR_ERR(info->pbl_table); 2688 goto done; 2689 } 2690 2691 DP_DEBUG(dev, QEDR_MSG_MR, "pbl_table_pa = %pa\n", 2692 &info->pbl_table->pa); 2693 2694 /* in usual case we use 2 PBLs, so we add one to free 2695 * list and allocating another one 2696 */ 2697 tmp = qedr_alloc_pbl_tbl(dev, &info->pbl_info, GFP_KERNEL); 2698 if (IS_ERR(tmp)) { 2699 DP_DEBUG(dev, QEDR_MSG_MR, "Extra PBL is not allocated\n"); 2700 goto done; 2701 } 2702 2703 list_add_tail(&tmp->list_entry, &info->free_pbl_list); 2704 2705 DP_DEBUG(dev, QEDR_MSG_MR, "extra pbl_table_pa = %pa\n", &tmp->pa); 2706 2707 done: 2708 if (rc) 2709 free_mr_info(dev, info); 2710 2711 return rc; 2712 } 2713 2714 struct ib_mr *qedr_reg_user_mr(struct ib_pd *ibpd, u64 start, u64 len, 2715 u64 usr_addr, int acc, struct ib_udata *udata) 2716 { 2717 struct qedr_dev *dev = get_qedr_dev(ibpd->device); 2718 struct qedr_mr *mr; 2719 struct qedr_pd *pd; 2720 int rc = -ENOMEM; 2721 2722 pd = get_qedr_pd(ibpd); 2723 DP_DEBUG(dev, QEDR_MSG_MR, 2724 "qedr_register user mr pd = %d start = %lld, len = %lld, usr_addr = %lld, acc = %d\n", 2725 pd->pd_id, start, len, usr_addr, acc); 2726 2727 if (acc & IB_ACCESS_REMOTE_WRITE && !(acc & IB_ACCESS_LOCAL_WRITE)) 2728 return ERR_PTR(-EINVAL); 2729 2730 mr = kzalloc(sizeof(*mr), GFP_KERNEL); 2731 if (!mr) 2732 return ERR_PTR(rc); 2733 2734 mr->type = QEDR_MR_USER; 2735 2736 mr->umem = ib_umem_get(ibpd->uobject->context, start, len, acc, 0); 2737 if (IS_ERR(mr->umem)) { 2738 rc = -EFAULT; 2739 goto err0; 2740 } 2741 2742 rc = init_mr_info(dev, &mr->info, ib_umem_page_count(mr->umem), 1); 2743 if (rc) 2744 goto err1; 2745 2746 qedr_populate_pbls(dev, mr->umem, mr->info.pbl_table, 2747 &mr->info.pbl_info, mr->umem->page_shift); 2748 2749 rc = dev->ops->rdma_alloc_tid(dev->rdma_ctx, &mr->hw_mr.itid); 2750 if (rc) { 2751 DP_ERR(dev, "roce alloc tid returned an error %d\n", rc); 2752 goto err1; 2753 } 2754 2755 /* Index only, 18 bit long, lkey = itid << 8 | key */ 2756 mr->hw_mr.tid_type = QED_RDMA_TID_REGISTERED_MR; 2757 mr->hw_mr.key = 0; 2758 mr->hw_mr.pd = pd->pd_id; 2759 mr->hw_mr.local_read = 1; 2760 mr->hw_mr.local_write = (acc & IB_ACCESS_LOCAL_WRITE) ? 1 : 0; 2761 mr->hw_mr.remote_read = (acc & IB_ACCESS_REMOTE_READ) ? 1 : 0; 2762 mr->hw_mr.remote_write = (acc & IB_ACCESS_REMOTE_WRITE) ? 1 : 0; 2763 mr->hw_mr.remote_atomic = (acc & IB_ACCESS_REMOTE_ATOMIC) ? 1 : 0; 2764 mr->hw_mr.mw_bind = false; 2765 mr->hw_mr.pbl_ptr = mr->info.pbl_table[0].pa; 2766 mr->hw_mr.pbl_two_level = mr->info.pbl_info.two_layered; 2767 mr->hw_mr.pbl_page_size_log = ilog2(mr->info.pbl_info.pbl_size); 2768 mr->hw_mr.page_size_log = mr->umem->page_shift; 2769 mr->hw_mr.fbo = ib_umem_offset(mr->umem); 2770 mr->hw_mr.length = len; 2771 mr->hw_mr.vaddr = usr_addr; 2772 mr->hw_mr.zbva = false; 2773 mr->hw_mr.phy_mr = false; 2774 mr->hw_mr.dma_mr = false; 2775 2776 rc = dev->ops->rdma_register_tid(dev->rdma_ctx, &mr->hw_mr); 2777 if (rc) { 2778 DP_ERR(dev, "roce register tid returned an error %d\n", rc); 2779 goto err2; 2780 } 2781 2782 mr->ibmr.lkey = mr->hw_mr.itid << 8 | mr->hw_mr.key; 2783 if (mr->hw_mr.remote_write || mr->hw_mr.remote_read || 2784 mr->hw_mr.remote_atomic) 2785 mr->ibmr.rkey = mr->hw_mr.itid << 8 | mr->hw_mr.key; 2786 2787 DP_DEBUG(dev, QEDR_MSG_MR, "register user mr lkey: %x\n", 2788 mr->ibmr.lkey); 2789 return &mr->ibmr; 2790 2791 err2: 2792 dev->ops->rdma_free_tid(dev->rdma_ctx, mr->hw_mr.itid); 2793 err1: 2794 qedr_free_pbl(dev, &mr->info.pbl_info, mr->info.pbl_table); 2795 err0: 2796 kfree(mr); 2797 return ERR_PTR(rc); 2798 } 2799 2800 int qedr_dereg_mr(struct ib_mr *ib_mr) 2801 { 2802 struct qedr_mr *mr = get_qedr_mr(ib_mr); 2803 struct qedr_dev *dev = get_qedr_dev(ib_mr->device); 2804 int rc = 0; 2805 2806 rc = dev->ops->rdma_deregister_tid(dev->rdma_ctx, mr->hw_mr.itid); 2807 if (rc) 2808 return rc; 2809 2810 dev->ops->rdma_free_tid(dev->rdma_ctx, mr->hw_mr.itid); 2811 2812 if ((mr->type != QEDR_MR_DMA) && (mr->type != QEDR_MR_FRMR)) 2813 qedr_free_pbl(dev, &mr->info.pbl_info, mr->info.pbl_table); 2814 2815 /* it could be user registered memory. */ 2816 if (mr->umem) 2817 ib_umem_release(mr->umem); 2818 2819 kfree(mr); 2820 2821 return rc; 2822 } 2823 2824 static struct qedr_mr *__qedr_alloc_mr(struct ib_pd *ibpd, 2825 int max_page_list_len) 2826 { 2827 struct qedr_pd *pd = get_qedr_pd(ibpd); 2828 struct qedr_dev *dev = get_qedr_dev(ibpd->device); 2829 struct qedr_mr *mr; 2830 int rc = -ENOMEM; 2831 2832 DP_DEBUG(dev, QEDR_MSG_MR, 2833 "qedr_alloc_frmr pd = %d max_page_list_len= %d\n", pd->pd_id, 2834 max_page_list_len); 2835 2836 mr = kzalloc(sizeof(*mr), GFP_KERNEL); 2837 if (!mr) 2838 return ERR_PTR(rc); 2839 2840 mr->dev = dev; 2841 mr->type = QEDR_MR_FRMR; 2842 2843 rc = init_mr_info(dev, &mr->info, max_page_list_len, 1); 2844 if (rc) 2845 goto err0; 2846 2847 rc = dev->ops->rdma_alloc_tid(dev->rdma_ctx, &mr->hw_mr.itid); 2848 if (rc) { 2849 DP_ERR(dev, "roce alloc tid returned an error %d\n", rc); 2850 goto err0; 2851 } 2852 2853 /* Index only, 18 bit long, lkey = itid << 8 | key */ 2854 mr->hw_mr.tid_type = QED_RDMA_TID_FMR; 2855 mr->hw_mr.key = 0; 2856 mr->hw_mr.pd = pd->pd_id; 2857 mr->hw_mr.local_read = 1; 2858 mr->hw_mr.local_write = 0; 2859 mr->hw_mr.remote_read = 0; 2860 mr->hw_mr.remote_write = 0; 2861 mr->hw_mr.remote_atomic = 0; 2862 mr->hw_mr.mw_bind = false; 2863 mr->hw_mr.pbl_ptr = 0; 2864 mr->hw_mr.pbl_two_level = mr->info.pbl_info.two_layered; 2865 mr->hw_mr.pbl_page_size_log = ilog2(mr->info.pbl_info.pbl_size); 2866 mr->hw_mr.fbo = 0; 2867 mr->hw_mr.length = 0; 2868 mr->hw_mr.vaddr = 0; 2869 mr->hw_mr.zbva = false; 2870 mr->hw_mr.phy_mr = true; 2871 mr->hw_mr.dma_mr = false; 2872 2873 rc = dev->ops->rdma_register_tid(dev->rdma_ctx, &mr->hw_mr); 2874 if (rc) { 2875 DP_ERR(dev, "roce register tid returned an error %d\n", rc); 2876 goto err1; 2877 } 2878 2879 mr->ibmr.lkey = mr->hw_mr.itid << 8 | mr->hw_mr.key; 2880 mr->ibmr.rkey = mr->ibmr.lkey; 2881 2882 DP_DEBUG(dev, QEDR_MSG_MR, "alloc frmr: %x\n", mr->ibmr.lkey); 2883 return mr; 2884 2885 err1: 2886 dev->ops->rdma_free_tid(dev->rdma_ctx, mr->hw_mr.itid); 2887 err0: 2888 kfree(mr); 2889 return ERR_PTR(rc); 2890 } 2891 2892 struct ib_mr *qedr_alloc_mr(struct ib_pd *ibpd, 2893 enum ib_mr_type mr_type, u32 max_num_sg) 2894 { 2895 struct qedr_mr *mr; 2896 2897 if (mr_type != IB_MR_TYPE_MEM_REG) 2898 return ERR_PTR(-EINVAL); 2899 2900 mr = __qedr_alloc_mr(ibpd, max_num_sg); 2901 2902 if (IS_ERR(mr)) 2903 return ERR_PTR(-EINVAL); 2904 2905 return &mr->ibmr; 2906 } 2907 2908 static int qedr_set_page(struct ib_mr *ibmr, u64 addr) 2909 { 2910 struct qedr_mr *mr = get_qedr_mr(ibmr); 2911 struct qedr_pbl *pbl_table; 2912 struct regpair *pbe; 2913 u32 pbes_in_page; 2914 2915 if (unlikely(mr->npages == mr->info.pbl_info.num_pbes)) { 2916 DP_ERR(mr->dev, "qedr_set_page fails when %d\n", mr->npages); 2917 return -ENOMEM; 2918 } 2919 2920 DP_DEBUG(mr->dev, QEDR_MSG_MR, "qedr_set_page pages[%d] = 0x%llx\n", 2921 mr->npages, addr); 2922 2923 pbes_in_page = mr->info.pbl_info.pbl_size / sizeof(u64); 2924 pbl_table = mr->info.pbl_table + (mr->npages / pbes_in_page); 2925 pbe = (struct regpair *)pbl_table->va; 2926 pbe += mr->npages % pbes_in_page; 2927 pbe->lo = cpu_to_le32((u32)addr); 2928 pbe->hi = cpu_to_le32((u32)upper_32_bits(addr)); 2929 2930 mr->npages++; 2931 2932 return 0; 2933 } 2934 2935 static void handle_completed_mrs(struct qedr_dev *dev, struct mr_info *info) 2936 { 2937 int work = info->completed - info->completed_handled - 1; 2938 2939 DP_DEBUG(dev, QEDR_MSG_MR, "Special FMR work = %d\n", work); 2940 while (work-- > 0 && !list_empty(&info->inuse_pbl_list)) { 2941 struct qedr_pbl *pbl; 2942 2943 /* Free all the page list that are possible to be freed 2944 * (all the ones that were invalidated), under the assumption 2945 * that if an FMR was completed successfully that means that 2946 * if there was an invalidate operation before it also ended 2947 */ 2948 pbl = list_first_entry(&info->inuse_pbl_list, 2949 struct qedr_pbl, list_entry); 2950 list_move_tail(&pbl->list_entry, &info->free_pbl_list); 2951 info->completed_handled++; 2952 } 2953 } 2954 2955 int qedr_map_mr_sg(struct ib_mr *ibmr, struct scatterlist *sg, 2956 int sg_nents, unsigned int *sg_offset) 2957 { 2958 struct qedr_mr *mr = get_qedr_mr(ibmr); 2959 2960 mr->npages = 0; 2961 2962 handle_completed_mrs(mr->dev, &mr->info); 2963 return ib_sg_to_pages(ibmr, sg, sg_nents, NULL, qedr_set_page); 2964 } 2965 2966 struct ib_mr *qedr_get_dma_mr(struct ib_pd *ibpd, int acc) 2967 { 2968 struct qedr_dev *dev = get_qedr_dev(ibpd->device); 2969 struct qedr_pd *pd = get_qedr_pd(ibpd); 2970 struct qedr_mr *mr; 2971 int rc; 2972 2973 mr = kzalloc(sizeof(*mr), GFP_KERNEL); 2974 if (!mr) 2975 return ERR_PTR(-ENOMEM); 2976 2977 mr->type = QEDR_MR_DMA; 2978 2979 rc = dev->ops->rdma_alloc_tid(dev->rdma_ctx, &mr->hw_mr.itid); 2980 if (rc) { 2981 DP_ERR(dev, "roce alloc tid returned an error %d\n", rc); 2982 goto err1; 2983 } 2984 2985 /* index only, 18 bit long, lkey = itid << 8 | key */ 2986 mr->hw_mr.tid_type = QED_RDMA_TID_REGISTERED_MR; 2987 mr->hw_mr.pd = pd->pd_id; 2988 mr->hw_mr.local_read = 1; 2989 mr->hw_mr.local_write = (acc & IB_ACCESS_LOCAL_WRITE) ? 1 : 0; 2990 mr->hw_mr.remote_read = (acc & IB_ACCESS_REMOTE_READ) ? 1 : 0; 2991 mr->hw_mr.remote_write = (acc & IB_ACCESS_REMOTE_WRITE) ? 1 : 0; 2992 mr->hw_mr.remote_atomic = (acc & IB_ACCESS_REMOTE_ATOMIC) ? 1 : 0; 2993 mr->hw_mr.dma_mr = true; 2994 2995 rc = dev->ops->rdma_register_tid(dev->rdma_ctx, &mr->hw_mr); 2996 if (rc) { 2997 DP_ERR(dev, "roce register tid returned an error %d\n", rc); 2998 goto err2; 2999 } 3000 3001 mr->ibmr.lkey = mr->hw_mr.itid << 8 | mr->hw_mr.key; 3002 if (mr->hw_mr.remote_write || mr->hw_mr.remote_read || 3003 mr->hw_mr.remote_atomic) 3004 mr->ibmr.rkey = mr->hw_mr.itid << 8 | mr->hw_mr.key; 3005 3006 DP_DEBUG(dev, QEDR_MSG_MR, "get dma mr: lkey = %x\n", mr->ibmr.lkey); 3007 return &mr->ibmr; 3008 3009 err2: 3010 dev->ops->rdma_free_tid(dev->rdma_ctx, mr->hw_mr.itid); 3011 err1: 3012 kfree(mr); 3013 return ERR_PTR(rc); 3014 } 3015 3016 static inline int qedr_wq_is_full(struct qedr_qp_hwq_info *wq) 3017 { 3018 return (((wq->prod + 1) % wq->max_wr) == wq->cons); 3019 } 3020 3021 static int sge_data_len(struct ib_sge *sg_list, int num_sge) 3022 { 3023 int i, len = 0; 3024 3025 for (i = 0; i < num_sge; i++) 3026 len += sg_list[i].length; 3027 3028 return len; 3029 } 3030 3031 static void swap_wqe_data64(u64 *p) 3032 { 3033 int i; 3034 3035 for (i = 0; i < QEDR_SQE_ELEMENT_SIZE / sizeof(u64); i++, p++) 3036 *p = cpu_to_be64(cpu_to_le64(*p)); 3037 } 3038 3039 static u32 qedr_prepare_sq_inline_data(struct qedr_dev *dev, 3040 struct qedr_qp *qp, u8 *wqe_size, 3041 const struct ib_send_wr *wr, 3042 const struct ib_send_wr **bad_wr, 3043 u8 *bits, u8 bit) 3044 { 3045 u32 data_size = sge_data_len(wr->sg_list, wr->num_sge); 3046 char *seg_prt, *wqe; 3047 int i, seg_siz; 3048 3049 if (data_size > ROCE_REQ_MAX_INLINE_DATA_SIZE) { 3050 DP_ERR(dev, "Too much inline data in WR: %d\n", data_size); 3051 *bad_wr = wr; 3052 return 0; 3053 } 3054 3055 if (!data_size) 3056 return data_size; 3057 3058 *bits |= bit; 3059 3060 seg_prt = NULL; 3061 wqe = NULL; 3062 seg_siz = 0; 3063 3064 /* Copy data inline */ 3065 for (i = 0; i < wr->num_sge; i++) { 3066 u32 len = wr->sg_list[i].length; 3067 void *src = (void *)(uintptr_t)wr->sg_list[i].addr; 3068 3069 while (len > 0) { 3070 u32 cur; 3071 3072 /* New segment required */ 3073 if (!seg_siz) { 3074 wqe = (char *)qed_chain_produce(&qp->sq.pbl); 3075 seg_prt = wqe; 3076 seg_siz = sizeof(struct rdma_sq_common_wqe); 3077 (*wqe_size)++; 3078 } 3079 3080 /* Calculate currently allowed length */ 3081 cur = min_t(u32, len, seg_siz); 3082 memcpy(seg_prt, src, cur); 3083 3084 /* Update segment variables */ 3085 seg_prt += cur; 3086 seg_siz -= cur; 3087 3088 /* Update sge variables */ 3089 src += cur; 3090 len -= cur; 3091 3092 /* Swap fully-completed segments */ 3093 if (!seg_siz) 3094 swap_wqe_data64((u64 *)wqe); 3095 } 3096 } 3097 3098 /* swap last not completed segment */ 3099 if (seg_siz) 3100 swap_wqe_data64((u64 *)wqe); 3101 3102 return data_size; 3103 } 3104 3105 #define RQ_SGE_SET(sge, vaddr, vlength, vflags) \ 3106 do { \ 3107 DMA_REGPAIR_LE(sge->addr, vaddr); \ 3108 (sge)->length = cpu_to_le32(vlength); \ 3109 (sge)->flags = cpu_to_le32(vflags); \ 3110 } while (0) 3111 3112 #define SRQ_HDR_SET(hdr, vwr_id, num_sge) \ 3113 do { \ 3114 DMA_REGPAIR_LE(hdr->wr_id, vwr_id); \ 3115 (hdr)->num_sges = num_sge; \ 3116 } while (0) 3117 3118 #define SRQ_SGE_SET(sge, vaddr, vlength, vlkey) \ 3119 do { \ 3120 DMA_REGPAIR_LE(sge->addr, vaddr); \ 3121 (sge)->length = cpu_to_le32(vlength); \ 3122 (sge)->l_key = cpu_to_le32(vlkey); \ 3123 } while (0) 3124 3125 static u32 qedr_prepare_sq_sges(struct qedr_qp *qp, u8 *wqe_size, 3126 const struct ib_send_wr *wr) 3127 { 3128 u32 data_size = 0; 3129 int i; 3130 3131 for (i = 0; i < wr->num_sge; i++) { 3132 struct rdma_sq_sge *sge = qed_chain_produce(&qp->sq.pbl); 3133 3134 DMA_REGPAIR_LE(sge->addr, wr->sg_list[i].addr); 3135 sge->l_key = cpu_to_le32(wr->sg_list[i].lkey); 3136 sge->length = cpu_to_le32(wr->sg_list[i].length); 3137 data_size += wr->sg_list[i].length; 3138 } 3139 3140 if (wqe_size) 3141 *wqe_size += wr->num_sge; 3142 3143 return data_size; 3144 } 3145 3146 static u32 qedr_prepare_sq_rdma_data(struct qedr_dev *dev, 3147 struct qedr_qp *qp, 3148 struct rdma_sq_rdma_wqe_1st *rwqe, 3149 struct rdma_sq_rdma_wqe_2nd *rwqe2, 3150 const struct ib_send_wr *wr, 3151 const struct ib_send_wr **bad_wr) 3152 { 3153 rwqe2->r_key = cpu_to_le32(rdma_wr(wr)->rkey); 3154 DMA_REGPAIR_LE(rwqe2->remote_va, rdma_wr(wr)->remote_addr); 3155 3156 if (wr->send_flags & IB_SEND_INLINE && 3157 (wr->opcode == IB_WR_RDMA_WRITE_WITH_IMM || 3158 wr->opcode == IB_WR_RDMA_WRITE)) { 3159 u8 flags = 0; 3160 3161 SET_FIELD2(flags, RDMA_SQ_RDMA_WQE_1ST_INLINE_FLG, 1); 3162 return qedr_prepare_sq_inline_data(dev, qp, &rwqe->wqe_size, wr, 3163 bad_wr, &rwqe->flags, flags); 3164 } 3165 3166 return qedr_prepare_sq_sges(qp, &rwqe->wqe_size, wr); 3167 } 3168 3169 static u32 qedr_prepare_sq_send_data(struct qedr_dev *dev, 3170 struct qedr_qp *qp, 3171 struct rdma_sq_send_wqe_1st *swqe, 3172 struct rdma_sq_send_wqe_2st *swqe2, 3173 const struct ib_send_wr *wr, 3174 const struct ib_send_wr **bad_wr) 3175 { 3176 memset(swqe2, 0, sizeof(*swqe2)); 3177 if (wr->send_flags & IB_SEND_INLINE) { 3178 u8 flags = 0; 3179 3180 SET_FIELD2(flags, RDMA_SQ_SEND_WQE_INLINE_FLG, 1); 3181 return qedr_prepare_sq_inline_data(dev, qp, &swqe->wqe_size, wr, 3182 bad_wr, &swqe->flags, flags); 3183 } 3184 3185 return qedr_prepare_sq_sges(qp, &swqe->wqe_size, wr); 3186 } 3187 3188 static int qedr_prepare_reg(struct qedr_qp *qp, 3189 struct rdma_sq_fmr_wqe_1st *fwqe1, 3190 const struct ib_reg_wr *wr) 3191 { 3192 struct qedr_mr *mr = get_qedr_mr(wr->mr); 3193 struct rdma_sq_fmr_wqe_2nd *fwqe2; 3194 3195 fwqe2 = (struct rdma_sq_fmr_wqe_2nd *)qed_chain_produce(&qp->sq.pbl); 3196 fwqe1->addr.hi = upper_32_bits(mr->ibmr.iova); 3197 fwqe1->addr.lo = lower_32_bits(mr->ibmr.iova); 3198 fwqe1->l_key = wr->key; 3199 3200 fwqe2->access_ctrl = 0; 3201 3202 SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_REMOTE_READ, 3203 !!(wr->access & IB_ACCESS_REMOTE_READ)); 3204 SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_REMOTE_WRITE, 3205 !!(wr->access & IB_ACCESS_REMOTE_WRITE)); 3206 SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_ENABLE_ATOMIC, 3207 !!(wr->access & IB_ACCESS_REMOTE_ATOMIC)); 3208 SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_LOCAL_READ, 1); 3209 SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_LOCAL_WRITE, 3210 !!(wr->access & IB_ACCESS_LOCAL_WRITE)); 3211 fwqe2->fmr_ctrl = 0; 3212 3213 SET_FIELD2(fwqe2->fmr_ctrl, RDMA_SQ_FMR_WQE_2ND_PAGE_SIZE_LOG, 3214 ilog2(mr->ibmr.page_size) - 12); 3215 3216 fwqe2->length_hi = 0; 3217 fwqe2->length_lo = mr->ibmr.length; 3218 fwqe2->pbl_addr.hi = upper_32_bits(mr->info.pbl_table->pa); 3219 fwqe2->pbl_addr.lo = lower_32_bits(mr->info.pbl_table->pa); 3220 3221 qp->wqe_wr_id[qp->sq.prod].mr = mr; 3222 3223 return 0; 3224 } 3225 3226 static enum ib_wc_opcode qedr_ib_to_wc_opcode(enum ib_wr_opcode opcode) 3227 { 3228 switch (opcode) { 3229 case IB_WR_RDMA_WRITE: 3230 case IB_WR_RDMA_WRITE_WITH_IMM: 3231 return IB_WC_RDMA_WRITE; 3232 case IB_WR_SEND_WITH_IMM: 3233 case IB_WR_SEND: 3234 case IB_WR_SEND_WITH_INV: 3235 return IB_WC_SEND; 3236 case IB_WR_RDMA_READ: 3237 case IB_WR_RDMA_READ_WITH_INV: 3238 return IB_WC_RDMA_READ; 3239 case IB_WR_ATOMIC_CMP_AND_SWP: 3240 return IB_WC_COMP_SWAP; 3241 case IB_WR_ATOMIC_FETCH_AND_ADD: 3242 return IB_WC_FETCH_ADD; 3243 case IB_WR_REG_MR: 3244 return IB_WC_REG_MR; 3245 case IB_WR_LOCAL_INV: 3246 return IB_WC_LOCAL_INV; 3247 default: 3248 return IB_WC_SEND; 3249 } 3250 } 3251 3252 static inline bool qedr_can_post_send(struct qedr_qp *qp, 3253 const struct ib_send_wr *wr) 3254 { 3255 int wq_is_full, err_wr, pbl_is_full; 3256 struct qedr_dev *dev = qp->dev; 3257 3258 /* prevent SQ overflow and/or processing of a bad WR */ 3259 err_wr = wr->num_sge > qp->sq.max_sges; 3260 wq_is_full = qedr_wq_is_full(&qp->sq); 3261 pbl_is_full = qed_chain_get_elem_left_u32(&qp->sq.pbl) < 3262 QEDR_MAX_SQE_ELEMENTS_PER_SQE; 3263 if (wq_is_full || err_wr || pbl_is_full) { 3264 if (wq_is_full && !(qp->err_bitmap & QEDR_QP_ERR_SQ_FULL)) { 3265 DP_ERR(dev, 3266 "error: WQ is full. Post send on QP %p failed (this error appears only once)\n", 3267 qp); 3268 qp->err_bitmap |= QEDR_QP_ERR_SQ_FULL; 3269 } 3270 3271 if (err_wr && !(qp->err_bitmap & QEDR_QP_ERR_BAD_SR)) { 3272 DP_ERR(dev, 3273 "error: WR is bad. Post send on QP %p failed (this error appears only once)\n", 3274 qp); 3275 qp->err_bitmap |= QEDR_QP_ERR_BAD_SR; 3276 } 3277 3278 if (pbl_is_full && 3279 !(qp->err_bitmap & QEDR_QP_ERR_SQ_PBL_FULL)) { 3280 DP_ERR(dev, 3281 "error: WQ PBL is full. Post send on QP %p failed (this error appears only once)\n", 3282 qp); 3283 qp->err_bitmap |= QEDR_QP_ERR_SQ_PBL_FULL; 3284 } 3285 return false; 3286 } 3287 return true; 3288 } 3289 3290 static int __qedr_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr, 3291 const struct ib_send_wr **bad_wr) 3292 { 3293 struct qedr_dev *dev = get_qedr_dev(ibqp->device); 3294 struct qedr_qp *qp = get_qedr_qp(ibqp); 3295 struct rdma_sq_atomic_wqe_1st *awqe1; 3296 struct rdma_sq_atomic_wqe_2nd *awqe2; 3297 struct rdma_sq_atomic_wqe_3rd *awqe3; 3298 struct rdma_sq_send_wqe_2st *swqe2; 3299 struct rdma_sq_local_inv_wqe *iwqe; 3300 struct rdma_sq_rdma_wqe_2nd *rwqe2; 3301 struct rdma_sq_send_wqe_1st *swqe; 3302 struct rdma_sq_rdma_wqe_1st *rwqe; 3303 struct rdma_sq_fmr_wqe_1st *fwqe1; 3304 struct rdma_sq_common_wqe *wqe; 3305 u32 length; 3306 int rc = 0; 3307 bool comp; 3308 3309 if (!qedr_can_post_send(qp, wr)) { 3310 *bad_wr = wr; 3311 return -ENOMEM; 3312 } 3313 3314 wqe = qed_chain_produce(&qp->sq.pbl); 3315 qp->wqe_wr_id[qp->sq.prod].signaled = 3316 !!(wr->send_flags & IB_SEND_SIGNALED) || qp->signaled; 3317 3318 wqe->flags = 0; 3319 SET_FIELD2(wqe->flags, RDMA_SQ_SEND_WQE_SE_FLG, 3320 !!(wr->send_flags & IB_SEND_SOLICITED)); 3321 comp = (!!(wr->send_flags & IB_SEND_SIGNALED)) || qp->signaled; 3322 SET_FIELD2(wqe->flags, RDMA_SQ_SEND_WQE_COMP_FLG, comp); 3323 SET_FIELD2(wqe->flags, RDMA_SQ_SEND_WQE_RD_FENCE_FLG, 3324 !!(wr->send_flags & IB_SEND_FENCE)); 3325 wqe->prev_wqe_size = qp->prev_wqe_size; 3326 3327 qp->wqe_wr_id[qp->sq.prod].opcode = qedr_ib_to_wc_opcode(wr->opcode); 3328 3329 switch (wr->opcode) { 3330 case IB_WR_SEND_WITH_IMM: 3331 if (unlikely(rdma_protocol_iwarp(&dev->ibdev, 1))) { 3332 rc = -EINVAL; 3333 *bad_wr = wr; 3334 break; 3335 } 3336 wqe->req_type = RDMA_SQ_REQ_TYPE_SEND_WITH_IMM; 3337 swqe = (struct rdma_sq_send_wqe_1st *)wqe; 3338 swqe->wqe_size = 2; 3339 swqe2 = qed_chain_produce(&qp->sq.pbl); 3340 3341 swqe->inv_key_or_imm_data = cpu_to_le32(be32_to_cpu(wr->ex.imm_data)); 3342 length = qedr_prepare_sq_send_data(dev, qp, swqe, swqe2, 3343 wr, bad_wr); 3344 swqe->length = cpu_to_le32(length); 3345 qp->wqe_wr_id[qp->sq.prod].wqe_size = swqe->wqe_size; 3346 qp->prev_wqe_size = swqe->wqe_size; 3347 qp->wqe_wr_id[qp->sq.prod].bytes_len = swqe->length; 3348 break; 3349 case IB_WR_SEND: 3350 wqe->req_type = RDMA_SQ_REQ_TYPE_SEND; 3351 swqe = (struct rdma_sq_send_wqe_1st *)wqe; 3352 3353 swqe->wqe_size = 2; 3354 swqe2 = qed_chain_produce(&qp->sq.pbl); 3355 length = qedr_prepare_sq_send_data(dev, qp, swqe, swqe2, 3356 wr, bad_wr); 3357 swqe->length = cpu_to_le32(length); 3358 qp->wqe_wr_id[qp->sq.prod].wqe_size = swqe->wqe_size; 3359 qp->prev_wqe_size = swqe->wqe_size; 3360 qp->wqe_wr_id[qp->sq.prod].bytes_len = swqe->length; 3361 break; 3362 case IB_WR_SEND_WITH_INV: 3363 wqe->req_type = RDMA_SQ_REQ_TYPE_SEND_WITH_INVALIDATE; 3364 swqe = (struct rdma_sq_send_wqe_1st *)wqe; 3365 swqe2 = qed_chain_produce(&qp->sq.pbl); 3366 swqe->wqe_size = 2; 3367 swqe->inv_key_or_imm_data = cpu_to_le32(wr->ex.invalidate_rkey); 3368 length = qedr_prepare_sq_send_data(dev, qp, swqe, swqe2, 3369 wr, bad_wr); 3370 swqe->length = cpu_to_le32(length); 3371 qp->wqe_wr_id[qp->sq.prod].wqe_size = swqe->wqe_size; 3372 qp->prev_wqe_size = swqe->wqe_size; 3373 qp->wqe_wr_id[qp->sq.prod].bytes_len = swqe->length; 3374 break; 3375 3376 case IB_WR_RDMA_WRITE_WITH_IMM: 3377 if (unlikely(rdma_protocol_iwarp(&dev->ibdev, 1))) { 3378 rc = -EINVAL; 3379 *bad_wr = wr; 3380 break; 3381 } 3382 wqe->req_type = RDMA_SQ_REQ_TYPE_RDMA_WR_WITH_IMM; 3383 rwqe = (struct rdma_sq_rdma_wqe_1st *)wqe; 3384 3385 rwqe->wqe_size = 2; 3386 rwqe->imm_data = htonl(cpu_to_le32(wr->ex.imm_data)); 3387 rwqe2 = qed_chain_produce(&qp->sq.pbl); 3388 length = qedr_prepare_sq_rdma_data(dev, qp, rwqe, rwqe2, 3389 wr, bad_wr); 3390 rwqe->length = cpu_to_le32(length); 3391 qp->wqe_wr_id[qp->sq.prod].wqe_size = rwqe->wqe_size; 3392 qp->prev_wqe_size = rwqe->wqe_size; 3393 qp->wqe_wr_id[qp->sq.prod].bytes_len = rwqe->length; 3394 break; 3395 case IB_WR_RDMA_WRITE: 3396 wqe->req_type = RDMA_SQ_REQ_TYPE_RDMA_WR; 3397 rwqe = (struct rdma_sq_rdma_wqe_1st *)wqe; 3398 3399 rwqe->wqe_size = 2; 3400 rwqe2 = qed_chain_produce(&qp->sq.pbl); 3401 length = qedr_prepare_sq_rdma_data(dev, qp, rwqe, rwqe2, 3402 wr, bad_wr); 3403 rwqe->length = cpu_to_le32(length); 3404 qp->wqe_wr_id[qp->sq.prod].wqe_size = rwqe->wqe_size; 3405 qp->prev_wqe_size = rwqe->wqe_size; 3406 qp->wqe_wr_id[qp->sq.prod].bytes_len = rwqe->length; 3407 break; 3408 case IB_WR_RDMA_READ_WITH_INV: 3409 SET_FIELD2(wqe->flags, RDMA_SQ_RDMA_WQE_1ST_READ_INV_FLG, 1); 3410 /* fallthrough -- same is identical to RDMA READ */ 3411 3412 case IB_WR_RDMA_READ: 3413 wqe->req_type = RDMA_SQ_REQ_TYPE_RDMA_RD; 3414 rwqe = (struct rdma_sq_rdma_wqe_1st *)wqe; 3415 3416 rwqe->wqe_size = 2; 3417 rwqe2 = qed_chain_produce(&qp->sq.pbl); 3418 length = qedr_prepare_sq_rdma_data(dev, qp, rwqe, rwqe2, 3419 wr, bad_wr); 3420 rwqe->length = cpu_to_le32(length); 3421 qp->wqe_wr_id[qp->sq.prod].wqe_size = rwqe->wqe_size; 3422 qp->prev_wqe_size = rwqe->wqe_size; 3423 qp->wqe_wr_id[qp->sq.prod].bytes_len = rwqe->length; 3424 break; 3425 3426 case IB_WR_ATOMIC_CMP_AND_SWP: 3427 case IB_WR_ATOMIC_FETCH_AND_ADD: 3428 awqe1 = (struct rdma_sq_atomic_wqe_1st *)wqe; 3429 awqe1->wqe_size = 4; 3430 3431 awqe2 = qed_chain_produce(&qp->sq.pbl); 3432 DMA_REGPAIR_LE(awqe2->remote_va, atomic_wr(wr)->remote_addr); 3433 awqe2->r_key = cpu_to_le32(atomic_wr(wr)->rkey); 3434 3435 awqe3 = qed_chain_produce(&qp->sq.pbl); 3436 3437 if (wr->opcode == IB_WR_ATOMIC_FETCH_AND_ADD) { 3438 wqe->req_type = RDMA_SQ_REQ_TYPE_ATOMIC_ADD; 3439 DMA_REGPAIR_LE(awqe3->swap_data, 3440 atomic_wr(wr)->compare_add); 3441 } else { 3442 wqe->req_type = RDMA_SQ_REQ_TYPE_ATOMIC_CMP_AND_SWAP; 3443 DMA_REGPAIR_LE(awqe3->swap_data, 3444 atomic_wr(wr)->swap); 3445 DMA_REGPAIR_LE(awqe3->cmp_data, 3446 atomic_wr(wr)->compare_add); 3447 } 3448 3449 qedr_prepare_sq_sges(qp, NULL, wr); 3450 3451 qp->wqe_wr_id[qp->sq.prod].wqe_size = awqe1->wqe_size; 3452 qp->prev_wqe_size = awqe1->wqe_size; 3453 break; 3454 3455 case IB_WR_LOCAL_INV: 3456 iwqe = (struct rdma_sq_local_inv_wqe *)wqe; 3457 iwqe->wqe_size = 1; 3458 3459 iwqe->req_type = RDMA_SQ_REQ_TYPE_LOCAL_INVALIDATE; 3460 iwqe->inv_l_key = wr->ex.invalidate_rkey; 3461 qp->wqe_wr_id[qp->sq.prod].wqe_size = iwqe->wqe_size; 3462 qp->prev_wqe_size = iwqe->wqe_size; 3463 break; 3464 case IB_WR_REG_MR: 3465 DP_DEBUG(dev, QEDR_MSG_CQ, "REG_MR\n"); 3466 wqe->req_type = RDMA_SQ_REQ_TYPE_FAST_MR; 3467 fwqe1 = (struct rdma_sq_fmr_wqe_1st *)wqe; 3468 fwqe1->wqe_size = 2; 3469 3470 rc = qedr_prepare_reg(qp, fwqe1, reg_wr(wr)); 3471 if (rc) { 3472 DP_ERR(dev, "IB_REG_MR failed rc=%d\n", rc); 3473 *bad_wr = wr; 3474 break; 3475 } 3476 3477 qp->wqe_wr_id[qp->sq.prod].wqe_size = fwqe1->wqe_size; 3478 qp->prev_wqe_size = fwqe1->wqe_size; 3479 break; 3480 default: 3481 DP_ERR(dev, "invalid opcode 0x%x!\n", wr->opcode); 3482 rc = -EINVAL; 3483 *bad_wr = wr; 3484 break; 3485 } 3486 3487 if (*bad_wr) { 3488 u16 value; 3489 3490 /* Restore prod to its position before 3491 * this WR was processed 3492 */ 3493 value = le16_to_cpu(qp->sq.db_data.data.value); 3494 qed_chain_set_prod(&qp->sq.pbl, value, wqe); 3495 3496 /* Restore prev_wqe_size */ 3497 qp->prev_wqe_size = wqe->prev_wqe_size; 3498 rc = -EINVAL; 3499 DP_ERR(dev, "POST SEND FAILED\n"); 3500 } 3501 3502 return rc; 3503 } 3504 3505 int qedr_post_send(struct ib_qp *ibqp, const struct ib_send_wr *wr, 3506 const struct ib_send_wr **bad_wr) 3507 { 3508 struct qedr_dev *dev = get_qedr_dev(ibqp->device); 3509 struct qedr_qp *qp = get_qedr_qp(ibqp); 3510 unsigned long flags; 3511 int rc = 0; 3512 3513 *bad_wr = NULL; 3514 3515 if (qp->qp_type == IB_QPT_GSI) 3516 return qedr_gsi_post_send(ibqp, wr, bad_wr); 3517 3518 spin_lock_irqsave(&qp->q_lock, flags); 3519 3520 if (rdma_protocol_roce(&dev->ibdev, 1)) { 3521 if ((qp->state != QED_ROCE_QP_STATE_RTS) && 3522 (qp->state != QED_ROCE_QP_STATE_ERR) && 3523 (qp->state != QED_ROCE_QP_STATE_SQD)) { 3524 spin_unlock_irqrestore(&qp->q_lock, flags); 3525 *bad_wr = wr; 3526 DP_DEBUG(dev, QEDR_MSG_CQ, 3527 "QP in wrong state! QP icid=0x%x state %d\n", 3528 qp->icid, qp->state); 3529 return -EINVAL; 3530 } 3531 } 3532 3533 while (wr) { 3534 rc = __qedr_post_send(ibqp, wr, bad_wr); 3535 if (rc) 3536 break; 3537 3538 qp->wqe_wr_id[qp->sq.prod].wr_id = wr->wr_id; 3539 3540 qedr_inc_sw_prod(&qp->sq); 3541 3542 qp->sq.db_data.data.value++; 3543 3544 wr = wr->next; 3545 } 3546 3547 /* Trigger doorbell 3548 * If there was a failure in the first WR then it will be triggered in 3549 * vane. However this is not harmful (as long as the producer value is 3550 * unchanged). For performance reasons we avoid checking for this 3551 * redundant doorbell. 3552 * 3553 * qp->wqe_wr_id is accessed during qedr_poll_cq, as 3554 * soon as we give the doorbell, we could get a completion 3555 * for this wr, therefore we need to make sure that the 3556 * memory is updated before giving the doorbell. 3557 * During qedr_poll_cq, rmb is called before accessing the 3558 * cqe. This covers for the smp_rmb as well. 3559 */ 3560 smp_wmb(); 3561 writel(qp->sq.db_data.raw, qp->sq.db); 3562 3563 /* Make sure write sticks */ 3564 mmiowb(); 3565 3566 spin_unlock_irqrestore(&qp->q_lock, flags); 3567 3568 return rc; 3569 } 3570 3571 static u32 qedr_srq_elem_left(struct qedr_srq_hwq_info *hw_srq) 3572 { 3573 u32 used; 3574 3575 /* Calculate number of elements used based on producer 3576 * count and consumer count and subtract it from max 3577 * work request supported so that we get elements left. 3578 */ 3579 used = hw_srq->wr_prod_cnt - hw_srq->wr_cons_cnt; 3580 3581 return hw_srq->max_wr - used; 3582 } 3583 3584 int qedr_post_srq_recv(struct ib_srq *ibsrq, const struct ib_recv_wr *wr, 3585 const struct ib_recv_wr **bad_wr) 3586 { 3587 struct qedr_srq *srq = get_qedr_srq(ibsrq); 3588 struct qedr_srq_hwq_info *hw_srq; 3589 struct qedr_dev *dev = srq->dev; 3590 struct qed_chain *pbl; 3591 unsigned long flags; 3592 int status = 0; 3593 u32 num_sge; 3594 u32 offset; 3595 3596 spin_lock_irqsave(&srq->lock, flags); 3597 3598 hw_srq = &srq->hw_srq; 3599 pbl = &srq->hw_srq.pbl; 3600 while (wr) { 3601 struct rdma_srq_wqe_header *hdr; 3602 int i; 3603 3604 if (!qedr_srq_elem_left(hw_srq) || 3605 wr->num_sge > srq->hw_srq.max_sges) { 3606 DP_ERR(dev, "Can't post WR (%d,%d) || (%d > %d)\n", 3607 hw_srq->wr_prod_cnt, hw_srq->wr_cons_cnt, 3608 wr->num_sge, srq->hw_srq.max_sges); 3609 status = -ENOMEM; 3610 *bad_wr = wr; 3611 break; 3612 } 3613 3614 hdr = qed_chain_produce(pbl); 3615 num_sge = wr->num_sge; 3616 /* Set number of sge and work request id in header */ 3617 SRQ_HDR_SET(hdr, wr->wr_id, num_sge); 3618 3619 srq->hw_srq.wr_prod_cnt++; 3620 hw_srq->wqe_prod++; 3621 hw_srq->sge_prod++; 3622 3623 DP_DEBUG(dev, QEDR_MSG_SRQ, 3624 "SRQ WR: SGEs: %d with wr_id[%d] = %llx\n", 3625 wr->num_sge, hw_srq->wqe_prod, wr->wr_id); 3626 3627 for (i = 0; i < wr->num_sge; i++) { 3628 struct rdma_srq_sge *srq_sge = qed_chain_produce(pbl); 3629 3630 /* Set SGE length, lkey and address */ 3631 SRQ_SGE_SET(srq_sge, wr->sg_list[i].addr, 3632 wr->sg_list[i].length, wr->sg_list[i].lkey); 3633 3634 DP_DEBUG(dev, QEDR_MSG_SRQ, 3635 "[%d]: len %d key %x addr %x:%x\n", 3636 i, srq_sge->length, srq_sge->l_key, 3637 srq_sge->addr.hi, srq_sge->addr.lo); 3638 hw_srq->sge_prod++; 3639 } 3640 3641 /* Flush WQE and SGE information before 3642 * updating producer. 3643 */ 3644 wmb(); 3645 3646 /* SRQ producer is 8 bytes. Need to update SGE producer index 3647 * in first 4 bytes and need to update WQE producer in 3648 * next 4 bytes. 3649 */ 3650 *srq->hw_srq.virt_prod_pair_addr = hw_srq->sge_prod; 3651 offset = offsetof(struct rdma_srq_producers, wqe_prod); 3652 *((u8 *)srq->hw_srq.virt_prod_pair_addr + offset) = 3653 hw_srq->wqe_prod; 3654 3655 /* Flush producer after updating it. */ 3656 wmb(); 3657 wr = wr->next; 3658 } 3659 3660 DP_DEBUG(dev, QEDR_MSG_SRQ, "POST: Elements in S-RQ: %d\n", 3661 qed_chain_get_elem_left(pbl)); 3662 spin_unlock_irqrestore(&srq->lock, flags); 3663 3664 return status; 3665 } 3666 3667 int qedr_post_recv(struct ib_qp *ibqp, const struct ib_recv_wr *wr, 3668 const struct ib_recv_wr **bad_wr) 3669 { 3670 struct qedr_qp *qp = get_qedr_qp(ibqp); 3671 struct qedr_dev *dev = qp->dev; 3672 unsigned long flags; 3673 int status = 0; 3674 3675 if (qp->qp_type == IB_QPT_GSI) 3676 return qedr_gsi_post_recv(ibqp, wr, bad_wr); 3677 3678 spin_lock_irqsave(&qp->q_lock, flags); 3679 3680 if (qp->state == QED_ROCE_QP_STATE_RESET) { 3681 spin_unlock_irqrestore(&qp->q_lock, flags); 3682 *bad_wr = wr; 3683 return -EINVAL; 3684 } 3685 3686 while (wr) { 3687 int i; 3688 3689 if (qed_chain_get_elem_left_u32(&qp->rq.pbl) < 3690 QEDR_MAX_RQE_ELEMENTS_PER_RQE || 3691 wr->num_sge > qp->rq.max_sges) { 3692 DP_ERR(dev, "Can't post WR (%d < %d) || (%d > %d)\n", 3693 qed_chain_get_elem_left_u32(&qp->rq.pbl), 3694 QEDR_MAX_RQE_ELEMENTS_PER_RQE, wr->num_sge, 3695 qp->rq.max_sges); 3696 status = -ENOMEM; 3697 *bad_wr = wr; 3698 break; 3699 } 3700 for (i = 0; i < wr->num_sge; i++) { 3701 u32 flags = 0; 3702 struct rdma_rq_sge *rqe = 3703 qed_chain_produce(&qp->rq.pbl); 3704 3705 /* First one must include the number 3706 * of SGE in the list 3707 */ 3708 if (!i) 3709 SET_FIELD(flags, RDMA_RQ_SGE_NUM_SGES, 3710 wr->num_sge); 3711 3712 SET_FIELD(flags, RDMA_RQ_SGE_L_KEY_LO, 3713 wr->sg_list[i].lkey); 3714 3715 RQ_SGE_SET(rqe, wr->sg_list[i].addr, 3716 wr->sg_list[i].length, flags); 3717 } 3718 3719 /* Special case of no sges. FW requires between 1-4 sges... 3720 * in this case we need to post 1 sge with length zero. this is 3721 * because rdma write with immediate consumes an RQ. 3722 */ 3723 if (!wr->num_sge) { 3724 u32 flags = 0; 3725 struct rdma_rq_sge *rqe = 3726 qed_chain_produce(&qp->rq.pbl); 3727 3728 /* First one must include the number 3729 * of SGE in the list 3730 */ 3731 SET_FIELD(flags, RDMA_RQ_SGE_L_KEY_LO, 0); 3732 SET_FIELD(flags, RDMA_RQ_SGE_NUM_SGES, 1); 3733 3734 RQ_SGE_SET(rqe, 0, 0, flags); 3735 i = 1; 3736 } 3737 3738 qp->rqe_wr_id[qp->rq.prod].wr_id = wr->wr_id; 3739 qp->rqe_wr_id[qp->rq.prod].wqe_size = i; 3740 3741 qedr_inc_sw_prod(&qp->rq); 3742 3743 /* qp->rqe_wr_id is accessed during qedr_poll_cq, as 3744 * soon as we give the doorbell, we could get a completion 3745 * for this wr, therefore we need to make sure that the 3746 * memory is update before giving the doorbell. 3747 * During qedr_poll_cq, rmb is called before accessing the 3748 * cqe. This covers for the smp_rmb as well. 3749 */ 3750 smp_wmb(); 3751 3752 qp->rq.db_data.data.value++; 3753 3754 writel(qp->rq.db_data.raw, qp->rq.db); 3755 3756 /* Make sure write sticks */ 3757 mmiowb(); 3758 3759 if (rdma_protocol_iwarp(&dev->ibdev, 1)) { 3760 writel(qp->rq.iwarp_db2_data.raw, qp->rq.iwarp_db2); 3761 mmiowb(); /* for second doorbell */ 3762 } 3763 3764 wr = wr->next; 3765 } 3766 3767 spin_unlock_irqrestore(&qp->q_lock, flags); 3768 3769 return status; 3770 } 3771 3772 static int is_valid_cqe(struct qedr_cq *cq, union rdma_cqe *cqe) 3773 { 3774 struct rdma_cqe_requester *resp_cqe = &cqe->req; 3775 3776 return (resp_cqe->flags & RDMA_CQE_REQUESTER_TOGGLE_BIT_MASK) == 3777 cq->pbl_toggle; 3778 } 3779 3780 static struct qedr_qp *cqe_get_qp(union rdma_cqe *cqe) 3781 { 3782 struct rdma_cqe_requester *resp_cqe = &cqe->req; 3783 struct qedr_qp *qp; 3784 3785 qp = (struct qedr_qp *)(uintptr_t)HILO_GEN(resp_cqe->qp_handle.hi, 3786 resp_cqe->qp_handle.lo, 3787 u64); 3788 return qp; 3789 } 3790 3791 static enum rdma_cqe_type cqe_get_type(union rdma_cqe *cqe) 3792 { 3793 struct rdma_cqe_requester *resp_cqe = &cqe->req; 3794 3795 return GET_FIELD(resp_cqe->flags, RDMA_CQE_REQUESTER_TYPE); 3796 } 3797 3798 /* Return latest CQE (needs processing) */ 3799 static union rdma_cqe *get_cqe(struct qedr_cq *cq) 3800 { 3801 return cq->latest_cqe; 3802 } 3803 3804 /* In fmr we need to increase the number of fmr completed counter for the fmr 3805 * algorithm determining whether we can free a pbl or not. 3806 * we need to perform this whether the work request was signaled or not. for 3807 * this purpose we call this function from the condition that checks if a wr 3808 * should be skipped, to make sure we don't miss it ( possibly this fmr 3809 * operation was not signalted) 3810 */ 3811 static inline void qedr_chk_if_fmr(struct qedr_qp *qp) 3812 { 3813 if (qp->wqe_wr_id[qp->sq.cons].opcode == IB_WC_REG_MR) 3814 qp->wqe_wr_id[qp->sq.cons].mr->info.completed++; 3815 } 3816 3817 static int process_req(struct qedr_dev *dev, struct qedr_qp *qp, 3818 struct qedr_cq *cq, int num_entries, 3819 struct ib_wc *wc, u16 hw_cons, enum ib_wc_status status, 3820 int force) 3821 { 3822 u16 cnt = 0; 3823 3824 while (num_entries && qp->sq.wqe_cons != hw_cons) { 3825 if (!qp->wqe_wr_id[qp->sq.cons].signaled && !force) { 3826 qedr_chk_if_fmr(qp); 3827 /* skip WC */ 3828 goto next_cqe; 3829 } 3830 3831 /* fill WC */ 3832 wc->status = status; 3833 wc->vendor_err = 0; 3834 wc->wc_flags = 0; 3835 wc->src_qp = qp->id; 3836 wc->qp = &qp->ibqp; 3837 3838 wc->wr_id = qp->wqe_wr_id[qp->sq.cons].wr_id; 3839 wc->opcode = qp->wqe_wr_id[qp->sq.cons].opcode; 3840 3841 switch (wc->opcode) { 3842 case IB_WC_RDMA_WRITE: 3843 wc->byte_len = qp->wqe_wr_id[qp->sq.cons].bytes_len; 3844 break; 3845 case IB_WC_COMP_SWAP: 3846 case IB_WC_FETCH_ADD: 3847 wc->byte_len = 8; 3848 break; 3849 case IB_WC_REG_MR: 3850 qp->wqe_wr_id[qp->sq.cons].mr->info.completed++; 3851 break; 3852 case IB_WC_RDMA_READ: 3853 case IB_WC_SEND: 3854 wc->byte_len = qp->wqe_wr_id[qp->sq.cons].bytes_len; 3855 break; 3856 default: 3857 break; 3858 } 3859 3860 num_entries--; 3861 wc++; 3862 cnt++; 3863 next_cqe: 3864 while (qp->wqe_wr_id[qp->sq.cons].wqe_size--) 3865 qed_chain_consume(&qp->sq.pbl); 3866 qedr_inc_sw_cons(&qp->sq); 3867 } 3868 3869 return cnt; 3870 } 3871 3872 static int qedr_poll_cq_req(struct qedr_dev *dev, 3873 struct qedr_qp *qp, struct qedr_cq *cq, 3874 int num_entries, struct ib_wc *wc, 3875 struct rdma_cqe_requester *req) 3876 { 3877 int cnt = 0; 3878 3879 switch (req->status) { 3880 case RDMA_CQE_REQ_STS_OK: 3881 cnt = process_req(dev, qp, cq, num_entries, wc, req->sq_cons, 3882 IB_WC_SUCCESS, 0); 3883 break; 3884 case RDMA_CQE_REQ_STS_WORK_REQUEST_FLUSHED_ERR: 3885 if (qp->state != QED_ROCE_QP_STATE_ERR) 3886 DP_DEBUG(dev, QEDR_MSG_CQ, 3887 "Error: POLL CQ with RDMA_CQE_REQ_STS_WORK_REQUEST_FLUSHED_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3888 cq->icid, qp->icid); 3889 cnt = process_req(dev, qp, cq, num_entries, wc, req->sq_cons, 3890 IB_WC_WR_FLUSH_ERR, 1); 3891 break; 3892 default: 3893 /* process all WQE before the cosumer */ 3894 qp->state = QED_ROCE_QP_STATE_ERR; 3895 cnt = process_req(dev, qp, cq, num_entries, wc, 3896 req->sq_cons - 1, IB_WC_SUCCESS, 0); 3897 wc += cnt; 3898 /* if we have extra WC fill it with actual error info */ 3899 if (cnt < num_entries) { 3900 enum ib_wc_status wc_status; 3901 3902 switch (req->status) { 3903 case RDMA_CQE_REQ_STS_BAD_RESPONSE_ERR: 3904 DP_ERR(dev, 3905 "Error: POLL CQ with RDMA_CQE_REQ_STS_BAD_RESPONSE_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3906 cq->icid, qp->icid); 3907 wc_status = IB_WC_BAD_RESP_ERR; 3908 break; 3909 case RDMA_CQE_REQ_STS_LOCAL_LENGTH_ERR: 3910 DP_ERR(dev, 3911 "Error: POLL CQ with RDMA_CQE_REQ_STS_LOCAL_LENGTH_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3912 cq->icid, qp->icid); 3913 wc_status = IB_WC_LOC_LEN_ERR; 3914 break; 3915 case RDMA_CQE_REQ_STS_LOCAL_QP_OPERATION_ERR: 3916 DP_ERR(dev, 3917 "Error: POLL CQ with RDMA_CQE_REQ_STS_LOCAL_QP_OPERATION_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3918 cq->icid, qp->icid); 3919 wc_status = IB_WC_LOC_QP_OP_ERR; 3920 break; 3921 case RDMA_CQE_REQ_STS_LOCAL_PROTECTION_ERR: 3922 DP_ERR(dev, 3923 "Error: POLL CQ with RDMA_CQE_REQ_STS_LOCAL_PROTECTION_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3924 cq->icid, qp->icid); 3925 wc_status = IB_WC_LOC_PROT_ERR; 3926 break; 3927 case RDMA_CQE_REQ_STS_MEMORY_MGT_OPERATION_ERR: 3928 DP_ERR(dev, 3929 "Error: POLL CQ with RDMA_CQE_REQ_STS_MEMORY_MGT_OPERATION_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3930 cq->icid, qp->icid); 3931 wc_status = IB_WC_MW_BIND_ERR; 3932 break; 3933 case RDMA_CQE_REQ_STS_REMOTE_INVALID_REQUEST_ERR: 3934 DP_ERR(dev, 3935 "Error: POLL CQ with RDMA_CQE_REQ_STS_REMOTE_INVALID_REQUEST_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3936 cq->icid, qp->icid); 3937 wc_status = IB_WC_REM_INV_REQ_ERR; 3938 break; 3939 case RDMA_CQE_REQ_STS_REMOTE_ACCESS_ERR: 3940 DP_ERR(dev, 3941 "Error: POLL CQ with RDMA_CQE_REQ_STS_REMOTE_ACCESS_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3942 cq->icid, qp->icid); 3943 wc_status = IB_WC_REM_ACCESS_ERR; 3944 break; 3945 case RDMA_CQE_REQ_STS_REMOTE_OPERATION_ERR: 3946 DP_ERR(dev, 3947 "Error: POLL CQ with RDMA_CQE_REQ_STS_REMOTE_OPERATION_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3948 cq->icid, qp->icid); 3949 wc_status = IB_WC_REM_OP_ERR; 3950 break; 3951 case RDMA_CQE_REQ_STS_RNR_NAK_RETRY_CNT_ERR: 3952 DP_ERR(dev, 3953 "Error: POLL CQ with RDMA_CQE_REQ_STS_RNR_NAK_RETRY_CNT_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3954 cq->icid, qp->icid); 3955 wc_status = IB_WC_RNR_RETRY_EXC_ERR; 3956 break; 3957 case RDMA_CQE_REQ_STS_TRANSPORT_RETRY_CNT_ERR: 3958 DP_ERR(dev, 3959 "Error: POLL CQ with ROCE_CQE_REQ_STS_TRANSPORT_RETRY_CNT_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3960 cq->icid, qp->icid); 3961 wc_status = IB_WC_RETRY_EXC_ERR; 3962 break; 3963 default: 3964 DP_ERR(dev, 3965 "Error: POLL CQ with IB_WC_GENERAL_ERR. CQ icid=0x%x, QP icid=0x%x\n", 3966 cq->icid, qp->icid); 3967 wc_status = IB_WC_GENERAL_ERR; 3968 } 3969 cnt += process_req(dev, qp, cq, 1, wc, req->sq_cons, 3970 wc_status, 1); 3971 } 3972 } 3973 3974 return cnt; 3975 } 3976 3977 static inline int qedr_cqe_resp_status_to_ib(u8 status) 3978 { 3979 switch (status) { 3980 case RDMA_CQE_RESP_STS_LOCAL_ACCESS_ERR: 3981 return IB_WC_LOC_ACCESS_ERR; 3982 case RDMA_CQE_RESP_STS_LOCAL_LENGTH_ERR: 3983 return IB_WC_LOC_LEN_ERR; 3984 case RDMA_CQE_RESP_STS_LOCAL_QP_OPERATION_ERR: 3985 return IB_WC_LOC_QP_OP_ERR; 3986 case RDMA_CQE_RESP_STS_LOCAL_PROTECTION_ERR: 3987 return IB_WC_LOC_PROT_ERR; 3988 case RDMA_CQE_RESP_STS_MEMORY_MGT_OPERATION_ERR: 3989 return IB_WC_MW_BIND_ERR; 3990 case RDMA_CQE_RESP_STS_REMOTE_INVALID_REQUEST_ERR: 3991 return IB_WC_REM_INV_RD_REQ_ERR; 3992 case RDMA_CQE_RESP_STS_OK: 3993 return IB_WC_SUCCESS; 3994 default: 3995 return IB_WC_GENERAL_ERR; 3996 } 3997 } 3998 3999 static inline int qedr_set_ok_cqe_resp_wc(struct rdma_cqe_responder *resp, 4000 struct ib_wc *wc) 4001 { 4002 wc->status = IB_WC_SUCCESS; 4003 wc->byte_len = le32_to_cpu(resp->length); 4004 4005 if (resp->flags & QEDR_RESP_IMM) { 4006 wc->ex.imm_data = cpu_to_be32(le32_to_cpu(resp->imm_data_or_inv_r_Key)); 4007 wc->wc_flags |= IB_WC_WITH_IMM; 4008 4009 if (resp->flags & QEDR_RESP_RDMA) 4010 wc->opcode = IB_WC_RECV_RDMA_WITH_IMM; 4011 4012 if (resp->flags & QEDR_RESP_INV) 4013 return -EINVAL; 4014 4015 } else if (resp->flags & QEDR_RESP_INV) { 4016 wc->ex.imm_data = le32_to_cpu(resp->imm_data_or_inv_r_Key); 4017 wc->wc_flags |= IB_WC_WITH_INVALIDATE; 4018 4019 if (resp->flags & QEDR_RESP_RDMA) 4020 return -EINVAL; 4021 4022 } else if (resp->flags & QEDR_RESP_RDMA) { 4023 return -EINVAL; 4024 } 4025 4026 return 0; 4027 } 4028 4029 static void __process_resp_one(struct qedr_dev *dev, struct qedr_qp *qp, 4030 struct qedr_cq *cq, struct ib_wc *wc, 4031 struct rdma_cqe_responder *resp, u64 wr_id) 4032 { 4033 /* Must fill fields before qedr_set_ok_cqe_resp_wc() */ 4034 wc->opcode = IB_WC_RECV; 4035 wc->wc_flags = 0; 4036 4037 if (likely(resp->status == RDMA_CQE_RESP_STS_OK)) { 4038 if (qedr_set_ok_cqe_resp_wc(resp, wc)) 4039 DP_ERR(dev, 4040 "CQ %p (icid=%d) has invalid CQE responder flags=0x%x\n", 4041 cq, cq->icid, resp->flags); 4042 4043 } else { 4044 wc->status = qedr_cqe_resp_status_to_ib(resp->status); 4045 if (wc->status == IB_WC_GENERAL_ERR) 4046 DP_ERR(dev, 4047 "CQ %p (icid=%d) contains an invalid CQE status %d\n", 4048 cq, cq->icid, resp->status); 4049 } 4050 4051 /* Fill the rest of the WC */ 4052 wc->vendor_err = 0; 4053 wc->src_qp = qp->id; 4054 wc->qp = &qp->ibqp; 4055 wc->wr_id = wr_id; 4056 } 4057 4058 static int process_resp_one_srq(struct qedr_dev *dev, struct qedr_qp *qp, 4059 struct qedr_cq *cq, struct ib_wc *wc, 4060 struct rdma_cqe_responder *resp) 4061 { 4062 struct qedr_srq *srq = qp->srq; 4063 u64 wr_id; 4064 4065 wr_id = HILO_GEN(le32_to_cpu(resp->srq_wr_id.hi), 4066 le32_to_cpu(resp->srq_wr_id.lo), u64); 4067 4068 if (resp->status == RDMA_CQE_RESP_STS_WORK_REQUEST_FLUSHED_ERR) { 4069 wc->status = IB_WC_WR_FLUSH_ERR; 4070 wc->vendor_err = 0; 4071 wc->wr_id = wr_id; 4072 wc->byte_len = 0; 4073 wc->src_qp = qp->id; 4074 wc->qp = &qp->ibqp; 4075 wc->wr_id = wr_id; 4076 } else { 4077 __process_resp_one(dev, qp, cq, wc, resp, wr_id); 4078 } 4079 srq->hw_srq.wr_cons_cnt++; 4080 4081 return 1; 4082 } 4083 static int process_resp_one(struct qedr_dev *dev, struct qedr_qp *qp, 4084 struct qedr_cq *cq, struct ib_wc *wc, 4085 struct rdma_cqe_responder *resp) 4086 { 4087 u64 wr_id = qp->rqe_wr_id[qp->rq.cons].wr_id; 4088 4089 __process_resp_one(dev, qp, cq, wc, resp, wr_id); 4090 4091 while (qp->rqe_wr_id[qp->rq.cons].wqe_size--) 4092 qed_chain_consume(&qp->rq.pbl); 4093 qedr_inc_sw_cons(&qp->rq); 4094 4095 return 1; 4096 } 4097 4098 static int process_resp_flush(struct qedr_qp *qp, struct qedr_cq *cq, 4099 int num_entries, struct ib_wc *wc, u16 hw_cons) 4100 { 4101 u16 cnt = 0; 4102 4103 while (num_entries && qp->rq.wqe_cons != hw_cons) { 4104 /* fill WC */ 4105 wc->status = IB_WC_WR_FLUSH_ERR; 4106 wc->vendor_err = 0; 4107 wc->wc_flags = 0; 4108 wc->src_qp = qp->id; 4109 wc->byte_len = 0; 4110 wc->wr_id = qp->rqe_wr_id[qp->rq.cons].wr_id; 4111 wc->qp = &qp->ibqp; 4112 num_entries--; 4113 wc++; 4114 cnt++; 4115 while (qp->rqe_wr_id[qp->rq.cons].wqe_size--) 4116 qed_chain_consume(&qp->rq.pbl); 4117 qedr_inc_sw_cons(&qp->rq); 4118 } 4119 4120 return cnt; 4121 } 4122 4123 static void try_consume_resp_cqe(struct qedr_cq *cq, struct qedr_qp *qp, 4124 struct rdma_cqe_responder *resp, int *update) 4125 { 4126 if (le16_to_cpu(resp->rq_cons_or_srq_id) == qp->rq.wqe_cons) { 4127 consume_cqe(cq); 4128 *update |= 1; 4129 } 4130 } 4131 4132 static int qedr_poll_cq_resp_srq(struct qedr_dev *dev, struct qedr_qp *qp, 4133 struct qedr_cq *cq, int num_entries, 4134 struct ib_wc *wc, 4135 struct rdma_cqe_responder *resp) 4136 { 4137 int cnt; 4138 4139 cnt = process_resp_one_srq(dev, qp, cq, wc, resp); 4140 consume_cqe(cq); 4141 4142 return cnt; 4143 } 4144 4145 static int qedr_poll_cq_resp(struct qedr_dev *dev, struct qedr_qp *qp, 4146 struct qedr_cq *cq, int num_entries, 4147 struct ib_wc *wc, struct rdma_cqe_responder *resp, 4148 int *update) 4149 { 4150 int cnt; 4151 4152 if (resp->status == RDMA_CQE_RESP_STS_WORK_REQUEST_FLUSHED_ERR) { 4153 cnt = process_resp_flush(qp, cq, num_entries, wc, 4154 resp->rq_cons_or_srq_id); 4155 try_consume_resp_cqe(cq, qp, resp, update); 4156 } else { 4157 cnt = process_resp_one(dev, qp, cq, wc, resp); 4158 consume_cqe(cq); 4159 *update |= 1; 4160 } 4161 4162 return cnt; 4163 } 4164 4165 static void try_consume_req_cqe(struct qedr_cq *cq, struct qedr_qp *qp, 4166 struct rdma_cqe_requester *req, int *update) 4167 { 4168 if (le16_to_cpu(req->sq_cons) == qp->sq.wqe_cons) { 4169 consume_cqe(cq); 4170 *update |= 1; 4171 } 4172 } 4173 4174 int qedr_poll_cq(struct ib_cq *ibcq, int num_entries, struct ib_wc *wc) 4175 { 4176 struct qedr_dev *dev = get_qedr_dev(ibcq->device); 4177 struct qedr_cq *cq = get_qedr_cq(ibcq); 4178 union rdma_cqe *cqe; 4179 u32 old_cons, new_cons; 4180 unsigned long flags; 4181 int update = 0; 4182 int done = 0; 4183 4184 if (cq->destroyed) { 4185 DP_ERR(dev, 4186 "warning: poll was invoked after destroy for cq %p (icid=%d)\n", 4187 cq, cq->icid); 4188 return 0; 4189 } 4190 4191 if (cq->cq_type == QEDR_CQ_TYPE_GSI) 4192 return qedr_gsi_poll_cq(ibcq, num_entries, wc); 4193 4194 spin_lock_irqsave(&cq->cq_lock, flags); 4195 cqe = cq->latest_cqe; 4196 old_cons = qed_chain_get_cons_idx_u32(&cq->pbl); 4197 while (num_entries && is_valid_cqe(cq, cqe)) { 4198 struct qedr_qp *qp; 4199 int cnt = 0; 4200 4201 /* prevent speculative reads of any field of CQE */ 4202 rmb(); 4203 4204 qp = cqe_get_qp(cqe); 4205 if (!qp) { 4206 WARN(1, "Error: CQE QP pointer is NULL. CQE=%p\n", cqe); 4207 break; 4208 } 4209 4210 wc->qp = &qp->ibqp; 4211 4212 switch (cqe_get_type(cqe)) { 4213 case RDMA_CQE_TYPE_REQUESTER: 4214 cnt = qedr_poll_cq_req(dev, qp, cq, num_entries, wc, 4215 &cqe->req); 4216 try_consume_req_cqe(cq, qp, &cqe->req, &update); 4217 break; 4218 case RDMA_CQE_TYPE_RESPONDER_RQ: 4219 cnt = qedr_poll_cq_resp(dev, qp, cq, num_entries, wc, 4220 &cqe->resp, &update); 4221 break; 4222 case RDMA_CQE_TYPE_RESPONDER_SRQ: 4223 cnt = qedr_poll_cq_resp_srq(dev, qp, cq, num_entries, 4224 wc, &cqe->resp); 4225 update = 1; 4226 break; 4227 case RDMA_CQE_TYPE_INVALID: 4228 default: 4229 DP_ERR(dev, "Error: invalid CQE type = %d\n", 4230 cqe_get_type(cqe)); 4231 } 4232 num_entries -= cnt; 4233 wc += cnt; 4234 done += cnt; 4235 4236 cqe = get_cqe(cq); 4237 } 4238 new_cons = qed_chain_get_cons_idx_u32(&cq->pbl); 4239 4240 cq->cq_cons += new_cons - old_cons; 4241 4242 if (update) 4243 /* doorbell notifies abount latest VALID entry, 4244 * but chain already point to the next INVALID one 4245 */ 4246 doorbell_cq(cq, cq->cq_cons - 1, cq->arm_flags); 4247 4248 spin_unlock_irqrestore(&cq->cq_lock, flags); 4249 return done; 4250 } 4251 4252 int qedr_process_mad(struct ib_device *ibdev, int process_mad_flags, 4253 u8 port_num, 4254 const struct ib_wc *in_wc, 4255 const struct ib_grh *in_grh, 4256 const struct ib_mad_hdr *mad_hdr, 4257 size_t in_mad_size, struct ib_mad_hdr *out_mad, 4258 size_t *out_mad_size, u16 *out_mad_pkey_index) 4259 { 4260 struct qedr_dev *dev = get_qedr_dev(ibdev); 4261 4262 DP_DEBUG(dev, QEDR_MSG_GSI, 4263 "QEDR_PROCESS_MAD in_mad %x %x %x %x %x %x %x %x\n", 4264 mad_hdr->attr_id, mad_hdr->base_version, mad_hdr->attr_mod, 4265 mad_hdr->class_specific, mad_hdr->class_version, 4266 mad_hdr->method, mad_hdr->mgmt_class, mad_hdr->status); 4267 return IB_MAD_RESULT_SUCCESS; 4268 } 4269