xref: /openbmc/linux/drivers/infiniband/hw/qedr/verbs.c (revision e983940270f10fe8551baf0098be76ea478294a3)
1 /* QLogic qedr NIC Driver
2  * Copyright (c) 2015-2016  QLogic Corporation
3  *
4  * This software is available to you under a choice of one of two
5  * licenses.  You may choose to be licensed under the terms of the GNU
6  * General Public License (GPL) Version 2, available from the file
7  * COPYING in the main directory of this source tree, or the
8  * OpenIB.org BSD license below:
9  *
10  *     Redistribution and use in source and binary forms, with or
11  *     without modification, are permitted provided that the following
12  *     conditions are met:
13  *
14  *      - Redistributions of source code must retain the above
15  *        copyright notice, this list of conditions and the following
16  *        disclaimer.
17  *
18  *      - Redistributions in binary form must reproduce the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer in the documentation and /or other materials
21  *        provided with the distribution.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30  * SOFTWARE.
31  */
32 #include <linux/dma-mapping.h>
33 #include <linux/crc32.h>
34 #include <net/ip.h>
35 #include <net/ipv6.h>
36 #include <net/udp.h>
37 #include <linux/iommu.h>
38 
39 #include <rdma/ib_verbs.h>
40 #include <rdma/ib_user_verbs.h>
41 #include <rdma/iw_cm.h>
42 #include <rdma/ib_umem.h>
43 #include <rdma/ib_addr.h>
44 #include <rdma/ib_cache.h>
45 
46 #include "qedr_hsi.h"
47 #include <linux/qed/qed_if.h>
48 #include "qedr.h"
49 #include "verbs.h"
50 #include <rdma/qedr-abi.h>
51 #include "qedr_cm.h"
52 
53 #define DB_ADDR_SHIFT(addr)		((addr) << DB_PWM_ADDR_OFFSET_SHIFT)
54 
55 int qedr_query_pkey(struct ib_device *ibdev, u8 port, u16 index, u16 *pkey)
56 {
57 	if (index > QEDR_ROCE_PKEY_TABLE_LEN)
58 		return -EINVAL;
59 
60 	*pkey = QEDR_ROCE_PKEY_DEFAULT;
61 	return 0;
62 }
63 
64 int qedr_query_gid(struct ib_device *ibdev, u8 port, int index,
65 		   union ib_gid *sgid)
66 {
67 	struct qedr_dev *dev = get_qedr_dev(ibdev);
68 	int rc = 0;
69 
70 	if (!rdma_cap_roce_gid_table(ibdev, port))
71 		return -ENODEV;
72 
73 	rc = ib_get_cached_gid(ibdev, port, index, sgid, NULL);
74 	if (rc == -EAGAIN) {
75 		memcpy(sgid, &zgid, sizeof(*sgid));
76 		return 0;
77 	}
78 
79 	DP_DEBUG(dev, QEDR_MSG_INIT, "query gid: index=%d %llx:%llx\n", index,
80 		 sgid->global.interface_id, sgid->global.subnet_prefix);
81 
82 	return rc;
83 }
84 
85 int qedr_add_gid(struct ib_device *device, u8 port_num,
86 		 unsigned int index, const union ib_gid *gid,
87 		 const struct ib_gid_attr *attr, void **context)
88 {
89 	if (!rdma_cap_roce_gid_table(device, port_num))
90 		return -EINVAL;
91 
92 	if (port_num > QEDR_MAX_PORT)
93 		return -EINVAL;
94 
95 	if (!context)
96 		return -EINVAL;
97 
98 	return 0;
99 }
100 
101 int qedr_del_gid(struct ib_device *device, u8 port_num,
102 		 unsigned int index, void **context)
103 {
104 	if (!rdma_cap_roce_gid_table(device, port_num))
105 		return -EINVAL;
106 
107 	if (port_num > QEDR_MAX_PORT)
108 		return -EINVAL;
109 
110 	if (!context)
111 		return -EINVAL;
112 
113 	return 0;
114 }
115 
116 int qedr_query_device(struct ib_device *ibdev,
117 		      struct ib_device_attr *attr, struct ib_udata *udata)
118 {
119 	struct qedr_dev *dev = get_qedr_dev(ibdev);
120 	struct qedr_device_attr *qattr = &dev->attr;
121 
122 	if (!dev->rdma_ctx) {
123 		DP_ERR(dev,
124 		       "qedr_query_device called with invalid params rdma_ctx=%p\n",
125 		       dev->rdma_ctx);
126 		return -EINVAL;
127 	}
128 
129 	memset(attr, 0, sizeof(*attr));
130 
131 	attr->fw_ver = qattr->fw_ver;
132 	attr->sys_image_guid = qattr->sys_image_guid;
133 	attr->max_mr_size = qattr->max_mr_size;
134 	attr->page_size_cap = qattr->page_size_caps;
135 	attr->vendor_id = qattr->vendor_id;
136 	attr->vendor_part_id = qattr->vendor_part_id;
137 	attr->hw_ver = qattr->hw_ver;
138 	attr->max_qp = qattr->max_qp;
139 	attr->max_qp_wr = max_t(u32, qattr->max_sqe, qattr->max_rqe);
140 	attr->device_cap_flags = IB_DEVICE_CURR_QP_STATE_MOD |
141 	    IB_DEVICE_RC_RNR_NAK_GEN |
142 	    IB_DEVICE_LOCAL_DMA_LKEY | IB_DEVICE_MEM_MGT_EXTENSIONS;
143 
144 	attr->max_sge = qattr->max_sge;
145 	attr->max_sge_rd = qattr->max_sge;
146 	attr->max_cq = qattr->max_cq;
147 	attr->max_cqe = qattr->max_cqe;
148 	attr->max_mr = qattr->max_mr;
149 	attr->max_mw = qattr->max_mw;
150 	attr->max_pd = qattr->max_pd;
151 	attr->atomic_cap = dev->atomic_cap;
152 	attr->max_fmr = qattr->max_fmr;
153 	attr->max_map_per_fmr = 16;
154 	attr->max_qp_init_rd_atom =
155 	    1 << (fls(qattr->max_qp_req_rd_atomic_resc) - 1);
156 	attr->max_qp_rd_atom =
157 	    min(1 << (fls(qattr->max_qp_resp_rd_atomic_resc) - 1),
158 		attr->max_qp_init_rd_atom);
159 
160 	attr->max_srq = qattr->max_srq;
161 	attr->max_srq_sge = qattr->max_srq_sge;
162 	attr->max_srq_wr = qattr->max_srq_wr;
163 
164 	attr->local_ca_ack_delay = qattr->dev_ack_delay;
165 	attr->max_fast_reg_page_list_len = qattr->max_mr / 8;
166 	attr->max_pkeys = QEDR_ROCE_PKEY_MAX;
167 	attr->max_ah = qattr->max_ah;
168 
169 	return 0;
170 }
171 
172 #define QEDR_SPEED_SDR		(1)
173 #define QEDR_SPEED_DDR		(2)
174 #define QEDR_SPEED_QDR		(4)
175 #define QEDR_SPEED_FDR10	(8)
176 #define QEDR_SPEED_FDR		(16)
177 #define QEDR_SPEED_EDR		(32)
178 
179 static inline void get_link_speed_and_width(int speed, u8 *ib_speed,
180 					    u8 *ib_width)
181 {
182 	switch (speed) {
183 	case 1000:
184 		*ib_speed = QEDR_SPEED_SDR;
185 		*ib_width = IB_WIDTH_1X;
186 		break;
187 	case 10000:
188 		*ib_speed = QEDR_SPEED_QDR;
189 		*ib_width = IB_WIDTH_1X;
190 		break;
191 
192 	case 20000:
193 		*ib_speed = QEDR_SPEED_DDR;
194 		*ib_width = IB_WIDTH_4X;
195 		break;
196 
197 	case 25000:
198 		*ib_speed = QEDR_SPEED_EDR;
199 		*ib_width = IB_WIDTH_1X;
200 		break;
201 
202 	case 40000:
203 		*ib_speed = QEDR_SPEED_QDR;
204 		*ib_width = IB_WIDTH_4X;
205 		break;
206 
207 	case 50000:
208 		*ib_speed = QEDR_SPEED_QDR;
209 		*ib_width = IB_WIDTH_4X;
210 		break;
211 
212 	case 100000:
213 		*ib_speed = QEDR_SPEED_EDR;
214 		*ib_width = IB_WIDTH_4X;
215 		break;
216 
217 	default:
218 		/* Unsupported */
219 		*ib_speed = QEDR_SPEED_SDR;
220 		*ib_width = IB_WIDTH_1X;
221 	}
222 }
223 
224 int qedr_query_port(struct ib_device *ibdev, u8 port, struct ib_port_attr *attr)
225 {
226 	struct qedr_dev *dev;
227 	struct qed_rdma_port *rdma_port;
228 
229 	dev = get_qedr_dev(ibdev);
230 	if (port > 1) {
231 		DP_ERR(dev, "invalid_port=0x%x\n", port);
232 		return -EINVAL;
233 	}
234 
235 	if (!dev->rdma_ctx) {
236 		DP_ERR(dev, "rdma_ctx is NULL\n");
237 		return -EINVAL;
238 	}
239 
240 	rdma_port = dev->ops->rdma_query_port(dev->rdma_ctx);
241 	memset(attr, 0, sizeof(*attr));
242 
243 	if (rdma_port->port_state == QED_RDMA_PORT_UP) {
244 		attr->state = IB_PORT_ACTIVE;
245 		attr->phys_state = 5;
246 	} else {
247 		attr->state = IB_PORT_DOWN;
248 		attr->phys_state = 3;
249 	}
250 	attr->max_mtu = IB_MTU_4096;
251 	attr->active_mtu = iboe_get_mtu(dev->ndev->mtu);
252 	attr->lid = 0;
253 	attr->lmc = 0;
254 	attr->sm_lid = 0;
255 	attr->sm_sl = 0;
256 	attr->port_cap_flags = IB_PORT_IP_BASED_GIDS;
257 	attr->gid_tbl_len = QEDR_MAX_SGID;
258 	attr->pkey_tbl_len = QEDR_ROCE_PKEY_TABLE_LEN;
259 	attr->bad_pkey_cntr = rdma_port->pkey_bad_counter;
260 	attr->qkey_viol_cntr = 0;
261 	get_link_speed_and_width(rdma_port->link_speed,
262 				 &attr->active_speed, &attr->active_width);
263 	attr->max_msg_sz = rdma_port->max_msg_size;
264 	attr->max_vl_num = 4;
265 
266 	return 0;
267 }
268 
269 int qedr_modify_port(struct ib_device *ibdev, u8 port, int mask,
270 		     struct ib_port_modify *props)
271 {
272 	struct qedr_dev *dev;
273 
274 	dev = get_qedr_dev(ibdev);
275 	if (port > 1) {
276 		DP_ERR(dev, "invalid_port=0x%x\n", port);
277 		return -EINVAL;
278 	}
279 
280 	return 0;
281 }
282 
283 static int qedr_add_mmap(struct qedr_ucontext *uctx, u64 phy_addr,
284 			 unsigned long len)
285 {
286 	struct qedr_mm *mm;
287 
288 	mm = kzalloc(sizeof(*mm), GFP_KERNEL);
289 	if (!mm)
290 		return -ENOMEM;
291 
292 	mm->key.phy_addr = phy_addr;
293 	/* This function might be called with a length which is not a multiple
294 	 * of PAGE_SIZE, while the mapping is PAGE_SIZE grained and the kernel
295 	 * forces this granularity by increasing the requested size if needed.
296 	 * When qedr_mmap is called, it will search the list with the updated
297 	 * length as a key. To prevent search failures, the length is rounded up
298 	 * in advance to PAGE_SIZE.
299 	 */
300 	mm->key.len = roundup(len, PAGE_SIZE);
301 	INIT_LIST_HEAD(&mm->entry);
302 
303 	mutex_lock(&uctx->mm_list_lock);
304 	list_add(&mm->entry, &uctx->mm_head);
305 	mutex_unlock(&uctx->mm_list_lock);
306 
307 	DP_DEBUG(uctx->dev, QEDR_MSG_MISC,
308 		 "added (addr=0x%llx,len=0x%lx) for ctx=%p\n",
309 		 (unsigned long long)mm->key.phy_addr,
310 		 (unsigned long)mm->key.len, uctx);
311 
312 	return 0;
313 }
314 
315 static bool qedr_search_mmap(struct qedr_ucontext *uctx, u64 phy_addr,
316 			     unsigned long len)
317 {
318 	bool found = false;
319 	struct qedr_mm *mm;
320 
321 	mutex_lock(&uctx->mm_list_lock);
322 	list_for_each_entry(mm, &uctx->mm_head, entry) {
323 		if (len != mm->key.len || phy_addr != mm->key.phy_addr)
324 			continue;
325 
326 		found = true;
327 		break;
328 	}
329 	mutex_unlock(&uctx->mm_list_lock);
330 	DP_DEBUG(uctx->dev, QEDR_MSG_MISC,
331 		 "searched for (addr=0x%llx,len=0x%lx) for ctx=%p, result=%d\n",
332 		 mm->key.phy_addr, mm->key.len, uctx, found);
333 
334 	return found;
335 }
336 
337 struct ib_ucontext *qedr_alloc_ucontext(struct ib_device *ibdev,
338 					struct ib_udata *udata)
339 {
340 	int rc;
341 	struct qedr_ucontext *ctx;
342 	struct qedr_alloc_ucontext_resp uresp;
343 	struct qedr_dev *dev = get_qedr_dev(ibdev);
344 	struct qed_rdma_add_user_out_params oparams;
345 
346 	if (!udata)
347 		return ERR_PTR(-EFAULT);
348 
349 	ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
350 	if (!ctx)
351 		return ERR_PTR(-ENOMEM);
352 
353 	rc = dev->ops->rdma_add_user(dev->rdma_ctx, &oparams);
354 	if (rc) {
355 		DP_ERR(dev,
356 		       "failed to allocate a DPI for a new RoCE application, rc=%d. To overcome this consider to increase the number of DPIs, increase the doorbell BAR size or just close unnecessary RoCE applications. In order to increase the number of DPIs consult the qedr readme\n",
357 		       rc);
358 		goto err;
359 	}
360 
361 	ctx->dpi = oparams.dpi;
362 	ctx->dpi_addr = oparams.dpi_addr;
363 	ctx->dpi_phys_addr = oparams.dpi_phys_addr;
364 	ctx->dpi_size = oparams.dpi_size;
365 	INIT_LIST_HEAD(&ctx->mm_head);
366 	mutex_init(&ctx->mm_list_lock);
367 
368 	memset(&uresp, 0, sizeof(uresp));
369 
370 	uresp.db_pa = ctx->dpi_phys_addr;
371 	uresp.db_size = ctx->dpi_size;
372 	uresp.max_send_wr = dev->attr.max_sqe;
373 	uresp.max_recv_wr = dev->attr.max_rqe;
374 	uresp.max_srq_wr = dev->attr.max_srq_wr;
375 	uresp.sges_per_send_wr = QEDR_MAX_SQE_ELEMENTS_PER_SQE;
376 	uresp.sges_per_recv_wr = QEDR_MAX_RQE_ELEMENTS_PER_RQE;
377 	uresp.sges_per_srq_wr = dev->attr.max_srq_sge;
378 	uresp.max_cqes = QEDR_MAX_CQES;
379 
380 	rc = ib_copy_to_udata(udata, &uresp, sizeof(uresp));
381 	if (rc)
382 		goto err;
383 
384 	ctx->dev = dev;
385 
386 	rc = qedr_add_mmap(ctx, ctx->dpi_phys_addr, ctx->dpi_size);
387 	if (rc)
388 		goto err;
389 
390 	DP_DEBUG(dev, QEDR_MSG_INIT, "Allocating user context %p\n",
391 		 &ctx->ibucontext);
392 	return &ctx->ibucontext;
393 
394 err:
395 	kfree(ctx);
396 	return ERR_PTR(rc);
397 }
398 
399 int qedr_dealloc_ucontext(struct ib_ucontext *ibctx)
400 {
401 	struct qedr_ucontext *uctx = get_qedr_ucontext(ibctx);
402 	struct qedr_mm *mm, *tmp;
403 	int status = 0;
404 
405 	DP_DEBUG(uctx->dev, QEDR_MSG_INIT, "Deallocating user context %p\n",
406 		 uctx);
407 	uctx->dev->ops->rdma_remove_user(uctx->dev->rdma_ctx, uctx->dpi);
408 
409 	list_for_each_entry_safe(mm, tmp, &uctx->mm_head, entry) {
410 		DP_DEBUG(uctx->dev, QEDR_MSG_MISC,
411 			 "deleted (addr=0x%llx,len=0x%lx) for ctx=%p\n",
412 			 mm->key.phy_addr, mm->key.len, uctx);
413 		list_del(&mm->entry);
414 		kfree(mm);
415 	}
416 
417 	kfree(uctx);
418 	return status;
419 }
420 
421 int qedr_mmap(struct ib_ucontext *context, struct vm_area_struct *vma)
422 {
423 	struct qedr_ucontext *ucontext = get_qedr_ucontext(context);
424 	struct qedr_dev *dev = get_qedr_dev(context->device);
425 	unsigned long vm_page = vma->vm_pgoff << PAGE_SHIFT;
426 	u64 unmapped_db = dev->db_phys_addr;
427 	unsigned long len = (vma->vm_end - vma->vm_start);
428 	int rc = 0;
429 	bool found;
430 
431 	DP_DEBUG(dev, QEDR_MSG_INIT,
432 		 "qedr_mmap called vm_page=0x%lx vm_pgoff=0x%lx unmapped_db=0x%llx db_size=%x, len=%lx\n",
433 		 vm_page, vma->vm_pgoff, unmapped_db, dev->db_size, len);
434 	if (vma->vm_start & (PAGE_SIZE - 1)) {
435 		DP_ERR(dev, "Vma_start not page aligned = %ld\n",
436 		       vma->vm_start);
437 		return -EINVAL;
438 	}
439 
440 	found = qedr_search_mmap(ucontext, vm_page, len);
441 	if (!found) {
442 		DP_ERR(dev, "Vma_pgoff not found in mapped array = %ld\n",
443 		       vma->vm_pgoff);
444 		return -EINVAL;
445 	}
446 
447 	DP_DEBUG(dev, QEDR_MSG_INIT, "Mapping doorbell bar\n");
448 
449 	if ((vm_page >= unmapped_db) && (vm_page <= (unmapped_db +
450 						     dev->db_size))) {
451 		DP_DEBUG(dev, QEDR_MSG_INIT, "Mapping doorbell bar\n");
452 		if (vma->vm_flags & VM_READ) {
453 			DP_ERR(dev, "Trying to map doorbell bar for read\n");
454 			return -EPERM;
455 		}
456 
457 		vma->vm_page_prot = pgprot_writecombine(vma->vm_page_prot);
458 
459 		rc = io_remap_pfn_range(vma, vma->vm_start, vma->vm_pgoff,
460 					PAGE_SIZE, vma->vm_page_prot);
461 	} else {
462 		DP_DEBUG(dev, QEDR_MSG_INIT, "Mapping chains\n");
463 		rc = remap_pfn_range(vma, vma->vm_start,
464 				     vma->vm_pgoff, len, vma->vm_page_prot);
465 	}
466 	DP_DEBUG(dev, QEDR_MSG_INIT, "qedr_mmap return code: %d\n", rc);
467 	return rc;
468 }
469 
470 struct ib_pd *qedr_alloc_pd(struct ib_device *ibdev,
471 			    struct ib_ucontext *context, struct ib_udata *udata)
472 {
473 	struct qedr_dev *dev = get_qedr_dev(ibdev);
474 	struct qedr_ucontext *uctx = NULL;
475 	struct qedr_alloc_pd_uresp uresp;
476 	struct qedr_pd *pd;
477 	u16 pd_id;
478 	int rc;
479 
480 	DP_DEBUG(dev, QEDR_MSG_INIT, "Function called from: %s\n",
481 		 (udata && context) ? "User Lib" : "Kernel");
482 
483 	if (!dev->rdma_ctx) {
484 		DP_ERR(dev, "invlaid RDMA context\n");
485 		return ERR_PTR(-EINVAL);
486 	}
487 
488 	pd = kzalloc(sizeof(*pd), GFP_KERNEL);
489 	if (!pd)
490 		return ERR_PTR(-ENOMEM);
491 
492 	dev->ops->rdma_alloc_pd(dev->rdma_ctx, &pd_id);
493 
494 	uresp.pd_id = pd_id;
495 	pd->pd_id = pd_id;
496 
497 	if (udata && context) {
498 		rc = ib_copy_to_udata(udata, &uresp, sizeof(uresp));
499 		if (rc)
500 			DP_ERR(dev, "copy error pd_id=0x%x.\n", pd_id);
501 		uctx = get_qedr_ucontext(context);
502 		uctx->pd = pd;
503 		pd->uctx = uctx;
504 	}
505 
506 	return &pd->ibpd;
507 }
508 
509 int qedr_dealloc_pd(struct ib_pd *ibpd)
510 {
511 	struct qedr_dev *dev = get_qedr_dev(ibpd->device);
512 	struct qedr_pd *pd = get_qedr_pd(ibpd);
513 
514 	if (!pd)
515 		pr_err("Invalid PD received in dealloc_pd\n");
516 
517 	DP_DEBUG(dev, QEDR_MSG_INIT, "Deallocating PD %d\n", pd->pd_id);
518 	dev->ops->rdma_dealloc_pd(dev->rdma_ctx, pd->pd_id);
519 
520 	kfree(pd);
521 
522 	return 0;
523 }
524 
525 static void qedr_free_pbl(struct qedr_dev *dev,
526 			  struct qedr_pbl_info *pbl_info, struct qedr_pbl *pbl)
527 {
528 	struct pci_dev *pdev = dev->pdev;
529 	int i;
530 
531 	for (i = 0; i < pbl_info->num_pbls; i++) {
532 		if (!pbl[i].va)
533 			continue;
534 		dma_free_coherent(&pdev->dev, pbl_info->pbl_size,
535 				  pbl[i].va, pbl[i].pa);
536 	}
537 
538 	kfree(pbl);
539 }
540 
541 #define MIN_FW_PBL_PAGE_SIZE (4 * 1024)
542 #define MAX_FW_PBL_PAGE_SIZE (64 * 1024)
543 
544 #define NUM_PBES_ON_PAGE(_page_size) (_page_size / sizeof(u64))
545 #define MAX_PBES_ON_PAGE NUM_PBES_ON_PAGE(MAX_FW_PBL_PAGE_SIZE)
546 #define MAX_PBES_TWO_LAYER (MAX_PBES_ON_PAGE * MAX_PBES_ON_PAGE)
547 
548 static struct qedr_pbl *qedr_alloc_pbl_tbl(struct qedr_dev *dev,
549 					   struct qedr_pbl_info *pbl_info,
550 					   gfp_t flags)
551 {
552 	struct pci_dev *pdev = dev->pdev;
553 	struct qedr_pbl *pbl_table;
554 	dma_addr_t *pbl_main_tbl;
555 	dma_addr_t pa;
556 	void *va;
557 	int i;
558 
559 	pbl_table = kcalloc(pbl_info->num_pbls, sizeof(*pbl_table), flags);
560 	if (!pbl_table)
561 		return ERR_PTR(-ENOMEM);
562 
563 	for (i = 0; i < pbl_info->num_pbls; i++) {
564 		va = dma_alloc_coherent(&pdev->dev, pbl_info->pbl_size,
565 					&pa, flags);
566 		if (!va)
567 			goto err;
568 
569 		memset(va, 0, pbl_info->pbl_size);
570 		pbl_table[i].va = va;
571 		pbl_table[i].pa = pa;
572 	}
573 
574 	/* Two-Layer PBLs, if we have more than one pbl we need to initialize
575 	 * the first one with physical pointers to all of the rest
576 	 */
577 	pbl_main_tbl = (dma_addr_t *)pbl_table[0].va;
578 	for (i = 0; i < pbl_info->num_pbls - 1; i++)
579 		pbl_main_tbl[i] = pbl_table[i + 1].pa;
580 
581 	return pbl_table;
582 
583 err:
584 	for (i--; i >= 0; i--)
585 		dma_free_coherent(&pdev->dev, pbl_info->pbl_size,
586 				  pbl_table[i].va, pbl_table[i].pa);
587 
588 	qedr_free_pbl(dev, pbl_info, pbl_table);
589 
590 	return ERR_PTR(-ENOMEM);
591 }
592 
593 static int qedr_prepare_pbl_tbl(struct qedr_dev *dev,
594 				struct qedr_pbl_info *pbl_info,
595 				u32 num_pbes, int two_layer_capable)
596 {
597 	u32 pbl_capacity;
598 	u32 pbl_size;
599 	u32 num_pbls;
600 
601 	if ((num_pbes > MAX_PBES_ON_PAGE) && two_layer_capable) {
602 		if (num_pbes > MAX_PBES_TWO_LAYER) {
603 			DP_ERR(dev, "prepare pbl table: too many pages %d\n",
604 			       num_pbes);
605 			return -EINVAL;
606 		}
607 
608 		/* calculate required pbl page size */
609 		pbl_size = MIN_FW_PBL_PAGE_SIZE;
610 		pbl_capacity = NUM_PBES_ON_PAGE(pbl_size) *
611 			       NUM_PBES_ON_PAGE(pbl_size);
612 
613 		while (pbl_capacity < num_pbes) {
614 			pbl_size *= 2;
615 			pbl_capacity = pbl_size / sizeof(u64);
616 			pbl_capacity = pbl_capacity * pbl_capacity;
617 		}
618 
619 		num_pbls = DIV_ROUND_UP(num_pbes, NUM_PBES_ON_PAGE(pbl_size));
620 		num_pbls++;	/* One for the layer0 ( points to the pbls) */
621 		pbl_info->two_layered = true;
622 	} else {
623 		/* One layered PBL */
624 		num_pbls = 1;
625 		pbl_size = max_t(u32, MIN_FW_PBL_PAGE_SIZE,
626 				 roundup_pow_of_two((num_pbes * sizeof(u64))));
627 		pbl_info->two_layered = false;
628 	}
629 
630 	pbl_info->num_pbls = num_pbls;
631 	pbl_info->pbl_size = pbl_size;
632 	pbl_info->num_pbes = num_pbes;
633 
634 	DP_DEBUG(dev, QEDR_MSG_MR,
635 		 "prepare pbl table: num_pbes=%d, num_pbls=%d, pbl_size=%d\n",
636 		 pbl_info->num_pbes, pbl_info->num_pbls, pbl_info->pbl_size);
637 
638 	return 0;
639 }
640 
641 static void qedr_populate_pbls(struct qedr_dev *dev, struct ib_umem *umem,
642 			       struct qedr_pbl *pbl,
643 			       struct qedr_pbl_info *pbl_info)
644 {
645 	int shift, pg_cnt, pages, pbe_cnt, total_num_pbes = 0;
646 	struct qedr_pbl *pbl_tbl;
647 	struct scatterlist *sg;
648 	struct regpair *pbe;
649 	int entry;
650 	u32 addr;
651 
652 	if (!pbl_info->num_pbes)
653 		return;
654 
655 	/* If we have a two layered pbl, the first pbl points to the rest
656 	 * of the pbls and the first entry lays on the second pbl in the table
657 	 */
658 	if (pbl_info->two_layered)
659 		pbl_tbl = &pbl[1];
660 	else
661 		pbl_tbl = pbl;
662 
663 	pbe = (struct regpair *)pbl_tbl->va;
664 	if (!pbe) {
665 		DP_ERR(dev, "cannot populate PBL due to a NULL PBE\n");
666 		return;
667 	}
668 
669 	pbe_cnt = 0;
670 
671 	shift = ilog2(umem->page_size);
672 
673 	for_each_sg(umem->sg_head.sgl, sg, umem->nmap, entry) {
674 		pages = sg_dma_len(sg) >> shift;
675 		for (pg_cnt = 0; pg_cnt < pages; pg_cnt++) {
676 			/* store the page address in pbe */
677 			pbe->lo = cpu_to_le32(sg_dma_address(sg) +
678 					      umem->page_size * pg_cnt);
679 			addr = upper_32_bits(sg_dma_address(sg) +
680 					     umem->page_size * pg_cnt);
681 			pbe->hi = cpu_to_le32(addr);
682 			pbe_cnt++;
683 			total_num_pbes++;
684 			pbe++;
685 
686 			if (total_num_pbes == pbl_info->num_pbes)
687 				return;
688 
689 			/* If the given pbl is full storing the pbes,
690 			 * move to next pbl.
691 			 */
692 			if (pbe_cnt == (pbl_info->pbl_size / sizeof(u64))) {
693 				pbl_tbl++;
694 				pbe = (struct regpair *)pbl_tbl->va;
695 				pbe_cnt = 0;
696 			}
697 		}
698 	}
699 }
700 
701 static int qedr_copy_cq_uresp(struct qedr_dev *dev,
702 			      struct qedr_cq *cq, struct ib_udata *udata)
703 {
704 	struct qedr_create_cq_uresp uresp;
705 	int rc;
706 
707 	memset(&uresp, 0, sizeof(uresp));
708 
709 	uresp.db_offset = DB_ADDR_SHIFT(DQ_PWM_OFFSET_UCM_RDMA_CQ_CONS_32BIT);
710 	uresp.icid = cq->icid;
711 
712 	rc = ib_copy_to_udata(udata, &uresp, sizeof(uresp));
713 	if (rc)
714 		DP_ERR(dev, "copy error cqid=0x%x.\n", cq->icid);
715 
716 	return rc;
717 }
718 
719 static void consume_cqe(struct qedr_cq *cq)
720 {
721 	if (cq->latest_cqe == cq->toggle_cqe)
722 		cq->pbl_toggle ^= RDMA_CQE_REQUESTER_TOGGLE_BIT_MASK;
723 
724 	cq->latest_cqe = qed_chain_consume(&cq->pbl);
725 }
726 
727 static inline int qedr_align_cq_entries(int entries)
728 {
729 	u64 size, aligned_size;
730 
731 	/* We allocate an extra entry that we don't report to the FW. */
732 	size = (entries + 1) * QEDR_CQE_SIZE;
733 	aligned_size = ALIGN(size, PAGE_SIZE);
734 
735 	return aligned_size / QEDR_CQE_SIZE;
736 }
737 
738 static inline int qedr_init_user_queue(struct ib_ucontext *ib_ctx,
739 				       struct qedr_dev *dev,
740 				       struct qedr_userq *q,
741 				       u64 buf_addr, size_t buf_len,
742 				       int access, int dmasync)
743 {
744 	int page_cnt;
745 	int rc;
746 
747 	q->buf_addr = buf_addr;
748 	q->buf_len = buf_len;
749 	q->umem = ib_umem_get(ib_ctx, q->buf_addr, q->buf_len, access, dmasync);
750 	if (IS_ERR(q->umem)) {
751 		DP_ERR(dev, "create user queue: failed ib_umem_get, got %ld\n",
752 		       PTR_ERR(q->umem));
753 		return PTR_ERR(q->umem);
754 	}
755 
756 	page_cnt = ib_umem_page_count(q->umem);
757 	rc = qedr_prepare_pbl_tbl(dev, &q->pbl_info, page_cnt, 0);
758 	if (rc)
759 		goto err0;
760 
761 	q->pbl_tbl = qedr_alloc_pbl_tbl(dev, &q->pbl_info, GFP_KERNEL);
762 	if (IS_ERR_OR_NULL(q->pbl_tbl))
763 		goto err0;
764 
765 	qedr_populate_pbls(dev, q->umem, q->pbl_tbl, &q->pbl_info);
766 
767 	return 0;
768 
769 err0:
770 	ib_umem_release(q->umem);
771 
772 	return rc;
773 }
774 
775 static inline void qedr_init_cq_params(struct qedr_cq *cq,
776 				       struct qedr_ucontext *ctx,
777 				       struct qedr_dev *dev, int vector,
778 				       int chain_entries, int page_cnt,
779 				       u64 pbl_ptr,
780 				       struct qed_rdma_create_cq_in_params
781 				       *params)
782 {
783 	memset(params, 0, sizeof(*params));
784 	params->cq_handle_hi = upper_32_bits((uintptr_t)cq);
785 	params->cq_handle_lo = lower_32_bits((uintptr_t)cq);
786 	params->cnq_id = vector;
787 	params->cq_size = chain_entries - 1;
788 	params->dpi = (ctx) ? ctx->dpi : dev->dpi;
789 	params->pbl_num_pages = page_cnt;
790 	params->pbl_ptr = pbl_ptr;
791 	params->pbl_two_level = 0;
792 }
793 
794 static void doorbell_cq(struct qedr_cq *cq, u32 cons, u8 flags)
795 {
796 	/* Flush data before signalling doorbell */
797 	wmb();
798 	cq->db.data.agg_flags = flags;
799 	cq->db.data.value = cpu_to_le32(cons);
800 	writeq(cq->db.raw, cq->db_addr);
801 
802 	/* Make sure write would stick */
803 	mmiowb();
804 }
805 
806 int qedr_arm_cq(struct ib_cq *ibcq, enum ib_cq_notify_flags flags)
807 {
808 	struct qedr_cq *cq = get_qedr_cq(ibcq);
809 	unsigned long sflags;
810 
811 	if (cq->cq_type == QEDR_CQ_TYPE_GSI)
812 		return 0;
813 
814 	spin_lock_irqsave(&cq->cq_lock, sflags);
815 
816 	cq->arm_flags = 0;
817 
818 	if (flags & IB_CQ_SOLICITED)
819 		cq->arm_flags |= DQ_UCM_ROCE_CQ_ARM_SE_CF_CMD;
820 
821 	if (flags & IB_CQ_NEXT_COMP)
822 		cq->arm_flags |= DQ_UCM_ROCE_CQ_ARM_CF_CMD;
823 
824 	doorbell_cq(cq, cq->cq_cons - 1, cq->arm_flags);
825 
826 	spin_unlock_irqrestore(&cq->cq_lock, sflags);
827 
828 	return 0;
829 }
830 
831 struct ib_cq *qedr_create_cq(struct ib_device *ibdev,
832 			     const struct ib_cq_init_attr *attr,
833 			     struct ib_ucontext *ib_ctx, struct ib_udata *udata)
834 {
835 	struct qedr_ucontext *ctx = get_qedr_ucontext(ib_ctx);
836 	struct qed_rdma_destroy_cq_out_params destroy_oparams;
837 	struct qed_rdma_destroy_cq_in_params destroy_iparams;
838 	struct qedr_dev *dev = get_qedr_dev(ibdev);
839 	struct qed_rdma_create_cq_in_params params;
840 	struct qedr_create_cq_ureq ureq;
841 	int vector = attr->comp_vector;
842 	int entries = attr->cqe;
843 	struct qedr_cq *cq;
844 	int chain_entries;
845 	int page_cnt;
846 	u64 pbl_ptr;
847 	u16 icid;
848 	int rc;
849 
850 	DP_DEBUG(dev, QEDR_MSG_INIT,
851 		 "create_cq: called from %s. entries=%d, vector=%d\n",
852 		 udata ? "User Lib" : "Kernel", entries, vector);
853 
854 	if (entries > QEDR_MAX_CQES) {
855 		DP_ERR(dev,
856 		       "create cq: the number of entries %d is too high. Must be equal or below %d.\n",
857 		       entries, QEDR_MAX_CQES);
858 		return ERR_PTR(-EINVAL);
859 	}
860 
861 	chain_entries = qedr_align_cq_entries(entries);
862 	chain_entries = min_t(int, chain_entries, QEDR_MAX_CQES);
863 
864 	cq = kzalloc(sizeof(*cq), GFP_KERNEL);
865 	if (!cq)
866 		return ERR_PTR(-ENOMEM);
867 
868 	if (udata) {
869 		memset(&ureq, 0, sizeof(ureq));
870 		if (ib_copy_from_udata(&ureq, udata, sizeof(ureq))) {
871 			DP_ERR(dev,
872 			       "create cq: problem copying data from user space\n");
873 			goto err0;
874 		}
875 
876 		if (!ureq.len) {
877 			DP_ERR(dev,
878 			       "create cq: cannot create a cq with 0 entries\n");
879 			goto err0;
880 		}
881 
882 		cq->cq_type = QEDR_CQ_TYPE_USER;
883 
884 		rc = qedr_init_user_queue(ib_ctx, dev, &cq->q, ureq.addr,
885 					  ureq.len, IB_ACCESS_LOCAL_WRITE, 1);
886 		if (rc)
887 			goto err0;
888 
889 		pbl_ptr = cq->q.pbl_tbl->pa;
890 		page_cnt = cq->q.pbl_info.num_pbes;
891 	} else {
892 		cq->cq_type = QEDR_CQ_TYPE_KERNEL;
893 
894 		rc = dev->ops->common->chain_alloc(dev->cdev,
895 						   QED_CHAIN_USE_TO_CONSUME,
896 						   QED_CHAIN_MODE_PBL,
897 						   QED_CHAIN_CNT_TYPE_U32,
898 						   chain_entries,
899 						   sizeof(union rdma_cqe),
900 						   &cq->pbl);
901 		if (rc)
902 			goto err1;
903 
904 		page_cnt = qed_chain_get_page_cnt(&cq->pbl);
905 		pbl_ptr = qed_chain_get_pbl_phys(&cq->pbl);
906 	}
907 
908 	qedr_init_cq_params(cq, ctx, dev, vector, chain_entries, page_cnt,
909 			    pbl_ptr, &params);
910 
911 	rc = dev->ops->rdma_create_cq(dev->rdma_ctx, &params, &icid);
912 	if (rc)
913 		goto err2;
914 
915 	cq->icid = icid;
916 	cq->sig = QEDR_CQ_MAGIC_NUMBER;
917 	spin_lock_init(&cq->cq_lock);
918 
919 	if (ib_ctx) {
920 		rc = qedr_copy_cq_uresp(dev, cq, udata);
921 		if (rc)
922 			goto err3;
923 	} else {
924 		/* Generate doorbell address. */
925 		cq->db_addr = dev->db_addr +
926 		    DB_ADDR_SHIFT(DQ_PWM_OFFSET_UCM_RDMA_CQ_CONS_32BIT);
927 		cq->db.data.icid = cq->icid;
928 		cq->db.data.params = DB_AGG_CMD_SET <<
929 		    RDMA_PWM_VAL32_DATA_AGG_CMD_SHIFT;
930 
931 		/* point to the very last element, passing it we will toggle */
932 		cq->toggle_cqe = qed_chain_get_last_elem(&cq->pbl);
933 		cq->pbl_toggle = RDMA_CQE_REQUESTER_TOGGLE_BIT_MASK;
934 		cq->latest_cqe = NULL;
935 		consume_cqe(cq);
936 		cq->cq_cons = qed_chain_get_cons_idx_u32(&cq->pbl);
937 	}
938 
939 	DP_DEBUG(dev, QEDR_MSG_CQ,
940 		 "create cq: icid=0x%0x, addr=%p, size(entries)=0x%0x\n",
941 		 cq->icid, cq, params.cq_size);
942 
943 	return &cq->ibcq;
944 
945 err3:
946 	destroy_iparams.icid = cq->icid;
947 	dev->ops->rdma_destroy_cq(dev->rdma_ctx, &destroy_iparams,
948 				  &destroy_oparams);
949 err2:
950 	if (udata)
951 		qedr_free_pbl(dev, &cq->q.pbl_info, cq->q.pbl_tbl);
952 	else
953 		dev->ops->common->chain_free(dev->cdev, &cq->pbl);
954 err1:
955 	if (udata)
956 		ib_umem_release(cq->q.umem);
957 err0:
958 	kfree(cq);
959 	return ERR_PTR(-EINVAL);
960 }
961 
962 int qedr_resize_cq(struct ib_cq *ibcq, int new_cnt, struct ib_udata *udata)
963 {
964 	struct qedr_dev *dev = get_qedr_dev(ibcq->device);
965 	struct qedr_cq *cq = get_qedr_cq(ibcq);
966 
967 	DP_ERR(dev, "cq %p RESIZE NOT SUPPORTED\n", cq);
968 
969 	return 0;
970 }
971 
972 int qedr_destroy_cq(struct ib_cq *ibcq)
973 {
974 	struct qedr_dev *dev = get_qedr_dev(ibcq->device);
975 	struct qed_rdma_destroy_cq_out_params oparams;
976 	struct qed_rdma_destroy_cq_in_params iparams;
977 	struct qedr_cq *cq = get_qedr_cq(ibcq);
978 
979 	DP_DEBUG(dev, QEDR_MSG_CQ, "destroy cq: cq_id %d", cq->icid);
980 
981 	/* GSIs CQs are handled by driver, so they don't exist in the FW */
982 	if (cq->cq_type != QEDR_CQ_TYPE_GSI) {
983 		iparams.icid = cq->icid;
984 		dev->ops->rdma_destroy_cq(dev->rdma_ctx, &iparams, &oparams);
985 		dev->ops->common->chain_free(dev->cdev, &cq->pbl);
986 	}
987 
988 	if (ibcq->uobject && ibcq->uobject->context) {
989 		qedr_free_pbl(dev, &cq->q.pbl_info, cq->q.pbl_tbl);
990 		ib_umem_release(cq->q.umem);
991 	}
992 
993 	kfree(cq);
994 
995 	return 0;
996 }
997 
998 static inline int get_gid_info_from_table(struct ib_qp *ibqp,
999 					  struct ib_qp_attr *attr,
1000 					  int attr_mask,
1001 					  struct qed_rdma_modify_qp_in_params
1002 					  *qp_params)
1003 {
1004 	enum rdma_network_type nw_type;
1005 	struct ib_gid_attr gid_attr;
1006 	union ib_gid gid;
1007 	u32 ipv4_addr;
1008 	int rc = 0;
1009 	int i;
1010 
1011 	rc = ib_get_cached_gid(ibqp->device, attr->ah_attr.port_num,
1012 			       attr->ah_attr.grh.sgid_index, &gid, &gid_attr);
1013 	if (rc)
1014 		return rc;
1015 
1016 	if (!memcmp(&gid, &zgid, sizeof(gid)))
1017 		return -ENOENT;
1018 
1019 	if (gid_attr.ndev) {
1020 		qp_params->vlan_id = rdma_vlan_dev_vlan_id(gid_attr.ndev);
1021 
1022 		dev_put(gid_attr.ndev);
1023 		nw_type = ib_gid_to_network_type(gid_attr.gid_type, &gid);
1024 		switch (nw_type) {
1025 		case RDMA_NETWORK_IPV6:
1026 			memcpy(&qp_params->sgid.bytes[0], &gid.raw[0],
1027 			       sizeof(qp_params->sgid));
1028 			memcpy(&qp_params->dgid.bytes[0],
1029 			       &attr->ah_attr.grh.dgid,
1030 			       sizeof(qp_params->dgid));
1031 			qp_params->roce_mode = ROCE_V2_IPV6;
1032 			SET_FIELD(qp_params->modify_flags,
1033 				  QED_ROCE_MODIFY_QP_VALID_ROCE_MODE, 1);
1034 			break;
1035 		case RDMA_NETWORK_IB:
1036 			memcpy(&qp_params->sgid.bytes[0], &gid.raw[0],
1037 			       sizeof(qp_params->sgid));
1038 			memcpy(&qp_params->dgid.bytes[0],
1039 			       &attr->ah_attr.grh.dgid,
1040 			       sizeof(qp_params->dgid));
1041 			qp_params->roce_mode = ROCE_V1;
1042 			break;
1043 		case RDMA_NETWORK_IPV4:
1044 			memset(&qp_params->sgid, 0, sizeof(qp_params->sgid));
1045 			memset(&qp_params->dgid, 0, sizeof(qp_params->dgid));
1046 			ipv4_addr = qedr_get_ipv4_from_gid(gid.raw);
1047 			qp_params->sgid.ipv4_addr = ipv4_addr;
1048 			ipv4_addr =
1049 			    qedr_get_ipv4_from_gid(attr->ah_attr.grh.dgid.raw);
1050 			qp_params->dgid.ipv4_addr = ipv4_addr;
1051 			SET_FIELD(qp_params->modify_flags,
1052 				  QED_ROCE_MODIFY_QP_VALID_ROCE_MODE, 1);
1053 			qp_params->roce_mode = ROCE_V2_IPV4;
1054 			break;
1055 		}
1056 	}
1057 
1058 	for (i = 0; i < 4; i++) {
1059 		qp_params->sgid.dwords[i] = ntohl(qp_params->sgid.dwords[i]);
1060 		qp_params->dgid.dwords[i] = ntohl(qp_params->dgid.dwords[i]);
1061 	}
1062 
1063 	if (qp_params->vlan_id >= VLAN_CFI_MASK)
1064 		qp_params->vlan_id = 0;
1065 
1066 	return 0;
1067 }
1068 
1069 static void qedr_cleanup_user_sq(struct qedr_dev *dev, struct qedr_qp *qp)
1070 {
1071 	qedr_free_pbl(dev, &qp->usq.pbl_info, qp->usq.pbl_tbl);
1072 	ib_umem_release(qp->usq.umem);
1073 }
1074 
1075 static void qedr_cleanup_user_rq(struct qedr_dev *dev, struct qedr_qp *qp)
1076 {
1077 	qedr_free_pbl(dev, &qp->urq.pbl_info, qp->urq.pbl_tbl);
1078 	ib_umem_release(qp->urq.umem);
1079 }
1080 
1081 static void qedr_cleanup_kernel_sq(struct qedr_dev *dev, struct qedr_qp *qp)
1082 {
1083 	dev->ops->common->chain_free(dev->cdev, &qp->sq.pbl);
1084 	kfree(qp->wqe_wr_id);
1085 }
1086 
1087 static void qedr_cleanup_kernel_rq(struct qedr_dev *dev, struct qedr_qp *qp)
1088 {
1089 	dev->ops->common->chain_free(dev->cdev, &qp->rq.pbl);
1090 	kfree(qp->rqe_wr_id);
1091 }
1092 
1093 static int qedr_check_qp_attrs(struct ib_pd *ibpd, struct qedr_dev *dev,
1094 			       struct ib_qp_init_attr *attrs)
1095 {
1096 	struct qedr_device_attr *qattr = &dev->attr;
1097 
1098 	/* QP0... attrs->qp_type == IB_QPT_GSI */
1099 	if (attrs->qp_type != IB_QPT_RC && attrs->qp_type != IB_QPT_GSI) {
1100 		DP_DEBUG(dev, QEDR_MSG_QP,
1101 			 "create qp: unsupported qp type=0x%x requested\n",
1102 			 attrs->qp_type);
1103 		return -EINVAL;
1104 	}
1105 
1106 	if (attrs->cap.max_send_wr > qattr->max_sqe) {
1107 		DP_ERR(dev,
1108 		       "create qp: cannot create a SQ with %d elements (max_send_wr=0x%x)\n",
1109 		       attrs->cap.max_send_wr, qattr->max_sqe);
1110 		return -EINVAL;
1111 	}
1112 
1113 	if (attrs->cap.max_inline_data > qattr->max_inline) {
1114 		DP_ERR(dev,
1115 		       "create qp: unsupported inline data size=0x%x requested (max_inline=0x%x)\n",
1116 		       attrs->cap.max_inline_data, qattr->max_inline);
1117 		return -EINVAL;
1118 	}
1119 
1120 	if (attrs->cap.max_send_sge > qattr->max_sge) {
1121 		DP_ERR(dev,
1122 		       "create qp: unsupported send_sge=0x%x requested (max_send_sge=0x%x)\n",
1123 		       attrs->cap.max_send_sge, qattr->max_sge);
1124 		return -EINVAL;
1125 	}
1126 
1127 	if (attrs->cap.max_recv_sge > qattr->max_sge) {
1128 		DP_ERR(dev,
1129 		       "create qp: unsupported recv_sge=0x%x requested (max_recv_sge=0x%x)\n",
1130 		       attrs->cap.max_recv_sge, qattr->max_sge);
1131 		return -EINVAL;
1132 	}
1133 
1134 	/* Unprivileged user space cannot create special QP */
1135 	if (ibpd->uobject && attrs->qp_type == IB_QPT_GSI) {
1136 		DP_ERR(dev,
1137 		       "create qp: userspace can't create special QPs of type=0x%x\n",
1138 		       attrs->qp_type);
1139 		return -EINVAL;
1140 	}
1141 
1142 	return 0;
1143 }
1144 
1145 static void qedr_copy_rq_uresp(struct qedr_create_qp_uresp *uresp,
1146 			       struct qedr_qp *qp)
1147 {
1148 	uresp->rq_db_offset = DB_ADDR_SHIFT(DQ_PWM_OFFSET_TCM_ROCE_RQ_PROD);
1149 	uresp->rq_icid = qp->icid;
1150 }
1151 
1152 static void qedr_copy_sq_uresp(struct qedr_create_qp_uresp *uresp,
1153 			       struct qedr_qp *qp)
1154 {
1155 	uresp->sq_db_offset = DB_ADDR_SHIFT(DQ_PWM_OFFSET_XCM_RDMA_SQ_PROD);
1156 	uresp->sq_icid = qp->icid + 1;
1157 }
1158 
1159 static int qedr_copy_qp_uresp(struct qedr_dev *dev,
1160 			      struct qedr_qp *qp, struct ib_udata *udata)
1161 {
1162 	struct qedr_create_qp_uresp uresp;
1163 	int rc;
1164 
1165 	memset(&uresp, 0, sizeof(uresp));
1166 	qedr_copy_sq_uresp(&uresp, qp);
1167 	qedr_copy_rq_uresp(&uresp, qp);
1168 
1169 	uresp.atomic_supported = dev->atomic_cap != IB_ATOMIC_NONE;
1170 	uresp.qp_id = qp->qp_id;
1171 
1172 	rc = ib_copy_to_udata(udata, &uresp, sizeof(uresp));
1173 	if (rc)
1174 		DP_ERR(dev,
1175 		       "create qp: failed a copy to user space with qp icid=0x%x.\n",
1176 		       qp->icid);
1177 
1178 	return rc;
1179 }
1180 
1181 static void qedr_set_qp_init_params(struct qedr_dev *dev,
1182 				    struct qedr_qp *qp,
1183 				    struct qedr_pd *pd,
1184 				    struct ib_qp_init_attr *attrs)
1185 {
1186 	qp->pd = pd;
1187 
1188 	spin_lock_init(&qp->q_lock);
1189 
1190 	qp->qp_type = attrs->qp_type;
1191 	qp->max_inline_data = attrs->cap.max_inline_data;
1192 	qp->sq.max_sges = attrs->cap.max_send_sge;
1193 	qp->state = QED_ROCE_QP_STATE_RESET;
1194 	qp->signaled = (attrs->sq_sig_type == IB_SIGNAL_ALL_WR) ? true : false;
1195 	qp->sq_cq = get_qedr_cq(attrs->send_cq);
1196 	qp->rq_cq = get_qedr_cq(attrs->recv_cq);
1197 	qp->dev = dev;
1198 
1199 	DP_DEBUG(dev, QEDR_MSG_QP,
1200 		 "QP params:\tpd = %d, qp_type = %d, max_inline_data = %d, state = %d, signaled = %d, use_srq=%d\n",
1201 		 pd->pd_id, qp->qp_type, qp->max_inline_data,
1202 		 qp->state, qp->signaled, (attrs->srq) ? 1 : 0);
1203 	DP_DEBUG(dev, QEDR_MSG_QP,
1204 		 "SQ params:\tsq_max_sges = %d, sq_cq_id = %d\n",
1205 		 qp->sq.max_sges, qp->sq_cq->icid);
1206 	qp->rq.max_sges = attrs->cap.max_recv_sge;
1207 	DP_DEBUG(dev, QEDR_MSG_QP,
1208 		 "RQ params:\trq_max_sges = %d, rq_cq_id = %d\n",
1209 		 qp->rq.max_sges, qp->rq_cq->icid);
1210 }
1211 
1212 static inline void
1213 qedr_init_qp_user_params(struct qed_rdma_create_qp_in_params *params,
1214 			 struct qedr_create_qp_ureq *ureq)
1215 {
1216 	/* QP handle to be written in CQE */
1217 	params->qp_handle_lo = ureq->qp_handle_lo;
1218 	params->qp_handle_hi = ureq->qp_handle_hi;
1219 }
1220 
1221 static inline void
1222 qedr_init_qp_kernel_doorbell_sq(struct qedr_dev *dev, struct qedr_qp *qp)
1223 {
1224 	qp->sq.db = dev->db_addr +
1225 		    DB_ADDR_SHIFT(DQ_PWM_OFFSET_XCM_RDMA_SQ_PROD);
1226 	qp->sq.db_data.data.icid = qp->icid + 1;
1227 }
1228 
1229 static inline void
1230 qedr_init_qp_kernel_doorbell_rq(struct qedr_dev *dev, struct qedr_qp *qp)
1231 {
1232 	qp->rq.db = dev->db_addr +
1233 		    DB_ADDR_SHIFT(DQ_PWM_OFFSET_TCM_ROCE_RQ_PROD);
1234 	qp->rq.db_data.data.icid = qp->icid;
1235 }
1236 
1237 static inline int
1238 qedr_init_qp_kernel_params_rq(struct qedr_dev *dev,
1239 			      struct qedr_qp *qp, struct ib_qp_init_attr *attrs)
1240 {
1241 	/* Allocate driver internal RQ array */
1242 	qp->rqe_wr_id = kcalloc(qp->rq.max_wr, sizeof(*qp->rqe_wr_id),
1243 				GFP_KERNEL);
1244 	if (!qp->rqe_wr_id)
1245 		return -ENOMEM;
1246 
1247 	DP_DEBUG(dev, QEDR_MSG_QP, "RQ max_wr set to %d.\n", qp->rq.max_wr);
1248 
1249 	return 0;
1250 }
1251 
1252 static inline int
1253 qedr_init_qp_kernel_params_sq(struct qedr_dev *dev,
1254 			      struct qedr_qp *qp,
1255 			      struct ib_qp_init_attr *attrs,
1256 			      struct qed_rdma_create_qp_in_params *params)
1257 {
1258 	u32 temp_max_wr;
1259 
1260 	/* Allocate driver internal SQ array */
1261 	temp_max_wr = attrs->cap.max_send_wr * dev->wq_multiplier;
1262 	temp_max_wr = min_t(u32, temp_max_wr, dev->attr.max_sqe);
1263 
1264 	/* temp_max_wr < attr->max_sqe < u16 so the casting is safe */
1265 	qp->sq.max_wr = (u16)temp_max_wr;
1266 	qp->wqe_wr_id = kcalloc(qp->sq.max_wr, sizeof(*qp->wqe_wr_id),
1267 				GFP_KERNEL);
1268 	if (!qp->wqe_wr_id)
1269 		return -ENOMEM;
1270 
1271 	DP_DEBUG(dev, QEDR_MSG_QP, "SQ max_wr set to %d.\n", qp->sq.max_wr);
1272 
1273 	/* QP handle to be written in CQE */
1274 	params->qp_handle_lo = lower_32_bits((uintptr_t)qp);
1275 	params->qp_handle_hi = upper_32_bits((uintptr_t)qp);
1276 
1277 	return 0;
1278 }
1279 
1280 static inline int qedr_init_qp_kernel_sq(struct qedr_dev *dev,
1281 					 struct qedr_qp *qp,
1282 					 struct ib_qp_init_attr *attrs)
1283 {
1284 	u32 n_sq_elems, n_sq_entries;
1285 	int rc;
1286 
1287 	/* A single work request may take up to QEDR_MAX_SQ_WQE_SIZE elements in
1288 	 * the ring. The ring should allow at least a single WR, even if the
1289 	 * user requested none, due to allocation issues.
1290 	 */
1291 	n_sq_entries = attrs->cap.max_send_wr;
1292 	n_sq_entries = min_t(u32, n_sq_entries, dev->attr.max_sqe);
1293 	n_sq_entries = max_t(u32, n_sq_entries, 1);
1294 	n_sq_elems = n_sq_entries * QEDR_MAX_SQE_ELEMENTS_PER_SQE;
1295 	rc = dev->ops->common->chain_alloc(dev->cdev,
1296 					   QED_CHAIN_USE_TO_PRODUCE,
1297 					   QED_CHAIN_MODE_PBL,
1298 					   QED_CHAIN_CNT_TYPE_U32,
1299 					   n_sq_elems,
1300 					   QEDR_SQE_ELEMENT_SIZE,
1301 					   &qp->sq.pbl);
1302 	if (rc) {
1303 		DP_ERR(dev, "failed to allocate QP %p SQ\n", qp);
1304 		return rc;
1305 	}
1306 
1307 	DP_DEBUG(dev, QEDR_MSG_SQ,
1308 		 "SQ Pbl base addr = %llx max_send_wr=%d max_wr=%d capacity=%d, rc=%d\n",
1309 		 qed_chain_get_pbl_phys(&qp->sq.pbl), attrs->cap.max_send_wr,
1310 		 n_sq_entries, qed_chain_get_capacity(&qp->sq.pbl), rc);
1311 	return 0;
1312 }
1313 
1314 static inline int qedr_init_qp_kernel_rq(struct qedr_dev *dev,
1315 					 struct qedr_qp *qp,
1316 					 struct ib_qp_init_attr *attrs)
1317 {
1318 	u32 n_rq_elems, n_rq_entries;
1319 	int rc;
1320 
1321 	/* A single work request may take up to QEDR_MAX_RQ_WQE_SIZE elements in
1322 	 * the ring. There ring should allow at least a single WR, even if the
1323 	 * user requested none, due to allocation issues.
1324 	 */
1325 	n_rq_entries = max_t(u32, attrs->cap.max_recv_wr, 1);
1326 	n_rq_elems = n_rq_entries * QEDR_MAX_RQE_ELEMENTS_PER_RQE;
1327 	rc = dev->ops->common->chain_alloc(dev->cdev,
1328 					   QED_CHAIN_USE_TO_CONSUME_PRODUCE,
1329 					   QED_CHAIN_MODE_PBL,
1330 					   QED_CHAIN_CNT_TYPE_U32,
1331 					   n_rq_elems,
1332 					   QEDR_RQE_ELEMENT_SIZE,
1333 					   &qp->rq.pbl);
1334 
1335 	if (rc) {
1336 		DP_ERR(dev, "failed to allocate memory for QP %p RQ\n", qp);
1337 		return -ENOMEM;
1338 	}
1339 
1340 	DP_DEBUG(dev, QEDR_MSG_RQ,
1341 		 "RQ Pbl base addr = %llx max_recv_wr=%d max_wr=%d capacity=%d, rc=%d\n",
1342 		 qed_chain_get_pbl_phys(&qp->rq.pbl), attrs->cap.max_recv_wr,
1343 		 n_rq_entries, qed_chain_get_capacity(&qp->rq.pbl), rc);
1344 
1345 	/* n_rq_entries < u16 so the casting is safe */
1346 	qp->rq.max_wr = (u16)n_rq_entries;
1347 
1348 	return 0;
1349 }
1350 
1351 static inline void
1352 qedr_init_qp_in_params_sq(struct qedr_dev *dev,
1353 			  struct qedr_pd *pd,
1354 			  struct qedr_qp *qp,
1355 			  struct ib_qp_init_attr *attrs,
1356 			  struct ib_udata *udata,
1357 			  struct qed_rdma_create_qp_in_params *params)
1358 {
1359 	/* QP handle to be written in an async event */
1360 	params->qp_handle_async_lo = lower_32_bits((uintptr_t)qp);
1361 	params->qp_handle_async_hi = upper_32_bits((uintptr_t)qp);
1362 
1363 	params->signal_all = (attrs->sq_sig_type == IB_SIGNAL_ALL_WR);
1364 	params->fmr_and_reserved_lkey = !udata;
1365 	params->pd = pd->pd_id;
1366 	params->dpi = pd->uctx ? pd->uctx->dpi : dev->dpi;
1367 	params->sq_cq_id = get_qedr_cq(attrs->send_cq)->icid;
1368 	params->max_sq_sges = 0;
1369 	params->stats_queue = 0;
1370 
1371 	if (udata) {
1372 		params->sq_num_pages = qp->usq.pbl_info.num_pbes;
1373 		params->sq_pbl_ptr = qp->usq.pbl_tbl->pa;
1374 	} else {
1375 		params->sq_num_pages = qed_chain_get_page_cnt(&qp->sq.pbl);
1376 		params->sq_pbl_ptr = qed_chain_get_pbl_phys(&qp->sq.pbl);
1377 	}
1378 }
1379 
1380 static inline void
1381 qedr_init_qp_in_params_rq(struct qedr_qp *qp,
1382 			  struct ib_qp_init_attr *attrs,
1383 			  struct ib_udata *udata,
1384 			  struct qed_rdma_create_qp_in_params *params)
1385 {
1386 	params->rq_cq_id = get_qedr_cq(attrs->recv_cq)->icid;
1387 	params->srq_id = 0;
1388 	params->use_srq = false;
1389 
1390 	if (udata) {
1391 		params->rq_num_pages = qp->urq.pbl_info.num_pbes;
1392 		params->rq_pbl_ptr = qp->urq.pbl_tbl->pa;
1393 	} else {
1394 		params->rq_num_pages = qed_chain_get_page_cnt(&qp->rq.pbl);
1395 		params->rq_pbl_ptr = qed_chain_get_pbl_phys(&qp->rq.pbl);
1396 	}
1397 }
1398 
1399 static inline void qedr_qp_user_print(struct qedr_dev *dev, struct qedr_qp *qp)
1400 {
1401 	DP_DEBUG(dev, QEDR_MSG_QP,
1402 		 "create qp: successfully created user QP. qp=%p, sq_addr=0x%llx, sq_len=%zd, rq_addr=0x%llx, rq_len=%zd\n",
1403 		 qp, qp->usq.buf_addr, qp->usq.buf_len, qp->urq.buf_addr,
1404 		 qp->urq.buf_len);
1405 }
1406 
1407 static inline int qedr_init_user_qp(struct ib_ucontext *ib_ctx,
1408 				    struct qedr_dev *dev,
1409 				    struct qedr_qp *qp,
1410 				    struct qedr_create_qp_ureq *ureq)
1411 {
1412 	int rc;
1413 
1414 	/* SQ - read access only (0), dma sync not required (0) */
1415 	rc = qedr_init_user_queue(ib_ctx, dev, &qp->usq, ureq->sq_addr,
1416 				  ureq->sq_len, 0, 0);
1417 	if (rc)
1418 		return rc;
1419 
1420 	/* RQ - read access only (0), dma sync not required (0) */
1421 	rc = qedr_init_user_queue(ib_ctx, dev, &qp->urq, ureq->rq_addr,
1422 				  ureq->rq_len, 0, 0);
1423 
1424 	if (rc)
1425 		qedr_cleanup_user_sq(dev, qp);
1426 	return rc;
1427 }
1428 
1429 static inline int
1430 qedr_init_kernel_qp(struct qedr_dev *dev,
1431 		    struct qedr_qp *qp,
1432 		    struct ib_qp_init_attr *attrs,
1433 		    struct qed_rdma_create_qp_in_params *params)
1434 {
1435 	int rc;
1436 
1437 	rc = qedr_init_qp_kernel_sq(dev, qp, attrs);
1438 	if (rc) {
1439 		DP_ERR(dev, "failed to init kernel QP %p SQ\n", qp);
1440 		return rc;
1441 	}
1442 
1443 	rc = qedr_init_qp_kernel_params_sq(dev, qp, attrs, params);
1444 	if (rc) {
1445 		dev->ops->common->chain_free(dev->cdev, &qp->sq.pbl);
1446 		DP_ERR(dev, "failed to init kernel QP %p SQ params\n", qp);
1447 		return rc;
1448 	}
1449 
1450 	rc = qedr_init_qp_kernel_rq(dev, qp, attrs);
1451 	if (rc) {
1452 		qedr_cleanup_kernel_sq(dev, qp);
1453 		DP_ERR(dev, "failed to init kernel QP %p RQ\n", qp);
1454 		return rc;
1455 	}
1456 
1457 	rc = qedr_init_qp_kernel_params_rq(dev, qp, attrs);
1458 	if (rc) {
1459 		DP_ERR(dev, "failed to init kernel QP %p RQ params\n", qp);
1460 		qedr_cleanup_kernel_sq(dev, qp);
1461 		dev->ops->common->chain_free(dev->cdev, &qp->rq.pbl);
1462 		return rc;
1463 	}
1464 
1465 	return rc;
1466 }
1467 
1468 struct ib_qp *qedr_create_qp(struct ib_pd *ibpd,
1469 			     struct ib_qp_init_attr *attrs,
1470 			     struct ib_udata *udata)
1471 {
1472 	struct qedr_dev *dev = get_qedr_dev(ibpd->device);
1473 	struct qed_rdma_create_qp_out_params out_params;
1474 	struct qed_rdma_create_qp_in_params in_params;
1475 	struct qedr_pd *pd = get_qedr_pd(ibpd);
1476 	struct ib_ucontext *ib_ctx = NULL;
1477 	struct qedr_ucontext *ctx = NULL;
1478 	struct qedr_create_qp_ureq ureq;
1479 	struct qedr_qp *qp;
1480 	int rc = 0;
1481 
1482 	DP_DEBUG(dev, QEDR_MSG_QP, "create qp: called from %s, pd=%p\n",
1483 		 udata ? "user library" : "kernel", pd);
1484 
1485 	rc = qedr_check_qp_attrs(ibpd, dev, attrs);
1486 	if (rc)
1487 		return ERR_PTR(rc);
1488 
1489 	qp = kzalloc(sizeof(*qp), GFP_KERNEL);
1490 	if (!qp)
1491 		return ERR_PTR(-ENOMEM);
1492 
1493 	if (attrs->srq)
1494 		return ERR_PTR(-EINVAL);
1495 
1496 	DP_DEBUG(dev, QEDR_MSG_QP,
1497 		 "create qp: sq_cq=%p, sq_icid=%d, rq_cq=%p, rq_icid=%d\n",
1498 		 get_qedr_cq(attrs->send_cq),
1499 		 get_qedr_cq(attrs->send_cq)->icid,
1500 		 get_qedr_cq(attrs->recv_cq),
1501 		 get_qedr_cq(attrs->recv_cq)->icid);
1502 
1503 	qedr_set_qp_init_params(dev, qp, pd, attrs);
1504 
1505 	if (attrs->qp_type == IB_QPT_GSI) {
1506 		if (udata) {
1507 			DP_ERR(dev,
1508 			       "create qp: unexpected udata when creating GSI QP\n");
1509 			goto err0;
1510 		}
1511 		return qedr_create_gsi_qp(dev, attrs, qp);
1512 	}
1513 
1514 	memset(&in_params, 0, sizeof(in_params));
1515 
1516 	if (udata) {
1517 		if (!(udata && ibpd->uobject && ibpd->uobject->context))
1518 			goto err0;
1519 
1520 		ib_ctx = ibpd->uobject->context;
1521 		ctx = get_qedr_ucontext(ib_ctx);
1522 
1523 		memset(&ureq, 0, sizeof(ureq));
1524 		if (ib_copy_from_udata(&ureq, udata, sizeof(ureq))) {
1525 			DP_ERR(dev,
1526 			       "create qp: problem copying data from user space\n");
1527 			goto err0;
1528 		}
1529 
1530 		rc = qedr_init_user_qp(ib_ctx, dev, qp, &ureq);
1531 		if (rc)
1532 			goto err0;
1533 
1534 		qedr_init_qp_user_params(&in_params, &ureq);
1535 	} else {
1536 		rc = qedr_init_kernel_qp(dev, qp, attrs, &in_params);
1537 		if (rc)
1538 			goto err0;
1539 	}
1540 
1541 	qedr_init_qp_in_params_sq(dev, pd, qp, attrs, udata, &in_params);
1542 	qedr_init_qp_in_params_rq(qp, attrs, udata, &in_params);
1543 
1544 	qp->qed_qp = dev->ops->rdma_create_qp(dev->rdma_ctx,
1545 					      &in_params, &out_params);
1546 
1547 	if (!qp->qed_qp)
1548 		goto err1;
1549 
1550 	qp->qp_id = out_params.qp_id;
1551 	qp->icid = out_params.icid;
1552 	qp->ibqp.qp_num = qp->qp_id;
1553 
1554 	if (udata) {
1555 		rc = qedr_copy_qp_uresp(dev, qp, udata);
1556 		if (rc)
1557 			goto err2;
1558 
1559 		qedr_qp_user_print(dev, qp);
1560 	} else {
1561 		qedr_init_qp_kernel_doorbell_sq(dev, qp);
1562 		qedr_init_qp_kernel_doorbell_rq(dev, qp);
1563 	}
1564 
1565 	DP_DEBUG(dev, QEDR_MSG_QP, "created %s space QP %p\n",
1566 		 udata ? "user" : "kernel", qp);
1567 
1568 	return &qp->ibqp;
1569 
1570 err2:
1571 	rc = dev->ops->rdma_destroy_qp(dev->rdma_ctx, qp->qed_qp);
1572 	if (rc)
1573 		DP_ERR(dev, "create qp: fatal fault. rc=%d", rc);
1574 err1:
1575 	if (udata) {
1576 		qedr_cleanup_user_sq(dev, qp);
1577 		qedr_cleanup_user_rq(dev, qp);
1578 	} else {
1579 		qedr_cleanup_kernel_sq(dev, qp);
1580 		qedr_cleanup_kernel_rq(dev, qp);
1581 	}
1582 
1583 err0:
1584 	kfree(qp);
1585 
1586 	return ERR_PTR(-EFAULT);
1587 }
1588 
1589 enum ib_qp_state qedr_get_ibqp_state(enum qed_roce_qp_state qp_state)
1590 {
1591 	switch (qp_state) {
1592 	case QED_ROCE_QP_STATE_RESET:
1593 		return IB_QPS_RESET;
1594 	case QED_ROCE_QP_STATE_INIT:
1595 		return IB_QPS_INIT;
1596 	case QED_ROCE_QP_STATE_RTR:
1597 		return IB_QPS_RTR;
1598 	case QED_ROCE_QP_STATE_RTS:
1599 		return IB_QPS_RTS;
1600 	case QED_ROCE_QP_STATE_SQD:
1601 		return IB_QPS_SQD;
1602 	case QED_ROCE_QP_STATE_ERR:
1603 		return IB_QPS_ERR;
1604 	case QED_ROCE_QP_STATE_SQE:
1605 		return IB_QPS_SQE;
1606 	}
1607 	return IB_QPS_ERR;
1608 }
1609 
1610 enum qed_roce_qp_state qedr_get_state_from_ibqp(enum ib_qp_state qp_state)
1611 {
1612 	switch (qp_state) {
1613 	case IB_QPS_RESET:
1614 		return QED_ROCE_QP_STATE_RESET;
1615 	case IB_QPS_INIT:
1616 		return QED_ROCE_QP_STATE_INIT;
1617 	case IB_QPS_RTR:
1618 		return QED_ROCE_QP_STATE_RTR;
1619 	case IB_QPS_RTS:
1620 		return QED_ROCE_QP_STATE_RTS;
1621 	case IB_QPS_SQD:
1622 		return QED_ROCE_QP_STATE_SQD;
1623 	case IB_QPS_ERR:
1624 		return QED_ROCE_QP_STATE_ERR;
1625 	default:
1626 		return QED_ROCE_QP_STATE_ERR;
1627 	}
1628 }
1629 
1630 static void qedr_reset_qp_hwq_info(struct qedr_qp_hwq_info *qph)
1631 {
1632 	qed_chain_reset(&qph->pbl);
1633 	qph->prod = 0;
1634 	qph->cons = 0;
1635 	qph->wqe_cons = 0;
1636 	qph->db_data.data.value = cpu_to_le16(0);
1637 }
1638 
1639 static int qedr_update_qp_state(struct qedr_dev *dev,
1640 				struct qedr_qp *qp,
1641 				enum qed_roce_qp_state new_state)
1642 {
1643 	int status = 0;
1644 
1645 	if (new_state == qp->state)
1646 		return 1;
1647 
1648 	switch (qp->state) {
1649 	case QED_ROCE_QP_STATE_RESET:
1650 		switch (new_state) {
1651 		case QED_ROCE_QP_STATE_INIT:
1652 			qp->prev_wqe_size = 0;
1653 			qedr_reset_qp_hwq_info(&qp->sq);
1654 			qedr_reset_qp_hwq_info(&qp->rq);
1655 			break;
1656 		default:
1657 			status = -EINVAL;
1658 			break;
1659 		};
1660 		break;
1661 	case QED_ROCE_QP_STATE_INIT:
1662 		switch (new_state) {
1663 		case QED_ROCE_QP_STATE_RTR:
1664 			/* Update doorbell (in case post_recv was
1665 			 * done before move to RTR)
1666 			 */
1667 			wmb();
1668 			writel(qp->rq.db_data.raw, qp->rq.db);
1669 			/* Make sure write takes effect */
1670 			mmiowb();
1671 			break;
1672 		case QED_ROCE_QP_STATE_ERR:
1673 			break;
1674 		default:
1675 			/* Invalid state change. */
1676 			status = -EINVAL;
1677 			break;
1678 		};
1679 		break;
1680 	case QED_ROCE_QP_STATE_RTR:
1681 		/* RTR->XXX */
1682 		switch (new_state) {
1683 		case QED_ROCE_QP_STATE_RTS:
1684 			break;
1685 		case QED_ROCE_QP_STATE_ERR:
1686 			break;
1687 		default:
1688 			/* Invalid state change. */
1689 			status = -EINVAL;
1690 			break;
1691 		};
1692 		break;
1693 	case QED_ROCE_QP_STATE_RTS:
1694 		/* RTS->XXX */
1695 		switch (new_state) {
1696 		case QED_ROCE_QP_STATE_SQD:
1697 			break;
1698 		case QED_ROCE_QP_STATE_ERR:
1699 			break;
1700 		default:
1701 			/* Invalid state change. */
1702 			status = -EINVAL;
1703 			break;
1704 		};
1705 		break;
1706 	case QED_ROCE_QP_STATE_SQD:
1707 		/* SQD->XXX */
1708 		switch (new_state) {
1709 		case QED_ROCE_QP_STATE_RTS:
1710 		case QED_ROCE_QP_STATE_ERR:
1711 			break;
1712 		default:
1713 			/* Invalid state change. */
1714 			status = -EINVAL;
1715 			break;
1716 		};
1717 		break;
1718 	case QED_ROCE_QP_STATE_ERR:
1719 		/* ERR->XXX */
1720 		switch (new_state) {
1721 		case QED_ROCE_QP_STATE_RESET:
1722 			break;
1723 		default:
1724 			status = -EINVAL;
1725 			break;
1726 		};
1727 		break;
1728 	default:
1729 		status = -EINVAL;
1730 		break;
1731 	};
1732 
1733 	return status;
1734 }
1735 
1736 int qedr_modify_qp(struct ib_qp *ibqp, struct ib_qp_attr *attr,
1737 		   int attr_mask, struct ib_udata *udata)
1738 {
1739 	struct qedr_qp *qp = get_qedr_qp(ibqp);
1740 	struct qed_rdma_modify_qp_in_params qp_params = { 0 };
1741 	struct qedr_dev *dev = get_qedr_dev(&qp->dev->ibdev);
1742 	enum ib_qp_state old_qp_state, new_qp_state;
1743 	int rc = 0;
1744 
1745 	DP_DEBUG(dev, QEDR_MSG_QP,
1746 		 "modify qp: qp %p attr_mask=0x%x, state=%d", qp, attr_mask,
1747 		 attr->qp_state);
1748 
1749 	old_qp_state = qedr_get_ibqp_state(qp->state);
1750 	if (attr_mask & IB_QP_STATE)
1751 		new_qp_state = attr->qp_state;
1752 	else
1753 		new_qp_state = old_qp_state;
1754 
1755 	if (!ib_modify_qp_is_ok
1756 	    (old_qp_state, new_qp_state, ibqp->qp_type, attr_mask,
1757 	     IB_LINK_LAYER_ETHERNET)) {
1758 		DP_ERR(dev,
1759 		       "modify qp: invalid attribute mask=0x%x specified for\n"
1760 		       "qpn=0x%x of type=0x%x old_qp_state=0x%x, new_qp_state=0x%x\n",
1761 		       attr_mask, qp->qp_id, ibqp->qp_type, old_qp_state,
1762 		       new_qp_state);
1763 		rc = -EINVAL;
1764 		goto err;
1765 	}
1766 
1767 	/* Translate the masks... */
1768 	if (attr_mask & IB_QP_STATE) {
1769 		SET_FIELD(qp_params.modify_flags,
1770 			  QED_RDMA_MODIFY_QP_VALID_NEW_STATE, 1);
1771 		qp_params.new_state = qedr_get_state_from_ibqp(attr->qp_state);
1772 	}
1773 
1774 	if (attr_mask & IB_QP_EN_SQD_ASYNC_NOTIFY)
1775 		qp_params.sqd_async = true;
1776 
1777 	if (attr_mask & IB_QP_PKEY_INDEX) {
1778 		SET_FIELD(qp_params.modify_flags,
1779 			  QED_ROCE_MODIFY_QP_VALID_PKEY, 1);
1780 		if (attr->pkey_index >= QEDR_ROCE_PKEY_TABLE_LEN) {
1781 			rc = -EINVAL;
1782 			goto err;
1783 		}
1784 
1785 		qp_params.pkey = QEDR_ROCE_PKEY_DEFAULT;
1786 	}
1787 
1788 	if (attr_mask & IB_QP_QKEY)
1789 		qp->qkey = attr->qkey;
1790 
1791 	if (attr_mask & IB_QP_ACCESS_FLAGS) {
1792 		SET_FIELD(qp_params.modify_flags,
1793 			  QED_RDMA_MODIFY_QP_VALID_RDMA_OPS_EN, 1);
1794 		qp_params.incoming_rdma_read_en = attr->qp_access_flags &
1795 						  IB_ACCESS_REMOTE_READ;
1796 		qp_params.incoming_rdma_write_en = attr->qp_access_flags &
1797 						   IB_ACCESS_REMOTE_WRITE;
1798 		qp_params.incoming_atomic_en = attr->qp_access_flags &
1799 					       IB_ACCESS_REMOTE_ATOMIC;
1800 	}
1801 
1802 	if (attr_mask & (IB_QP_AV | IB_QP_PATH_MTU)) {
1803 		if (attr_mask & IB_QP_PATH_MTU) {
1804 			if (attr->path_mtu < IB_MTU_256 ||
1805 			    attr->path_mtu > IB_MTU_4096) {
1806 				pr_err("error: Only MTU sizes of 256, 512, 1024, 2048 and 4096 are supported by RoCE\n");
1807 				rc = -EINVAL;
1808 				goto err;
1809 			}
1810 			qp->mtu = min(ib_mtu_enum_to_int(attr->path_mtu),
1811 				      ib_mtu_enum_to_int(iboe_get_mtu
1812 							 (dev->ndev->mtu)));
1813 		}
1814 
1815 		if (!qp->mtu) {
1816 			qp->mtu =
1817 			ib_mtu_enum_to_int(iboe_get_mtu(dev->ndev->mtu));
1818 			pr_err("Fixing zeroed MTU to qp->mtu = %d\n", qp->mtu);
1819 		}
1820 
1821 		SET_FIELD(qp_params.modify_flags,
1822 			  QED_ROCE_MODIFY_QP_VALID_ADDRESS_VECTOR, 1);
1823 
1824 		qp_params.traffic_class_tos = attr->ah_attr.grh.traffic_class;
1825 		qp_params.flow_label = attr->ah_attr.grh.flow_label;
1826 		qp_params.hop_limit_ttl = attr->ah_attr.grh.hop_limit;
1827 
1828 		qp->sgid_idx = attr->ah_attr.grh.sgid_index;
1829 
1830 		rc = get_gid_info_from_table(ibqp, attr, attr_mask, &qp_params);
1831 		if (rc) {
1832 			DP_ERR(dev,
1833 			       "modify qp: problems with GID index %d (rc=%d)\n",
1834 			       attr->ah_attr.grh.sgid_index, rc);
1835 			return rc;
1836 		}
1837 
1838 		rc = qedr_get_dmac(dev, &attr->ah_attr,
1839 				   qp_params.remote_mac_addr);
1840 		if (rc)
1841 			return rc;
1842 
1843 		qp_params.use_local_mac = true;
1844 		ether_addr_copy(qp_params.local_mac_addr, dev->ndev->dev_addr);
1845 
1846 		DP_DEBUG(dev, QEDR_MSG_QP, "dgid=%x:%x:%x:%x\n",
1847 			 qp_params.dgid.dwords[0], qp_params.dgid.dwords[1],
1848 			 qp_params.dgid.dwords[2], qp_params.dgid.dwords[3]);
1849 		DP_DEBUG(dev, QEDR_MSG_QP, "sgid=%x:%x:%x:%x\n",
1850 			 qp_params.sgid.dwords[0], qp_params.sgid.dwords[1],
1851 			 qp_params.sgid.dwords[2], qp_params.sgid.dwords[3]);
1852 		DP_DEBUG(dev, QEDR_MSG_QP, "remote_mac=[%pM]\n",
1853 			 qp_params.remote_mac_addr);
1854 ;
1855 
1856 		qp_params.mtu = qp->mtu;
1857 		qp_params.lb_indication = false;
1858 	}
1859 
1860 	if (!qp_params.mtu) {
1861 		/* Stay with current MTU */
1862 		if (qp->mtu)
1863 			qp_params.mtu = qp->mtu;
1864 		else
1865 			qp_params.mtu =
1866 			    ib_mtu_enum_to_int(iboe_get_mtu(dev->ndev->mtu));
1867 	}
1868 
1869 	if (attr_mask & IB_QP_TIMEOUT) {
1870 		SET_FIELD(qp_params.modify_flags,
1871 			  QED_ROCE_MODIFY_QP_VALID_ACK_TIMEOUT, 1);
1872 
1873 		qp_params.ack_timeout = attr->timeout;
1874 		if (attr->timeout) {
1875 			u32 temp;
1876 
1877 			temp = 4096 * (1UL << attr->timeout) / 1000 / 1000;
1878 			/* FW requires [msec] */
1879 			qp_params.ack_timeout = temp;
1880 		} else {
1881 			/* Infinite */
1882 			qp_params.ack_timeout = 0;
1883 		}
1884 	}
1885 	if (attr_mask & IB_QP_RETRY_CNT) {
1886 		SET_FIELD(qp_params.modify_flags,
1887 			  QED_ROCE_MODIFY_QP_VALID_RETRY_CNT, 1);
1888 		qp_params.retry_cnt = attr->retry_cnt;
1889 	}
1890 
1891 	if (attr_mask & IB_QP_RNR_RETRY) {
1892 		SET_FIELD(qp_params.modify_flags,
1893 			  QED_ROCE_MODIFY_QP_VALID_RNR_RETRY_CNT, 1);
1894 		qp_params.rnr_retry_cnt = attr->rnr_retry;
1895 	}
1896 
1897 	if (attr_mask & IB_QP_RQ_PSN) {
1898 		SET_FIELD(qp_params.modify_flags,
1899 			  QED_ROCE_MODIFY_QP_VALID_RQ_PSN, 1);
1900 		qp_params.rq_psn = attr->rq_psn;
1901 		qp->rq_psn = attr->rq_psn;
1902 	}
1903 
1904 	if (attr_mask & IB_QP_MAX_QP_RD_ATOMIC) {
1905 		if (attr->max_rd_atomic > dev->attr.max_qp_req_rd_atomic_resc) {
1906 			rc = -EINVAL;
1907 			DP_ERR(dev,
1908 			       "unsupported max_rd_atomic=%d, supported=%d\n",
1909 			       attr->max_rd_atomic,
1910 			       dev->attr.max_qp_req_rd_atomic_resc);
1911 			goto err;
1912 		}
1913 
1914 		SET_FIELD(qp_params.modify_flags,
1915 			  QED_RDMA_MODIFY_QP_VALID_MAX_RD_ATOMIC_REQ, 1);
1916 		qp_params.max_rd_atomic_req = attr->max_rd_atomic;
1917 	}
1918 
1919 	if (attr_mask & IB_QP_MIN_RNR_TIMER) {
1920 		SET_FIELD(qp_params.modify_flags,
1921 			  QED_ROCE_MODIFY_QP_VALID_MIN_RNR_NAK_TIMER, 1);
1922 		qp_params.min_rnr_nak_timer = attr->min_rnr_timer;
1923 	}
1924 
1925 	if (attr_mask & IB_QP_SQ_PSN) {
1926 		SET_FIELD(qp_params.modify_flags,
1927 			  QED_ROCE_MODIFY_QP_VALID_SQ_PSN, 1);
1928 		qp_params.sq_psn = attr->sq_psn;
1929 		qp->sq_psn = attr->sq_psn;
1930 	}
1931 
1932 	if (attr_mask & IB_QP_MAX_DEST_RD_ATOMIC) {
1933 		if (attr->max_dest_rd_atomic >
1934 		    dev->attr.max_qp_resp_rd_atomic_resc) {
1935 			DP_ERR(dev,
1936 			       "unsupported max_dest_rd_atomic=%d, supported=%d\n",
1937 			       attr->max_dest_rd_atomic,
1938 			       dev->attr.max_qp_resp_rd_atomic_resc);
1939 
1940 			rc = -EINVAL;
1941 			goto err;
1942 		}
1943 
1944 		SET_FIELD(qp_params.modify_flags,
1945 			  QED_RDMA_MODIFY_QP_VALID_MAX_RD_ATOMIC_RESP, 1);
1946 		qp_params.max_rd_atomic_resp = attr->max_dest_rd_atomic;
1947 	}
1948 
1949 	if (attr_mask & IB_QP_DEST_QPN) {
1950 		SET_FIELD(qp_params.modify_flags,
1951 			  QED_ROCE_MODIFY_QP_VALID_DEST_QP, 1);
1952 
1953 		qp_params.dest_qp = attr->dest_qp_num;
1954 		qp->dest_qp_num = attr->dest_qp_num;
1955 	}
1956 
1957 	if (qp->qp_type != IB_QPT_GSI)
1958 		rc = dev->ops->rdma_modify_qp(dev->rdma_ctx,
1959 					      qp->qed_qp, &qp_params);
1960 
1961 	if (attr_mask & IB_QP_STATE) {
1962 		if ((qp->qp_type != IB_QPT_GSI) && (!udata))
1963 			qedr_update_qp_state(dev, qp, qp_params.new_state);
1964 		qp->state = qp_params.new_state;
1965 	}
1966 
1967 err:
1968 	return rc;
1969 }
1970 
1971 static int qedr_to_ib_qp_acc_flags(struct qed_rdma_query_qp_out_params *params)
1972 {
1973 	int ib_qp_acc_flags = 0;
1974 
1975 	if (params->incoming_rdma_write_en)
1976 		ib_qp_acc_flags |= IB_ACCESS_REMOTE_WRITE;
1977 	if (params->incoming_rdma_read_en)
1978 		ib_qp_acc_flags |= IB_ACCESS_REMOTE_READ;
1979 	if (params->incoming_atomic_en)
1980 		ib_qp_acc_flags |= IB_ACCESS_REMOTE_ATOMIC;
1981 	ib_qp_acc_flags |= IB_ACCESS_LOCAL_WRITE;
1982 	return ib_qp_acc_flags;
1983 }
1984 
1985 int qedr_query_qp(struct ib_qp *ibqp,
1986 		  struct ib_qp_attr *qp_attr,
1987 		  int attr_mask, struct ib_qp_init_attr *qp_init_attr)
1988 {
1989 	struct qed_rdma_query_qp_out_params params;
1990 	struct qedr_qp *qp = get_qedr_qp(ibqp);
1991 	struct qedr_dev *dev = qp->dev;
1992 	int rc = 0;
1993 
1994 	memset(&params, 0, sizeof(params));
1995 
1996 	rc = dev->ops->rdma_query_qp(dev->rdma_ctx, qp->qed_qp, &params);
1997 	if (rc)
1998 		goto err;
1999 
2000 	memset(qp_attr, 0, sizeof(*qp_attr));
2001 	memset(qp_init_attr, 0, sizeof(*qp_init_attr));
2002 
2003 	qp_attr->qp_state = qedr_get_ibqp_state(params.state);
2004 	qp_attr->cur_qp_state = qedr_get_ibqp_state(params.state);
2005 	qp_attr->path_mtu = iboe_get_mtu(params.mtu);
2006 	qp_attr->path_mig_state = IB_MIG_MIGRATED;
2007 	qp_attr->rq_psn = params.rq_psn;
2008 	qp_attr->sq_psn = params.sq_psn;
2009 	qp_attr->dest_qp_num = params.dest_qp;
2010 
2011 	qp_attr->qp_access_flags = qedr_to_ib_qp_acc_flags(&params);
2012 
2013 	qp_attr->cap.max_send_wr = qp->sq.max_wr;
2014 	qp_attr->cap.max_recv_wr = qp->rq.max_wr;
2015 	qp_attr->cap.max_send_sge = qp->sq.max_sges;
2016 	qp_attr->cap.max_recv_sge = qp->rq.max_sges;
2017 	qp_attr->cap.max_inline_data = qp->max_inline_data;
2018 	qp_init_attr->cap = qp_attr->cap;
2019 
2020 	memcpy(&qp_attr->ah_attr.grh.dgid.raw[0], &params.dgid.bytes[0],
2021 	       sizeof(qp_attr->ah_attr.grh.dgid.raw));
2022 
2023 	qp_attr->ah_attr.grh.flow_label = params.flow_label;
2024 	qp_attr->ah_attr.grh.sgid_index = qp->sgid_idx;
2025 	qp_attr->ah_attr.grh.hop_limit = params.hop_limit_ttl;
2026 	qp_attr->ah_attr.grh.traffic_class = params.traffic_class_tos;
2027 
2028 	qp_attr->ah_attr.ah_flags = IB_AH_GRH;
2029 	qp_attr->ah_attr.port_num = 1;
2030 	qp_attr->ah_attr.sl = 0;
2031 	qp_attr->timeout = params.timeout;
2032 	qp_attr->rnr_retry = params.rnr_retry;
2033 	qp_attr->retry_cnt = params.retry_cnt;
2034 	qp_attr->min_rnr_timer = params.min_rnr_nak_timer;
2035 	qp_attr->pkey_index = params.pkey_index;
2036 	qp_attr->port_num = 1;
2037 	qp_attr->ah_attr.src_path_bits = 0;
2038 	qp_attr->ah_attr.static_rate = 0;
2039 	qp_attr->alt_pkey_index = 0;
2040 	qp_attr->alt_port_num = 0;
2041 	qp_attr->alt_timeout = 0;
2042 	memset(&qp_attr->alt_ah_attr, 0, sizeof(qp_attr->alt_ah_attr));
2043 
2044 	qp_attr->sq_draining = (params.state == QED_ROCE_QP_STATE_SQD) ? 1 : 0;
2045 	qp_attr->max_dest_rd_atomic = params.max_dest_rd_atomic;
2046 	qp_attr->max_rd_atomic = params.max_rd_atomic;
2047 	qp_attr->en_sqd_async_notify = (params.sqd_async) ? 1 : 0;
2048 
2049 	DP_DEBUG(dev, QEDR_MSG_QP, "QEDR_QUERY_QP: max_inline_data=%d\n",
2050 		 qp_attr->cap.max_inline_data);
2051 
2052 err:
2053 	return rc;
2054 }
2055 
2056 int qedr_destroy_qp(struct ib_qp *ibqp)
2057 {
2058 	struct qedr_qp *qp = get_qedr_qp(ibqp);
2059 	struct qedr_dev *dev = qp->dev;
2060 	struct ib_qp_attr attr;
2061 	int attr_mask = 0;
2062 	int rc = 0;
2063 
2064 	DP_DEBUG(dev, QEDR_MSG_QP, "destroy qp: destroying %p, qp type=%d\n",
2065 		 qp, qp->qp_type);
2066 
2067 	if (qp->state != (QED_ROCE_QP_STATE_RESET | QED_ROCE_QP_STATE_ERR |
2068 			  QED_ROCE_QP_STATE_INIT)) {
2069 		attr.qp_state = IB_QPS_ERR;
2070 		attr_mask |= IB_QP_STATE;
2071 
2072 		/* Change the QP state to ERROR */
2073 		qedr_modify_qp(ibqp, &attr, attr_mask, NULL);
2074 	}
2075 
2076 	if (qp->qp_type != IB_QPT_GSI) {
2077 		rc = dev->ops->rdma_destroy_qp(dev->rdma_ctx, qp->qed_qp);
2078 		if (rc)
2079 			return rc;
2080 	} else {
2081 		qedr_destroy_gsi_qp(dev);
2082 	}
2083 
2084 	if (ibqp->uobject && ibqp->uobject->context) {
2085 		qedr_cleanup_user_sq(dev, qp);
2086 		qedr_cleanup_user_rq(dev, qp);
2087 	} else {
2088 		qedr_cleanup_kernel_sq(dev, qp);
2089 		qedr_cleanup_kernel_rq(dev, qp);
2090 	}
2091 
2092 	kfree(qp);
2093 
2094 	return rc;
2095 }
2096 
2097 struct ib_ah *qedr_create_ah(struct ib_pd *ibpd, struct ib_ah_attr *attr)
2098 {
2099 	struct qedr_ah *ah;
2100 
2101 	ah = kzalloc(sizeof(*ah), GFP_ATOMIC);
2102 	if (!ah)
2103 		return ERR_PTR(-ENOMEM);
2104 
2105 	ah->attr = *attr;
2106 
2107 	return &ah->ibah;
2108 }
2109 
2110 int qedr_destroy_ah(struct ib_ah *ibah)
2111 {
2112 	struct qedr_ah *ah = get_qedr_ah(ibah);
2113 
2114 	kfree(ah);
2115 	return 0;
2116 }
2117 
2118 static void free_mr_info(struct qedr_dev *dev, struct mr_info *info)
2119 {
2120 	struct qedr_pbl *pbl, *tmp;
2121 
2122 	if (info->pbl_table)
2123 		list_add_tail(&info->pbl_table->list_entry,
2124 			      &info->free_pbl_list);
2125 
2126 	if (!list_empty(&info->inuse_pbl_list))
2127 		list_splice(&info->inuse_pbl_list, &info->free_pbl_list);
2128 
2129 	list_for_each_entry_safe(pbl, tmp, &info->free_pbl_list, list_entry) {
2130 		list_del(&pbl->list_entry);
2131 		qedr_free_pbl(dev, &info->pbl_info, pbl);
2132 	}
2133 }
2134 
2135 static int init_mr_info(struct qedr_dev *dev, struct mr_info *info,
2136 			size_t page_list_len, bool two_layered)
2137 {
2138 	struct qedr_pbl *tmp;
2139 	int rc;
2140 
2141 	INIT_LIST_HEAD(&info->free_pbl_list);
2142 	INIT_LIST_HEAD(&info->inuse_pbl_list);
2143 
2144 	rc = qedr_prepare_pbl_tbl(dev, &info->pbl_info,
2145 				  page_list_len, two_layered);
2146 	if (rc)
2147 		goto done;
2148 
2149 	info->pbl_table = qedr_alloc_pbl_tbl(dev, &info->pbl_info, GFP_KERNEL);
2150 	if (!info->pbl_table) {
2151 		rc = -ENOMEM;
2152 		goto done;
2153 	}
2154 
2155 	DP_DEBUG(dev, QEDR_MSG_MR, "pbl_table_pa = %pa\n",
2156 		 &info->pbl_table->pa);
2157 
2158 	/* in usual case we use 2 PBLs, so we add one to free
2159 	 * list and allocating another one
2160 	 */
2161 	tmp = qedr_alloc_pbl_tbl(dev, &info->pbl_info, GFP_KERNEL);
2162 	if (!tmp) {
2163 		DP_DEBUG(dev, QEDR_MSG_MR, "Extra PBL is not allocated\n");
2164 		goto done;
2165 	}
2166 
2167 	list_add_tail(&tmp->list_entry, &info->free_pbl_list);
2168 
2169 	DP_DEBUG(dev, QEDR_MSG_MR, "extra pbl_table_pa = %pa\n", &tmp->pa);
2170 
2171 done:
2172 	if (rc)
2173 		free_mr_info(dev, info);
2174 
2175 	return rc;
2176 }
2177 
2178 struct ib_mr *qedr_reg_user_mr(struct ib_pd *ibpd, u64 start, u64 len,
2179 			       u64 usr_addr, int acc, struct ib_udata *udata)
2180 {
2181 	struct qedr_dev *dev = get_qedr_dev(ibpd->device);
2182 	struct qedr_mr *mr;
2183 	struct qedr_pd *pd;
2184 	int rc = -ENOMEM;
2185 
2186 	pd = get_qedr_pd(ibpd);
2187 	DP_DEBUG(dev, QEDR_MSG_MR,
2188 		 "qedr_register user mr pd = %d start = %lld, len = %lld, usr_addr = %lld, acc = %d\n",
2189 		 pd->pd_id, start, len, usr_addr, acc);
2190 
2191 	if (acc & IB_ACCESS_REMOTE_WRITE && !(acc & IB_ACCESS_LOCAL_WRITE))
2192 		return ERR_PTR(-EINVAL);
2193 
2194 	mr = kzalloc(sizeof(*mr), GFP_KERNEL);
2195 	if (!mr)
2196 		return ERR_PTR(rc);
2197 
2198 	mr->type = QEDR_MR_USER;
2199 
2200 	mr->umem = ib_umem_get(ibpd->uobject->context, start, len, acc, 0);
2201 	if (IS_ERR(mr->umem)) {
2202 		rc = -EFAULT;
2203 		goto err0;
2204 	}
2205 
2206 	rc = init_mr_info(dev, &mr->info, ib_umem_page_count(mr->umem), 1);
2207 	if (rc)
2208 		goto err1;
2209 
2210 	qedr_populate_pbls(dev, mr->umem, mr->info.pbl_table,
2211 			   &mr->info.pbl_info);
2212 
2213 	rc = dev->ops->rdma_alloc_tid(dev->rdma_ctx, &mr->hw_mr.itid);
2214 	if (rc) {
2215 		DP_ERR(dev, "roce alloc tid returned an error %d\n", rc);
2216 		goto err1;
2217 	}
2218 
2219 	/* Index only, 18 bit long, lkey = itid << 8 | key */
2220 	mr->hw_mr.tid_type = QED_RDMA_TID_REGISTERED_MR;
2221 	mr->hw_mr.key = 0;
2222 	mr->hw_mr.pd = pd->pd_id;
2223 	mr->hw_mr.local_read = 1;
2224 	mr->hw_mr.local_write = (acc & IB_ACCESS_LOCAL_WRITE) ? 1 : 0;
2225 	mr->hw_mr.remote_read = (acc & IB_ACCESS_REMOTE_READ) ? 1 : 0;
2226 	mr->hw_mr.remote_write = (acc & IB_ACCESS_REMOTE_WRITE) ? 1 : 0;
2227 	mr->hw_mr.remote_atomic = (acc & IB_ACCESS_REMOTE_ATOMIC) ? 1 : 0;
2228 	mr->hw_mr.mw_bind = false;
2229 	mr->hw_mr.pbl_ptr = mr->info.pbl_table[0].pa;
2230 	mr->hw_mr.pbl_two_level = mr->info.pbl_info.two_layered;
2231 	mr->hw_mr.pbl_page_size_log = ilog2(mr->info.pbl_info.pbl_size);
2232 	mr->hw_mr.page_size_log = ilog2(mr->umem->page_size);
2233 	mr->hw_mr.fbo = ib_umem_offset(mr->umem);
2234 	mr->hw_mr.length = len;
2235 	mr->hw_mr.vaddr = usr_addr;
2236 	mr->hw_mr.zbva = false;
2237 	mr->hw_mr.phy_mr = false;
2238 	mr->hw_mr.dma_mr = false;
2239 
2240 	rc = dev->ops->rdma_register_tid(dev->rdma_ctx, &mr->hw_mr);
2241 	if (rc) {
2242 		DP_ERR(dev, "roce register tid returned an error %d\n", rc);
2243 		goto err2;
2244 	}
2245 
2246 	mr->ibmr.lkey = mr->hw_mr.itid << 8 | mr->hw_mr.key;
2247 	if (mr->hw_mr.remote_write || mr->hw_mr.remote_read ||
2248 	    mr->hw_mr.remote_atomic)
2249 		mr->ibmr.rkey = mr->hw_mr.itid << 8 | mr->hw_mr.key;
2250 
2251 	DP_DEBUG(dev, QEDR_MSG_MR, "register user mr lkey: %x\n",
2252 		 mr->ibmr.lkey);
2253 	return &mr->ibmr;
2254 
2255 err2:
2256 	dev->ops->rdma_free_tid(dev->rdma_ctx, mr->hw_mr.itid);
2257 err1:
2258 	qedr_free_pbl(dev, &mr->info.pbl_info, mr->info.pbl_table);
2259 err0:
2260 	kfree(mr);
2261 	return ERR_PTR(rc);
2262 }
2263 
2264 int qedr_dereg_mr(struct ib_mr *ib_mr)
2265 {
2266 	struct qedr_mr *mr = get_qedr_mr(ib_mr);
2267 	struct qedr_dev *dev = get_qedr_dev(ib_mr->device);
2268 	int rc = 0;
2269 
2270 	rc = dev->ops->rdma_deregister_tid(dev->rdma_ctx, mr->hw_mr.itid);
2271 	if (rc)
2272 		return rc;
2273 
2274 	dev->ops->rdma_free_tid(dev->rdma_ctx, mr->hw_mr.itid);
2275 
2276 	if ((mr->type != QEDR_MR_DMA) && (mr->type != QEDR_MR_FRMR))
2277 		qedr_free_pbl(dev, &mr->info.pbl_info, mr->info.pbl_table);
2278 
2279 	/* it could be user registered memory. */
2280 	if (mr->umem)
2281 		ib_umem_release(mr->umem);
2282 
2283 	kfree(mr);
2284 
2285 	return rc;
2286 }
2287 
2288 struct qedr_mr *__qedr_alloc_mr(struct ib_pd *ibpd, int max_page_list_len)
2289 {
2290 	struct qedr_pd *pd = get_qedr_pd(ibpd);
2291 	struct qedr_dev *dev = get_qedr_dev(ibpd->device);
2292 	struct qedr_mr *mr;
2293 	int rc = -ENOMEM;
2294 
2295 	DP_DEBUG(dev, QEDR_MSG_MR,
2296 		 "qedr_alloc_frmr pd = %d max_page_list_len= %d\n", pd->pd_id,
2297 		 max_page_list_len);
2298 
2299 	mr = kzalloc(sizeof(*mr), GFP_KERNEL);
2300 	if (!mr)
2301 		return ERR_PTR(rc);
2302 
2303 	mr->dev = dev;
2304 	mr->type = QEDR_MR_FRMR;
2305 
2306 	rc = init_mr_info(dev, &mr->info, max_page_list_len, 1);
2307 	if (rc)
2308 		goto err0;
2309 
2310 	rc = dev->ops->rdma_alloc_tid(dev->rdma_ctx, &mr->hw_mr.itid);
2311 	if (rc) {
2312 		DP_ERR(dev, "roce alloc tid returned an error %d\n", rc);
2313 		goto err0;
2314 	}
2315 
2316 	/* Index only, 18 bit long, lkey = itid << 8 | key */
2317 	mr->hw_mr.tid_type = QED_RDMA_TID_FMR;
2318 	mr->hw_mr.key = 0;
2319 	mr->hw_mr.pd = pd->pd_id;
2320 	mr->hw_mr.local_read = 1;
2321 	mr->hw_mr.local_write = 0;
2322 	mr->hw_mr.remote_read = 0;
2323 	mr->hw_mr.remote_write = 0;
2324 	mr->hw_mr.remote_atomic = 0;
2325 	mr->hw_mr.mw_bind = false;
2326 	mr->hw_mr.pbl_ptr = 0;
2327 	mr->hw_mr.pbl_two_level = mr->info.pbl_info.two_layered;
2328 	mr->hw_mr.pbl_page_size_log = ilog2(mr->info.pbl_info.pbl_size);
2329 	mr->hw_mr.fbo = 0;
2330 	mr->hw_mr.length = 0;
2331 	mr->hw_mr.vaddr = 0;
2332 	mr->hw_mr.zbva = false;
2333 	mr->hw_mr.phy_mr = true;
2334 	mr->hw_mr.dma_mr = false;
2335 
2336 	rc = dev->ops->rdma_register_tid(dev->rdma_ctx, &mr->hw_mr);
2337 	if (rc) {
2338 		DP_ERR(dev, "roce register tid returned an error %d\n", rc);
2339 		goto err1;
2340 	}
2341 
2342 	mr->ibmr.lkey = mr->hw_mr.itid << 8 | mr->hw_mr.key;
2343 	mr->ibmr.rkey = mr->ibmr.lkey;
2344 
2345 	DP_DEBUG(dev, QEDR_MSG_MR, "alloc frmr: %x\n", mr->ibmr.lkey);
2346 	return mr;
2347 
2348 err1:
2349 	dev->ops->rdma_free_tid(dev->rdma_ctx, mr->hw_mr.itid);
2350 err0:
2351 	kfree(mr);
2352 	return ERR_PTR(rc);
2353 }
2354 
2355 struct ib_mr *qedr_alloc_mr(struct ib_pd *ibpd,
2356 			    enum ib_mr_type mr_type, u32 max_num_sg)
2357 {
2358 	struct qedr_dev *dev;
2359 	struct qedr_mr *mr;
2360 
2361 	if (mr_type != IB_MR_TYPE_MEM_REG)
2362 		return ERR_PTR(-EINVAL);
2363 
2364 	mr = __qedr_alloc_mr(ibpd, max_num_sg);
2365 
2366 	if (IS_ERR(mr))
2367 		return ERR_PTR(-EINVAL);
2368 
2369 	dev = mr->dev;
2370 
2371 	return &mr->ibmr;
2372 }
2373 
2374 static int qedr_set_page(struct ib_mr *ibmr, u64 addr)
2375 {
2376 	struct qedr_mr *mr = get_qedr_mr(ibmr);
2377 	struct qedr_pbl *pbl_table;
2378 	struct regpair *pbe;
2379 	u32 pbes_in_page;
2380 
2381 	if (unlikely(mr->npages == mr->info.pbl_info.num_pbes)) {
2382 		DP_ERR(mr->dev, "qedr_set_page failes when %d\n", mr->npages);
2383 		return -ENOMEM;
2384 	}
2385 
2386 	DP_DEBUG(mr->dev, QEDR_MSG_MR, "qedr_set_page pages[%d] = 0x%llx\n",
2387 		 mr->npages, addr);
2388 
2389 	pbes_in_page = mr->info.pbl_info.pbl_size / sizeof(u64);
2390 	pbl_table = mr->info.pbl_table + (mr->npages / pbes_in_page);
2391 	pbe = (struct regpair *)pbl_table->va;
2392 	pbe +=  mr->npages % pbes_in_page;
2393 	pbe->lo = cpu_to_le32((u32)addr);
2394 	pbe->hi = cpu_to_le32((u32)upper_32_bits(addr));
2395 
2396 	mr->npages++;
2397 
2398 	return 0;
2399 }
2400 
2401 static void handle_completed_mrs(struct qedr_dev *dev, struct mr_info *info)
2402 {
2403 	int work = info->completed - info->completed_handled - 1;
2404 
2405 	DP_DEBUG(dev, QEDR_MSG_MR, "Special FMR work = %d\n", work);
2406 	while (work-- > 0 && !list_empty(&info->inuse_pbl_list)) {
2407 		struct qedr_pbl *pbl;
2408 
2409 		/* Free all the page list that are possible to be freed
2410 		 * (all the ones that were invalidated), under the assumption
2411 		 * that if an FMR was completed successfully that means that
2412 		 * if there was an invalidate operation before it also ended
2413 		 */
2414 		pbl = list_first_entry(&info->inuse_pbl_list,
2415 				       struct qedr_pbl, list_entry);
2416 		list_del(&pbl->list_entry);
2417 		list_add_tail(&pbl->list_entry, &info->free_pbl_list);
2418 		info->completed_handled++;
2419 	}
2420 }
2421 
2422 int qedr_map_mr_sg(struct ib_mr *ibmr, struct scatterlist *sg,
2423 		   int sg_nents, unsigned int *sg_offset)
2424 {
2425 	struct qedr_mr *mr = get_qedr_mr(ibmr);
2426 
2427 	mr->npages = 0;
2428 
2429 	handle_completed_mrs(mr->dev, &mr->info);
2430 	return ib_sg_to_pages(ibmr, sg, sg_nents, NULL, qedr_set_page);
2431 }
2432 
2433 struct ib_mr *qedr_get_dma_mr(struct ib_pd *ibpd, int acc)
2434 {
2435 	struct qedr_dev *dev = get_qedr_dev(ibpd->device);
2436 	struct qedr_pd *pd = get_qedr_pd(ibpd);
2437 	struct qedr_mr *mr;
2438 	int rc;
2439 
2440 	mr = kzalloc(sizeof(*mr), GFP_KERNEL);
2441 	if (!mr)
2442 		return ERR_PTR(-ENOMEM);
2443 
2444 	mr->type = QEDR_MR_DMA;
2445 
2446 	rc = dev->ops->rdma_alloc_tid(dev->rdma_ctx, &mr->hw_mr.itid);
2447 	if (rc) {
2448 		DP_ERR(dev, "roce alloc tid returned an error %d\n", rc);
2449 		goto err1;
2450 	}
2451 
2452 	/* index only, 18 bit long, lkey = itid << 8 | key */
2453 	mr->hw_mr.tid_type = QED_RDMA_TID_REGISTERED_MR;
2454 	mr->hw_mr.pd = pd->pd_id;
2455 	mr->hw_mr.local_read = 1;
2456 	mr->hw_mr.local_write = (acc & IB_ACCESS_LOCAL_WRITE) ? 1 : 0;
2457 	mr->hw_mr.remote_read = (acc & IB_ACCESS_REMOTE_READ) ? 1 : 0;
2458 	mr->hw_mr.remote_write = (acc & IB_ACCESS_REMOTE_WRITE) ? 1 : 0;
2459 	mr->hw_mr.remote_atomic = (acc & IB_ACCESS_REMOTE_ATOMIC) ? 1 : 0;
2460 	mr->hw_mr.dma_mr = true;
2461 
2462 	rc = dev->ops->rdma_register_tid(dev->rdma_ctx, &mr->hw_mr);
2463 	if (rc) {
2464 		DP_ERR(dev, "roce register tid returned an error %d\n", rc);
2465 		goto err2;
2466 	}
2467 
2468 	mr->ibmr.lkey = mr->hw_mr.itid << 8 | mr->hw_mr.key;
2469 	if (mr->hw_mr.remote_write || mr->hw_mr.remote_read ||
2470 	    mr->hw_mr.remote_atomic)
2471 		mr->ibmr.rkey = mr->hw_mr.itid << 8 | mr->hw_mr.key;
2472 
2473 	DP_DEBUG(dev, QEDR_MSG_MR, "get dma mr: lkey = %x\n", mr->ibmr.lkey);
2474 	return &mr->ibmr;
2475 
2476 err2:
2477 	dev->ops->rdma_free_tid(dev->rdma_ctx, mr->hw_mr.itid);
2478 err1:
2479 	kfree(mr);
2480 	return ERR_PTR(rc);
2481 }
2482 
2483 static inline int qedr_wq_is_full(struct qedr_qp_hwq_info *wq)
2484 {
2485 	return (((wq->prod + 1) % wq->max_wr) == wq->cons);
2486 }
2487 
2488 static int sge_data_len(struct ib_sge *sg_list, int num_sge)
2489 {
2490 	int i, len = 0;
2491 
2492 	for (i = 0; i < num_sge; i++)
2493 		len += sg_list[i].length;
2494 
2495 	return len;
2496 }
2497 
2498 static void swap_wqe_data64(u64 *p)
2499 {
2500 	int i;
2501 
2502 	for (i = 0; i < QEDR_SQE_ELEMENT_SIZE / sizeof(u64); i++, p++)
2503 		*p = cpu_to_be64(cpu_to_le64(*p));
2504 }
2505 
2506 static u32 qedr_prepare_sq_inline_data(struct qedr_dev *dev,
2507 				       struct qedr_qp *qp, u8 *wqe_size,
2508 				       struct ib_send_wr *wr,
2509 				       struct ib_send_wr **bad_wr, u8 *bits,
2510 				       u8 bit)
2511 {
2512 	u32 data_size = sge_data_len(wr->sg_list, wr->num_sge);
2513 	char *seg_prt, *wqe;
2514 	int i, seg_siz;
2515 
2516 	if (data_size > ROCE_REQ_MAX_INLINE_DATA_SIZE) {
2517 		DP_ERR(dev, "Too much inline data in WR: %d\n", data_size);
2518 		*bad_wr = wr;
2519 		return 0;
2520 	}
2521 
2522 	if (!data_size)
2523 		return data_size;
2524 
2525 	*bits |= bit;
2526 
2527 	seg_prt = NULL;
2528 	wqe = NULL;
2529 	seg_siz = 0;
2530 
2531 	/* Copy data inline */
2532 	for (i = 0; i < wr->num_sge; i++) {
2533 		u32 len = wr->sg_list[i].length;
2534 		void *src = (void *)(uintptr_t)wr->sg_list[i].addr;
2535 
2536 		while (len > 0) {
2537 			u32 cur;
2538 
2539 			/* New segment required */
2540 			if (!seg_siz) {
2541 				wqe = (char *)qed_chain_produce(&qp->sq.pbl);
2542 				seg_prt = wqe;
2543 				seg_siz = sizeof(struct rdma_sq_common_wqe);
2544 				(*wqe_size)++;
2545 			}
2546 
2547 			/* Calculate currently allowed length */
2548 			cur = min_t(u32, len, seg_siz);
2549 			memcpy(seg_prt, src, cur);
2550 
2551 			/* Update segment variables */
2552 			seg_prt += cur;
2553 			seg_siz -= cur;
2554 
2555 			/* Update sge variables */
2556 			src += cur;
2557 			len -= cur;
2558 
2559 			/* Swap fully-completed segments */
2560 			if (!seg_siz)
2561 				swap_wqe_data64((u64 *)wqe);
2562 		}
2563 	}
2564 
2565 	/* swap last not completed segment */
2566 	if (seg_siz)
2567 		swap_wqe_data64((u64 *)wqe);
2568 
2569 	return data_size;
2570 }
2571 
2572 #define RQ_SGE_SET(sge, vaddr, vlength, vflags)			\
2573 	do {							\
2574 		DMA_REGPAIR_LE(sge->addr, vaddr);		\
2575 		(sge)->length = cpu_to_le32(vlength);		\
2576 		(sge)->flags = cpu_to_le32(vflags);		\
2577 	} while (0)
2578 
2579 #define SRQ_HDR_SET(hdr, vwr_id, num_sge)			\
2580 	do {							\
2581 		DMA_REGPAIR_LE(hdr->wr_id, vwr_id);		\
2582 		(hdr)->num_sges = num_sge;			\
2583 	} while (0)
2584 
2585 #define SRQ_SGE_SET(sge, vaddr, vlength, vlkey)			\
2586 	do {							\
2587 		DMA_REGPAIR_LE(sge->addr, vaddr);		\
2588 		(sge)->length = cpu_to_le32(vlength);		\
2589 		(sge)->l_key = cpu_to_le32(vlkey);		\
2590 	} while (0)
2591 
2592 static u32 qedr_prepare_sq_sges(struct qedr_qp *qp, u8 *wqe_size,
2593 				struct ib_send_wr *wr)
2594 {
2595 	u32 data_size = 0;
2596 	int i;
2597 
2598 	for (i = 0; i < wr->num_sge; i++) {
2599 		struct rdma_sq_sge *sge = qed_chain_produce(&qp->sq.pbl);
2600 
2601 		DMA_REGPAIR_LE(sge->addr, wr->sg_list[i].addr);
2602 		sge->l_key = cpu_to_le32(wr->sg_list[i].lkey);
2603 		sge->length = cpu_to_le32(wr->sg_list[i].length);
2604 		data_size += wr->sg_list[i].length;
2605 	}
2606 
2607 	if (wqe_size)
2608 		*wqe_size += wr->num_sge;
2609 
2610 	return data_size;
2611 }
2612 
2613 static u32 qedr_prepare_sq_rdma_data(struct qedr_dev *dev,
2614 				     struct qedr_qp *qp,
2615 				     struct rdma_sq_rdma_wqe_1st *rwqe,
2616 				     struct rdma_sq_rdma_wqe_2nd *rwqe2,
2617 				     struct ib_send_wr *wr,
2618 				     struct ib_send_wr **bad_wr)
2619 {
2620 	rwqe2->r_key = cpu_to_le32(rdma_wr(wr)->rkey);
2621 	DMA_REGPAIR_LE(rwqe2->remote_va, rdma_wr(wr)->remote_addr);
2622 
2623 	if (wr->send_flags & IB_SEND_INLINE) {
2624 		u8 flags = 0;
2625 
2626 		SET_FIELD2(flags, RDMA_SQ_RDMA_WQE_1ST_INLINE_FLG, 1);
2627 		return qedr_prepare_sq_inline_data(dev, qp, &rwqe->wqe_size, wr,
2628 						   bad_wr, &rwqe->flags, flags);
2629 	}
2630 
2631 	return qedr_prepare_sq_sges(qp, &rwqe->wqe_size, wr);
2632 }
2633 
2634 static u32 qedr_prepare_sq_send_data(struct qedr_dev *dev,
2635 				     struct qedr_qp *qp,
2636 				     struct rdma_sq_send_wqe_1st *swqe,
2637 				     struct rdma_sq_send_wqe_2st *swqe2,
2638 				     struct ib_send_wr *wr,
2639 				     struct ib_send_wr **bad_wr)
2640 {
2641 	memset(swqe2, 0, sizeof(*swqe2));
2642 	if (wr->send_flags & IB_SEND_INLINE) {
2643 		u8 flags = 0;
2644 
2645 		SET_FIELD2(flags, RDMA_SQ_SEND_WQE_INLINE_FLG, 1);
2646 		return qedr_prepare_sq_inline_data(dev, qp, &swqe->wqe_size, wr,
2647 						   bad_wr, &swqe->flags, flags);
2648 	}
2649 
2650 	return qedr_prepare_sq_sges(qp, &swqe->wqe_size, wr);
2651 }
2652 
2653 static int qedr_prepare_reg(struct qedr_qp *qp,
2654 			    struct rdma_sq_fmr_wqe_1st *fwqe1,
2655 			    struct ib_reg_wr *wr)
2656 {
2657 	struct qedr_mr *mr = get_qedr_mr(wr->mr);
2658 	struct rdma_sq_fmr_wqe_2nd *fwqe2;
2659 
2660 	fwqe2 = (struct rdma_sq_fmr_wqe_2nd *)qed_chain_produce(&qp->sq.pbl);
2661 	fwqe1->addr.hi = upper_32_bits(mr->ibmr.iova);
2662 	fwqe1->addr.lo = lower_32_bits(mr->ibmr.iova);
2663 	fwqe1->l_key = wr->key;
2664 
2665 	SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_REMOTE_READ,
2666 		   !!(wr->access & IB_ACCESS_REMOTE_READ));
2667 	SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_REMOTE_WRITE,
2668 		   !!(wr->access & IB_ACCESS_REMOTE_WRITE));
2669 	SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_ENABLE_ATOMIC,
2670 		   !!(wr->access & IB_ACCESS_REMOTE_ATOMIC));
2671 	SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_LOCAL_READ, 1);
2672 	SET_FIELD2(fwqe2->access_ctrl, RDMA_SQ_FMR_WQE_2ND_LOCAL_WRITE,
2673 		   !!(wr->access & IB_ACCESS_LOCAL_WRITE));
2674 	fwqe2->fmr_ctrl = 0;
2675 
2676 	SET_FIELD2(fwqe2->fmr_ctrl, RDMA_SQ_FMR_WQE_2ND_PAGE_SIZE_LOG,
2677 		   ilog2(mr->ibmr.page_size) - 12);
2678 
2679 	fwqe2->length_hi = 0;
2680 	fwqe2->length_lo = mr->ibmr.length;
2681 	fwqe2->pbl_addr.hi = upper_32_bits(mr->info.pbl_table->pa);
2682 	fwqe2->pbl_addr.lo = lower_32_bits(mr->info.pbl_table->pa);
2683 
2684 	qp->wqe_wr_id[qp->sq.prod].mr = mr;
2685 
2686 	return 0;
2687 }
2688 
2689 enum ib_wc_opcode qedr_ib_to_wc_opcode(enum ib_wr_opcode opcode)
2690 {
2691 	switch (opcode) {
2692 	case IB_WR_RDMA_WRITE:
2693 	case IB_WR_RDMA_WRITE_WITH_IMM:
2694 		return IB_WC_RDMA_WRITE;
2695 	case IB_WR_SEND_WITH_IMM:
2696 	case IB_WR_SEND:
2697 	case IB_WR_SEND_WITH_INV:
2698 		return IB_WC_SEND;
2699 	case IB_WR_RDMA_READ:
2700 		return IB_WC_RDMA_READ;
2701 	case IB_WR_ATOMIC_CMP_AND_SWP:
2702 		return IB_WC_COMP_SWAP;
2703 	case IB_WR_ATOMIC_FETCH_AND_ADD:
2704 		return IB_WC_FETCH_ADD;
2705 	case IB_WR_REG_MR:
2706 		return IB_WC_REG_MR;
2707 	case IB_WR_LOCAL_INV:
2708 		return IB_WC_LOCAL_INV;
2709 	default:
2710 		return IB_WC_SEND;
2711 	}
2712 }
2713 
2714 inline bool qedr_can_post_send(struct qedr_qp *qp, struct ib_send_wr *wr)
2715 {
2716 	int wq_is_full, err_wr, pbl_is_full;
2717 	struct qedr_dev *dev = qp->dev;
2718 
2719 	/* prevent SQ overflow and/or processing of a bad WR */
2720 	err_wr = wr->num_sge > qp->sq.max_sges;
2721 	wq_is_full = qedr_wq_is_full(&qp->sq);
2722 	pbl_is_full = qed_chain_get_elem_left_u32(&qp->sq.pbl) <
2723 		      QEDR_MAX_SQE_ELEMENTS_PER_SQE;
2724 	if (wq_is_full || err_wr || pbl_is_full) {
2725 		if (wq_is_full && !(qp->err_bitmap & QEDR_QP_ERR_SQ_FULL)) {
2726 			DP_ERR(dev,
2727 			       "error: WQ is full. Post send on QP %p failed (this error appears only once)\n",
2728 			       qp);
2729 			qp->err_bitmap |= QEDR_QP_ERR_SQ_FULL;
2730 		}
2731 
2732 		if (err_wr && !(qp->err_bitmap & QEDR_QP_ERR_BAD_SR)) {
2733 			DP_ERR(dev,
2734 			       "error: WR is bad. Post send on QP %p failed (this error appears only once)\n",
2735 			       qp);
2736 			qp->err_bitmap |= QEDR_QP_ERR_BAD_SR;
2737 		}
2738 
2739 		if (pbl_is_full &&
2740 		    !(qp->err_bitmap & QEDR_QP_ERR_SQ_PBL_FULL)) {
2741 			DP_ERR(dev,
2742 			       "error: WQ PBL is full. Post send on QP %p failed (this error appears only once)\n",
2743 			       qp);
2744 			qp->err_bitmap |= QEDR_QP_ERR_SQ_PBL_FULL;
2745 		}
2746 		return false;
2747 	}
2748 	return true;
2749 }
2750 
2751 int __qedr_post_send(struct ib_qp *ibqp, struct ib_send_wr *wr,
2752 		     struct ib_send_wr **bad_wr)
2753 {
2754 	struct qedr_dev *dev = get_qedr_dev(ibqp->device);
2755 	struct qedr_qp *qp = get_qedr_qp(ibqp);
2756 	struct rdma_sq_atomic_wqe_1st *awqe1;
2757 	struct rdma_sq_atomic_wqe_2nd *awqe2;
2758 	struct rdma_sq_atomic_wqe_3rd *awqe3;
2759 	struct rdma_sq_send_wqe_2st *swqe2;
2760 	struct rdma_sq_local_inv_wqe *iwqe;
2761 	struct rdma_sq_rdma_wqe_2nd *rwqe2;
2762 	struct rdma_sq_send_wqe_1st *swqe;
2763 	struct rdma_sq_rdma_wqe_1st *rwqe;
2764 	struct rdma_sq_fmr_wqe_1st *fwqe1;
2765 	struct rdma_sq_common_wqe *wqe;
2766 	u32 length;
2767 	int rc = 0;
2768 	bool comp;
2769 
2770 	if (!qedr_can_post_send(qp, wr)) {
2771 		*bad_wr = wr;
2772 		return -ENOMEM;
2773 	}
2774 
2775 	wqe = qed_chain_produce(&qp->sq.pbl);
2776 	qp->wqe_wr_id[qp->sq.prod].signaled =
2777 		!!(wr->send_flags & IB_SEND_SIGNALED) || qp->signaled;
2778 
2779 	wqe->flags = 0;
2780 	SET_FIELD2(wqe->flags, RDMA_SQ_SEND_WQE_SE_FLG,
2781 		   !!(wr->send_flags & IB_SEND_SOLICITED));
2782 	comp = (!!(wr->send_flags & IB_SEND_SIGNALED)) || qp->signaled;
2783 	SET_FIELD2(wqe->flags, RDMA_SQ_SEND_WQE_COMP_FLG, comp);
2784 	SET_FIELD2(wqe->flags, RDMA_SQ_SEND_WQE_RD_FENCE_FLG,
2785 		   !!(wr->send_flags & IB_SEND_FENCE));
2786 	wqe->prev_wqe_size = qp->prev_wqe_size;
2787 
2788 	qp->wqe_wr_id[qp->sq.prod].opcode = qedr_ib_to_wc_opcode(wr->opcode);
2789 
2790 	switch (wr->opcode) {
2791 	case IB_WR_SEND_WITH_IMM:
2792 		wqe->req_type = RDMA_SQ_REQ_TYPE_SEND_WITH_IMM;
2793 		swqe = (struct rdma_sq_send_wqe_1st *)wqe;
2794 		swqe->wqe_size = 2;
2795 		swqe2 = qed_chain_produce(&qp->sq.pbl);
2796 
2797 		swqe->inv_key_or_imm_data = cpu_to_le32(wr->ex.imm_data);
2798 		length = qedr_prepare_sq_send_data(dev, qp, swqe, swqe2,
2799 						   wr, bad_wr);
2800 		swqe->length = cpu_to_le32(length);
2801 		qp->wqe_wr_id[qp->sq.prod].wqe_size = swqe->wqe_size;
2802 		qp->prev_wqe_size = swqe->wqe_size;
2803 		qp->wqe_wr_id[qp->sq.prod].bytes_len = swqe->length;
2804 		break;
2805 	case IB_WR_SEND:
2806 		wqe->req_type = RDMA_SQ_REQ_TYPE_SEND;
2807 		swqe = (struct rdma_sq_send_wqe_1st *)wqe;
2808 
2809 		swqe->wqe_size = 2;
2810 		swqe2 = qed_chain_produce(&qp->sq.pbl);
2811 		length = qedr_prepare_sq_send_data(dev, qp, swqe, swqe2,
2812 						   wr, bad_wr);
2813 		swqe->length = cpu_to_le32(length);
2814 		qp->wqe_wr_id[qp->sq.prod].wqe_size = swqe->wqe_size;
2815 		qp->prev_wqe_size = swqe->wqe_size;
2816 		qp->wqe_wr_id[qp->sq.prod].bytes_len = swqe->length;
2817 		break;
2818 	case IB_WR_SEND_WITH_INV:
2819 		wqe->req_type = RDMA_SQ_REQ_TYPE_SEND_WITH_INVALIDATE;
2820 		swqe = (struct rdma_sq_send_wqe_1st *)wqe;
2821 		swqe2 = qed_chain_produce(&qp->sq.pbl);
2822 		swqe->wqe_size = 2;
2823 		swqe->inv_key_or_imm_data = cpu_to_le32(wr->ex.invalidate_rkey);
2824 		length = qedr_prepare_sq_send_data(dev, qp, swqe, swqe2,
2825 						   wr, bad_wr);
2826 		swqe->length = cpu_to_le32(length);
2827 		qp->wqe_wr_id[qp->sq.prod].wqe_size = swqe->wqe_size;
2828 		qp->prev_wqe_size = swqe->wqe_size;
2829 		qp->wqe_wr_id[qp->sq.prod].bytes_len = swqe->length;
2830 		break;
2831 
2832 	case IB_WR_RDMA_WRITE_WITH_IMM:
2833 		wqe->req_type = RDMA_SQ_REQ_TYPE_RDMA_WR_WITH_IMM;
2834 		rwqe = (struct rdma_sq_rdma_wqe_1st *)wqe;
2835 
2836 		rwqe->wqe_size = 2;
2837 		rwqe->imm_data = htonl(cpu_to_le32(wr->ex.imm_data));
2838 		rwqe2 = qed_chain_produce(&qp->sq.pbl);
2839 		length = qedr_prepare_sq_rdma_data(dev, qp, rwqe, rwqe2,
2840 						   wr, bad_wr);
2841 		rwqe->length = cpu_to_le32(length);
2842 		qp->wqe_wr_id[qp->sq.prod].wqe_size = rwqe->wqe_size;
2843 		qp->prev_wqe_size = rwqe->wqe_size;
2844 		qp->wqe_wr_id[qp->sq.prod].bytes_len = rwqe->length;
2845 		break;
2846 	case IB_WR_RDMA_WRITE:
2847 		wqe->req_type = RDMA_SQ_REQ_TYPE_RDMA_WR;
2848 		rwqe = (struct rdma_sq_rdma_wqe_1st *)wqe;
2849 
2850 		rwqe->wqe_size = 2;
2851 		rwqe2 = qed_chain_produce(&qp->sq.pbl);
2852 		length = qedr_prepare_sq_rdma_data(dev, qp, rwqe, rwqe2,
2853 						   wr, bad_wr);
2854 		rwqe->length = cpu_to_le32(length);
2855 		qp->wqe_wr_id[qp->sq.prod].wqe_size = rwqe->wqe_size;
2856 		qp->prev_wqe_size = rwqe->wqe_size;
2857 		qp->wqe_wr_id[qp->sq.prod].bytes_len = rwqe->length;
2858 		break;
2859 	case IB_WR_RDMA_READ_WITH_INV:
2860 		DP_ERR(dev,
2861 		       "RDMA READ WITH INVALIDATE not supported\n");
2862 		*bad_wr = wr;
2863 		rc = -EINVAL;
2864 		break;
2865 
2866 	case IB_WR_RDMA_READ:
2867 		wqe->req_type = RDMA_SQ_REQ_TYPE_RDMA_RD;
2868 		rwqe = (struct rdma_sq_rdma_wqe_1st *)wqe;
2869 
2870 		rwqe->wqe_size = 2;
2871 		rwqe2 = qed_chain_produce(&qp->sq.pbl);
2872 		length = qedr_prepare_sq_rdma_data(dev, qp, rwqe, rwqe2,
2873 						   wr, bad_wr);
2874 		rwqe->length = cpu_to_le32(length);
2875 		qp->wqe_wr_id[qp->sq.prod].wqe_size = rwqe->wqe_size;
2876 		qp->prev_wqe_size = rwqe->wqe_size;
2877 		qp->wqe_wr_id[qp->sq.prod].bytes_len = rwqe->length;
2878 		break;
2879 
2880 	case IB_WR_ATOMIC_CMP_AND_SWP:
2881 	case IB_WR_ATOMIC_FETCH_AND_ADD:
2882 		awqe1 = (struct rdma_sq_atomic_wqe_1st *)wqe;
2883 		awqe1->wqe_size = 4;
2884 
2885 		awqe2 = qed_chain_produce(&qp->sq.pbl);
2886 		DMA_REGPAIR_LE(awqe2->remote_va, atomic_wr(wr)->remote_addr);
2887 		awqe2->r_key = cpu_to_le32(atomic_wr(wr)->rkey);
2888 
2889 		awqe3 = qed_chain_produce(&qp->sq.pbl);
2890 
2891 		if (wr->opcode == IB_WR_ATOMIC_FETCH_AND_ADD) {
2892 			wqe->req_type = RDMA_SQ_REQ_TYPE_ATOMIC_ADD;
2893 			DMA_REGPAIR_LE(awqe3->swap_data,
2894 				       atomic_wr(wr)->compare_add);
2895 		} else {
2896 			wqe->req_type = RDMA_SQ_REQ_TYPE_ATOMIC_CMP_AND_SWAP;
2897 			DMA_REGPAIR_LE(awqe3->swap_data,
2898 				       atomic_wr(wr)->swap);
2899 			DMA_REGPAIR_LE(awqe3->cmp_data,
2900 				       atomic_wr(wr)->compare_add);
2901 		}
2902 
2903 		qedr_prepare_sq_sges(qp, NULL, wr);
2904 
2905 		qp->wqe_wr_id[qp->sq.prod].wqe_size = awqe1->wqe_size;
2906 		qp->prev_wqe_size = awqe1->wqe_size;
2907 		break;
2908 
2909 	case IB_WR_LOCAL_INV:
2910 		iwqe = (struct rdma_sq_local_inv_wqe *)wqe;
2911 		iwqe->wqe_size = 1;
2912 
2913 		iwqe->req_type = RDMA_SQ_REQ_TYPE_LOCAL_INVALIDATE;
2914 		iwqe->inv_l_key = wr->ex.invalidate_rkey;
2915 		qp->wqe_wr_id[qp->sq.prod].wqe_size = iwqe->wqe_size;
2916 		qp->prev_wqe_size = iwqe->wqe_size;
2917 		break;
2918 	case IB_WR_REG_MR:
2919 		DP_DEBUG(dev, QEDR_MSG_CQ, "REG_MR\n");
2920 		wqe->req_type = RDMA_SQ_REQ_TYPE_FAST_MR;
2921 		fwqe1 = (struct rdma_sq_fmr_wqe_1st *)wqe;
2922 		fwqe1->wqe_size = 2;
2923 
2924 		rc = qedr_prepare_reg(qp, fwqe1, reg_wr(wr));
2925 		if (rc) {
2926 			DP_ERR(dev, "IB_REG_MR failed rc=%d\n", rc);
2927 			*bad_wr = wr;
2928 			break;
2929 		}
2930 
2931 		qp->wqe_wr_id[qp->sq.prod].wqe_size = fwqe1->wqe_size;
2932 		qp->prev_wqe_size = fwqe1->wqe_size;
2933 		break;
2934 	default:
2935 		DP_ERR(dev, "invalid opcode 0x%x!\n", wr->opcode);
2936 		rc = -EINVAL;
2937 		*bad_wr = wr;
2938 		break;
2939 	}
2940 
2941 	if (*bad_wr) {
2942 		u16 value;
2943 
2944 		/* Restore prod to its position before
2945 		 * this WR was processed
2946 		 */
2947 		value = le16_to_cpu(qp->sq.db_data.data.value);
2948 		qed_chain_set_prod(&qp->sq.pbl, value, wqe);
2949 
2950 		/* Restore prev_wqe_size */
2951 		qp->prev_wqe_size = wqe->prev_wqe_size;
2952 		rc = -EINVAL;
2953 		DP_ERR(dev, "POST SEND FAILED\n");
2954 	}
2955 
2956 	return rc;
2957 }
2958 
2959 int qedr_post_send(struct ib_qp *ibqp, struct ib_send_wr *wr,
2960 		   struct ib_send_wr **bad_wr)
2961 {
2962 	struct qedr_dev *dev = get_qedr_dev(ibqp->device);
2963 	struct qedr_qp *qp = get_qedr_qp(ibqp);
2964 	unsigned long flags;
2965 	int rc = 0;
2966 
2967 	*bad_wr = NULL;
2968 
2969 	if (qp->qp_type == IB_QPT_GSI)
2970 		return qedr_gsi_post_send(ibqp, wr, bad_wr);
2971 
2972 	spin_lock_irqsave(&qp->q_lock, flags);
2973 
2974 	if ((qp->state == QED_ROCE_QP_STATE_RESET) ||
2975 	    (qp->state == QED_ROCE_QP_STATE_ERR)) {
2976 		spin_unlock_irqrestore(&qp->q_lock, flags);
2977 		*bad_wr = wr;
2978 		DP_DEBUG(dev, QEDR_MSG_CQ,
2979 			 "QP in wrong state! QP icid=0x%x state %d\n",
2980 			 qp->icid, qp->state);
2981 		return -EINVAL;
2982 	}
2983 
2984 	if (!wr) {
2985 		DP_ERR(dev, "Got an empty post send.\n");
2986 		return -EINVAL;
2987 	}
2988 
2989 	while (wr) {
2990 		rc = __qedr_post_send(ibqp, wr, bad_wr);
2991 		if (rc)
2992 			break;
2993 
2994 		qp->wqe_wr_id[qp->sq.prod].wr_id = wr->wr_id;
2995 
2996 		qedr_inc_sw_prod(&qp->sq);
2997 
2998 		qp->sq.db_data.data.value++;
2999 
3000 		wr = wr->next;
3001 	}
3002 
3003 	/* Trigger doorbell
3004 	 * If there was a failure in the first WR then it will be triggered in
3005 	 * vane. However this is not harmful (as long as the producer value is
3006 	 * unchanged). For performance reasons we avoid checking for this
3007 	 * redundant doorbell.
3008 	 */
3009 	wmb();
3010 	writel(qp->sq.db_data.raw, qp->sq.db);
3011 
3012 	/* Make sure write sticks */
3013 	mmiowb();
3014 
3015 	spin_unlock_irqrestore(&qp->q_lock, flags);
3016 
3017 	return rc;
3018 }
3019 
3020 int qedr_post_recv(struct ib_qp *ibqp, struct ib_recv_wr *wr,
3021 		   struct ib_recv_wr **bad_wr)
3022 {
3023 	struct qedr_qp *qp = get_qedr_qp(ibqp);
3024 	struct qedr_dev *dev = qp->dev;
3025 	unsigned long flags;
3026 	int status = 0;
3027 
3028 	if (qp->qp_type == IB_QPT_GSI)
3029 		return qedr_gsi_post_recv(ibqp, wr, bad_wr);
3030 
3031 	spin_lock_irqsave(&qp->q_lock, flags);
3032 
3033 	if ((qp->state == QED_ROCE_QP_STATE_RESET) ||
3034 	    (qp->state == QED_ROCE_QP_STATE_ERR)) {
3035 		spin_unlock_irqrestore(&qp->q_lock, flags);
3036 		*bad_wr = wr;
3037 		return -EINVAL;
3038 	}
3039 
3040 	while (wr) {
3041 		int i;
3042 
3043 		if (qed_chain_get_elem_left_u32(&qp->rq.pbl) <
3044 		    QEDR_MAX_RQE_ELEMENTS_PER_RQE ||
3045 		    wr->num_sge > qp->rq.max_sges) {
3046 			DP_ERR(dev, "Can't post WR  (%d < %d) || (%d > %d)\n",
3047 			       qed_chain_get_elem_left_u32(&qp->rq.pbl),
3048 			       QEDR_MAX_RQE_ELEMENTS_PER_RQE, wr->num_sge,
3049 			       qp->rq.max_sges);
3050 			status = -ENOMEM;
3051 			*bad_wr = wr;
3052 			break;
3053 		}
3054 		for (i = 0; i < wr->num_sge; i++) {
3055 			u32 flags = 0;
3056 			struct rdma_rq_sge *rqe =
3057 			    qed_chain_produce(&qp->rq.pbl);
3058 
3059 			/* First one must include the number
3060 			 * of SGE in the list
3061 			 */
3062 			if (!i)
3063 				SET_FIELD(flags, RDMA_RQ_SGE_NUM_SGES,
3064 					  wr->num_sge);
3065 
3066 			SET_FIELD(flags, RDMA_RQ_SGE_L_KEY,
3067 				  wr->sg_list[i].lkey);
3068 
3069 			RQ_SGE_SET(rqe, wr->sg_list[i].addr,
3070 				   wr->sg_list[i].length, flags);
3071 		}
3072 
3073 		/* Special case of no sges. FW requires between 1-4 sges...
3074 		 * in this case we need to post 1 sge with length zero. this is
3075 		 * because rdma write with immediate consumes an RQ.
3076 		 */
3077 		if (!wr->num_sge) {
3078 			u32 flags = 0;
3079 			struct rdma_rq_sge *rqe =
3080 			    qed_chain_produce(&qp->rq.pbl);
3081 
3082 			/* First one must include the number
3083 			 * of SGE in the list
3084 			 */
3085 			SET_FIELD(flags, RDMA_RQ_SGE_L_KEY, 0);
3086 			SET_FIELD(flags, RDMA_RQ_SGE_NUM_SGES, 1);
3087 
3088 			RQ_SGE_SET(rqe, 0, 0, flags);
3089 			i = 1;
3090 		}
3091 
3092 		qp->rqe_wr_id[qp->rq.prod].wr_id = wr->wr_id;
3093 		qp->rqe_wr_id[qp->rq.prod].wqe_size = i;
3094 
3095 		qedr_inc_sw_prod(&qp->rq);
3096 
3097 		/* Flush all the writes before signalling doorbell */
3098 		wmb();
3099 
3100 		qp->rq.db_data.data.value++;
3101 
3102 		writel(qp->rq.db_data.raw, qp->rq.db);
3103 
3104 		/* Make sure write sticks */
3105 		mmiowb();
3106 
3107 		wr = wr->next;
3108 	}
3109 
3110 	spin_unlock_irqrestore(&qp->q_lock, flags);
3111 
3112 	return status;
3113 }
3114 
3115 static int is_valid_cqe(struct qedr_cq *cq, union rdma_cqe *cqe)
3116 {
3117 	struct rdma_cqe_requester *resp_cqe = &cqe->req;
3118 
3119 	return (resp_cqe->flags & RDMA_CQE_REQUESTER_TOGGLE_BIT_MASK) ==
3120 		cq->pbl_toggle;
3121 }
3122 
3123 static struct qedr_qp *cqe_get_qp(union rdma_cqe *cqe)
3124 {
3125 	struct rdma_cqe_requester *resp_cqe = &cqe->req;
3126 	struct qedr_qp *qp;
3127 
3128 	qp = (struct qedr_qp *)(uintptr_t)HILO_GEN(resp_cqe->qp_handle.hi,
3129 						   resp_cqe->qp_handle.lo,
3130 						   u64);
3131 	return qp;
3132 }
3133 
3134 static enum rdma_cqe_type cqe_get_type(union rdma_cqe *cqe)
3135 {
3136 	struct rdma_cqe_requester *resp_cqe = &cqe->req;
3137 
3138 	return GET_FIELD(resp_cqe->flags, RDMA_CQE_REQUESTER_TYPE);
3139 }
3140 
3141 /* Return latest CQE (needs processing) */
3142 static union rdma_cqe *get_cqe(struct qedr_cq *cq)
3143 {
3144 	return cq->latest_cqe;
3145 }
3146 
3147 /* In fmr we need to increase the number of fmr completed counter for the fmr
3148  * algorithm determining whether we can free a pbl or not.
3149  * we need to perform this whether the work request was signaled or not. for
3150  * this purpose we call this function from the condition that checks if a wr
3151  * should be skipped, to make sure we don't miss it ( possibly this fmr
3152  * operation was not signalted)
3153  */
3154 static inline void qedr_chk_if_fmr(struct qedr_qp *qp)
3155 {
3156 	if (qp->wqe_wr_id[qp->sq.cons].opcode == IB_WC_REG_MR)
3157 		qp->wqe_wr_id[qp->sq.cons].mr->info.completed++;
3158 }
3159 
3160 static int process_req(struct qedr_dev *dev, struct qedr_qp *qp,
3161 		       struct qedr_cq *cq, int num_entries,
3162 		       struct ib_wc *wc, u16 hw_cons, enum ib_wc_status status,
3163 		       int force)
3164 {
3165 	u16 cnt = 0;
3166 
3167 	while (num_entries && qp->sq.wqe_cons != hw_cons) {
3168 		if (!qp->wqe_wr_id[qp->sq.cons].signaled && !force) {
3169 			qedr_chk_if_fmr(qp);
3170 			/* skip WC */
3171 			goto next_cqe;
3172 		}
3173 
3174 		/* fill WC */
3175 		wc->status = status;
3176 		wc->wc_flags = 0;
3177 		wc->src_qp = qp->id;
3178 		wc->qp = &qp->ibqp;
3179 
3180 		wc->wr_id = qp->wqe_wr_id[qp->sq.cons].wr_id;
3181 		wc->opcode = qp->wqe_wr_id[qp->sq.cons].opcode;
3182 
3183 		switch (wc->opcode) {
3184 		case IB_WC_RDMA_WRITE:
3185 			wc->byte_len = qp->wqe_wr_id[qp->sq.cons].bytes_len;
3186 			break;
3187 		case IB_WC_COMP_SWAP:
3188 		case IB_WC_FETCH_ADD:
3189 			wc->byte_len = 8;
3190 			break;
3191 		case IB_WC_REG_MR:
3192 			qp->wqe_wr_id[qp->sq.cons].mr->info.completed++;
3193 			break;
3194 		default:
3195 			break;
3196 		}
3197 
3198 		num_entries--;
3199 		wc++;
3200 		cnt++;
3201 next_cqe:
3202 		while (qp->wqe_wr_id[qp->sq.cons].wqe_size--)
3203 			qed_chain_consume(&qp->sq.pbl);
3204 		qedr_inc_sw_cons(&qp->sq);
3205 	}
3206 
3207 	return cnt;
3208 }
3209 
3210 static int qedr_poll_cq_req(struct qedr_dev *dev,
3211 			    struct qedr_qp *qp, struct qedr_cq *cq,
3212 			    int num_entries, struct ib_wc *wc,
3213 			    struct rdma_cqe_requester *req)
3214 {
3215 	int cnt = 0;
3216 
3217 	switch (req->status) {
3218 	case RDMA_CQE_REQ_STS_OK:
3219 		cnt = process_req(dev, qp, cq, num_entries, wc, req->sq_cons,
3220 				  IB_WC_SUCCESS, 0);
3221 		break;
3222 	case RDMA_CQE_REQ_STS_WORK_REQUEST_FLUSHED_ERR:
3223 		DP_ERR(dev,
3224 		       "Error: POLL CQ with RDMA_CQE_REQ_STS_WORK_REQUEST_FLUSHED_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3225 		       cq->icid, qp->icid);
3226 		cnt = process_req(dev, qp, cq, num_entries, wc, req->sq_cons,
3227 				  IB_WC_WR_FLUSH_ERR, 0);
3228 		break;
3229 	default:
3230 		/* process all WQE before the cosumer */
3231 		qp->state = QED_ROCE_QP_STATE_ERR;
3232 		cnt = process_req(dev, qp, cq, num_entries, wc,
3233 				  req->sq_cons - 1, IB_WC_SUCCESS, 0);
3234 		wc += cnt;
3235 		/* if we have extra WC fill it with actual error info */
3236 		if (cnt < num_entries) {
3237 			enum ib_wc_status wc_status;
3238 
3239 			switch (req->status) {
3240 			case RDMA_CQE_REQ_STS_BAD_RESPONSE_ERR:
3241 				DP_ERR(dev,
3242 				       "Error: POLL CQ with RDMA_CQE_REQ_STS_BAD_RESPONSE_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3243 				       cq->icid, qp->icid);
3244 				wc_status = IB_WC_BAD_RESP_ERR;
3245 				break;
3246 			case RDMA_CQE_REQ_STS_LOCAL_LENGTH_ERR:
3247 				DP_ERR(dev,
3248 				       "Error: POLL CQ with RDMA_CQE_REQ_STS_LOCAL_LENGTH_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3249 				       cq->icid, qp->icid);
3250 				wc_status = IB_WC_LOC_LEN_ERR;
3251 				break;
3252 			case RDMA_CQE_REQ_STS_LOCAL_QP_OPERATION_ERR:
3253 				DP_ERR(dev,
3254 				       "Error: POLL CQ with RDMA_CQE_REQ_STS_LOCAL_QP_OPERATION_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3255 				       cq->icid, qp->icid);
3256 				wc_status = IB_WC_LOC_QP_OP_ERR;
3257 				break;
3258 			case RDMA_CQE_REQ_STS_LOCAL_PROTECTION_ERR:
3259 				DP_ERR(dev,
3260 				       "Error: POLL CQ with RDMA_CQE_REQ_STS_LOCAL_PROTECTION_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3261 				       cq->icid, qp->icid);
3262 				wc_status = IB_WC_LOC_PROT_ERR;
3263 				break;
3264 			case RDMA_CQE_REQ_STS_MEMORY_MGT_OPERATION_ERR:
3265 				DP_ERR(dev,
3266 				       "Error: POLL CQ with RDMA_CQE_REQ_STS_MEMORY_MGT_OPERATION_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3267 				       cq->icid, qp->icid);
3268 				wc_status = IB_WC_MW_BIND_ERR;
3269 				break;
3270 			case RDMA_CQE_REQ_STS_REMOTE_INVALID_REQUEST_ERR:
3271 				DP_ERR(dev,
3272 				       "Error: POLL CQ with RDMA_CQE_REQ_STS_REMOTE_INVALID_REQUEST_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3273 				       cq->icid, qp->icid);
3274 				wc_status = IB_WC_REM_INV_REQ_ERR;
3275 				break;
3276 			case RDMA_CQE_REQ_STS_REMOTE_ACCESS_ERR:
3277 				DP_ERR(dev,
3278 				       "Error: POLL CQ with RDMA_CQE_REQ_STS_REMOTE_ACCESS_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3279 				       cq->icid, qp->icid);
3280 				wc_status = IB_WC_REM_ACCESS_ERR;
3281 				break;
3282 			case RDMA_CQE_REQ_STS_REMOTE_OPERATION_ERR:
3283 				DP_ERR(dev,
3284 				       "Error: POLL CQ with RDMA_CQE_REQ_STS_REMOTE_OPERATION_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3285 				       cq->icid, qp->icid);
3286 				wc_status = IB_WC_REM_OP_ERR;
3287 				break;
3288 			case RDMA_CQE_REQ_STS_RNR_NAK_RETRY_CNT_ERR:
3289 				DP_ERR(dev,
3290 				       "Error: POLL CQ with RDMA_CQE_REQ_STS_RNR_NAK_RETRY_CNT_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3291 				       cq->icid, qp->icid);
3292 				wc_status = IB_WC_RNR_RETRY_EXC_ERR;
3293 				break;
3294 			case RDMA_CQE_REQ_STS_TRANSPORT_RETRY_CNT_ERR:
3295 				DP_ERR(dev,
3296 				       "Error: POLL CQ with ROCE_CQE_REQ_STS_TRANSPORT_RETRY_CNT_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3297 				       cq->icid, qp->icid);
3298 				wc_status = IB_WC_RETRY_EXC_ERR;
3299 				break;
3300 			default:
3301 				DP_ERR(dev,
3302 				       "Error: POLL CQ with IB_WC_GENERAL_ERR. CQ icid=0x%x, QP icid=0x%x\n",
3303 				       cq->icid, qp->icid);
3304 				wc_status = IB_WC_GENERAL_ERR;
3305 			}
3306 			cnt += process_req(dev, qp, cq, 1, wc, req->sq_cons,
3307 					   wc_status, 1);
3308 		}
3309 	}
3310 
3311 	return cnt;
3312 }
3313 
3314 static void __process_resp_one(struct qedr_dev *dev, struct qedr_qp *qp,
3315 			       struct qedr_cq *cq, struct ib_wc *wc,
3316 			       struct rdma_cqe_responder *resp, u64 wr_id)
3317 {
3318 	enum ib_wc_status wc_status = IB_WC_SUCCESS;
3319 	u8 flags;
3320 
3321 	wc->opcode = IB_WC_RECV;
3322 	wc->wc_flags = 0;
3323 
3324 	switch (resp->status) {
3325 	case RDMA_CQE_RESP_STS_LOCAL_ACCESS_ERR:
3326 		wc_status = IB_WC_LOC_ACCESS_ERR;
3327 		break;
3328 	case RDMA_CQE_RESP_STS_LOCAL_LENGTH_ERR:
3329 		wc_status = IB_WC_LOC_LEN_ERR;
3330 		break;
3331 	case RDMA_CQE_RESP_STS_LOCAL_QP_OPERATION_ERR:
3332 		wc_status = IB_WC_LOC_QP_OP_ERR;
3333 		break;
3334 	case RDMA_CQE_RESP_STS_LOCAL_PROTECTION_ERR:
3335 		wc_status = IB_WC_LOC_PROT_ERR;
3336 		break;
3337 	case RDMA_CQE_RESP_STS_MEMORY_MGT_OPERATION_ERR:
3338 		wc_status = IB_WC_MW_BIND_ERR;
3339 		break;
3340 	case RDMA_CQE_RESP_STS_REMOTE_INVALID_REQUEST_ERR:
3341 		wc_status = IB_WC_REM_INV_RD_REQ_ERR;
3342 		break;
3343 	case RDMA_CQE_RESP_STS_OK:
3344 		wc_status = IB_WC_SUCCESS;
3345 		wc->byte_len = le32_to_cpu(resp->length);
3346 
3347 		flags = resp->flags & QEDR_RESP_RDMA_IMM;
3348 
3349 		if (flags == QEDR_RESP_RDMA_IMM)
3350 			wc->opcode = IB_WC_RECV_RDMA_WITH_IMM;
3351 
3352 		if (flags == QEDR_RESP_RDMA_IMM || flags == QEDR_RESP_IMM) {
3353 			wc->ex.imm_data =
3354 				le32_to_cpu(resp->imm_data_or_inv_r_Key);
3355 			wc->wc_flags |= IB_WC_WITH_IMM;
3356 		}
3357 		break;
3358 	default:
3359 		wc->status = IB_WC_GENERAL_ERR;
3360 		DP_ERR(dev, "Invalid CQE status detected\n");
3361 	}
3362 
3363 	/* fill WC */
3364 	wc->status = wc_status;
3365 	wc->src_qp = qp->id;
3366 	wc->qp = &qp->ibqp;
3367 	wc->wr_id = wr_id;
3368 }
3369 
3370 static int process_resp_one(struct qedr_dev *dev, struct qedr_qp *qp,
3371 			    struct qedr_cq *cq, struct ib_wc *wc,
3372 			    struct rdma_cqe_responder *resp)
3373 {
3374 	u64 wr_id = qp->rqe_wr_id[qp->rq.cons].wr_id;
3375 
3376 	__process_resp_one(dev, qp, cq, wc, resp, wr_id);
3377 
3378 	while (qp->rqe_wr_id[qp->rq.cons].wqe_size--)
3379 		qed_chain_consume(&qp->rq.pbl);
3380 	qedr_inc_sw_cons(&qp->rq);
3381 
3382 	return 1;
3383 }
3384 
3385 static int process_resp_flush(struct qedr_qp *qp, struct qedr_cq *cq,
3386 			      int num_entries, struct ib_wc *wc, u16 hw_cons)
3387 {
3388 	u16 cnt = 0;
3389 
3390 	while (num_entries && qp->rq.wqe_cons != hw_cons) {
3391 		/* fill WC */
3392 		wc->status = IB_WC_WR_FLUSH_ERR;
3393 		wc->wc_flags = 0;
3394 		wc->src_qp = qp->id;
3395 		wc->byte_len = 0;
3396 		wc->wr_id = qp->rqe_wr_id[qp->rq.cons].wr_id;
3397 		wc->qp = &qp->ibqp;
3398 		num_entries--;
3399 		wc++;
3400 		cnt++;
3401 		while (qp->rqe_wr_id[qp->rq.cons].wqe_size--)
3402 			qed_chain_consume(&qp->rq.pbl);
3403 		qedr_inc_sw_cons(&qp->rq);
3404 	}
3405 
3406 	return cnt;
3407 }
3408 
3409 static void try_consume_resp_cqe(struct qedr_cq *cq, struct qedr_qp *qp,
3410 				 struct rdma_cqe_responder *resp, int *update)
3411 {
3412 	if (le16_to_cpu(resp->rq_cons) == qp->rq.wqe_cons) {
3413 		consume_cqe(cq);
3414 		*update |= 1;
3415 	}
3416 }
3417 
3418 static int qedr_poll_cq_resp(struct qedr_dev *dev, struct qedr_qp *qp,
3419 			     struct qedr_cq *cq, int num_entries,
3420 			     struct ib_wc *wc, struct rdma_cqe_responder *resp,
3421 			     int *update)
3422 {
3423 	int cnt;
3424 
3425 	if (resp->status == RDMA_CQE_RESP_STS_WORK_REQUEST_FLUSHED_ERR) {
3426 		cnt = process_resp_flush(qp, cq, num_entries, wc,
3427 					 resp->rq_cons);
3428 		try_consume_resp_cqe(cq, qp, resp, update);
3429 	} else {
3430 		cnt = process_resp_one(dev, qp, cq, wc, resp);
3431 		consume_cqe(cq);
3432 		*update |= 1;
3433 	}
3434 
3435 	return cnt;
3436 }
3437 
3438 static void try_consume_req_cqe(struct qedr_cq *cq, struct qedr_qp *qp,
3439 				struct rdma_cqe_requester *req, int *update)
3440 {
3441 	if (le16_to_cpu(req->sq_cons) == qp->sq.wqe_cons) {
3442 		consume_cqe(cq);
3443 		*update |= 1;
3444 	}
3445 }
3446 
3447 int qedr_poll_cq(struct ib_cq *ibcq, int num_entries, struct ib_wc *wc)
3448 {
3449 	struct qedr_dev *dev = get_qedr_dev(ibcq->device);
3450 	struct qedr_cq *cq = get_qedr_cq(ibcq);
3451 	union rdma_cqe *cqe = cq->latest_cqe;
3452 	u32 old_cons, new_cons;
3453 	unsigned long flags;
3454 	int update = 0;
3455 	int done = 0;
3456 
3457 	if (cq->cq_type == QEDR_CQ_TYPE_GSI)
3458 		return qedr_gsi_poll_cq(ibcq, num_entries, wc);
3459 
3460 	spin_lock_irqsave(&cq->cq_lock, flags);
3461 	old_cons = qed_chain_get_cons_idx_u32(&cq->pbl);
3462 	while (num_entries && is_valid_cqe(cq, cqe)) {
3463 		struct qedr_qp *qp;
3464 		int cnt = 0;
3465 
3466 		/* prevent speculative reads of any field of CQE */
3467 		rmb();
3468 
3469 		qp = cqe_get_qp(cqe);
3470 		if (!qp) {
3471 			WARN(1, "Error: CQE QP pointer is NULL. CQE=%p\n", cqe);
3472 			break;
3473 		}
3474 
3475 		wc->qp = &qp->ibqp;
3476 
3477 		switch (cqe_get_type(cqe)) {
3478 		case RDMA_CQE_TYPE_REQUESTER:
3479 			cnt = qedr_poll_cq_req(dev, qp, cq, num_entries, wc,
3480 					       &cqe->req);
3481 			try_consume_req_cqe(cq, qp, &cqe->req, &update);
3482 			break;
3483 		case RDMA_CQE_TYPE_RESPONDER_RQ:
3484 			cnt = qedr_poll_cq_resp(dev, qp, cq, num_entries, wc,
3485 						&cqe->resp, &update);
3486 			break;
3487 		case RDMA_CQE_TYPE_INVALID:
3488 		default:
3489 			DP_ERR(dev, "Error: invalid CQE type = %d\n",
3490 			       cqe_get_type(cqe));
3491 		}
3492 		num_entries -= cnt;
3493 		wc += cnt;
3494 		done += cnt;
3495 
3496 		cqe = get_cqe(cq);
3497 	}
3498 	new_cons = qed_chain_get_cons_idx_u32(&cq->pbl);
3499 
3500 	cq->cq_cons += new_cons - old_cons;
3501 
3502 	if (update)
3503 		/* doorbell notifies abount latest VALID entry,
3504 		 * but chain already point to the next INVALID one
3505 		 */
3506 		doorbell_cq(cq, cq->cq_cons - 1, cq->arm_flags);
3507 
3508 	spin_unlock_irqrestore(&cq->cq_lock, flags);
3509 	return done;
3510 }
3511 
3512 int qedr_process_mad(struct ib_device *ibdev, int process_mad_flags,
3513 		     u8 port_num,
3514 		     const struct ib_wc *in_wc,
3515 		     const struct ib_grh *in_grh,
3516 		     const struct ib_mad_hdr *mad_hdr,
3517 		     size_t in_mad_size, struct ib_mad_hdr *out_mad,
3518 		     size_t *out_mad_size, u16 *out_mad_pkey_index)
3519 {
3520 	struct qedr_dev *dev = get_qedr_dev(ibdev);
3521 
3522 	DP_DEBUG(dev, QEDR_MSG_GSI,
3523 		 "QEDR_PROCESS_MAD in_mad %x %x %x %x %x %x %x %x\n",
3524 		 mad_hdr->attr_id, mad_hdr->base_version, mad_hdr->attr_mod,
3525 		 mad_hdr->class_specific, mad_hdr->class_version,
3526 		 mad_hdr->method, mad_hdr->mgmt_class, mad_hdr->status);
3527 	return IB_MAD_RESULT_SUCCESS;
3528 }
3529 
3530 int qedr_port_immutable(struct ib_device *ibdev, u8 port_num,
3531 			struct ib_port_immutable *immutable)
3532 {
3533 	struct ib_port_attr attr;
3534 	int err;
3535 
3536 	err = qedr_query_port(ibdev, port_num, &attr);
3537 	if (err)
3538 		return err;
3539 
3540 	immutable->pkey_tbl_len = attr.pkey_tbl_len;
3541 	immutable->gid_tbl_len = attr.gid_tbl_len;
3542 	immutable->core_cap_flags = RDMA_CORE_PORT_IBA_ROCE |
3543 				    RDMA_CORE_PORT_IBA_ROCE_UDP_ENCAP;
3544 	immutable->max_mad_size = IB_MGMT_MAD_SIZE;
3545 
3546 	return 0;
3547 }
3548