xref: /openbmc/linux/drivers/infiniband/hw/efa/efa_verbs.c (revision 40ddb3f020834f9afb7aab31385994811f4db259)
140909f66SGal Pressman // SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB
240909f66SGal Pressman /*
340909f66SGal Pressman  * Copyright 2018-2019 Amazon.com, Inc. or its affiliates. All rights reserved.
440909f66SGal Pressman  */
540909f66SGal Pressman 
640909f66SGal Pressman #include <linux/vmalloc.h>
740909f66SGal Pressman 
840909f66SGal Pressman #include <rdma/ib_addr.h>
940909f66SGal Pressman #include <rdma/ib_umem.h>
1040909f66SGal Pressman #include <rdma/ib_user_verbs.h>
1140909f66SGal Pressman #include <rdma/ib_verbs.h>
1240909f66SGal Pressman #include <rdma/uverbs_ioctl.h>
1340909f66SGal Pressman 
1440909f66SGal Pressman #include "efa.h"
1540909f66SGal Pressman 
1640909f66SGal Pressman #define EFA_MMAP_FLAG_SHIFT 56
1740909f66SGal Pressman #define EFA_MMAP_PAGE_MASK GENMASK(EFA_MMAP_FLAG_SHIFT - 1, 0)
1840909f66SGal Pressman #define EFA_MMAP_INVALID U64_MAX
1940909f66SGal Pressman 
2040909f66SGal Pressman enum {
2140909f66SGal Pressman 	EFA_MMAP_DMA_PAGE = 0,
2240909f66SGal Pressman 	EFA_MMAP_IO_WC,
2340909f66SGal Pressman 	EFA_MMAP_IO_NC,
2440909f66SGal Pressman };
2540909f66SGal Pressman 
2640909f66SGal Pressman #define EFA_AENQ_ENABLED_GROUPS \
2740909f66SGal Pressman 	(BIT(EFA_ADMIN_FATAL_ERROR) | BIT(EFA_ADMIN_WARNING) | \
2840909f66SGal Pressman 	 BIT(EFA_ADMIN_NOTIFICATION) | BIT(EFA_ADMIN_KEEP_ALIVE))
2940909f66SGal Pressman 
3040909f66SGal Pressman struct efa_mmap_entry {
3140909f66SGal Pressman 	void  *obj;
3240909f66SGal Pressman 	u64 address;
3340909f66SGal Pressman 	u64 length;
3440909f66SGal Pressman 	u32 mmap_page;
3540909f66SGal Pressman 	u8 mmap_flag;
3640909f66SGal Pressman };
3740909f66SGal Pressman 
3840909f66SGal Pressman static inline u64 get_mmap_key(const struct efa_mmap_entry *efa)
3940909f66SGal Pressman {
4040909f66SGal Pressman 	return ((u64)efa->mmap_flag << EFA_MMAP_FLAG_SHIFT) |
4140909f66SGal Pressman 	       ((u64)efa->mmap_page << PAGE_SHIFT);
4240909f66SGal Pressman }
4340909f66SGal Pressman 
4440909f66SGal Pressman #define EFA_CHUNK_PAYLOAD_SHIFT       12
4540909f66SGal Pressman #define EFA_CHUNK_PAYLOAD_SIZE        BIT(EFA_CHUNK_PAYLOAD_SHIFT)
4640909f66SGal Pressman #define EFA_CHUNK_PAYLOAD_PTR_SIZE    8
4740909f66SGal Pressman 
4840909f66SGal Pressman #define EFA_CHUNK_SHIFT               12
4940909f66SGal Pressman #define EFA_CHUNK_SIZE                BIT(EFA_CHUNK_SHIFT)
5040909f66SGal Pressman #define EFA_CHUNK_PTR_SIZE            sizeof(struct efa_com_ctrl_buff_info)
5140909f66SGal Pressman 
5240909f66SGal Pressman #define EFA_PTRS_PER_CHUNK \
5340909f66SGal Pressman 	((EFA_CHUNK_SIZE - EFA_CHUNK_PTR_SIZE) / EFA_CHUNK_PAYLOAD_PTR_SIZE)
5440909f66SGal Pressman 
5540909f66SGal Pressman #define EFA_CHUNK_USED_SIZE \
5640909f66SGal Pressman 	((EFA_PTRS_PER_CHUNK * EFA_CHUNK_PAYLOAD_PTR_SIZE) + EFA_CHUNK_PTR_SIZE)
5740909f66SGal Pressman 
5840909f66SGal Pressman #define EFA_SUPPORTED_ACCESS_FLAGS IB_ACCESS_LOCAL_WRITE
5940909f66SGal Pressman 
6040909f66SGal Pressman struct pbl_chunk {
6140909f66SGal Pressman 	dma_addr_t dma_addr;
6240909f66SGal Pressman 	u64 *buf;
6340909f66SGal Pressman 	u32 length;
6440909f66SGal Pressman };
6540909f66SGal Pressman 
6640909f66SGal Pressman struct pbl_chunk_list {
6740909f66SGal Pressman 	struct pbl_chunk *chunks;
6840909f66SGal Pressman 	unsigned int size;
6940909f66SGal Pressman };
7040909f66SGal Pressman 
7140909f66SGal Pressman struct pbl_context {
7240909f66SGal Pressman 	union {
7340909f66SGal Pressman 		struct {
7440909f66SGal Pressman 			dma_addr_t dma_addr;
7540909f66SGal Pressman 		} continuous;
7640909f66SGal Pressman 		struct {
7740909f66SGal Pressman 			u32 pbl_buf_size_in_pages;
7840909f66SGal Pressman 			struct scatterlist *sgl;
7940909f66SGal Pressman 			int sg_dma_cnt;
8040909f66SGal Pressman 			struct pbl_chunk_list chunk_list;
8140909f66SGal Pressman 		} indirect;
8240909f66SGal Pressman 	} phys;
8340909f66SGal Pressman 	u64 *pbl_buf;
8440909f66SGal Pressman 	u32 pbl_buf_size_in_bytes;
8540909f66SGal Pressman 	u8 physically_continuous;
8640909f66SGal Pressman };
8740909f66SGal Pressman 
8840909f66SGal Pressman static inline struct efa_dev *to_edev(struct ib_device *ibdev)
8940909f66SGal Pressman {
9040909f66SGal Pressman 	return container_of(ibdev, struct efa_dev, ibdev);
9140909f66SGal Pressman }
9240909f66SGal Pressman 
9340909f66SGal Pressman static inline struct efa_ucontext *to_eucontext(struct ib_ucontext *ibucontext)
9440909f66SGal Pressman {
9540909f66SGal Pressman 	return container_of(ibucontext, struct efa_ucontext, ibucontext);
9640909f66SGal Pressman }
9740909f66SGal Pressman 
9840909f66SGal Pressman static inline struct efa_pd *to_epd(struct ib_pd *ibpd)
9940909f66SGal Pressman {
10040909f66SGal Pressman 	return container_of(ibpd, struct efa_pd, ibpd);
10140909f66SGal Pressman }
10240909f66SGal Pressman 
10340909f66SGal Pressman static inline struct efa_mr *to_emr(struct ib_mr *ibmr)
10440909f66SGal Pressman {
10540909f66SGal Pressman 	return container_of(ibmr, struct efa_mr, ibmr);
10640909f66SGal Pressman }
10740909f66SGal Pressman 
10840909f66SGal Pressman static inline struct efa_qp *to_eqp(struct ib_qp *ibqp)
10940909f66SGal Pressman {
11040909f66SGal Pressman 	return container_of(ibqp, struct efa_qp, ibqp);
11140909f66SGal Pressman }
11240909f66SGal Pressman 
11340909f66SGal Pressman static inline struct efa_cq *to_ecq(struct ib_cq *ibcq)
11440909f66SGal Pressman {
11540909f66SGal Pressman 	return container_of(ibcq, struct efa_cq, ibcq);
11640909f66SGal Pressman }
11740909f66SGal Pressman 
11840909f66SGal Pressman static inline struct efa_ah *to_eah(struct ib_ah *ibah)
11940909f66SGal Pressman {
12040909f66SGal Pressman 	return container_of(ibah, struct efa_ah, ibah);
12140909f66SGal Pressman }
12240909f66SGal Pressman 
12340909f66SGal Pressman #define field_avail(x, fld, sz) (offsetof(typeof(x), fld) + \
12440909f66SGal Pressman 				 sizeof(((typeof(x) *)0)->fld) <= (sz))
12540909f66SGal Pressman 
12640909f66SGal Pressman #define is_reserved_cleared(reserved) \
12740909f66SGal Pressman 	!memchr_inv(reserved, 0, sizeof(reserved))
12840909f66SGal Pressman 
12940909f66SGal Pressman static void *efa_zalloc_mapped(struct efa_dev *dev, dma_addr_t *dma_addr,
13040909f66SGal Pressman 			       size_t size, enum dma_data_direction dir)
13140909f66SGal Pressman {
13240909f66SGal Pressman 	void *addr;
13340909f66SGal Pressman 
13440909f66SGal Pressman 	addr = alloc_pages_exact(size, GFP_KERNEL | __GFP_ZERO);
13540909f66SGal Pressman 	if (!addr)
13640909f66SGal Pressman 		return NULL;
13740909f66SGal Pressman 
13840909f66SGal Pressman 	*dma_addr = dma_map_single(&dev->pdev->dev, addr, size, dir);
13940909f66SGal Pressman 	if (dma_mapping_error(&dev->pdev->dev, *dma_addr)) {
14040909f66SGal Pressman 		ibdev_err(&dev->ibdev, "Failed to map DMA address\n");
14140909f66SGal Pressman 		free_pages_exact(addr, size);
14240909f66SGal Pressman 		return NULL;
14340909f66SGal Pressman 	}
14440909f66SGal Pressman 
14540909f66SGal Pressman 	return addr;
14640909f66SGal Pressman }
14740909f66SGal Pressman 
14840909f66SGal Pressman /*
14940909f66SGal Pressman  * This is only called when the ucontext is destroyed and there can be no
15040909f66SGal Pressman  * concurrent query via mmap or allocate on the xarray, thus we can be sure no
15140909f66SGal Pressman  * other thread is using the entry pointer. We also know that all the BAR
15240909f66SGal Pressman  * pages have either been zap'd or munmaped at this point.  Normal pages are
15340909f66SGal Pressman  * refcounted and will be freed at the proper time.
15440909f66SGal Pressman  */
15540909f66SGal Pressman static void mmap_entries_remove_free(struct efa_dev *dev,
15640909f66SGal Pressman 				     struct efa_ucontext *ucontext)
15740909f66SGal Pressman {
15840909f66SGal Pressman 	struct efa_mmap_entry *entry;
15940909f66SGal Pressman 	unsigned long mmap_page;
16040909f66SGal Pressman 
16140909f66SGal Pressman 	xa_for_each(&ucontext->mmap_xa, mmap_page, entry) {
16240909f66SGal Pressman 		xa_erase(&ucontext->mmap_xa, mmap_page);
16340909f66SGal Pressman 
16440909f66SGal Pressman 		ibdev_dbg(
16540909f66SGal Pressman 			&dev->ibdev,
16640909f66SGal Pressman 			"mmap: obj[0x%p] key[%#llx] addr[%#llx] len[%#llx] removed\n",
16740909f66SGal Pressman 			entry->obj, get_mmap_key(entry), entry->address,
16840909f66SGal Pressman 			entry->length);
16940909f66SGal Pressman 		if (entry->mmap_flag == EFA_MMAP_DMA_PAGE)
17040909f66SGal Pressman 			/* DMA mapping is already gone, now free the pages */
17140909f66SGal Pressman 			free_pages_exact(phys_to_virt(entry->address),
17240909f66SGal Pressman 					 entry->length);
17340909f66SGal Pressman 		kfree(entry);
17440909f66SGal Pressman 	}
17540909f66SGal Pressman }
17640909f66SGal Pressman 
17740909f66SGal Pressman static struct efa_mmap_entry *mmap_entry_get(struct efa_dev *dev,
17840909f66SGal Pressman 					     struct efa_ucontext *ucontext,
17940909f66SGal Pressman 					     u64 key, u64 len)
18040909f66SGal Pressman {
18140909f66SGal Pressman 	struct efa_mmap_entry *entry;
18240909f66SGal Pressman 	u64 mmap_page;
18340909f66SGal Pressman 
18440909f66SGal Pressman 	mmap_page = (key & EFA_MMAP_PAGE_MASK) >> PAGE_SHIFT;
18540909f66SGal Pressman 	if (mmap_page > U32_MAX)
18640909f66SGal Pressman 		return NULL;
18740909f66SGal Pressman 
18840909f66SGal Pressman 	entry = xa_load(&ucontext->mmap_xa, mmap_page);
18940909f66SGal Pressman 	if (!entry || get_mmap_key(entry) != key || entry->length != len)
19040909f66SGal Pressman 		return NULL;
19140909f66SGal Pressman 
19240909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
19340909f66SGal Pressman 		  "mmap: obj[0x%p] key[%#llx] addr[%#llx] len[%#llx] removed\n",
19440909f66SGal Pressman 		  entry->obj, key, entry->address, entry->length);
19540909f66SGal Pressman 
19640909f66SGal Pressman 	return entry;
19740909f66SGal Pressman }
19840909f66SGal Pressman 
19940909f66SGal Pressman /*
20040909f66SGal Pressman  * Note this locking scheme cannot support removal of entries, except during
20140909f66SGal Pressman  * ucontext destruction when the core code guarentees no concurrency.
20240909f66SGal Pressman  */
20340909f66SGal Pressman static u64 mmap_entry_insert(struct efa_dev *dev, struct efa_ucontext *ucontext,
20440909f66SGal Pressman 			     void *obj, u64 address, u64 length, u8 mmap_flag)
20540909f66SGal Pressman {
20640909f66SGal Pressman 	struct efa_mmap_entry *entry;
20740909f66SGal Pressman 	int err;
20840909f66SGal Pressman 
20940909f66SGal Pressman 	entry = kmalloc(sizeof(*entry), GFP_KERNEL);
21040909f66SGal Pressman 	if (!entry)
21140909f66SGal Pressman 		return EFA_MMAP_INVALID;
21240909f66SGal Pressman 
21340909f66SGal Pressman 	entry->obj = obj;
21440909f66SGal Pressman 	entry->address = address;
21540909f66SGal Pressman 	entry->length = length;
21640909f66SGal Pressman 	entry->mmap_flag = mmap_flag;
21740909f66SGal Pressman 
21840909f66SGal Pressman 	xa_lock(&ucontext->mmap_xa);
21940909f66SGal Pressman 	entry->mmap_page = ucontext->mmap_xa_page;
22040909f66SGal Pressman 	ucontext->mmap_xa_page += DIV_ROUND_UP(length, PAGE_SIZE);
22140909f66SGal Pressman 	err = __xa_insert(&ucontext->mmap_xa, entry->mmap_page, entry,
22240909f66SGal Pressman 			  GFP_KERNEL);
22340909f66SGal Pressman 	xa_unlock(&ucontext->mmap_xa);
22440909f66SGal Pressman 	if (err){
22540909f66SGal Pressman 		kfree(entry);
22640909f66SGal Pressman 		return EFA_MMAP_INVALID;
22740909f66SGal Pressman 	}
22840909f66SGal Pressman 
22940909f66SGal Pressman 	ibdev_dbg(
23040909f66SGal Pressman 		&dev->ibdev,
23140909f66SGal Pressman 		"mmap: obj[0x%p] addr[%#llx], len[%#llx], key[%#llx] inserted\n",
23240909f66SGal Pressman 		entry->obj, entry->address, entry->length, get_mmap_key(entry));
23340909f66SGal Pressman 
23440909f66SGal Pressman 	return get_mmap_key(entry);
23540909f66SGal Pressman }
23640909f66SGal Pressman 
23740909f66SGal Pressman int efa_query_device(struct ib_device *ibdev,
23840909f66SGal Pressman 		     struct ib_device_attr *props,
23940909f66SGal Pressman 		     struct ib_udata *udata)
24040909f66SGal Pressman {
24140909f66SGal Pressman 	struct efa_com_get_device_attr_result *dev_attr;
24240909f66SGal Pressman 	struct efa_ibv_ex_query_device_resp resp = {};
24340909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibdev);
24440909f66SGal Pressman 	int err;
24540909f66SGal Pressman 
24640909f66SGal Pressman 	if (udata && udata->inlen &&
24740909f66SGal Pressman 	    !ib_is_udata_cleared(udata, 0, udata->inlen)) {
24840909f66SGal Pressman 		ibdev_dbg(ibdev,
24940909f66SGal Pressman 			  "Incompatible ABI params, udata not cleared\n");
25040909f66SGal Pressman 		return -EINVAL;
25140909f66SGal Pressman 	}
25240909f66SGal Pressman 
25340909f66SGal Pressman 	dev_attr = &dev->dev_attr;
25440909f66SGal Pressman 
25540909f66SGal Pressman 	memset(props, 0, sizeof(*props));
25640909f66SGal Pressman 	props->max_mr_size = dev_attr->max_mr_pages * PAGE_SIZE;
25740909f66SGal Pressman 	props->page_size_cap = dev_attr->page_size_cap;
25840909f66SGal Pressman 	props->vendor_id = dev->pdev->vendor;
25940909f66SGal Pressman 	props->vendor_part_id = dev->pdev->device;
26040909f66SGal Pressman 	props->hw_ver = dev->pdev->subsystem_device;
26140909f66SGal Pressman 	props->max_qp = dev_attr->max_qp;
26240909f66SGal Pressman 	props->max_cq = dev_attr->max_cq;
26340909f66SGal Pressman 	props->max_pd = dev_attr->max_pd;
26440909f66SGal Pressman 	props->max_mr = dev_attr->max_mr;
26540909f66SGal Pressman 	props->max_ah = dev_attr->max_ah;
26640909f66SGal Pressman 	props->max_cqe = dev_attr->max_cq_depth;
26740909f66SGal Pressman 	props->max_qp_wr = min_t(u32, dev_attr->max_sq_depth,
26840909f66SGal Pressman 				 dev_attr->max_rq_depth);
26940909f66SGal Pressman 	props->max_send_sge = dev_attr->max_sq_sge;
27040909f66SGal Pressman 	props->max_recv_sge = dev_attr->max_rq_sge;
27140909f66SGal Pressman 
27240909f66SGal Pressman 	if (udata && udata->outlen) {
27340909f66SGal Pressman 		resp.max_sq_sge = dev_attr->max_sq_sge;
27440909f66SGal Pressman 		resp.max_rq_sge = dev_attr->max_rq_sge;
27540909f66SGal Pressman 		resp.max_sq_wr = dev_attr->max_sq_depth;
27640909f66SGal Pressman 		resp.max_rq_wr = dev_attr->max_rq_depth;
27740909f66SGal Pressman 
27840909f66SGal Pressman 		err = ib_copy_to_udata(udata, &resp,
27940909f66SGal Pressman 				       min(sizeof(resp), udata->outlen));
28040909f66SGal Pressman 		if (err) {
28140909f66SGal Pressman 			ibdev_dbg(ibdev,
28240909f66SGal Pressman 				  "Failed to copy udata for query_device\n");
28340909f66SGal Pressman 			return err;
28440909f66SGal Pressman 		}
28540909f66SGal Pressman 	}
28640909f66SGal Pressman 
28740909f66SGal Pressman 	return 0;
28840909f66SGal Pressman }
28940909f66SGal Pressman 
29040909f66SGal Pressman int efa_query_port(struct ib_device *ibdev, u8 port,
29140909f66SGal Pressman 		   struct ib_port_attr *props)
29240909f66SGal Pressman {
29340909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibdev);
29440909f66SGal Pressman 
29540909f66SGal Pressman 	props->lmc = 1;
29640909f66SGal Pressman 
29740909f66SGal Pressman 	props->state = IB_PORT_ACTIVE;
29840909f66SGal Pressman 	props->phys_state = 5;
29940909f66SGal Pressman 	props->gid_tbl_len = 1;
30040909f66SGal Pressman 	props->pkey_tbl_len = 1;
30140909f66SGal Pressman 	props->active_speed = IB_SPEED_EDR;
30240909f66SGal Pressman 	props->active_width = IB_WIDTH_4X;
30340909f66SGal Pressman 	props->max_mtu = ib_mtu_int_to_enum(dev->mtu);
30440909f66SGal Pressman 	props->active_mtu = ib_mtu_int_to_enum(dev->mtu);
30540909f66SGal Pressman 	props->max_msg_sz = dev->mtu;
30640909f66SGal Pressman 	props->max_vl_num = 1;
30740909f66SGal Pressman 
30840909f66SGal Pressman 	return 0;
30940909f66SGal Pressman }
31040909f66SGal Pressman 
31140909f66SGal Pressman int efa_query_qp(struct ib_qp *ibqp, struct ib_qp_attr *qp_attr,
31240909f66SGal Pressman 		 int qp_attr_mask,
31340909f66SGal Pressman 		 struct ib_qp_init_attr *qp_init_attr)
31440909f66SGal Pressman {
31540909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibqp->device);
31640909f66SGal Pressman 	struct efa_com_query_qp_params params = {};
31740909f66SGal Pressman 	struct efa_com_query_qp_result result;
31840909f66SGal Pressman 	struct efa_qp *qp = to_eqp(ibqp);
31940909f66SGal Pressman 	int err;
32040909f66SGal Pressman 
32140909f66SGal Pressman #define EFA_QUERY_QP_SUPP_MASK \
32240909f66SGal Pressman 	(IB_QP_STATE | IB_QP_PKEY_INDEX | IB_QP_PORT | \
32340909f66SGal Pressman 	 IB_QP_QKEY | IB_QP_SQ_PSN | IB_QP_CAP)
32440909f66SGal Pressman 
32540909f66SGal Pressman 	if (qp_attr_mask & ~EFA_QUERY_QP_SUPP_MASK) {
32640909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
32740909f66SGal Pressman 			  "Unsupported qp_attr_mask[%#x] supported[%#x]\n",
32840909f66SGal Pressman 			  qp_attr_mask, EFA_QUERY_QP_SUPP_MASK);
32940909f66SGal Pressman 		return -EOPNOTSUPP;
33040909f66SGal Pressman 	}
33140909f66SGal Pressman 
33240909f66SGal Pressman 	memset(qp_attr, 0, sizeof(*qp_attr));
33340909f66SGal Pressman 	memset(qp_init_attr, 0, sizeof(*qp_init_attr));
33440909f66SGal Pressman 
33540909f66SGal Pressman 	params.qp_handle = qp->qp_handle;
33640909f66SGal Pressman 	err = efa_com_query_qp(&dev->edev, &params, &result);
33740909f66SGal Pressman 	if (err)
33840909f66SGal Pressman 		return err;
33940909f66SGal Pressman 
34040909f66SGal Pressman 	qp_attr->qp_state = result.qp_state;
34140909f66SGal Pressman 	qp_attr->qkey = result.qkey;
34240909f66SGal Pressman 	qp_attr->sq_psn = result.sq_psn;
34340909f66SGal Pressman 	qp_attr->sq_draining = result.sq_draining;
34440909f66SGal Pressman 	qp_attr->port_num = 1;
34540909f66SGal Pressman 
34640909f66SGal Pressman 	qp_attr->cap.max_send_wr = qp->max_send_wr;
34740909f66SGal Pressman 	qp_attr->cap.max_recv_wr = qp->max_recv_wr;
34840909f66SGal Pressman 	qp_attr->cap.max_send_sge = qp->max_send_sge;
34940909f66SGal Pressman 	qp_attr->cap.max_recv_sge = qp->max_recv_sge;
35040909f66SGal Pressman 	qp_attr->cap.max_inline_data = qp->max_inline_data;
35140909f66SGal Pressman 
35240909f66SGal Pressman 	qp_init_attr->qp_type = ibqp->qp_type;
35340909f66SGal Pressman 	qp_init_attr->recv_cq = ibqp->recv_cq;
35440909f66SGal Pressman 	qp_init_attr->send_cq = ibqp->send_cq;
35540909f66SGal Pressman 	qp_init_attr->qp_context = ibqp->qp_context;
35640909f66SGal Pressman 	qp_init_attr->cap = qp_attr->cap;
35740909f66SGal Pressman 
35840909f66SGal Pressman 	return 0;
35940909f66SGal Pressman }
36040909f66SGal Pressman 
36140909f66SGal Pressman int efa_query_gid(struct ib_device *ibdev, u8 port, int index,
36240909f66SGal Pressman 		  union ib_gid *gid)
36340909f66SGal Pressman {
36440909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibdev);
36540909f66SGal Pressman 
36640909f66SGal Pressman 	memcpy(gid->raw, dev->addr, sizeof(dev->addr));
36740909f66SGal Pressman 
36840909f66SGal Pressman 	return 0;
36940909f66SGal Pressman }
37040909f66SGal Pressman 
37140909f66SGal Pressman int efa_query_pkey(struct ib_device *ibdev, u8 port, u16 index,
37240909f66SGal Pressman 		   u16 *pkey)
37340909f66SGal Pressman {
37440909f66SGal Pressman 	if (index > 0)
37540909f66SGal Pressman 		return -EINVAL;
37640909f66SGal Pressman 
37740909f66SGal Pressman 	*pkey = 0xffff;
37840909f66SGal Pressman 	return 0;
37940909f66SGal Pressman }
38040909f66SGal Pressman 
38140909f66SGal Pressman static int efa_pd_dealloc(struct efa_dev *dev, u16 pdn)
38240909f66SGal Pressman {
38340909f66SGal Pressman 	struct efa_com_dealloc_pd_params params = {
38440909f66SGal Pressman 		.pdn = pdn,
38540909f66SGal Pressman 	};
38640909f66SGal Pressman 
38740909f66SGal Pressman 	return efa_com_dealloc_pd(&dev->edev, &params);
38840909f66SGal Pressman }
38940909f66SGal Pressman 
39040909f66SGal Pressman int efa_alloc_pd(struct ib_pd *ibpd, struct ib_udata *udata)
39140909f66SGal Pressman {
39240909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibpd->device);
39340909f66SGal Pressman 	struct efa_ibv_alloc_pd_resp resp = {};
39440909f66SGal Pressman 	struct efa_com_alloc_pd_result result;
39540909f66SGal Pressman 	struct efa_pd *pd = to_epd(ibpd);
39640909f66SGal Pressman 	int err;
39740909f66SGal Pressman 
39840909f66SGal Pressman 	if (udata->inlen &&
39940909f66SGal Pressman 	    !ib_is_udata_cleared(udata, 0, udata->inlen)) {
40040909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
40140909f66SGal Pressman 			  "Incompatible ABI params, udata not cleared\n");
40240909f66SGal Pressman 		err = -EINVAL;
40340909f66SGal Pressman 		goto err_out;
40440909f66SGal Pressman 	}
40540909f66SGal Pressman 
40640909f66SGal Pressman 	err = efa_com_alloc_pd(&dev->edev, &result);
40740909f66SGal Pressman 	if (err)
40840909f66SGal Pressman 		goto err_out;
40940909f66SGal Pressman 
41040909f66SGal Pressman 	pd->pdn = result.pdn;
41140909f66SGal Pressman 	resp.pdn = result.pdn;
41240909f66SGal Pressman 
41340909f66SGal Pressman 	if (udata->outlen) {
41440909f66SGal Pressman 		err = ib_copy_to_udata(udata, &resp,
41540909f66SGal Pressman 				       min(sizeof(resp), udata->outlen));
41640909f66SGal Pressman 		if (err) {
41740909f66SGal Pressman 			ibdev_dbg(&dev->ibdev,
41840909f66SGal Pressman 				  "Failed to copy udata for alloc_pd\n");
41940909f66SGal Pressman 			goto err_dealloc_pd;
42040909f66SGal Pressman 		}
42140909f66SGal Pressman 	}
42240909f66SGal Pressman 
42340909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "Allocated pd[%d]\n", pd->pdn);
42440909f66SGal Pressman 
42540909f66SGal Pressman 	return 0;
42640909f66SGal Pressman 
42740909f66SGal Pressman err_dealloc_pd:
42840909f66SGal Pressman 	efa_pd_dealloc(dev, result.pdn);
42940909f66SGal Pressman err_out:
43040909f66SGal Pressman 	atomic64_inc(&dev->stats.sw_stats.alloc_pd_err);
43140909f66SGal Pressman 	return err;
43240909f66SGal Pressman }
43340909f66SGal Pressman 
43440909f66SGal Pressman void efa_dealloc_pd(struct ib_pd *ibpd, struct ib_udata *udata)
43540909f66SGal Pressman {
43640909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibpd->device);
43740909f66SGal Pressman 	struct efa_pd *pd = to_epd(ibpd);
43840909f66SGal Pressman 
43940909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "Dealloc pd[%d]\n", pd->pdn);
44040909f66SGal Pressman 	efa_pd_dealloc(dev, pd->pdn);
44140909f66SGal Pressman }
44240909f66SGal Pressman 
44340909f66SGal Pressman static int efa_destroy_qp_handle(struct efa_dev *dev, u32 qp_handle)
44440909f66SGal Pressman {
44540909f66SGal Pressman 	struct efa_com_destroy_qp_params params = { .qp_handle = qp_handle };
44640909f66SGal Pressman 
44740909f66SGal Pressman 	return efa_com_destroy_qp(&dev->edev, &params);
44840909f66SGal Pressman }
44940909f66SGal Pressman 
45040909f66SGal Pressman int efa_destroy_qp(struct ib_qp *ibqp, struct ib_udata *udata)
45140909f66SGal Pressman {
45240909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibqp->pd->device);
45340909f66SGal Pressman 	struct efa_qp *qp = to_eqp(ibqp);
45440909f66SGal Pressman 	int err;
45540909f66SGal Pressman 
45640909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "Destroy qp[%u]\n", ibqp->qp_num);
45740909f66SGal Pressman 	err = efa_destroy_qp_handle(dev, qp->qp_handle);
45840909f66SGal Pressman 	if (err)
45940909f66SGal Pressman 		return err;
46040909f66SGal Pressman 
46140909f66SGal Pressman 	if (qp->rq_cpu_addr) {
46240909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
46340909f66SGal Pressman 			  "qp->cpu_addr[0x%p] freed: size[%lu], dma[%pad]\n",
46440909f66SGal Pressman 			  qp->rq_cpu_addr, qp->rq_size,
46540909f66SGal Pressman 			  &qp->rq_dma_addr);
46640909f66SGal Pressman 		dma_unmap_single(&dev->pdev->dev, qp->rq_dma_addr, qp->rq_size,
46740909f66SGal Pressman 				 DMA_TO_DEVICE);
46840909f66SGal Pressman 	}
46940909f66SGal Pressman 
47040909f66SGal Pressman 	kfree(qp);
47140909f66SGal Pressman 	return 0;
47240909f66SGal Pressman }
47340909f66SGal Pressman 
47440909f66SGal Pressman static int qp_mmap_entries_setup(struct efa_qp *qp,
47540909f66SGal Pressman 				 struct efa_dev *dev,
47640909f66SGal Pressman 				 struct efa_ucontext *ucontext,
47740909f66SGal Pressman 				 struct efa_com_create_qp_params *params,
47840909f66SGal Pressman 				 struct efa_ibv_create_qp_resp *resp)
47940909f66SGal Pressman {
48040909f66SGal Pressman 	/*
48140909f66SGal Pressman 	 * Once an entry is inserted it might be mmapped, hence cannot be
48240909f66SGal Pressman 	 * cleaned up until dealloc_ucontext.
48340909f66SGal Pressman 	 */
48440909f66SGal Pressman 	resp->sq_db_mmap_key =
48540909f66SGal Pressman 		mmap_entry_insert(dev, ucontext, qp,
48640909f66SGal Pressman 				  dev->db_bar_addr + resp->sq_db_offset,
48740909f66SGal Pressman 				  PAGE_SIZE, EFA_MMAP_IO_NC);
48840909f66SGal Pressman 	if (resp->sq_db_mmap_key == EFA_MMAP_INVALID)
48940909f66SGal Pressman 		return -ENOMEM;
49040909f66SGal Pressman 
49140909f66SGal Pressman 	resp->sq_db_offset &= ~PAGE_MASK;
49240909f66SGal Pressman 
49340909f66SGal Pressman 	resp->llq_desc_mmap_key =
49440909f66SGal Pressman 		mmap_entry_insert(dev, ucontext, qp,
49540909f66SGal Pressman 				  dev->mem_bar_addr + resp->llq_desc_offset,
49640909f66SGal Pressman 				  PAGE_ALIGN(params->sq_ring_size_in_bytes +
49740909f66SGal Pressman 					     (resp->llq_desc_offset & ~PAGE_MASK)),
49840909f66SGal Pressman 				  EFA_MMAP_IO_WC);
49940909f66SGal Pressman 	if (resp->llq_desc_mmap_key == EFA_MMAP_INVALID)
50040909f66SGal Pressman 		return -ENOMEM;
50140909f66SGal Pressman 
50240909f66SGal Pressman 	resp->llq_desc_offset &= ~PAGE_MASK;
50340909f66SGal Pressman 
50440909f66SGal Pressman 	if (qp->rq_size) {
50540909f66SGal Pressman 		resp->rq_db_mmap_key =
50640909f66SGal Pressman 			mmap_entry_insert(dev, ucontext, qp,
50740909f66SGal Pressman 					  dev->db_bar_addr + resp->rq_db_offset,
50840909f66SGal Pressman 					  PAGE_SIZE, EFA_MMAP_IO_NC);
50940909f66SGal Pressman 		if (resp->rq_db_mmap_key == EFA_MMAP_INVALID)
51040909f66SGal Pressman 			return -ENOMEM;
51140909f66SGal Pressman 
51240909f66SGal Pressman 		resp->rq_db_offset &= ~PAGE_MASK;
51340909f66SGal Pressman 
51440909f66SGal Pressman 		resp->rq_mmap_key =
51540909f66SGal Pressman 			mmap_entry_insert(dev, ucontext, qp,
51640909f66SGal Pressman 					  virt_to_phys(qp->rq_cpu_addr),
51740909f66SGal Pressman 					  qp->rq_size, EFA_MMAP_DMA_PAGE);
51840909f66SGal Pressman 		if (resp->rq_mmap_key == EFA_MMAP_INVALID)
51940909f66SGal Pressman 			return -ENOMEM;
52040909f66SGal Pressman 
52140909f66SGal Pressman 		resp->rq_mmap_size = qp->rq_size;
52240909f66SGal Pressman 	}
52340909f66SGal Pressman 
52440909f66SGal Pressman 	return 0;
52540909f66SGal Pressman }
52640909f66SGal Pressman 
52740909f66SGal Pressman static int efa_qp_validate_cap(struct efa_dev *dev,
52840909f66SGal Pressman 			       struct ib_qp_init_attr *init_attr)
52940909f66SGal Pressman {
53040909f66SGal Pressman 	if (init_attr->cap.max_send_wr > dev->dev_attr.max_sq_depth) {
53140909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
53240909f66SGal Pressman 			  "qp: requested send wr[%u] exceeds the max[%u]\n",
53340909f66SGal Pressman 			  init_attr->cap.max_send_wr,
53440909f66SGal Pressman 			  dev->dev_attr.max_sq_depth);
53540909f66SGal Pressman 		return -EINVAL;
53640909f66SGal Pressman 	}
53740909f66SGal Pressman 	if (init_attr->cap.max_recv_wr > dev->dev_attr.max_rq_depth) {
53840909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
53940909f66SGal Pressman 			  "qp: requested receive wr[%u] exceeds the max[%u]\n",
54040909f66SGal Pressman 			  init_attr->cap.max_recv_wr,
54140909f66SGal Pressman 			  dev->dev_attr.max_rq_depth);
54240909f66SGal Pressman 		return -EINVAL;
54340909f66SGal Pressman 	}
54440909f66SGal Pressman 	if (init_attr->cap.max_send_sge > dev->dev_attr.max_sq_sge) {
54540909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
54640909f66SGal Pressman 			  "qp: requested sge send[%u] exceeds the max[%u]\n",
54740909f66SGal Pressman 			  init_attr->cap.max_send_sge, dev->dev_attr.max_sq_sge);
54840909f66SGal Pressman 		return -EINVAL;
54940909f66SGal Pressman 	}
55040909f66SGal Pressman 	if (init_attr->cap.max_recv_sge > dev->dev_attr.max_rq_sge) {
55140909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
55240909f66SGal Pressman 			  "qp: requested sge recv[%u] exceeds the max[%u]\n",
55340909f66SGal Pressman 			  init_attr->cap.max_recv_sge, dev->dev_attr.max_rq_sge);
55440909f66SGal Pressman 		return -EINVAL;
55540909f66SGal Pressman 	}
55640909f66SGal Pressman 	if (init_attr->cap.max_inline_data > dev->dev_attr.inline_buf_size) {
55740909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
55840909f66SGal Pressman 			  "qp: requested inline data[%u] exceeds the max[%u]\n",
55940909f66SGal Pressman 			  init_attr->cap.max_inline_data,
56040909f66SGal Pressman 			  dev->dev_attr.inline_buf_size);
56140909f66SGal Pressman 		return -EINVAL;
56240909f66SGal Pressman 	}
56340909f66SGal Pressman 
56440909f66SGal Pressman 	return 0;
56540909f66SGal Pressman }
56640909f66SGal Pressman 
56740909f66SGal Pressman static int efa_qp_validate_attr(struct efa_dev *dev,
56840909f66SGal Pressman 				struct ib_qp_init_attr *init_attr)
56940909f66SGal Pressman {
57040909f66SGal Pressman 	if (init_attr->qp_type != IB_QPT_DRIVER &&
57140909f66SGal Pressman 	    init_attr->qp_type != IB_QPT_UD) {
57240909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
57340909f66SGal Pressman 			  "Unsupported qp type %d\n", init_attr->qp_type);
57440909f66SGal Pressman 		return -EOPNOTSUPP;
57540909f66SGal Pressman 	}
57640909f66SGal Pressman 
57740909f66SGal Pressman 	if (init_attr->srq) {
57840909f66SGal Pressman 		ibdev_dbg(&dev->ibdev, "SRQ is not supported\n");
57940909f66SGal Pressman 		return -EOPNOTSUPP;
58040909f66SGal Pressman 	}
58140909f66SGal Pressman 
58240909f66SGal Pressman 	if (init_attr->create_flags) {
58340909f66SGal Pressman 		ibdev_dbg(&dev->ibdev, "Unsupported create flags\n");
58440909f66SGal Pressman 		return -EOPNOTSUPP;
58540909f66SGal Pressman 	}
58640909f66SGal Pressman 
58740909f66SGal Pressman 	return 0;
58840909f66SGal Pressman }
58940909f66SGal Pressman 
59040909f66SGal Pressman struct ib_qp *efa_create_qp(struct ib_pd *ibpd,
59140909f66SGal Pressman 			    struct ib_qp_init_attr *init_attr,
59240909f66SGal Pressman 			    struct ib_udata *udata)
59340909f66SGal Pressman {
59440909f66SGal Pressman 	struct efa_com_create_qp_params create_qp_params = {};
59540909f66SGal Pressman 	struct efa_com_create_qp_result create_qp_resp;
59640909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibpd->device);
59740909f66SGal Pressman 	struct efa_ibv_create_qp_resp resp = {};
59840909f66SGal Pressman 	struct efa_ibv_create_qp cmd = {};
59940909f66SGal Pressman 	bool rq_entry_inserted = false;
60040909f66SGal Pressman 	struct efa_ucontext *ucontext;
60140909f66SGal Pressman 	struct efa_qp *qp;
60240909f66SGal Pressman 	int err;
60340909f66SGal Pressman 
60440909f66SGal Pressman 	ucontext = rdma_udata_to_drv_context(udata, struct efa_ucontext,
60540909f66SGal Pressman 					     ibucontext);
60640909f66SGal Pressman 
60740909f66SGal Pressman 	err = efa_qp_validate_cap(dev, init_attr);
60840909f66SGal Pressman 	if (err)
60940909f66SGal Pressman 		goto err_out;
61040909f66SGal Pressman 
61140909f66SGal Pressman 	err = efa_qp_validate_attr(dev, init_attr);
61240909f66SGal Pressman 	if (err)
61340909f66SGal Pressman 		goto err_out;
61440909f66SGal Pressman 
61540909f66SGal Pressman 	if (!field_avail(cmd, driver_qp_type, udata->inlen)) {
61640909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
61740909f66SGal Pressman 			  "Incompatible ABI params, no input udata\n");
61840909f66SGal Pressman 		err = -EINVAL;
61940909f66SGal Pressman 		goto err_out;
62040909f66SGal Pressman 	}
62140909f66SGal Pressman 
62240909f66SGal Pressman 	if (udata->inlen > sizeof(cmd) &&
62340909f66SGal Pressman 	    !ib_is_udata_cleared(udata, sizeof(cmd),
62440909f66SGal Pressman 				 udata->inlen - sizeof(cmd))) {
62540909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
62640909f66SGal Pressman 			  "Incompatible ABI params, unknown fields in udata\n");
62740909f66SGal Pressman 		err = -EINVAL;
62840909f66SGal Pressman 		goto err_out;
62940909f66SGal Pressman 	}
63040909f66SGal Pressman 
63140909f66SGal Pressman 	err = ib_copy_from_udata(&cmd, udata,
63240909f66SGal Pressman 				 min(sizeof(cmd), udata->inlen));
63340909f66SGal Pressman 	if (err) {
63440909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
63540909f66SGal Pressman 			  "Cannot copy udata for create_qp\n");
63640909f66SGal Pressman 		goto err_out;
63740909f66SGal Pressman 	}
63840909f66SGal Pressman 
63940909f66SGal Pressman 	if (cmd.comp_mask) {
64040909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
64140909f66SGal Pressman 			  "Incompatible ABI params, unknown fields in udata\n");
64240909f66SGal Pressman 		err = -EINVAL;
64340909f66SGal Pressman 		goto err_out;
64440909f66SGal Pressman 	}
64540909f66SGal Pressman 
64640909f66SGal Pressman 	qp = kzalloc(sizeof(*qp), GFP_KERNEL);
64740909f66SGal Pressman 	if (!qp) {
64840909f66SGal Pressman 		err = -ENOMEM;
64940909f66SGal Pressman 		goto err_out;
65040909f66SGal Pressman 	}
65140909f66SGal Pressman 
65240909f66SGal Pressman 	create_qp_params.uarn = ucontext->uarn;
65340909f66SGal Pressman 	create_qp_params.pd = to_epd(ibpd)->pdn;
65440909f66SGal Pressman 
65540909f66SGal Pressman 	if (init_attr->qp_type == IB_QPT_UD) {
65640909f66SGal Pressman 		create_qp_params.qp_type = EFA_ADMIN_QP_TYPE_UD;
65740909f66SGal Pressman 	} else if (cmd.driver_qp_type == EFA_QP_DRIVER_TYPE_SRD) {
65840909f66SGal Pressman 		create_qp_params.qp_type = EFA_ADMIN_QP_TYPE_SRD;
65940909f66SGal Pressman 	} else {
66040909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
66140909f66SGal Pressman 			  "Unsupported qp type %d driver qp type %d\n",
66240909f66SGal Pressman 			  init_attr->qp_type, cmd.driver_qp_type);
66340909f66SGal Pressman 		err = -EOPNOTSUPP;
66440909f66SGal Pressman 		goto err_free_qp;
66540909f66SGal Pressman 	}
66640909f66SGal Pressman 
66740909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "Create QP: qp type %d driver qp type %#x\n",
66840909f66SGal Pressman 		  init_attr->qp_type, cmd.driver_qp_type);
66940909f66SGal Pressman 	create_qp_params.send_cq_idx = to_ecq(init_attr->send_cq)->cq_idx;
67040909f66SGal Pressman 	create_qp_params.recv_cq_idx = to_ecq(init_attr->recv_cq)->cq_idx;
67140909f66SGal Pressman 	create_qp_params.sq_depth = init_attr->cap.max_send_wr;
67240909f66SGal Pressman 	create_qp_params.sq_ring_size_in_bytes = cmd.sq_ring_size;
67340909f66SGal Pressman 
67440909f66SGal Pressman 	create_qp_params.rq_depth = init_attr->cap.max_recv_wr;
67540909f66SGal Pressman 	create_qp_params.rq_ring_size_in_bytes = cmd.rq_ring_size;
67640909f66SGal Pressman 	qp->rq_size = PAGE_ALIGN(create_qp_params.rq_ring_size_in_bytes);
67740909f66SGal Pressman 	if (qp->rq_size) {
67840909f66SGal Pressman 		qp->rq_cpu_addr = efa_zalloc_mapped(dev, &qp->rq_dma_addr,
67940909f66SGal Pressman 						    qp->rq_size, DMA_TO_DEVICE);
68040909f66SGal Pressman 		if (!qp->rq_cpu_addr) {
68140909f66SGal Pressman 			err = -ENOMEM;
68240909f66SGal Pressman 			goto err_free_qp;
68340909f66SGal Pressman 		}
68440909f66SGal Pressman 
68540909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
68640909f66SGal Pressman 			  "qp->cpu_addr[0x%p] allocated: size[%lu], dma[%pad]\n",
68740909f66SGal Pressman 			  qp->rq_cpu_addr, qp->rq_size, &qp->rq_dma_addr);
68840909f66SGal Pressman 		create_qp_params.rq_base_addr = qp->rq_dma_addr;
68940909f66SGal Pressman 	}
69040909f66SGal Pressman 
69140909f66SGal Pressman 	err = efa_com_create_qp(&dev->edev, &create_qp_params,
69240909f66SGal Pressman 				&create_qp_resp);
69340909f66SGal Pressman 	if (err)
69440909f66SGal Pressman 		goto err_free_mapped;
69540909f66SGal Pressman 
69640909f66SGal Pressman 	resp.sq_db_offset = create_qp_resp.sq_db_offset;
69740909f66SGal Pressman 	resp.rq_db_offset = create_qp_resp.rq_db_offset;
69840909f66SGal Pressman 	resp.llq_desc_offset = create_qp_resp.llq_descriptors_offset;
69940909f66SGal Pressman 	resp.send_sub_cq_idx = create_qp_resp.send_sub_cq_idx;
70040909f66SGal Pressman 	resp.recv_sub_cq_idx = create_qp_resp.recv_sub_cq_idx;
70140909f66SGal Pressman 
70240909f66SGal Pressman 	err = qp_mmap_entries_setup(qp, dev, ucontext, &create_qp_params,
70340909f66SGal Pressman 				    &resp);
70440909f66SGal Pressman 	if (err)
70540909f66SGal Pressman 		goto err_destroy_qp;
70640909f66SGal Pressman 
70740909f66SGal Pressman 	rq_entry_inserted = true;
70840909f66SGal Pressman 	qp->qp_handle = create_qp_resp.qp_handle;
70940909f66SGal Pressman 	qp->ibqp.qp_num = create_qp_resp.qp_num;
71040909f66SGal Pressman 	qp->ibqp.qp_type = init_attr->qp_type;
71140909f66SGal Pressman 	qp->max_send_wr = init_attr->cap.max_send_wr;
71240909f66SGal Pressman 	qp->max_recv_wr = init_attr->cap.max_recv_wr;
71340909f66SGal Pressman 	qp->max_send_sge = init_attr->cap.max_send_sge;
71440909f66SGal Pressman 	qp->max_recv_sge = init_attr->cap.max_recv_sge;
71540909f66SGal Pressman 	qp->max_inline_data = init_attr->cap.max_inline_data;
71640909f66SGal Pressman 
71740909f66SGal Pressman 	if (udata->outlen) {
71840909f66SGal Pressman 		err = ib_copy_to_udata(udata, &resp,
71940909f66SGal Pressman 				       min(sizeof(resp), udata->outlen));
72040909f66SGal Pressman 		if (err) {
72140909f66SGal Pressman 			ibdev_dbg(&dev->ibdev,
72240909f66SGal Pressman 				  "Failed to copy udata for qp[%u]\n",
72340909f66SGal Pressman 				  create_qp_resp.qp_num);
72440909f66SGal Pressman 			goto err_destroy_qp;
72540909f66SGal Pressman 		}
72640909f66SGal Pressman 	}
72740909f66SGal Pressman 
72840909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "Created qp[%d]\n", qp->ibqp.qp_num);
72940909f66SGal Pressman 
73040909f66SGal Pressman 	return &qp->ibqp;
73140909f66SGal Pressman 
73240909f66SGal Pressman err_destroy_qp:
73340909f66SGal Pressman 	efa_destroy_qp_handle(dev, create_qp_resp.qp_handle);
73440909f66SGal Pressman err_free_mapped:
73540909f66SGal Pressman 	if (qp->rq_size) {
73640909f66SGal Pressman 		dma_unmap_single(&dev->pdev->dev, qp->rq_dma_addr, qp->rq_size,
73740909f66SGal Pressman 				 DMA_TO_DEVICE);
73840909f66SGal Pressman 		if (!rq_entry_inserted)
73940909f66SGal Pressman 			free_pages_exact(qp->rq_cpu_addr, qp->rq_size);
74040909f66SGal Pressman 	}
74140909f66SGal Pressman err_free_qp:
74240909f66SGal Pressman 	kfree(qp);
74340909f66SGal Pressman err_out:
74440909f66SGal Pressman 	atomic64_inc(&dev->stats.sw_stats.create_qp_err);
74540909f66SGal Pressman 	return ERR_PTR(err);
74640909f66SGal Pressman }
74740909f66SGal Pressman 
74840909f66SGal Pressman static int efa_modify_qp_validate(struct efa_dev *dev, struct efa_qp *qp,
74940909f66SGal Pressman 				  struct ib_qp_attr *qp_attr, int qp_attr_mask,
75040909f66SGal Pressman 				  enum ib_qp_state cur_state,
75140909f66SGal Pressman 				  enum ib_qp_state new_state)
75240909f66SGal Pressman {
75340909f66SGal Pressman #define EFA_MODIFY_QP_SUPP_MASK \
75440909f66SGal Pressman 	(IB_QP_STATE | IB_QP_CUR_STATE | IB_QP_EN_SQD_ASYNC_NOTIFY | \
75540909f66SGal Pressman 	 IB_QP_PKEY_INDEX | IB_QP_PORT | IB_QP_QKEY | IB_QP_SQ_PSN)
75640909f66SGal Pressman 
75740909f66SGal Pressman 	if (qp_attr_mask & ~EFA_MODIFY_QP_SUPP_MASK) {
75840909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
75940909f66SGal Pressman 			  "Unsupported qp_attr_mask[%#x] supported[%#x]\n",
76040909f66SGal Pressman 			  qp_attr_mask, EFA_MODIFY_QP_SUPP_MASK);
76140909f66SGal Pressman 		return -EOPNOTSUPP;
76240909f66SGal Pressman 	}
76340909f66SGal Pressman 
76440909f66SGal Pressman 	if (!ib_modify_qp_is_ok(cur_state, new_state, IB_QPT_UD,
76540909f66SGal Pressman 				qp_attr_mask)) {
76640909f66SGal Pressman 		ibdev_dbg(&dev->ibdev, "Invalid modify QP parameters\n");
76740909f66SGal Pressman 		return -EINVAL;
76840909f66SGal Pressman 	}
76940909f66SGal Pressman 
77040909f66SGal Pressman 	if ((qp_attr_mask & IB_QP_PORT) && qp_attr->port_num != 1) {
77140909f66SGal Pressman 		ibdev_dbg(&dev->ibdev, "Can't change port num\n");
77240909f66SGal Pressman 		return -EOPNOTSUPP;
77340909f66SGal Pressman 	}
77440909f66SGal Pressman 
77540909f66SGal Pressman 	if ((qp_attr_mask & IB_QP_PKEY_INDEX) && qp_attr->pkey_index) {
77640909f66SGal Pressman 		ibdev_dbg(&dev->ibdev, "Can't change pkey index\n");
77740909f66SGal Pressman 		return -EOPNOTSUPP;
77840909f66SGal Pressman 	}
77940909f66SGal Pressman 
78040909f66SGal Pressman 	return 0;
78140909f66SGal Pressman }
78240909f66SGal Pressman 
78340909f66SGal Pressman int efa_modify_qp(struct ib_qp *ibqp, struct ib_qp_attr *qp_attr,
78440909f66SGal Pressman 		  int qp_attr_mask, struct ib_udata *udata)
78540909f66SGal Pressman {
78640909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibqp->device);
78740909f66SGal Pressman 	struct efa_com_modify_qp_params params = {};
78840909f66SGal Pressman 	struct efa_qp *qp = to_eqp(ibqp);
78940909f66SGal Pressman 	enum ib_qp_state cur_state;
79040909f66SGal Pressman 	enum ib_qp_state new_state;
79140909f66SGal Pressman 	int err;
79240909f66SGal Pressman 
79340909f66SGal Pressman 	if (udata->inlen &&
79440909f66SGal Pressman 	    !ib_is_udata_cleared(udata, 0, udata->inlen)) {
79540909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
79640909f66SGal Pressman 			  "Incompatible ABI params, udata not cleared\n");
79740909f66SGal Pressman 		return -EINVAL;
79840909f66SGal Pressman 	}
79940909f66SGal Pressman 
80040909f66SGal Pressman 	cur_state = qp_attr_mask & IB_QP_CUR_STATE ? qp_attr->cur_qp_state :
80140909f66SGal Pressman 						     qp->state;
80240909f66SGal Pressman 	new_state = qp_attr_mask & IB_QP_STATE ? qp_attr->qp_state : cur_state;
80340909f66SGal Pressman 
80440909f66SGal Pressman 	err = efa_modify_qp_validate(dev, qp, qp_attr, qp_attr_mask, cur_state,
80540909f66SGal Pressman 				     new_state);
80640909f66SGal Pressman 	if (err)
80740909f66SGal Pressman 		return err;
80840909f66SGal Pressman 
80940909f66SGal Pressman 	params.qp_handle = qp->qp_handle;
81040909f66SGal Pressman 
81140909f66SGal Pressman 	if (qp_attr_mask & IB_QP_STATE) {
81240909f66SGal Pressman 		params.modify_mask |= BIT(EFA_ADMIN_QP_STATE_BIT) |
81340909f66SGal Pressman 				      BIT(EFA_ADMIN_CUR_QP_STATE_BIT);
81440909f66SGal Pressman 		params.cur_qp_state = qp_attr->cur_qp_state;
81540909f66SGal Pressman 		params.qp_state = qp_attr->qp_state;
81640909f66SGal Pressman 	}
81740909f66SGal Pressman 
81840909f66SGal Pressman 	if (qp_attr_mask & IB_QP_EN_SQD_ASYNC_NOTIFY) {
81940909f66SGal Pressman 		params.modify_mask |=
82040909f66SGal Pressman 			BIT(EFA_ADMIN_SQ_DRAINED_ASYNC_NOTIFY_BIT);
82140909f66SGal Pressman 		params.sq_drained_async_notify = qp_attr->en_sqd_async_notify;
82240909f66SGal Pressman 	}
82340909f66SGal Pressman 
82440909f66SGal Pressman 	if (qp_attr_mask & IB_QP_QKEY) {
82540909f66SGal Pressman 		params.modify_mask |= BIT(EFA_ADMIN_QKEY_BIT);
82640909f66SGal Pressman 		params.qkey = qp_attr->qkey;
82740909f66SGal Pressman 	}
82840909f66SGal Pressman 
82940909f66SGal Pressman 	if (qp_attr_mask & IB_QP_SQ_PSN) {
83040909f66SGal Pressman 		params.modify_mask |= BIT(EFA_ADMIN_SQ_PSN_BIT);
83140909f66SGal Pressman 		params.sq_psn = qp_attr->sq_psn;
83240909f66SGal Pressman 	}
83340909f66SGal Pressman 
83440909f66SGal Pressman 	err = efa_com_modify_qp(&dev->edev, &params);
83540909f66SGal Pressman 	if (err)
83640909f66SGal Pressman 		return err;
83740909f66SGal Pressman 
83840909f66SGal Pressman 	qp->state = new_state;
83940909f66SGal Pressman 
84040909f66SGal Pressman 	return 0;
84140909f66SGal Pressman }
84240909f66SGal Pressman 
84340909f66SGal Pressman static int efa_destroy_cq_idx(struct efa_dev *dev, int cq_idx)
84440909f66SGal Pressman {
84540909f66SGal Pressman 	struct efa_com_destroy_cq_params params = { .cq_idx = cq_idx };
84640909f66SGal Pressman 
84740909f66SGal Pressman 	return efa_com_destroy_cq(&dev->edev, &params);
84840909f66SGal Pressman }
84940909f66SGal Pressman 
850a52c8e24SLeon Romanovsky void efa_destroy_cq(struct ib_cq *ibcq, struct ib_udata *udata)
85140909f66SGal Pressman {
85240909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibcq->device);
85340909f66SGal Pressman 	struct efa_cq *cq = to_ecq(ibcq);
85440909f66SGal Pressman 
85540909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
85640909f66SGal Pressman 		  "Destroy cq[%d] virt[0x%p] freed: size[%lu], dma[%pad]\n",
85740909f66SGal Pressman 		  cq->cq_idx, cq->cpu_addr, cq->size, &cq->dma_addr);
85840909f66SGal Pressman 
859a52c8e24SLeon Romanovsky 	efa_destroy_cq_idx(dev, cq->cq_idx);
86040909f66SGal Pressman 	dma_unmap_single(&dev->pdev->dev, cq->dma_addr, cq->size,
86140909f66SGal Pressman 			 DMA_FROM_DEVICE);
86240909f66SGal Pressman }
86340909f66SGal Pressman 
86440909f66SGal Pressman static int cq_mmap_entries_setup(struct efa_dev *dev, struct efa_cq *cq,
86540909f66SGal Pressman 				 struct efa_ibv_create_cq_resp *resp)
86640909f66SGal Pressman {
86740909f66SGal Pressman 	resp->q_mmap_size = cq->size;
86840909f66SGal Pressman 	resp->q_mmap_key = mmap_entry_insert(dev, cq->ucontext, cq,
86940909f66SGal Pressman 					     virt_to_phys(cq->cpu_addr),
87040909f66SGal Pressman 					     cq->size, EFA_MMAP_DMA_PAGE);
87140909f66SGal Pressman 	if (resp->q_mmap_key == EFA_MMAP_INVALID)
87240909f66SGal Pressman 		return -ENOMEM;
87340909f66SGal Pressman 
87440909f66SGal Pressman 	return 0;
87540909f66SGal Pressman }
87640909f66SGal Pressman 
877e39afe3dSLeon Romanovsky int efa_create_cq(struct ib_cq *ibcq, const struct ib_cq_init_attr *attr,
87840909f66SGal Pressman 		  struct ib_udata *udata)
87940909f66SGal Pressman {
880e39afe3dSLeon Romanovsky 	struct efa_ucontext *ucontext = rdma_udata_to_drv_context(
881e39afe3dSLeon Romanovsky 		udata, struct efa_ucontext, ibucontext);
88240909f66SGal Pressman 	struct efa_ibv_create_cq_resp resp = {};
88340909f66SGal Pressman 	struct efa_com_create_cq_params params;
88440909f66SGal Pressman 	struct efa_com_create_cq_result result;
885e39afe3dSLeon Romanovsky 	struct ib_device *ibdev = ibcq->device;
88640909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibdev);
88740909f66SGal Pressman 	struct efa_ibv_create_cq cmd = {};
888e39afe3dSLeon Romanovsky 	struct efa_cq *cq = to_ecq(ibcq);
88940909f66SGal Pressman 	bool cq_entry_inserted = false;
890e39afe3dSLeon Romanovsky 	int entries = attr->cqe;
89140909f66SGal Pressman 	int err;
89240909f66SGal Pressman 
89340909f66SGal Pressman 	ibdev_dbg(ibdev, "create_cq entries %d\n", entries);
89440909f66SGal Pressman 
89540909f66SGal Pressman 	if (entries < 1 || entries > dev->dev_attr.max_cq_depth) {
89640909f66SGal Pressman 		ibdev_dbg(ibdev,
89740909f66SGal Pressman 			  "cq: requested entries[%u] non-positive or greater than max[%u]\n",
89840909f66SGal Pressman 			  entries, dev->dev_attr.max_cq_depth);
89940909f66SGal Pressman 		err = -EINVAL;
90040909f66SGal Pressman 		goto err_out;
90140909f66SGal Pressman 	}
90240909f66SGal Pressman 
90340909f66SGal Pressman 	if (!field_avail(cmd, num_sub_cqs, udata->inlen)) {
90440909f66SGal Pressman 		ibdev_dbg(ibdev,
90540909f66SGal Pressman 			  "Incompatible ABI params, no input udata\n");
90640909f66SGal Pressman 		err = -EINVAL;
90740909f66SGal Pressman 		goto err_out;
90840909f66SGal Pressman 	}
90940909f66SGal Pressman 
91040909f66SGal Pressman 	if (udata->inlen > sizeof(cmd) &&
91140909f66SGal Pressman 	    !ib_is_udata_cleared(udata, sizeof(cmd),
91240909f66SGal Pressman 				 udata->inlen - sizeof(cmd))) {
91340909f66SGal Pressman 		ibdev_dbg(ibdev,
91440909f66SGal Pressman 			  "Incompatible ABI params, unknown fields in udata\n");
91540909f66SGal Pressman 		err = -EINVAL;
91640909f66SGal Pressman 		goto err_out;
91740909f66SGal Pressman 	}
91840909f66SGal Pressman 
91940909f66SGal Pressman 	err = ib_copy_from_udata(&cmd, udata,
92040909f66SGal Pressman 				 min(sizeof(cmd), udata->inlen));
92140909f66SGal Pressman 	if (err) {
92240909f66SGal Pressman 		ibdev_dbg(ibdev, "Cannot copy udata for create_cq\n");
92340909f66SGal Pressman 		goto err_out;
92440909f66SGal Pressman 	}
92540909f66SGal Pressman 
92640909f66SGal Pressman 	if (cmd.comp_mask || !is_reserved_cleared(cmd.reserved_50)) {
92740909f66SGal Pressman 		ibdev_dbg(ibdev,
92840909f66SGal Pressman 			  "Incompatible ABI params, unknown fields in udata\n");
92940909f66SGal Pressman 		err = -EINVAL;
93040909f66SGal Pressman 		goto err_out;
93140909f66SGal Pressman 	}
93240909f66SGal Pressman 
93340909f66SGal Pressman 	if (!cmd.cq_entry_size) {
93440909f66SGal Pressman 		ibdev_dbg(ibdev,
93540909f66SGal Pressman 			  "Invalid entry size [%u]\n", cmd.cq_entry_size);
93640909f66SGal Pressman 		err = -EINVAL;
93740909f66SGal Pressman 		goto err_out;
93840909f66SGal Pressman 	}
93940909f66SGal Pressman 
94040909f66SGal Pressman 	if (cmd.num_sub_cqs != dev->dev_attr.sub_cqs_per_cq) {
94140909f66SGal Pressman 		ibdev_dbg(ibdev,
94240909f66SGal Pressman 			  "Invalid number of sub cqs[%u] expected[%u]\n",
94340909f66SGal Pressman 			  cmd.num_sub_cqs, dev->dev_attr.sub_cqs_per_cq);
94440909f66SGal Pressman 		err = -EINVAL;
94540909f66SGal Pressman 		goto err_out;
94640909f66SGal Pressman 	}
94740909f66SGal Pressman 
948e39afe3dSLeon Romanovsky 	cq->ucontext = ucontext;
94940909f66SGal Pressman 	cq->size = PAGE_ALIGN(cmd.cq_entry_size * entries * cmd.num_sub_cqs);
95040909f66SGal Pressman 	cq->cpu_addr = efa_zalloc_mapped(dev, &cq->dma_addr, cq->size,
95140909f66SGal Pressman 					 DMA_FROM_DEVICE);
95240909f66SGal Pressman 	if (!cq->cpu_addr) {
95340909f66SGal Pressman 		err = -ENOMEM;
954e39afe3dSLeon Romanovsky 		goto err_out;
95540909f66SGal Pressman 	}
95640909f66SGal Pressman 
95740909f66SGal Pressman 	params.uarn = cq->ucontext->uarn;
95840909f66SGal Pressman 	params.cq_depth = entries;
95940909f66SGal Pressman 	params.dma_addr = cq->dma_addr;
96040909f66SGal Pressman 	params.entry_size_in_bytes = cmd.cq_entry_size;
96140909f66SGal Pressman 	params.num_sub_cqs = cmd.num_sub_cqs;
96240909f66SGal Pressman 	err = efa_com_create_cq(&dev->edev, &params, &result);
96340909f66SGal Pressman 	if (err)
96440909f66SGal Pressman 		goto err_free_mapped;
96540909f66SGal Pressman 
96640909f66SGal Pressman 	resp.cq_idx = result.cq_idx;
96740909f66SGal Pressman 	cq->cq_idx = result.cq_idx;
96840909f66SGal Pressman 	cq->ibcq.cqe = result.actual_depth;
96940909f66SGal Pressman 	WARN_ON_ONCE(entries != result.actual_depth);
97040909f66SGal Pressman 
97140909f66SGal Pressman 	err = cq_mmap_entries_setup(dev, cq, &resp);
97240909f66SGal Pressman 	if (err) {
973e39afe3dSLeon Romanovsky 		ibdev_dbg(ibdev, "Could not setup cq[%u] mmap entries\n",
974e39afe3dSLeon Romanovsky 			  cq->cq_idx);
97540909f66SGal Pressman 		goto err_destroy_cq;
97640909f66SGal Pressman 	}
97740909f66SGal Pressman 
97840909f66SGal Pressman 	cq_entry_inserted = true;
97940909f66SGal Pressman 
98040909f66SGal Pressman 	if (udata->outlen) {
98140909f66SGal Pressman 		err = ib_copy_to_udata(udata, &resp,
98240909f66SGal Pressman 				       min(sizeof(resp), udata->outlen));
98340909f66SGal Pressman 		if (err) {
98440909f66SGal Pressman 			ibdev_dbg(ibdev,
98540909f66SGal Pressman 				  "Failed to copy udata for create_cq\n");
98640909f66SGal Pressman 			goto err_destroy_cq;
98740909f66SGal Pressman 		}
98840909f66SGal Pressman 	}
98940909f66SGal Pressman 
990e39afe3dSLeon Romanovsky 	ibdev_dbg(ibdev, "Created cq[%d], cq depth[%u]. dma[%pad] virt[0x%p]\n",
99140909f66SGal Pressman 		  cq->cq_idx, result.actual_depth, &cq->dma_addr, cq->cpu_addr);
99240909f66SGal Pressman 
993e39afe3dSLeon Romanovsky 	return 0;
99440909f66SGal Pressman 
99540909f66SGal Pressman err_destroy_cq:
99640909f66SGal Pressman 	efa_destroy_cq_idx(dev, cq->cq_idx);
99740909f66SGal Pressman err_free_mapped:
99840909f66SGal Pressman 	dma_unmap_single(&dev->pdev->dev, cq->dma_addr, cq->size,
99940909f66SGal Pressman 			 DMA_FROM_DEVICE);
100040909f66SGal Pressman 	if (!cq_entry_inserted)
100140909f66SGal Pressman 		free_pages_exact(cq->cpu_addr, cq->size);
100240909f66SGal Pressman err_out:
100340909f66SGal Pressman 	atomic64_inc(&dev->stats.sw_stats.create_cq_err);
1004e39afe3dSLeon Romanovsky 	return err;
100540909f66SGal Pressman }
100640909f66SGal Pressman 
100740909f66SGal Pressman static int umem_to_page_list(struct efa_dev *dev,
100840909f66SGal Pressman 			     struct ib_umem *umem,
100940909f66SGal Pressman 			     u64 *page_list,
101040909f66SGal Pressman 			     u32 hp_cnt,
101140909f66SGal Pressman 			     u8 hp_shift)
101240909f66SGal Pressman {
101340909f66SGal Pressman 	u32 pages_in_hp = BIT(hp_shift - PAGE_SHIFT);
1014*40ddb3f0SGal Pressman 	struct ib_block_iter biter;
101540909f66SGal Pressman 	unsigned int hp_idx = 0;
101640909f66SGal Pressman 
101740909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "hp_cnt[%u], pages_in_hp[%u]\n",
101840909f66SGal Pressman 		  hp_cnt, pages_in_hp);
101940909f66SGal Pressman 
1020*40ddb3f0SGal Pressman 	rdma_for_each_block(umem->sg_head.sgl, &biter, umem->nmap,
1021*40ddb3f0SGal Pressman 			    BIT(hp_shift))
1022*40ddb3f0SGal Pressman 		page_list[hp_idx++] = rdma_block_iter_dma_address(&biter);
102340909f66SGal Pressman 
102440909f66SGal Pressman 	return 0;
102540909f66SGal Pressman }
102640909f66SGal Pressman 
102740909f66SGal Pressman static struct scatterlist *efa_vmalloc_buf_to_sg(u64 *buf, int page_cnt)
102840909f66SGal Pressman {
102940909f66SGal Pressman 	struct scatterlist *sglist;
103040909f66SGal Pressman 	struct page *pg;
103140909f66SGal Pressman 	int i;
103240909f66SGal Pressman 
103340909f66SGal Pressman 	sglist = kcalloc(page_cnt, sizeof(*sglist), GFP_KERNEL);
103440909f66SGal Pressman 	if (!sglist)
103540909f66SGal Pressman 		return NULL;
103640909f66SGal Pressman 	sg_init_table(sglist, page_cnt);
103740909f66SGal Pressman 	for (i = 0; i < page_cnt; i++) {
103840909f66SGal Pressman 		pg = vmalloc_to_page(buf);
103940909f66SGal Pressman 		if (!pg)
104040909f66SGal Pressman 			goto err;
104140909f66SGal Pressman 		sg_set_page(&sglist[i], pg, PAGE_SIZE, 0);
104240909f66SGal Pressman 		buf += PAGE_SIZE / sizeof(*buf);
104340909f66SGal Pressman 	}
104440909f66SGal Pressman 	return sglist;
104540909f66SGal Pressman 
104640909f66SGal Pressman err:
104740909f66SGal Pressman 	kfree(sglist);
104840909f66SGal Pressman 	return NULL;
104940909f66SGal Pressman }
105040909f66SGal Pressman 
105140909f66SGal Pressman /*
105240909f66SGal Pressman  * create a chunk list of physical pages dma addresses from the supplied
105340909f66SGal Pressman  * scatter gather list
105440909f66SGal Pressman  */
105540909f66SGal Pressman static int pbl_chunk_list_create(struct efa_dev *dev, struct pbl_context *pbl)
105640909f66SGal Pressman {
105740909f66SGal Pressman 	struct pbl_chunk_list *chunk_list = &pbl->phys.indirect.chunk_list;
105840909f66SGal Pressman 	int page_cnt = pbl->phys.indirect.pbl_buf_size_in_pages;
105940909f66SGal Pressman 	struct scatterlist *pages_sgl = pbl->phys.indirect.sgl;
10604d50e084SGal Pressman 	unsigned int chunk_list_size, chunk_idx, payload_idx;
106140909f66SGal Pressman 	int sg_dma_cnt = pbl->phys.indirect.sg_dma_cnt;
106240909f66SGal Pressman 	struct efa_com_ctrl_buff_info *ctrl_buf;
106340909f66SGal Pressman 	u64 *cur_chunk_buf, *prev_chunk_buf;
10644d50e084SGal Pressman 	struct ib_block_iter biter;
106540909f66SGal Pressman 	dma_addr_t dma_addr;
106640909f66SGal Pressman 	int i;
106740909f66SGal Pressman 
106840909f66SGal Pressman 	/* allocate a chunk list that consists of 4KB chunks */
106940909f66SGal Pressman 	chunk_list_size = DIV_ROUND_UP(page_cnt, EFA_PTRS_PER_CHUNK);
107040909f66SGal Pressman 
107140909f66SGal Pressman 	chunk_list->size = chunk_list_size;
107240909f66SGal Pressman 	chunk_list->chunks = kcalloc(chunk_list_size,
107340909f66SGal Pressman 				     sizeof(*chunk_list->chunks),
107440909f66SGal Pressman 				     GFP_KERNEL);
107540909f66SGal Pressman 	if (!chunk_list->chunks)
107640909f66SGal Pressman 		return -ENOMEM;
107740909f66SGal Pressman 
107840909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
107940909f66SGal Pressman 		  "chunk_list_size[%u] - pages[%u]\n", chunk_list_size,
108040909f66SGal Pressman 		  page_cnt);
108140909f66SGal Pressman 
108240909f66SGal Pressman 	/* allocate chunk buffers: */
108340909f66SGal Pressman 	for (i = 0; i < chunk_list_size; i++) {
108440909f66SGal Pressman 		chunk_list->chunks[i].buf = kzalloc(EFA_CHUNK_SIZE, GFP_KERNEL);
108540909f66SGal Pressman 		if (!chunk_list->chunks[i].buf)
108640909f66SGal Pressman 			goto chunk_list_dealloc;
108740909f66SGal Pressman 
108840909f66SGal Pressman 		chunk_list->chunks[i].length = EFA_CHUNK_USED_SIZE;
108940909f66SGal Pressman 	}
109040909f66SGal Pressman 	chunk_list->chunks[chunk_list_size - 1].length =
109140909f66SGal Pressman 		((page_cnt % EFA_PTRS_PER_CHUNK) * EFA_CHUNK_PAYLOAD_PTR_SIZE) +
109240909f66SGal Pressman 			EFA_CHUNK_PTR_SIZE;
109340909f66SGal Pressman 
109440909f66SGal Pressman 	/* fill the dma addresses of sg list pages to chunks: */
109540909f66SGal Pressman 	chunk_idx = 0;
109640909f66SGal Pressman 	payload_idx = 0;
109740909f66SGal Pressman 	cur_chunk_buf = chunk_list->chunks[0].buf;
10984d50e084SGal Pressman 	rdma_for_each_block(pages_sgl, &biter, sg_dma_cnt,
10994d50e084SGal Pressman 			    EFA_CHUNK_PAYLOAD_SIZE) {
110040909f66SGal Pressman 		cur_chunk_buf[payload_idx++] =
11014d50e084SGal Pressman 			rdma_block_iter_dma_address(&biter);
110240909f66SGal Pressman 
110340909f66SGal Pressman 		if (payload_idx == EFA_PTRS_PER_CHUNK) {
110440909f66SGal Pressman 			chunk_idx++;
110540909f66SGal Pressman 			cur_chunk_buf = chunk_list->chunks[chunk_idx].buf;
110640909f66SGal Pressman 			payload_idx = 0;
110740909f66SGal Pressman 		}
110840909f66SGal Pressman 	}
110940909f66SGal Pressman 
111040909f66SGal Pressman 	/* map chunks to dma and fill chunks next ptrs */
111140909f66SGal Pressman 	for (i = chunk_list_size - 1; i >= 0; i--) {
111240909f66SGal Pressman 		dma_addr = dma_map_single(&dev->pdev->dev,
111340909f66SGal Pressman 					  chunk_list->chunks[i].buf,
111440909f66SGal Pressman 					  chunk_list->chunks[i].length,
111540909f66SGal Pressman 					  DMA_TO_DEVICE);
111640909f66SGal Pressman 		if (dma_mapping_error(&dev->pdev->dev, dma_addr)) {
111740909f66SGal Pressman 			ibdev_err(&dev->ibdev,
111840909f66SGal Pressman 				  "chunk[%u] dma_map_failed\n", i);
111940909f66SGal Pressman 			goto chunk_list_unmap;
112040909f66SGal Pressman 		}
112140909f66SGal Pressman 
112240909f66SGal Pressman 		chunk_list->chunks[i].dma_addr = dma_addr;
112340909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
112440909f66SGal Pressman 			  "chunk[%u] mapped at [%pad]\n", i, &dma_addr);
112540909f66SGal Pressman 
112640909f66SGal Pressman 		if (!i)
112740909f66SGal Pressman 			break;
112840909f66SGal Pressman 
112940909f66SGal Pressman 		prev_chunk_buf = chunk_list->chunks[i - 1].buf;
113040909f66SGal Pressman 
113140909f66SGal Pressman 		ctrl_buf = (struct efa_com_ctrl_buff_info *)
113240909f66SGal Pressman 				&prev_chunk_buf[EFA_PTRS_PER_CHUNK];
113340909f66SGal Pressman 		ctrl_buf->length = chunk_list->chunks[i].length;
113440909f66SGal Pressman 
113540909f66SGal Pressman 		efa_com_set_dma_addr(dma_addr,
113640909f66SGal Pressman 				     &ctrl_buf->address.mem_addr_high,
113740909f66SGal Pressman 				     &ctrl_buf->address.mem_addr_low);
113840909f66SGal Pressman 	}
113940909f66SGal Pressman 
114040909f66SGal Pressman 	return 0;
114140909f66SGal Pressman 
114240909f66SGal Pressman chunk_list_unmap:
114340909f66SGal Pressman 	for (; i < chunk_list_size; i++) {
114440909f66SGal Pressman 		dma_unmap_single(&dev->pdev->dev, chunk_list->chunks[i].dma_addr,
114540909f66SGal Pressman 				 chunk_list->chunks[i].length, DMA_TO_DEVICE);
114640909f66SGal Pressman 	}
114740909f66SGal Pressman chunk_list_dealloc:
114840909f66SGal Pressman 	for (i = 0; i < chunk_list_size; i++)
114940909f66SGal Pressman 		kfree(chunk_list->chunks[i].buf);
115040909f66SGal Pressman 
115140909f66SGal Pressman 	kfree(chunk_list->chunks);
115240909f66SGal Pressman 	return -ENOMEM;
115340909f66SGal Pressman }
115440909f66SGal Pressman 
115540909f66SGal Pressman static void pbl_chunk_list_destroy(struct efa_dev *dev, struct pbl_context *pbl)
115640909f66SGal Pressman {
115740909f66SGal Pressman 	struct pbl_chunk_list *chunk_list = &pbl->phys.indirect.chunk_list;
115840909f66SGal Pressman 	int i;
115940909f66SGal Pressman 
116040909f66SGal Pressman 	for (i = 0; i < chunk_list->size; i++) {
116140909f66SGal Pressman 		dma_unmap_single(&dev->pdev->dev, chunk_list->chunks[i].dma_addr,
116240909f66SGal Pressman 				 chunk_list->chunks[i].length, DMA_TO_DEVICE);
116340909f66SGal Pressman 		kfree(chunk_list->chunks[i].buf);
116440909f66SGal Pressman 	}
116540909f66SGal Pressman 
116640909f66SGal Pressman 	kfree(chunk_list->chunks);
116740909f66SGal Pressman }
116840909f66SGal Pressman 
116940909f66SGal Pressman /* initialize pbl continuous mode: map pbl buffer to a dma address. */
117040909f66SGal Pressman static int pbl_continuous_initialize(struct efa_dev *dev,
117140909f66SGal Pressman 				     struct pbl_context *pbl)
117240909f66SGal Pressman {
117340909f66SGal Pressman 	dma_addr_t dma_addr;
117440909f66SGal Pressman 
117540909f66SGal Pressman 	dma_addr = dma_map_single(&dev->pdev->dev, pbl->pbl_buf,
117640909f66SGal Pressman 				  pbl->pbl_buf_size_in_bytes, DMA_TO_DEVICE);
117740909f66SGal Pressman 	if (dma_mapping_error(&dev->pdev->dev, dma_addr)) {
117840909f66SGal Pressman 		ibdev_err(&dev->ibdev, "Unable to map pbl to DMA address\n");
117940909f66SGal Pressman 		return -ENOMEM;
118040909f66SGal Pressman 	}
118140909f66SGal Pressman 
118240909f66SGal Pressman 	pbl->phys.continuous.dma_addr = dma_addr;
118340909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
118440909f66SGal Pressman 		  "pbl continuous - dma_addr = %pad, size[%u]\n",
118540909f66SGal Pressman 		  &dma_addr, pbl->pbl_buf_size_in_bytes);
118640909f66SGal Pressman 
118740909f66SGal Pressman 	return 0;
118840909f66SGal Pressman }
118940909f66SGal Pressman 
119040909f66SGal Pressman /*
119140909f66SGal Pressman  * initialize pbl indirect mode:
119240909f66SGal Pressman  * create a chunk list out of the dma addresses of the physical pages of
119340909f66SGal Pressman  * pbl buffer.
119440909f66SGal Pressman  */
119540909f66SGal Pressman static int pbl_indirect_initialize(struct efa_dev *dev, struct pbl_context *pbl)
119640909f66SGal Pressman {
119740909f66SGal Pressman 	u32 size_in_pages = DIV_ROUND_UP(pbl->pbl_buf_size_in_bytes, PAGE_SIZE);
119840909f66SGal Pressman 	struct scatterlist *sgl;
119940909f66SGal Pressman 	int sg_dma_cnt, err;
120040909f66SGal Pressman 
120140909f66SGal Pressman 	BUILD_BUG_ON(EFA_CHUNK_PAYLOAD_SIZE > PAGE_SIZE);
120240909f66SGal Pressman 	sgl = efa_vmalloc_buf_to_sg(pbl->pbl_buf, size_in_pages);
120340909f66SGal Pressman 	if (!sgl)
120440909f66SGal Pressman 		return -ENOMEM;
120540909f66SGal Pressman 
120640909f66SGal Pressman 	sg_dma_cnt = dma_map_sg(&dev->pdev->dev, sgl, size_in_pages, DMA_TO_DEVICE);
120740909f66SGal Pressman 	if (!sg_dma_cnt) {
120840909f66SGal Pressman 		err = -EINVAL;
120940909f66SGal Pressman 		goto err_map;
121040909f66SGal Pressman 	}
121140909f66SGal Pressman 
121240909f66SGal Pressman 	pbl->phys.indirect.pbl_buf_size_in_pages = size_in_pages;
121340909f66SGal Pressman 	pbl->phys.indirect.sgl = sgl;
121440909f66SGal Pressman 	pbl->phys.indirect.sg_dma_cnt = sg_dma_cnt;
121540909f66SGal Pressman 	err = pbl_chunk_list_create(dev, pbl);
121640909f66SGal Pressman 	if (err) {
121740909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
121840909f66SGal Pressman 			  "chunk_list creation failed[%d]\n", err);
121940909f66SGal Pressman 		goto err_chunk;
122040909f66SGal Pressman 	}
122140909f66SGal Pressman 
122240909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
122340909f66SGal Pressman 		  "pbl indirect - size[%u], chunks[%u]\n",
122440909f66SGal Pressman 		  pbl->pbl_buf_size_in_bytes,
122540909f66SGal Pressman 		  pbl->phys.indirect.chunk_list.size);
122640909f66SGal Pressman 
122740909f66SGal Pressman 	return 0;
122840909f66SGal Pressman 
122940909f66SGal Pressman err_chunk:
123040909f66SGal Pressman 	dma_unmap_sg(&dev->pdev->dev, sgl, size_in_pages, DMA_TO_DEVICE);
123140909f66SGal Pressman err_map:
123240909f66SGal Pressman 	kfree(sgl);
123340909f66SGal Pressman 	return err;
123440909f66SGal Pressman }
123540909f66SGal Pressman 
123640909f66SGal Pressman static void pbl_indirect_terminate(struct efa_dev *dev, struct pbl_context *pbl)
123740909f66SGal Pressman {
123840909f66SGal Pressman 	pbl_chunk_list_destroy(dev, pbl);
123940909f66SGal Pressman 	dma_unmap_sg(&dev->pdev->dev, pbl->phys.indirect.sgl,
124040909f66SGal Pressman 		     pbl->phys.indirect.pbl_buf_size_in_pages, DMA_TO_DEVICE);
124140909f66SGal Pressman 	kfree(pbl->phys.indirect.sgl);
124240909f66SGal Pressman }
124340909f66SGal Pressman 
124440909f66SGal Pressman /* create a page buffer list from a mapped user memory region */
124540909f66SGal Pressman static int pbl_create(struct efa_dev *dev,
124640909f66SGal Pressman 		      struct pbl_context *pbl,
124740909f66SGal Pressman 		      struct ib_umem *umem,
124840909f66SGal Pressman 		      int hp_cnt,
124940909f66SGal Pressman 		      u8 hp_shift)
125040909f66SGal Pressman {
125140909f66SGal Pressman 	int err;
125240909f66SGal Pressman 
125340909f66SGal Pressman 	pbl->pbl_buf_size_in_bytes = hp_cnt * EFA_CHUNK_PAYLOAD_PTR_SIZE;
1254255efcaeSGal Pressman 	pbl->pbl_buf = kvzalloc(pbl->pbl_buf_size_in_bytes, GFP_KERNEL);
1255255efcaeSGal Pressman 	if (!pbl->pbl_buf)
1256255efcaeSGal Pressman 		return -ENOMEM;
1257255efcaeSGal Pressman 
1258255efcaeSGal Pressman 	if (is_vmalloc_addr(pbl->pbl_buf)) {
1259255efcaeSGal Pressman 		pbl->physically_continuous = 0;
1260255efcaeSGal Pressman 		err = umem_to_page_list(dev, umem, pbl->pbl_buf, hp_cnt,
1261255efcaeSGal Pressman 					hp_shift);
1262255efcaeSGal Pressman 		if (err)
1263255efcaeSGal Pressman 			goto err_free;
1264255efcaeSGal Pressman 
1265255efcaeSGal Pressman 		err = pbl_indirect_initialize(dev, pbl);
1266255efcaeSGal Pressman 		if (err)
1267255efcaeSGal Pressman 			goto err_free;
1268255efcaeSGal Pressman 	} else {
126940909f66SGal Pressman 		pbl->physically_continuous = 1;
127040909f66SGal Pressman 		err = umem_to_page_list(dev, umem, pbl->pbl_buf, hp_cnt,
127140909f66SGal Pressman 					hp_shift);
127240909f66SGal Pressman 		if (err)
1273255efcaeSGal Pressman 			goto err_free;
1274255efcaeSGal Pressman 
127540909f66SGal Pressman 		err = pbl_continuous_initialize(dev, pbl);
127640909f66SGal Pressman 		if (err)
1277255efcaeSGal Pressman 			goto err_free;
127840909f66SGal Pressman 	}
127940909f66SGal Pressman 
128040909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
128140909f66SGal Pressman 		  "user_pbl_created: user_pages[%u], continuous[%u]\n",
128240909f66SGal Pressman 		  hp_cnt, pbl->physically_continuous);
128340909f66SGal Pressman 
128440909f66SGal Pressman 	return 0;
128540909f66SGal Pressman 
1286255efcaeSGal Pressman err_free:
1287255efcaeSGal Pressman 	kvfree(pbl->pbl_buf);
128840909f66SGal Pressman 	return err;
128940909f66SGal Pressman }
129040909f66SGal Pressman 
129140909f66SGal Pressman static void pbl_destroy(struct efa_dev *dev, struct pbl_context *pbl)
129240909f66SGal Pressman {
1293255efcaeSGal Pressman 	if (pbl->physically_continuous)
129440909f66SGal Pressman 		dma_unmap_single(&dev->pdev->dev, pbl->phys.continuous.dma_addr,
129540909f66SGal Pressman 				 pbl->pbl_buf_size_in_bytes, DMA_TO_DEVICE);
1296255efcaeSGal Pressman 	else
129740909f66SGal Pressman 		pbl_indirect_terminate(dev, pbl);
1298255efcaeSGal Pressman 
1299255efcaeSGal Pressman 	kvfree(pbl->pbl_buf);
130040909f66SGal Pressman }
130140909f66SGal Pressman 
130240909f66SGal Pressman static int efa_create_inline_pbl(struct efa_dev *dev, struct efa_mr *mr,
130340909f66SGal Pressman 				 struct efa_com_reg_mr_params *params)
130440909f66SGal Pressman {
130540909f66SGal Pressman 	int err;
130640909f66SGal Pressman 
130740909f66SGal Pressman 	params->inline_pbl = 1;
130840909f66SGal Pressman 	err = umem_to_page_list(dev, mr->umem, params->pbl.inline_pbl_array,
130940909f66SGal Pressman 				params->page_num, params->page_shift);
131040909f66SGal Pressman 	if (err)
131140909f66SGal Pressman 		return err;
131240909f66SGal Pressman 
131340909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
131440909f66SGal Pressman 		  "inline_pbl_array - pages[%u]\n", params->page_num);
131540909f66SGal Pressman 
131640909f66SGal Pressman 	return 0;
131740909f66SGal Pressman }
131840909f66SGal Pressman 
131940909f66SGal Pressman static int efa_create_pbl(struct efa_dev *dev,
132040909f66SGal Pressman 			  struct pbl_context *pbl,
132140909f66SGal Pressman 			  struct efa_mr *mr,
132240909f66SGal Pressman 			  struct efa_com_reg_mr_params *params)
132340909f66SGal Pressman {
132440909f66SGal Pressman 	int err;
132540909f66SGal Pressman 
132640909f66SGal Pressman 	err = pbl_create(dev, pbl, mr->umem, params->page_num,
132740909f66SGal Pressman 			 params->page_shift);
132840909f66SGal Pressman 	if (err) {
132940909f66SGal Pressman 		ibdev_dbg(&dev->ibdev, "Failed to create pbl[%d]\n", err);
133040909f66SGal Pressman 		return err;
133140909f66SGal Pressman 	}
133240909f66SGal Pressman 
133340909f66SGal Pressman 	params->inline_pbl = 0;
133440909f66SGal Pressman 	params->indirect = !pbl->physically_continuous;
133540909f66SGal Pressman 	if (pbl->physically_continuous) {
133640909f66SGal Pressman 		params->pbl.pbl.length = pbl->pbl_buf_size_in_bytes;
133740909f66SGal Pressman 
133840909f66SGal Pressman 		efa_com_set_dma_addr(pbl->phys.continuous.dma_addr,
133940909f66SGal Pressman 				     &params->pbl.pbl.address.mem_addr_high,
134040909f66SGal Pressman 				     &params->pbl.pbl.address.mem_addr_low);
134140909f66SGal Pressman 	} else {
134240909f66SGal Pressman 		params->pbl.pbl.length =
134340909f66SGal Pressman 			pbl->phys.indirect.chunk_list.chunks[0].length;
134440909f66SGal Pressman 
134540909f66SGal Pressman 		efa_com_set_dma_addr(pbl->phys.indirect.chunk_list.chunks[0].dma_addr,
134640909f66SGal Pressman 				     &params->pbl.pbl.address.mem_addr_high,
134740909f66SGal Pressman 				     &params->pbl.pbl.address.mem_addr_low);
134840909f66SGal Pressman 	}
134940909f66SGal Pressman 
135040909f66SGal Pressman 	return 0;
135140909f66SGal Pressman }
135240909f66SGal Pressman 
135340909f66SGal Pressman struct ib_mr *efa_reg_mr(struct ib_pd *ibpd, u64 start, u64 length,
135440909f66SGal Pressman 			 u64 virt_addr, int access_flags,
135540909f66SGal Pressman 			 struct ib_udata *udata)
135640909f66SGal Pressman {
135740909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibpd->device);
135840909f66SGal Pressman 	struct efa_com_reg_mr_params params = {};
135940909f66SGal Pressman 	struct efa_com_reg_mr_result result = {};
136040909f66SGal Pressman 	struct pbl_context pbl;
1361*40ddb3f0SGal Pressman 	unsigned int pg_sz;
136240909f66SGal Pressman 	struct efa_mr *mr;
136340909f66SGal Pressman 	int inline_size;
136440909f66SGal Pressman 	int err;
136540909f66SGal Pressman 
136640909f66SGal Pressman 	if (udata->inlen &&
136740909f66SGal Pressman 	    !ib_is_udata_cleared(udata, 0, sizeof(udata->inlen))) {
136840909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
136940909f66SGal Pressman 			  "Incompatible ABI params, udata not cleared\n");
137040909f66SGal Pressman 		err = -EINVAL;
137140909f66SGal Pressman 		goto err_out;
137240909f66SGal Pressman 	}
137340909f66SGal Pressman 
137440909f66SGal Pressman 	if (access_flags & ~EFA_SUPPORTED_ACCESS_FLAGS) {
137540909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
137640909f66SGal Pressman 			  "Unsupported access flags[%#x], supported[%#x]\n",
137740909f66SGal Pressman 			  access_flags, EFA_SUPPORTED_ACCESS_FLAGS);
137840909f66SGal Pressman 		err = -EOPNOTSUPP;
137940909f66SGal Pressman 		goto err_out;
138040909f66SGal Pressman 	}
138140909f66SGal Pressman 
138240909f66SGal Pressman 	mr = kzalloc(sizeof(*mr), GFP_KERNEL);
138340909f66SGal Pressman 	if (!mr) {
138440909f66SGal Pressman 		err = -ENOMEM;
138540909f66SGal Pressman 		goto err_out;
138640909f66SGal Pressman 	}
138740909f66SGal Pressman 
138840909f66SGal Pressman 	mr->umem = ib_umem_get(udata, start, length, access_flags, 0);
138940909f66SGal Pressman 	if (IS_ERR(mr->umem)) {
139040909f66SGal Pressman 		err = PTR_ERR(mr->umem);
139140909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
139240909f66SGal Pressman 			  "Failed to pin and map user space memory[%d]\n", err);
139340909f66SGal Pressman 		goto err_free;
139440909f66SGal Pressman 	}
139540909f66SGal Pressman 
139640909f66SGal Pressman 	params.pd = to_epd(ibpd)->pdn;
139740909f66SGal Pressman 	params.iova = virt_addr;
139840909f66SGal Pressman 	params.mr_length_in_bytes = length;
139940909f66SGal Pressman 	params.permissions = access_flags & 0x1;
140040909f66SGal Pressman 
1401*40ddb3f0SGal Pressman 	pg_sz = ib_umem_find_best_pgsz(mr->umem,
1402*40ddb3f0SGal Pressman 				       dev->dev_attr.page_size_cap,
1403*40ddb3f0SGal Pressman 				       virt_addr);
1404*40ddb3f0SGal Pressman 	if (!pg_sz) {
1405*40ddb3f0SGal Pressman 		err = -EOPNOTSUPP;
1406*40ddb3f0SGal Pressman 		ibdev_dbg(&dev->ibdev, "Failed to find a suitable page size in page_size_cap %#llx\n",
1407*40ddb3f0SGal Pressman 			  dev->dev_attr.page_size_cap);
1408*40ddb3f0SGal Pressman 		goto err_unmap;
1409*40ddb3f0SGal Pressman 	}
1410*40ddb3f0SGal Pressman 
1411*40ddb3f0SGal Pressman 	params.page_shift = __ffs(pg_sz);
1412*40ddb3f0SGal Pressman 	params.page_num = DIV_ROUND_UP(length + (start & (pg_sz - 1)),
1413*40ddb3f0SGal Pressman 				       pg_sz);
1414*40ddb3f0SGal Pressman 
141540909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
1416*40ddb3f0SGal Pressman 		  "start %#llx length %#llx params.page_shift %u params.page_num %u\n",
1417*40ddb3f0SGal Pressman 		  start, length, params.page_shift, params.page_num);
141840909f66SGal Pressman 
141940909f66SGal Pressman 	inline_size = ARRAY_SIZE(params.pbl.inline_pbl_array);
142040909f66SGal Pressman 	if (params.page_num <= inline_size) {
142140909f66SGal Pressman 		err = efa_create_inline_pbl(dev, mr, &params);
142240909f66SGal Pressman 		if (err)
142340909f66SGal Pressman 			goto err_unmap;
142440909f66SGal Pressman 
142540909f66SGal Pressman 		err = efa_com_register_mr(&dev->edev, &params, &result);
142640909f66SGal Pressman 		if (err)
142740909f66SGal Pressman 			goto err_unmap;
142840909f66SGal Pressman 	} else {
142940909f66SGal Pressman 		err = efa_create_pbl(dev, &pbl, mr, &params);
143040909f66SGal Pressman 		if (err)
143140909f66SGal Pressman 			goto err_unmap;
143240909f66SGal Pressman 
143340909f66SGal Pressman 		err = efa_com_register_mr(&dev->edev, &params, &result);
143440909f66SGal Pressman 		pbl_destroy(dev, &pbl);
143540909f66SGal Pressman 
143640909f66SGal Pressman 		if (err)
143740909f66SGal Pressman 			goto err_unmap;
143840909f66SGal Pressman 	}
143940909f66SGal Pressman 
144040909f66SGal Pressman 	mr->ibmr.lkey = result.l_key;
144140909f66SGal Pressman 	mr->ibmr.rkey = result.r_key;
144240909f66SGal Pressman 	mr->ibmr.length = length;
144340909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "Registered mr[%d]\n", mr->ibmr.lkey);
144440909f66SGal Pressman 
144540909f66SGal Pressman 	return &mr->ibmr;
144640909f66SGal Pressman 
144740909f66SGal Pressman err_unmap:
144840909f66SGal Pressman 	ib_umem_release(mr->umem);
144940909f66SGal Pressman err_free:
145040909f66SGal Pressman 	kfree(mr);
145140909f66SGal Pressman err_out:
145240909f66SGal Pressman 	atomic64_inc(&dev->stats.sw_stats.reg_mr_err);
145340909f66SGal Pressman 	return ERR_PTR(err);
145440909f66SGal Pressman }
145540909f66SGal Pressman 
145640909f66SGal Pressman int efa_dereg_mr(struct ib_mr *ibmr, struct ib_udata *udata)
145740909f66SGal Pressman {
145840909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibmr->device);
145940909f66SGal Pressman 	struct efa_com_dereg_mr_params params;
146040909f66SGal Pressman 	struct efa_mr *mr = to_emr(ibmr);
146140909f66SGal Pressman 	int err;
146240909f66SGal Pressman 
146340909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "Deregister mr[%d]\n", ibmr->lkey);
146440909f66SGal Pressman 
146540909f66SGal Pressman 	if (mr->umem) {
146640909f66SGal Pressman 		params.l_key = mr->ibmr.lkey;
146740909f66SGal Pressman 		err = efa_com_dereg_mr(&dev->edev, &params);
146840909f66SGal Pressman 		if (err)
146940909f66SGal Pressman 			return err;
147040909f66SGal Pressman 	}
1471836a0fbbSLeon Romanovsky 	ib_umem_release(mr->umem);
147240909f66SGal Pressman 
147340909f66SGal Pressman 	kfree(mr);
147440909f66SGal Pressman 
147540909f66SGal Pressman 	return 0;
147640909f66SGal Pressman }
147740909f66SGal Pressman 
147840909f66SGal Pressman int efa_get_port_immutable(struct ib_device *ibdev, u8 port_num,
147940909f66SGal Pressman 			   struct ib_port_immutable *immutable)
148040909f66SGal Pressman {
148140909f66SGal Pressman 	struct ib_port_attr attr;
148240909f66SGal Pressman 	int err;
148340909f66SGal Pressman 
148440909f66SGal Pressman 	err = ib_query_port(ibdev, port_num, &attr);
148540909f66SGal Pressman 	if (err) {
148640909f66SGal Pressman 		ibdev_dbg(ibdev, "Couldn't query port err[%d]\n", err);
148740909f66SGal Pressman 		return err;
148840909f66SGal Pressman 	}
148940909f66SGal Pressman 
149040909f66SGal Pressman 	immutable->pkey_tbl_len = attr.pkey_tbl_len;
149140909f66SGal Pressman 	immutable->gid_tbl_len = attr.gid_tbl_len;
149240909f66SGal Pressman 
149340909f66SGal Pressman 	return 0;
149440909f66SGal Pressman }
149540909f66SGal Pressman 
149640909f66SGal Pressman static int efa_dealloc_uar(struct efa_dev *dev, u16 uarn)
149740909f66SGal Pressman {
149840909f66SGal Pressman 	struct efa_com_dealloc_uar_params params = {
149940909f66SGal Pressman 		.uarn = uarn,
150040909f66SGal Pressman 	};
150140909f66SGal Pressman 
150240909f66SGal Pressman 	return efa_com_dealloc_uar(&dev->edev, &params);
150340909f66SGal Pressman }
150440909f66SGal Pressman 
150540909f66SGal Pressman int efa_alloc_ucontext(struct ib_ucontext *ibucontext, struct ib_udata *udata)
150640909f66SGal Pressman {
150740909f66SGal Pressman 	struct efa_ucontext *ucontext = to_eucontext(ibucontext);
150840909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibucontext->device);
150940909f66SGal Pressman 	struct efa_ibv_alloc_ucontext_resp resp = {};
151040909f66SGal Pressman 	struct efa_com_alloc_uar_result result;
151140909f66SGal Pressman 	int err;
151240909f66SGal Pressman 
151340909f66SGal Pressman 	/*
151440909f66SGal Pressman 	 * it's fine if the driver does not know all request fields,
151540909f66SGal Pressman 	 * we will ack input fields in our response.
151640909f66SGal Pressman 	 */
151740909f66SGal Pressman 
151840909f66SGal Pressman 	err = efa_com_alloc_uar(&dev->edev, &result);
151940909f66SGal Pressman 	if (err)
152040909f66SGal Pressman 		goto err_out;
152140909f66SGal Pressman 
152240909f66SGal Pressman 	ucontext->uarn = result.uarn;
152340909f66SGal Pressman 	xa_init(&ucontext->mmap_xa);
152440909f66SGal Pressman 
152540909f66SGal Pressman 	resp.cmds_supp_udata_mask |= EFA_USER_CMDS_SUPP_UDATA_QUERY_DEVICE;
152640909f66SGal Pressman 	resp.cmds_supp_udata_mask |= EFA_USER_CMDS_SUPP_UDATA_CREATE_AH;
152740909f66SGal Pressman 	resp.sub_cqs_per_cq = dev->dev_attr.sub_cqs_per_cq;
152840909f66SGal Pressman 	resp.inline_buf_size = dev->dev_attr.inline_buf_size;
152940909f66SGal Pressman 	resp.max_llq_size = dev->dev_attr.max_llq_size;
153040909f66SGal Pressman 
153140909f66SGal Pressman 	if (udata && udata->outlen) {
153240909f66SGal Pressman 		err = ib_copy_to_udata(udata, &resp,
153340909f66SGal Pressman 				       min(sizeof(resp), udata->outlen));
153440909f66SGal Pressman 		if (err)
153540909f66SGal Pressman 			goto err_dealloc_uar;
153640909f66SGal Pressman 	}
153740909f66SGal Pressman 
153840909f66SGal Pressman 	return 0;
153940909f66SGal Pressman 
154040909f66SGal Pressman err_dealloc_uar:
154140909f66SGal Pressman 	efa_dealloc_uar(dev, result.uarn);
154240909f66SGal Pressman err_out:
154340909f66SGal Pressman 	atomic64_inc(&dev->stats.sw_stats.alloc_ucontext_err);
154440909f66SGal Pressman 	return err;
154540909f66SGal Pressman }
154640909f66SGal Pressman 
154740909f66SGal Pressman void efa_dealloc_ucontext(struct ib_ucontext *ibucontext)
154840909f66SGal Pressman {
154940909f66SGal Pressman 	struct efa_ucontext *ucontext = to_eucontext(ibucontext);
155040909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibucontext->device);
155140909f66SGal Pressman 
155240909f66SGal Pressman 	mmap_entries_remove_free(dev, ucontext);
155340909f66SGal Pressman 	efa_dealloc_uar(dev, ucontext->uarn);
155440909f66SGal Pressman }
155540909f66SGal Pressman 
155640909f66SGal Pressman static int __efa_mmap(struct efa_dev *dev, struct efa_ucontext *ucontext,
155740909f66SGal Pressman 		      struct vm_area_struct *vma, u64 key, u64 length)
155840909f66SGal Pressman {
155940909f66SGal Pressman 	struct efa_mmap_entry *entry;
156040909f66SGal Pressman 	unsigned long va;
156140909f66SGal Pressman 	u64 pfn;
156240909f66SGal Pressman 	int err;
156340909f66SGal Pressman 
156440909f66SGal Pressman 	entry = mmap_entry_get(dev, ucontext, key, length);
156540909f66SGal Pressman 	if (!entry) {
156640909f66SGal Pressman 		ibdev_dbg(&dev->ibdev, "key[%#llx] does not have valid entry\n",
156740909f66SGal Pressman 			  key);
156840909f66SGal Pressman 		return -EINVAL;
156940909f66SGal Pressman 	}
157040909f66SGal Pressman 
157140909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
157240909f66SGal Pressman 		  "Mapping address[%#llx], length[%#llx], mmap_flag[%d]\n",
157340909f66SGal Pressman 		  entry->address, length, entry->mmap_flag);
157440909f66SGal Pressman 
157540909f66SGal Pressman 	pfn = entry->address >> PAGE_SHIFT;
157640909f66SGal Pressman 	switch (entry->mmap_flag) {
157740909f66SGal Pressman 	case EFA_MMAP_IO_NC:
157840909f66SGal Pressman 		err = rdma_user_mmap_io(&ucontext->ibucontext, vma, pfn, length,
157940909f66SGal Pressman 					pgprot_noncached(vma->vm_page_prot));
158040909f66SGal Pressman 		break;
158140909f66SGal Pressman 	case EFA_MMAP_IO_WC:
158240909f66SGal Pressman 		err = rdma_user_mmap_io(&ucontext->ibucontext, vma, pfn, length,
158340909f66SGal Pressman 					pgprot_writecombine(vma->vm_page_prot));
158440909f66SGal Pressman 		break;
158540909f66SGal Pressman 	case EFA_MMAP_DMA_PAGE:
158640909f66SGal Pressman 		for (va = vma->vm_start; va < vma->vm_end;
158740909f66SGal Pressman 		     va += PAGE_SIZE, pfn++) {
158840909f66SGal Pressman 			err = vm_insert_page(vma, va, pfn_to_page(pfn));
158940909f66SGal Pressman 			if (err)
159040909f66SGal Pressman 				break;
159140909f66SGal Pressman 		}
159240909f66SGal Pressman 		break;
159340909f66SGal Pressman 	default:
159440909f66SGal Pressman 		err = -EINVAL;
159540909f66SGal Pressman 	}
159640909f66SGal Pressman 
159740909f66SGal Pressman 	if (err)
159840909f66SGal Pressman 		ibdev_dbg(
159940909f66SGal Pressman 			&dev->ibdev,
160040909f66SGal Pressman 			"Couldn't mmap address[%#llx] length[%#llx] mmap_flag[%d] err[%d]\n",
160140909f66SGal Pressman 			entry->address, length, entry->mmap_flag, err);
160240909f66SGal Pressman 
160340909f66SGal Pressman 	return err;
160440909f66SGal Pressman }
160540909f66SGal Pressman 
160640909f66SGal Pressman int efa_mmap(struct ib_ucontext *ibucontext,
160740909f66SGal Pressman 	     struct vm_area_struct *vma)
160840909f66SGal Pressman {
160940909f66SGal Pressman 	struct efa_ucontext *ucontext = to_eucontext(ibucontext);
161040909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibucontext->device);
161140909f66SGal Pressman 	u64 length = vma->vm_end - vma->vm_start;
161240909f66SGal Pressman 	u64 key = vma->vm_pgoff << PAGE_SHIFT;
161340909f66SGal Pressman 
161440909f66SGal Pressman 	ibdev_dbg(&dev->ibdev,
161540909f66SGal Pressman 		  "start %#lx, end %#lx, length = %#llx, key = %#llx\n",
161640909f66SGal Pressman 		  vma->vm_start, vma->vm_end, length, key);
161740909f66SGal Pressman 
161840909f66SGal Pressman 	if (length % PAGE_SIZE != 0 || !(vma->vm_flags & VM_SHARED)) {
161940909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
162040909f66SGal Pressman 			  "length[%#llx] is not page size aligned[%#lx] or VM_SHARED is not set [%#lx]\n",
162140909f66SGal Pressman 			  length, PAGE_SIZE, vma->vm_flags);
162240909f66SGal Pressman 		return -EINVAL;
162340909f66SGal Pressman 	}
162440909f66SGal Pressman 
162540909f66SGal Pressman 	if (vma->vm_flags & VM_EXEC) {
162640909f66SGal Pressman 		ibdev_dbg(&dev->ibdev, "Mapping executable pages is not permitted\n");
162740909f66SGal Pressman 		return -EPERM;
162840909f66SGal Pressman 	}
162940909f66SGal Pressman 	vma->vm_flags &= ~VM_MAYEXEC;
163040909f66SGal Pressman 
163140909f66SGal Pressman 	return __efa_mmap(dev, ucontext, vma, key, length);
163240909f66SGal Pressman }
163340909f66SGal Pressman 
163440909f66SGal Pressman static int efa_ah_destroy(struct efa_dev *dev, struct efa_ah *ah)
163540909f66SGal Pressman {
163640909f66SGal Pressman 	struct efa_com_destroy_ah_params params = {
163740909f66SGal Pressman 		.ah = ah->ah,
163840909f66SGal Pressman 		.pdn = to_epd(ah->ibah.pd)->pdn,
163940909f66SGal Pressman 	};
164040909f66SGal Pressman 
164140909f66SGal Pressman 	return efa_com_destroy_ah(&dev->edev, &params);
164240909f66SGal Pressman }
164340909f66SGal Pressman 
164440909f66SGal Pressman int efa_create_ah(struct ib_ah *ibah,
164540909f66SGal Pressman 		  struct rdma_ah_attr *ah_attr,
164640909f66SGal Pressman 		  u32 flags,
164740909f66SGal Pressman 		  struct ib_udata *udata)
164840909f66SGal Pressman {
164940909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibah->device);
165040909f66SGal Pressman 	struct efa_com_create_ah_params params = {};
165140909f66SGal Pressman 	struct efa_ibv_create_ah_resp resp = {};
165240909f66SGal Pressman 	struct efa_com_create_ah_result result;
165340909f66SGal Pressman 	struct efa_ah *ah = to_eah(ibah);
165440909f66SGal Pressman 	int err;
165540909f66SGal Pressman 
165640909f66SGal Pressman 	if (!(flags & RDMA_CREATE_AH_SLEEPABLE)) {
165740909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
165840909f66SGal Pressman 			  "Create address handle is not supported in atomic context\n");
165940909f66SGal Pressman 		err = -EOPNOTSUPP;
166040909f66SGal Pressman 		goto err_out;
166140909f66SGal Pressman 	}
166240909f66SGal Pressman 
166340909f66SGal Pressman 	if (udata->inlen &&
166440909f66SGal Pressman 	    !ib_is_udata_cleared(udata, 0, udata->inlen)) {
166540909f66SGal Pressman 		ibdev_dbg(&dev->ibdev, "Incompatible ABI params\n");
166640909f66SGal Pressman 		err = -EINVAL;
166740909f66SGal Pressman 		goto err_out;
166840909f66SGal Pressman 	}
166940909f66SGal Pressman 
167040909f66SGal Pressman 	memcpy(params.dest_addr, ah_attr->grh.dgid.raw,
167140909f66SGal Pressman 	       sizeof(params.dest_addr));
167240909f66SGal Pressman 	params.pdn = to_epd(ibah->pd)->pdn;
167340909f66SGal Pressman 	err = efa_com_create_ah(&dev->edev, &params, &result);
167440909f66SGal Pressman 	if (err)
167540909f66SGal Pressman 		goto err_out;
167640909f66SGal Pressman 
167740909f66SGal Pressman 	memcpy(ah->id, ah_attr->grh.dgid.raw, sizeof(ah->id));
167840909f66SGal Pressman 	ah->ah = result.ah;
167940909f66SGal Pressman 
168040909f66SGal Pressman 	resp.efa_address_handle = result.ah;
168140909f66SGal Pressman 
168240909f66SGal Pressman 	if (udata->outlen) {
168340909f66SGal Pressman 		err = ib_copy_to_udata(udata, &resp,
168440909f66SGal Pressman 				       min(sizeof(resp), udata->outlen));
168540909f66SGal Pressman 		if (err) {
168640909f66SGal Pressman 			ibdev_dbg(&dev->ibdev,
168740909f66SGal Pressman 				  "Failed to copy udata for create_ah response\n");
168840909f66SGal Pressman 			goto err_destroy_ah;
168940909f66SGal Pressman 		}
169040909f66SGal Pressman 	}
169140909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "Created ah[%d]\n", ah->ah);
169240909f66SGal Pressman 
169340909f66SGal Pressman 	return 0;
169440909f66SGal Pressman 
169540909f66SGal Pressman err_destroy_ah:
169640909f66SGal Pressman 	efa_ah_destroy(dev, ah);
169740909f66SGal Pressman err_out:
169840909f66SGal Pressman 	atomic64_inc(&dev->stats.sw_stats.create_ah_err);
169940909f66SGal Pressman 	return err;
170040909f66SGal Pressman }
170140909f66SGal Pressman 
170240909f66SGal Pressman void efa_destroy_ah(struct ib_ah *ibah, u32 flags)
170340909f66SGal Pressman {
170440909f66SGal Pressman 	struct efa_dev *dev = to_edev(ibah->pd->device);
170540909f66SGal Pressman 	struct efa_ah *ah = to_eah(ibah);
170640909f66SGal Pressman 
170740909f66SGal Pressman 	ibdev_dbg(&dev->ibdev, "Destroy ah[%d]\n", ah->ah);
170840909f66SGal Pressman 
170940909f66SGal Pressman 	if (!(flags & RDMA_DESTROY_AH_SLEEPABLE)) {
171040909f66SGal Pressman 		ibdev_dbg(&dev->ibdev,
171140909f66SGal Pressman 			  "Destroy address handle is not supported in atomic context\n");
171240909f66SGal Pressman 		return;
171340909f66SGal Pressman 	}
171440909f66SGal Pressman 
171540909f66SGal Pressman 	efa_ah_destroy(dev, ah);
171640909f66SGal Pressman }
171740909f66SGal Pressman 
171840909f66SGal Pressman enum rdma_link_layer efa_port_link_layer(struct ib_device *ibdev,
171940909f66SGal Pressman 					 u8 port_num)
172040909f66SGal Pressman {
172140909f66SGal Pressman 	return IB_LINK_LAYER_UNSPECIFIED;
172240909f66SGal Pressman }
172340909f66SGal Pressman 
1724