xref: /openbmc/linux/drivers/infiniband/hw/mlx5/main.c (revision 4061ff7aa379fa770a82da0ed7ec4f9163034518)
1e126ba97SEli Cohen /*
26cf0a15fSSaeed Mahameed  * Copyright (c) 2013-2015, Mellanox Technologies. All rights reserved.
3e126ba97SEli Cohen  *
4e126ba97SEli Cohen  * This software is available to you under a choice of one of two
5e126ba97SEli Cohen  * licenses.  You may choose to be licensed under the terms of the GNU
6e126ba97SEli Cohen  * General Public License (GPL) Version 2, available from the file
7e126ba97SEli Cohen  * COPYING in the main directory of this source tree, or the
8e126ba97SEli Cohen  * OpenIB.org BSD license below:
9e126ba97SEli Cohen  *
10e126ba97SEli Cohen  *     Redistribution and use in source and binary forms, with or
11e126ba97SEli Cohen  *     without modification, are permitted provided that the following
12e126ba97SEli Cohen  *     conditions are met:
13e126ba97SEli Cohen  *
14e126ba97SEli Cohen  *      - Redistributions of source code must retain the above
15e126ba97SEli Cohen  *        copyright notice, this list of conditions and the following
16e126ba97SEli Cohen  *        disclaimer.
17e126ba97SEli Cohen  *
18e126ba97SEli Cohen  *      - Redistributions in binary form must reproduce the above
19e126ba97SEli Cohen  *        copyright notice, this list of conditions and the following
20e126ba97SEli Cohen  *        disclaimer in the documentation and/or other materials
21e126ba97SEli Cohen  *        provided with the distribution.
22e126ba97SEli Cohen  *
23e126ba97SEli Cohen  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24e126ba97SEli Cohen  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25e126ba97SEli Cohen  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26e126ba97SEli Cohen  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27e126ba97SEli Cohen  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28e126ba97SEli Cohen  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29e126ba97SEli Cohen  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30e126ba97SEli Cohen  * SOFTWARE.
31e126ba97SEli Cohen  */
32e126ba97SEli Cohen 
33fe248c3aSMaor Gottlieb #include <linux/debugfs.h>
34adec640eSChristoph Hellwig #include <linux/highmem.h>
35e126ba97SEli Cohen #include <linux/module.h>
36e126ba97SEli Cohen #include <linux/init.h>
37e126ba97SEli Cohen #include <linux/errno.h>
38e126ba97SEli Cohen #include <linux/pci.h>
39e126ba97SEli Cohen #include <linux/dma-mapping.h>
40e126ba97SEli Cohen #include <linux/slab.h>
4124da0016SAriel Levkovich #include <linux/bitmap.h>
4237aa5c36SGuy Levi #if defined(CONFIG_X86)
4337aa5c36SGuy Levi #include <asm/pat.h>
4437aa5c36SGuy Levi #endif
45e126ba97SEli Cohen #include <linux/sched.h>
466e84f315SIngo Molnar #include <linux/sched/mm.h>
470881e7bdSIngo Molnar #include <linux/sched/task.h>
487c2344c3SMaor Gottlieb #include <linux/delay.h>
49e126ba97SEli Cohen #include <rdma/ib_user_verbs.h>
503f89a643SAchiad Shochat #include <rdma/ib_addr.h>
512811ba51SAchiad Shochat #include <rdma/ib_cache.h>
52ada68c31SAchiad Shochat #include <linux/mlx5/port.h>
531b5daf11SMajd Dibbiny #include <linux/mlx5/vport.h>
5472c7fe90SPravin Shedge #include <linux/mlx5/fs.h>
55cecae747SMaor Gottlieb #include <linux/mlx5/eswitch.h>
567c2344c3SMaor Gottlieb #include <linux/list.h>
57e126ba97SEli Cohen #include <rdma/ib_smi.h>
58e126ba97SEli Cohen #include <rdma/ib_umem.h>
59038d2ef8SMaor Gottlieb #include <linux/in.h>
60038d2ef8SMaor Gottlieb #include <linux/etherdevice.h>
61e126ba97SEli Cohen #include "mlx5_ib.h"
62fc385b7aSMark Bloch #include "ib_rep.h"
63e1f24a79SParav Pandit #include "cmd.h"
64f3da6577SLeon Romanovsky #include "srq.h"
653346c487SBoris Pismenny #include <linux/mlx5/fs_helpers.h>
66c6475a0bSAviad Yehezkel #include <linux/mlx5/accel.h>
678c84660bSMatan Barak #include <rdma/uverbs_std_types.h>
68c6475a0bSAviad Yehezkel #include <rdma/mlx5_user_ioctl_verbs.h>
69c6475a0bSAviad Yehezkel #include <rdma/mlx5_user_ioctl_cmds.h>
70*4061ff7aSErez Alfasi #include <rdma/ib_umem_odp.h>
718c84660bSMatan Barak 
728c84660bSMatan Barak #define UVERBS_MODULE_NAME mlx5_ib
738c84660bSMatan Barak #include <rdma/uverbs_named_ioctl.h>
74e126ba97SEli Cohen 
75e126ba97SEli Cohen #define DRIVER_NAME "mlx5_ib"
76b359911dSTariq Toukan #define DRIVER_VERSION "5.0-0"
77e126ba97SEli Cohen 
78e126ba97SEli Cohen MODULE_AUTHOR("Eli Cohen <eli@mellanox.com>");
79e126ba97SEli Cohen MODULE_DESCRIPTION("Mellanox Connect-IB HCA IB driver");
80e126ba97SEli Cohen MODULE_LICENSE("Dual BSD/GPL");
81e126ba97SEli Cohen 
82e126ba97SEli Cohen static char mlx5_version[] =
83e126ba97SEli Cohen 	DRIVER_NAME ": Mellanox Connect-IB Infiniband driver v"
84b359911dSTariq Toukan 	DRIVER_VERSION "\n";
85e126ba97SEli Cohen 
86d69a24e0SDaniel Jurgens struct mlx5_ib_event_work {
87d69a24e0SDaniel Jurgens 	struct work_struct	work;
88df097a27SSaeed Mahameed 	union {
89df097a27SSaeed Mahameed 		struct mlx5_ib_dev	      *dev;
90df097a27SSaeed Mahameed 		struct mlx5_ib_multiport_info *mpi;
91df097a27SSaeed Mahameed 	};
92df097a27SSaeed Mahameed 	bool			is_slave;
93134e9349SSaeed Mahameed 	unsigned int		event;
94df097a27SSaeed Mahameed 	void			*param;
95d69a24e0SDaniel Jurgens };
96d69a24e0SDaniel Jurgens 
97da7525d2SEran Ben Elisha enum {
98da7525d2SEran Ben Elisha 	MLX5_ATOMIC_SIZE_QP_8BYTES = 1 << 3,
99da7525d2SEran Ben Elisha };
1001b5daf11SMajd Dibbiny 
101d69a24e0SDaniel Jurgens static struct workqueue_struct *mlx5_ib_event_wq;
10232f69e4bSDaniel Jurgens static LIST_HEAD(mlx5_ib_unaffiliated_port_list);
10332f69e4bSDaniel Jurgens static LIST_HEAD(mlx5_ib_dev_list);
10432f69e4bSDaniel Jurgens /*
10532f69e4bSDaniel Jurgens  * This mutex should be held when accessing either of the above lists
10632f69e4bSDaniel Jurgens  */
10732f69e4bSDaniel Jurgens static DEFINE_MUTEX(mlx5_ib_multiport_mutex);
10832f69e4bSDaniel Jurgens 
109c44ef998SIlya Lesokhin /* We can't use an array for xlt_emergency_page because dma_map_single
110c44ef998SIlya Lesokhin  * doesn't work on kernel modules memory
111c44ef998SIlya Lesokhin  */
112c44ef998SIlya Lesokhin static unsigned long xlt_emergency_page;
113c44ef998SIlya Lesokhin static struct mutex xlt_emergency_page_mutex;
114c44ef998SIlya Lesokhin 
11532f69e4bSDaniel Jurgens struct mlx5_ib_dev *mlx5_ib_get_ibdev_from_mpi(struct mlx5_ib_multiport_info *mpi)
11632f69e4bSDaniel Jurgens {
11732f69e4bSDaniel Jurgens 	struct mlx5_ib_dev *dev;
11832f69e4bSDaniel Jurgens 
11932f69e4bSDaniel Jurgens 	mutex_lock(&mlx5_ib_multiport_mutex);
12032f69e4bSDaniel Jurgens 	dev = mpi->ibdev;
12132f69e4bSDaniel Jurgens 	mutex_unlock(&mlx5_ib_multiport_mutex);
12232f69e4bSDaniel Jurgens 	return dev;
12332f69e4bSDaniel Jurgens }
12432f69e4bSDaniel Jurgens 
1251b5daf11SMajd Dibbiny static enum rdma_link_layer
126ebd61f68SAchiad Shochat mlx5_port_type_cap_to_rdma_ll(int port_type_cap)
1271b5daf11SMajd Dibbiny {
128ebd61f68SAchiad Shochat 	switch (port_type_cap) {
1291b5daf11SMajd Dibbiny 	case MLX5_CAP_PORT_TYPE_IB:
1301b5daf11SMajd Dibbiny 		return IB_LINK_LAYER_INFINIBAND;
1311b5daf11SMajd Dibbiny 	case MLX5_CAP_PORT_TYPE_ETH:
1321b5daf11SMajd Dibbiny 		return IB_LINK_LAYER_ETHERNET;
1331b5daf11SMajd Dibbiny 	default:
1341b5daf11SMajd Dibbiny 		return IB_LINK_LAYER_UNSPECIFIED;
1351b5daf11SMajd Dibbiny 	}
1361b5daf11SMajd Dibbiny }
1371b5daf11SMajd Dibbiny 
138ebd61f68SAchiad Shochat static enum rdma_link_layer
139ebd61f68SAchiad Shochat mlx5_ib_port_link_layer(struct ib_device *device, u8 port_num)
140ebd61f68SAchiad Shochat {
141ebd61f68SAchiad Shochat 	struct mlx5_ib_dev *dev = to_mdev(device);
142ebd61f68SAchiad Shochat 	int port_type_cap = MLX5_CAP_GEN(dev->mdev, port_type);
143ebd61f68SAchiad Shochat 
144ebd61f68SAchiad Shochat 	return mlx5_port_type_cap_to_rdma_ll(port_type_cap);
145ebd61f68SAchiad Shochat }
146ebd61f68SAchiad Shochat 
147fd65f1b8SMoni Shoua static int get_port_state(struct ib_device *ibdev,
148fd65f1b8SMoni Shoua 			  u8 port_num,
149fd65f1b8SMoni Shoua 			  enum ib_port_state *state)
150fd65f1b8SMoni Shoua {
151fd65f1b8SMoni Shoua 	struct ib_port_attr attr;
152fd65f1b8SMoni Shoua 	int ret;
153fd65f1b8SMoni Shoua 
154fd65f1b8SMoni Shoua 	memset(&attr, 0, sizeof(attr));
1553023a1e9SKamal Heib 	ret = ibdev->ops.query_port(ibdev, port_num, &attr);
156fd65f1b8SMoni Shoua 	if (!ret)
157fd65f1b8SMoni Shoua 		*state = attr.state;
158fd65f1b8SMoni Shoua 	return ret;
159fd65f1b8SMoni Shoua }
160fd65f1b8SMoni Shoua 
16135b0aa67SMark Bloch static struct mlx5_roce *mlx5_get_rep_roce(struct mlx5_ib_dev *dev,
16235b0aa67SMark Bloch 					   struct net_device *ndev,
16335b0aa67SMark Bloch 					   u8 *port_num)
16435b0aa67SMark Bloch {
16535b0aa67SMark Bloch 	struct mlx5_eswitch *esw = dev->mdev->priv.eswitch;
16635b0aa67SMark Bloch 	struct net_device *rep_ndev;
16735b0aa67SMark Bloch 	struct mlx5_ib_port *port;
16835b0aa67SMark Bloch 	int i;
16935b0aa67SMark Bloch 
17035b0aa67SMark Bloch 	for (i = 0; i < dev->num_ports; i++) {
17135b0aa67SMark Bloch 		port  = &dev->port[i];
17235b0aa67SMark Bloch 		if (!port->rep)
17335b0aa67SMark Bloch 			continue;
17435b0aa67SMark Bloch 
17535b0aa67SMark Bloch 		read_lock(&port->roce.netdev_lock);
17635b0aa67SMark Bloch 		rep_ndev = mlx5_ib_get_rep_netdev(esw,
17735b0aa67SMark Bloch 						  port->rep->vport);
17835b0aa67SMark Bloch 		if (rep_ndev == ndev) {
17935b0aa67SMark Bloch 			read_unlock(&port->roce.netdev_lock);
18035b0aa67SMark Bloch 			*port_num = i + 1;
18135b0aa67SMark Bloch 			return &port->roce;
18235b0aa67SMark Bloch 		}
18335b0aa67SMark Bloch 		read_unlock(&port->roce.netdev_lock);
18435b0aa67SMark Bloch 	}
18535b0aa67SMark Bloch 
18635b0aa67SMark Bloch 	return NULL;
18735b0aa67SMark Bloch }
18835b0aa67SMark Bloch 
189fc24fc5eSAchiad Shochat static int mlx5_netdev_event(struct notifier_block *this,
190fc24fc5eSAchiad Shochat 			     unsigned long event, void *ptr)
191fc24fc5eSAchiad Shochat {
1927fd8aefbSDaniel Jurgens 	struct mlx5_roce *roce = container_of(this, struct mlx5_roce, nb);
193fc24fc5eSAchiad Shochat 	struct net_device *ndev = netdev_notifier_info_to_dev(ptr);
1947fd8aefbSDaniel Jurgens 	u8 port_num = roce->native_port_num;
1957fd8aefbSDaniel Jurgens 	struct mlx5_core_dev *mdev;
1967fd8aefbSDaniel Jurgens 	struct mlx5_ib_dev *ibdev;
1977fd8aefbSDaniel Jurgens 
1987fd8aefbSDaniel Jurgens 	ibdev = roce->dev;
19932f69e4bSDaniel Jurgens 	mdev = mlx5_ib_get_native_port_mdev(ibdev, port_num, NULL);
20032f69e4bSDaniel Jurgens 	if (!mdev)
20132f69e4bSDaniel Jurgens 		return NOTIFY_DONE;
202fc24fc5eSAchiad Shochat 
2035ec8c83eSAviv Heller 	switch (event) {
2045ec8c83eSAviv Heller 	case NETDEV_REGISTER:
20535b0aa67SMark Bloch 		/* Should already be registered during the load */
20635b0aa67SMark Bloch 		if (ibdev->is_rep)
20735b0aa67SMark Bloch 			break;
2087fd8aefbSDaniel Jurgens 		write_lock(&roce->netdev_lock);
209dce45af5SLinus Torvalds 		if (ndev->dev.parent == mdev->device)
210842a9c83SOr Gerlitz 			roce->netdev = ndev;
2117fd8aefbSDaniel Jurgens 		write_unlock(&roce->netdev_lock);
2125ec8c83eSAviv Heller 		break;
2135ec8c83eSAviv Heller 
214842a9c83SOr Gerlitz 	case NETDEV_UNREGISTER:
21535b0aa67SMark Bloch 		/* In case of reps, ib device goes away before the netdevs */
216842a9c83SOr Gerlitz 		write_lock(&roce->netdev_lock);
217842a9c83SOr Gerlitz 		if (roce->netdev == ndev)
218842a9c83SOr Gerlitz 			roce->netdev = NULL;
219842a9c83SOr Gerlitz 		write_unlock(&roce->netdev_lock);
220842a9c83SOr Gerlitz 		break;
221842a9c83SOr Gerlitz 
222fd65f1b8SMoni Shoua 	case NETDEV_CHANGE:
2235ec8c83eSAviv Heller 	case NETDEV_UP:
22488621dfeSAviv Heller 	case NETDEV_DOWN: {
2257fd8aefbSDaniel Jurgens 		struct net_device *lag_ndev = mlx5_lag_get_roce_netdev(mdev);
22688621dfeSAviv Heller 		struct net_device *upper = NULL;
22788621dfeSAviv Heller 
22888621dfeSAviv Heller 		if (lag_ndev) {
22988621dfeSAviv Heller 			upper = netdev_master_upper_dev_get(lag_ndev);
23088621dfeSAviv Heller 			dev_put(lag_ndev);
23188621dfeSAviv Heller 		}
23288621dfeSAviv Heller 
23335b0aa67SMark Bloch 		if (ibdev->is_rep)
23435b0aa67SMark Bloch 			roce = mlx5_get_rep_roce(ibdev, ndev, &port_num);
23535b0aa67SMark Bloch 		if (!roce)
23635b0aa67SMark Bloch 			return NOTIFY_DONE;
2377fd8aefbSDaniel Jurgens 		if ((upper == ndev || (!upper && ndev == roce->netdev))
23888621dfeSAviv Heller 		    && ibdev->ib_active) {
239626bc02dSBart Van Assche 			struct ib_event ibev = { };
240fd65f1b8SMoni Shoua 			enum ib_port_state port_state;
2415ec8c83eSAviv Heller 
2427fd8aefbSDaniel Jurgens 			if (get_port_state(&ibdev->ib_dev, port_num,
2437fd8aefbSDaniel Jurgens 					   &port_state))
2447fd8aefbSDaniel Jurgens 				goto done;
245fd65f1b8SMoni Shoua 
2467fd8aefbSDaniel Jurgens 			if (roce->last_port_state == port_state)
2477fd8aefbSDaniel Jurgens 				goto done;
248fd65f1b8SMoni Shoua 
2497fd8aefbSDaniel Jurgens 			roce->last_port_state = port_state;
2505ec8c83eSAviv Heller 			ibev.device = &ibdev->ib_dev;
251fd65f1b8SMoni Shoua 			if (port_state == IB_PORT_DOWN)
252fd65f1b8SMoni Shoua 				ibev.event = IB_EVENT_PORT_ERR;
253fd65f1b8SMoni Shoua 			else if (port_state == IB_PORT_ACTIVE)
254fd65f1b8SMoni Shoua 				ibev.event = IB_EVENT_PORT_ACTIVE;
255fd65f1b8SMoni Shoua 			else
2567fd8aefbSDaniel Jurgens 				goto done;
257fd65f1b8SMoni Shoua 
2587fd8aefbSDaniel Jurgens 			ibev.element.port_num = port_num;
2595ec8c83eSAviv Heller 			ib_dispatch_event(&ibev);
2605ec8c83eSAviv Heller 		}
2615ec8c83eSAviv Heller 		break;
26288621dfeSAviv Heller 	}
2635ec8c83eSAviv Heller 
2645ec8c83eSAviv Heller 	default:
2655ec8c83eSAviv Heller 		break;
2665ec8c83eSAviv Heller 	}
2677fd8aefbSDaniel Jurgens done:
26832f69e4bSDaniel Jurgens 	mlx5_ib_put_native_port_mdev(ibdev, port_num);
269fc24fc5eSAchiad Shochat 	return NOTIFY_DONE;
270fc24fc5eSAchiad Shochat }
271fc24fc5eSAchiad Shochat 
272fc24fc5eSAchiad Shochat static struct net_device *mlx5_ib_get_netdev(struct ib_device *device,
273fc24fc5eSAchiad Shochat 					     u8 port_num)
274fc24fc5eSAchiad Shochat {
275fc24fc5eSAchiad Shochat 	struct mlx5_ib_dev *ibdev = to_mdev(device);
276fc24fc5eSAchiad Shochat 	struct net_device *ndev;
27732f69e4bSDaniel Jurgens 	struct mlx5_core_dev *mdev;
278fc24fc5eSAchiad Shochat 
27932f69e4bSDaniel Jurgens 	mdev = mlx5_ib_get_native_port_mdev(ibdev, port_num, NULL);
28032f69e4bSDaniel Jurgens 	if (!mdev)
28132f69e4bSDaniel Jurgens 		return NULL;
28232f69e4bSDaniel Jurgens 
28332f69e4bSDaniel Jurgens 	ndev = mlx5_lag_get_roce_netdev(mdev);
28488621dfeSAviv Heller 	if (ndev)
28532f69e4bSDaniel Jurgens 		goto out;
28688621dfeSAviv Heller 
287fc24fc5eSAchiad Shochat 	/* Ensure ndev does not disappear before we invoke dev_hold()
288fc24fc5eSAchiad Shochat 	 */
28995579e78SMark Bloch 	read_lock(&ibdev->port[port_num - 1].roce.netdev_lock);
29095579e78SMark Bloch 	ndev = ibdev->port[port_num - 1].roce.netdev;
291fc24fc5eSAchiad Shochat 	if (ndev)
292fc24fc5eSAchiad Shochat 		dev_hold(ndev);
29395579e78SMark Bloch 	read_unlock(&ibdev->port[port_num - 1].roce.netdev_lock);
294fc24fc5eSAchiad Shochat 
29532f69e4bSDaniel Jurgens out:
29632f69e4bSDaniel Jurgens 	mlx5_ib_put_native_port_mdev(ibdev, port_num);
297fc24fc5eSAchiad Shochat 	return ndev;
298fc24fc5eSAchiad Shochat }
299fc24fc5eSAchiad Shochat 
30032f69e4bSDaniel Jurgens struct mlx5_core_dev *mlx5_ib_get_native_port_mdev(struct mlx5_ib_dev *ibdev,
30132f69e4bSDaniel Jurgens 						   u8 ib_port_num,
30232f69e4bSDaniel Jurgens 						   u8 *native_port_num)
30332f69e4bSDaniel Jurgens {
30432f69e4bSDaniel Jurgens 	enum rdma_link_layer ll = mlx5_ib_port_link_layer(&ibdev->ib_dev,
30532f69e4bSDaniel Jurgens 							  ib_port_num);
30632f69e4bSDaniel Jurgens 	struct mlx5_core_dev *mdev = NULL;
30732f69e4bSDaniel Jurgens 	struct mlx5_ib_multiport_info *mpi;
30832f69e4bSDaniel Jurgens 	struct mlx5_ib_port *port;
30932f69e4bSDaniel Jurgens 
310210b1f78SMark Bloch 	if (!mlx5_core_mp_enabled(ibdev->mdev) ||
311210b1f78SMark Bloch 	    ll != IB_LINK_LAYER_ETHERNET) {
312210b1f78SMark Bloch 		if (native_port_num)
313210b1f78SMark Bloch 			*native_port_num = ib_port_num;
314210b1f78SMark Bloch 		return ibdev->mdev;
315210b1f78SMark Bloch 	}
316210b1f78SMark Bloch 
31732f69e4bSDaniel Jurgens 	if (native_port_num)
31832f69e4bSDaniel Jurgens 		*native_port_num = 1;
31932f69e4bSDaniel Jurgens 
32032f69e4bSDaniel Jurgens 	port = &ibdev->port[ib_port_num - 1];
32132f69e4bSDaniel Jurgens 	if (!port)
32232f69e4bSDaniel Jurgens 		return NULL;
32332f69e4bSDaniel Jurgens 
32432f69e4bSDaniel Jurgens 	spin_lock(&port->mp.mpi_lock);
32532f69e4bSDaniel Jurgens 	mpi = ibdev->port[ib_port_num - 1].mp.mpi;
32632f69e4bSDaniel Jurgens 	if (mpi && !mpi->unaffiliate) {
32732f69e4bSDaniel Jurgens 		mdev = mpi->mdev;
32832f69e4bSDaniel Jurgens 		/* If it's the master no need to refcount, it'll exist
32932f69e4bSDaniel Jurgens 		 * as long as the ib_dev exists.
33032f69e4bSDaniel Jurgens 		 */
33132f69e4bSDaniel Jurgens 		if (!mpi->is_master)
33232f69e4bSDaniel Jurgens 			mpi->mdev_refcnt++;
33332f69e4bSDaniel Jurgens 	}
33432f69e4bSDaniel Jurgens 	spin_unlock(&port->mp.mpi_lock);
33532f69e4bSDaniel Jurgens 
33632f69e4bSDaniel Jurgens 	return mdev;
33732f69e4bSDaniel Jurgens }
33832f69e4bSDaniel Jurgens 
33932f69e4bSDaniel Jurgens void mlx5_ib_put_native_port_mdev(struct mlx5_ib_dev *ibdev, u8 port_num)
34032f69e4bSDaniel Jurgens {
34132f69e4bSDaniel Jurgens 	enum rdma_link_layer ll = mlx5_ib_port_link_layer(&ibdev->ib_dev,
34232f69e4bSDaniel Jurgens 							  port_num);
34332f69e4bSDaniel Jurgens 	struct mlx5_ib_multiport_info *mpi;
34432f69e4bSDaniel Jurgens 	struct mlx5_ib_port *port;
34532f69e4bSDaniel Jurgens 
34632f69e4bSDaniel Jurgens 	if (!mlx5_core_mp_enabled(ibdev->mdev) || ll != IB_LINK_LAYER_ETHERNET)
34732f69e4bSDaniel Jurgens 		return;
34832f69e4bSDaniel Jurgens 
34932f69e4bSDaniel Jurgens 	port = &ibdev->port[port_num - 1];
35032f69e4bSDaniel Jurgens 
35132f69e4bSDaniel Jurgens 	spin_lock(&port->mp.mpi_lock);
35232f69e4bSDaniel Jurgens 	mpi = ibdev->port[port_num - 1].mp.mpi;
35332f69e4bSDaniel Jurgens 	if (mpi->is_master)
35432f69e4bSDaniel Jurgens 		goto out;
35532f69e4bSDaniel Jurgens 
35632f69e4bSDaniel Jurgens 	mpi->mdev_refcnt--;
35732f69e4bSDaniel Jurgens 	if (mpi->unaffiliate)
35832f69e4bSDaniel Jurgens 		complete(&mpi->unref_comp);
35932f69e4bSDaniel Jurgens out:
36032f69e4bSDaniel Jurgens 	spin_unlock(&port->mp.mpi_lock);
36132f69e4bSDaniel Jurgens }
36232f69e4bSDaniel Jurgens 
36308e8676fSAya Levin static int translate_eth_legacy_proto_oper(u32 eth_proto_oper, u8 *active_speed,
364f1b65df5SNoa Osherovich 					   u8 *active_width)
365f1b65df5SNoa Osherovich {
366f1b65df5SNoa Osherovich 	switch (eth_proto_oper) {
367f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_1000BASE_CX_SGMII):
368f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_1000BASE_KX):
369f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_100BASE_TX):
370f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_1000BASE_T):
371f1b65df5SNoa Osherovich 		*active_width = IB_WIDTH_1X;
372f1b65df5SNoa Osherovich 		*active_speed = IB_SPEED_SDR;
373f1b65df5SNoa Osherovich 		break;
374f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_10GBASE_T):
375f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_10GBASE_CX4):
376f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_10GBASE_KX4):
377f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_10GBASE_KR):
378f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_10GBASE_CR):
379f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_10GBASE_SR):
380f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_10GBASE_ER):
381f1b65df5SNoa Osherovich 		*active_width = IB_WIDTH_1X;
382f1b65df5SNoa Osherovich 		*active_speed = IB_SPEED_QDR;
383f1b65df5SNoa Osherovich 		break;
384f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_25GBASE_CR):
385f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_25GBASE_KR):
386f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_25GBASE_SR):
387f1b65df5SNoa Osherovich 		*active_width = IB_WIDTH_1X;
388f1b65df5SNoa Osherovich 		*active_speed = IB_SPEED_EDR;
389f1b65df5SNoa Osherovich 		break;
390f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_40GBASE_CR4):
391f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_40GBASE_KR4):
392f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_40GBASE_SR4):
393f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_40GBASE_LR4):
394f1b65df5SNoa Osherovich 		*active_width = IB_WIDTH_4X;
395f1b65df5SNoa Osherovich 		*active_speed = IB_SPEED_QDR;
396f1b65df5SNoa Osherovich 		break;
397f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_50GBASE_CR2):
398f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_50GBASE_KR2):
399f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_50GBASE_SR2):
400f1b65df5SNoa Osherovich 		*active_width = IB_WIDTH_1X;
401f1b65df5SNoa Osherovich 		*active_speed = IB_SPEED_HDR;
402f1b65df5SNoa Osherovich 		break;
403f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_56GBASE_R4):
404f1b65df5SNoa Osherovich 		*active_width = IB_WIDTH_4X;
405f1b65df5SNoa Osherovich 		*active_speed = IB_SPEED_FDR;
406f1b65df5SNoa Osherovich 		break;
407f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_100GBASE_CR4):
408f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_100GBASE_SR4):
409f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_100GBASE_KR4):
410f1b65df5SNoa Osherovich 	case MLX5E_PROT_MASK(MLX5E_100GBASE_LR4):
411f1b65df5SNoa Osherovich 		*active_width = IB_WIDTH_4X;
412f1b65df5SNoa Osherovich 		*active_speed = IB_SPEED_EDR;
413f1b65df5SNoa Osherovich 		break;
414f1b65df5SNoa Osherovich 	default:
415f1b65df5SNoa Osherovich 		return -EINVAL;
416f1b65df5SNoa Osherovich 	}
417f1b65df5SNoa Osherovich 
418f1b65df5SNoa Osherovich 	return 0;
419f1b65df5SNoa Osherovich }
420f1b65df5SNoa Osherovich 
42108e8676fSAya Levin static int translate_eth_ext_proto_oper(u32 eth_proto_oper, u8 *active_speed,
42208e8676fSAya Levin 					u8 *active_width)
42308e8676fSAya Levin {
42408e8676fSAya Levin 	switch (eth_proto_oper) {
42508e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_SGMII_100M):
42608e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_1000BASE_X_SGMII):
42708e8676fSAya Levin 		*active_width = IB_WIDTH_1X;
42808e8676fSAya Levin 		*active_speed = IB_SPEED_SDR;
42908e8676fSAya Levin 		break;
43008e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_5GBASE_R):
43108e8676fSAya Levin 		*active_width = IB_WIDTH_1X;
43208e8676fSAya Levin 		*active_speed = IB_SPEED_DDR;
43308e8676fSAya Levin 		break;
43408e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_10GBASE_XFI_XAUI_1):
43508e8676fSAya Levin 		*active_width = IB_WIDTH_1X;
43608e8676fSAya Levin 		*active_speed = IB_SPEED_QDR;
43708e8676fSAya Levin 		break;
43808e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_40GBASE_XLAUI_4_XLPPI_4):
43908e8676fSAya Levin 		*active_width = IB_WIDTH_4X;
44008e8676fSAya Levin 		*active_speed = IB_SPEED_QDR;
44108e8676fSAya Levin 		break;
44208e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_25GAUI_1_25GBASE_CR_KR):
44308e8676fSAya Levin 		*active_width = IB_WIDTH_1X;
44408e8676fSAya Levin 		*active_speed = IB_SPEED_EDR;
44508e8676fSAya Levin 		break;
44608e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_50GAUI_2_LAUI_2_50GBASE_CR2_KR2):
447cd272875SAya Levin 		*active_width = IB_WIDTH_2X;
448cd272875SAya Levin 		*active_speed = IB_SPEED_EDR;
449cd272875SAya Levin 		break;
45008e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_50GAUI_1_LAUI_1_50GBASE_CR_KR):
45108e8676fSAya Levin 		*active_width = IB_WIDTH_1X;
45208e8676fSAya Levin 		*active_speed = IB_SPEED_HDR;
45308e8676fSAya Levin 		break;
454cd272875SAya Levin 	case MLX5E_PROT_MASK(MLX5E_CAUI_4_100GBASE_CR4_KR4):
455cd272875SAya Levin 		*active_width = IB_WIDTH_4X;
456cd272875SAya Levin 		*active_speed = IB_SPEED_EDR;
457cd272875SAya Levin 		break;
45808e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_100GAUI_2_100GBASE_CR2_KR2):
45908e8676fSAya Levin 		*active_width = IB_WIDTH_2X;
46008e8676fSAya Levin 		*active_speed = IB_SPEED_HDR;
46108e8676fSAya Levin 		break;
46208e8676fSAya Levin 	case MLX5E_PROT_MASK(MLX5E_200GAUI_4_200GBASE_CR4_KR4):
46308e8676fSAya Levin 		*active_width = IB_WIDTH_4X;
46408e8676fSAya Levin 		*active_speed = IB_SPEED_HDR;
46508e8676fSAya Levin 		break;
46608e8676fSAya Levin 	default:
46708e8676fSAya Levin 		return -EINVAL;
46808e8676fSAya Levin 	}
46908e8676fSAya Levin 
47008e8676fSAya Levin 	return 0;
47108e8676fSAya Levin }
47208e8676fSAya Levin 
47308e8676fSAya Levin static int translate_eth_proto_oper(u32 eth_proto_oper, u8 *active_speed,
47408e8676fSAya Levin 				    u8 *active_width, bool ext)
47508e8676fSAya Levin {
47608e8676fSAya Levin 	return ext ?
47708e8676fSAya Levin 		translate_eth_ext_proto_oper(eth_proto_oper, active_speed,
47808e8676fSAya Levin 					     active_width) :
47908e8676fSAya Levin 		translate_eth_legacy_proto_oper(eth_proto_oper, active_speed,
48008e8676fSAya Levin 						active_width);
48108e8676fSAya Levin }
48208e8676fSAya Levin 
483095b0927SIlan Tayari static int mlx5_query_port_roce(struct ib_device *device, u8 port_num,
4843f89a643SAchiad Shochat 				struct ib_port_attr *props)
4853f89a643SAchiad Shochat {
4863f89a643SAchiad Shochat 	struct mlx5_ib_dev *dev = to_mdev(device);
487bc4e12ffSAya Levin 	u32 out[MLX5_ST_SZ_DW(ptys_reg)] = {0};
488da005f9fSColin Ian King 	struct mlx5_core_dev *mdev;
48988621dfeSAviv Heller 	struct net_device *ndev, *upper;
4903f89a643SAchiad Shochat 	enum ib_mtu ndev_ib_mtu;
491b3cbd6f0SDaniel Jurgens 	bool put_mdev = true;
492c876a1b7SLeon Romanovsky 	u16 qkey_viol_cntr;
493f1b65df5SNoa Osherovich 	u32 eth_prot_oper;
494b3cbd6f0SDaniel Jurgens 	u8 mdev_port_num;
49508e8676fSAya Levin 	bool ext;
496095b0927SIlan Tayari 	int err;
4973f89a643SAchiad Shochat 
498b3cbd6f0SDaniel Jurgens 	mdev = mlx5_ib_get_native_port_mdev(dev, port_num, &mdev_port_num);
499b3cbd6f0SDaniel Jurgens 	if (!mdev) {
500b3cbd6f0SDaniel Jurgens 		/* This means the port isn't affiliated yet. Get the
501b3cbd6f0SDaniel Jurgens 		 * info for the master port instead.
502b3cbd6f0SDaniel Jurgens 		 */
503b3cbd6f0SDaniel Jurgens 		put_mdev = false;
504b3cbd6f0SDaniel Jurgens 		mdev = dev->mdev;
505b3cbd6f0SDaniel Jurgens 		mdev_port_num = 1;
506b3cbd6f0SDaniel Jurgens 		port_num = 1;
507b3cbd6f0SDaniel Jurgens 	}
508b3cbd6f0SDaniel Jurgens 
509f1b65df5SNoa Osherovich 	/* Possible bad flows are checked before filling out props so in case
510f1b65df5SNoa Osherovich 	 * of an error it will still be zeroed out.
51126628e2dSMark Bloch 	 * Use native port in case of reps
51250f22fd8SNoa Osherovich 	 */
51326628e2dSMark Bloch 	if (dev->is_rep)
51426628e2dSMark Bloch 		err = mlx5_query_port_ptys(mdev, out, sizeof(out), MLX5_PTYS_EN,
51526628e2dSMark Bloch 					   1);
51626628e2dSMark Bloch 	else
517bc4e12ffSAya Levin 		err = mlx5_query_port_ptys(mdev, out, sizeof(out), MLX5_PTYS_EN,
518b3cbd6f0SDaniel Jurgens 					   mdev_port_num);
519095b0927SIlan Tayari 	if (err)
520b3cbd6f0SDaniel Jurgens 		goto out;
52108e8676fSAya Levin 	ext = MLX5_CAP_PCAM_FEATURE(dev->mdev, ptys_extended_ethernet);
52208e8676fSAya Levin 	eth_prot_oper = MLX5_GET_ETH_PROTO(ptys_reg, out, ext, eth_proto_oper);
523f1b65df5SNoa Osherovich 
5247672ed33SHonggang Li 	props->active_width     = IB_WIDTH_4X;
5257672ed33SHonggang Li 	props->active_speed     = IB_SPEED_QDR;
5267672ed33SHonggang Li 
527f1b65df5SNoa Osherovich 	translate_eth_proto_oper(eth_prot_oper, &props->active_speed,
52808e8676fSAya Levin 				 &props->active_width, ext);
5293f89a643SAchiad Shochat 
5303f89a643SAchiad Shochat 	props->port_cap_flags |= IB_PORT_CM_SUP;
5312f944c0fSJason Gunthorpe 	props->ip_gids = true;
5323f89a643SAchiad Shochat 
5333f89a643SAchiad Shochat 	props->gid_tbl_len      = MLX5_CAP_ROCE(dev->mdev,
5343f89a643SAchiad Shochat 						roce_address_table_size);
5353f89a643SAchiad Shochat 	props->max_mtu          = IB_MTU_4096;
5363f89a643SAchiad Shochat 	props->max_msg_sz       = 1 << MLX5_CAP_GEN(dev->mdev, log_max_msg);
5373f89a643SAchiad Shochat 	props->pkey_tbl_len     = 1;
5383f89a643SAchiad Shochat 	props->state            = IB_PORT_DOWN;
53972a7720fSKamal Heib 	props->phys_state       = IB_PORT_PHYS_STATE_DISABLED;
5403f89a643SAchiad Shochat 
541b3cbd6f0SDaniel Jurgens 	mlx5_query_nic_vport_qkey_viol_cntr(mdev, &qkey_viol_cntr);
542c876a1b7SLeon Romanovsky 	props->qkey_viol_cntr = qkey_viol_cntr;
5433f89a643SAchiad Shochat 
544b3cbd6f0SDaniel Jurgens 	/* If this is a stub query for an unaffiliated port stop here */
545b3cbd6f0SDaniel Jurgens 	if (!put_mdev)
546b3cbd6f0SDaniel Jurgens 		goto out;
547b3cbd6f0SDaniel Jurgens 
5483f89a643SAchiad Shochat 	ndev = mlx5_ib_get_netdev(device, port_num);
5493f89a643SAchiad Shochat 	if (!ndev)
550b3cbd6f0SDaniel Jurgens 		goto out;
5513f89a643SAchiad Shochat 
5527c34ec19SAviv Heller 	if (dev->lag_active) {
55388621dfeSAviv Heller 		rcu_read_lock();
55488621dfeSAviv Heller 		upper = netdev_master_upper_dev_get_rcu(ndev);
55588621dfeSAviv Heller 		if (upper) {
55688621dfeSAviv Heller 			dev_put(ndev);
55788621dfeSAviv Heller 			ndev = upper;
55888621dfeSAviv Heller 			dev_hold(ndev);
55988621dfeSAviv Heller 		}
56088621dfeSAviv Heller 		rcu_read_unlock();
56188621dfeSAviv Heller 	}
56288621dfeSAviv Heller 
5633f89a643SAchiad Shochat 	if (netif_running(ndev) && netif_carrier_ok(ndev)) {
5643f89a643SAchiad Shochat 		props->state      = IB_PORT_ACTIVE;
56572a7720fSKamal Heib 		props->phys_state = IB_PORT_PHYS_STATE_LINK_UP;
5663f89a643SAchiad Shochat 	}
5673f89a643SAchiad Shochat 
5683f89a643SAchiad Shochat 	ndev_ib_mtu = iboe_get_mtu(ndev->mtu);
5693f89a643SAchiad Shochat 
5703f89a643SAchiad Shochat 	dev_put(ndev);
5713f89a643SAchiad Shochat 
5723f89a643SAchiad Shochat 	props->active_mtu	= min(props->max_mtu, ndev_ib_mtu);
573b3cbd6f0SDaniel Jurgens out:
574b3cbd6f0SDaniel Jurgens 	if (put_mdev)
575b3cbd6f0SDaniel Jurgens 		mlx5_ib_put_native_port_mdev(dev, port_num);
576b3cbd6f0SDaniel Jurgens 	return err;
5773f89a643SAchiad Shochat }
5783f89a643SAchiad Shochat 
579095b0927SIlan Tayari static int set_roce_addr(struct mlx5_ib_dev *dev, u8 port_num,
580095b0927SIlan Tayari 			 unsigned int index, const union ib_gid *gid,
581095b0927SIlan Tayari 			 const struct ib_gid_attr *attr)
5823cca2606SAchiad Shochat {
583095b0927SIlan Tayari 	enum ib_gid_type gid_type = IB_GID_TYPE_IB;
584a70c0739SParav Pandit 	u16 vlan_id = 0xffff;
585095b0927SIlan Tayari 	u8 roce_version = 0;
586095b0927SIlan Tayari 	u8 roce_l3_type = 0;
587095b0927SIlan Tayari 	u8 mac[ETH_ALEN];
588a70c0739SParav Pandit 	int ret;
5893cca2606SAchiad Shochat 
590095b0927SIlan Tayari 	if (gid) {
591095b0927SIlan Tayari 		gid_type = attr->gid_type;
592a70c0739SParav Pandit 		ret = rdma_read_gid_l2_fields(attr, &vlan_id, &mac[0]);
593a70c0739SParav Pandit 		if (ret)
594a70c0739SParav Pandit 			return ret;
5953cca2606SAchiad Shochat 	}
5963cca2606SAchiad Shochat 
597095b0927SIlan Tayari 	switch (gid_type) {
5983cca2606SAchiad Shochat 	case IB_GID_TYPE_IB:
599095b0927SIlan Tayari 		roce_version = MLX5_ROCE_VERSION_1;
6003cca2606SAchiad Shochat 		break;
6013cca2606SAchiad Shochat 	case IB_GID_TYPE_ROCE_UDP_ENCAP:
602095b0927SIlan Tayari 		roce_version = MLX5_ROCE_VERSION_2;
603095b0927SIlan Tayari 		if (ipv6_addr_v4mapped((void *)gid))
604095b0927SIlan Tayari 			roce_l3_type = MLX5_ROCE_L3_TYPE_IPV4;
605095b0927SIlan Tayari 		else
606095b0927SIlan Tayari 			roce_l3_type = MLX5_ROCE_L3_TYPE_IPV6;
6073cca2606SAchiad Shochat 		break;
6083cca2606SAchiad Shochat 
6093cca2606SAchiad Shochat 	default:
610095b0927SIlan Tayari 		mlx5_ib_warn(dev, "Unexpected GID type %u\n", gid_type);
6113cca2606SAchiad Shochat 	}
6123cca2606SAchiad Shochat 
613095b0927SIlan Tayari 	return mlx5_core_roce_gid_set(dev->mdev, index, roce_version,
614cf34e1feSParav Pandit 				      roce_l3_type, gid->raw, mac,
615a70c0739SParav Pandit 				      vlan_id < VLAN_CFI_MASK, vlan_id,
616cf34e1feSParav Pandit 				      port_num);
6173cca2606SAchiad Shochat }
6183cca2606SAchiad Shochat 
619f4df9a7cSParav Pandit static int mlx5_ib_add_gid(const struct ib_gid_attr *attr,
6203cca2606SAchiad Shochat 			   __always_unused void **context)
6213cca2606SAchiad Shochat {
622414448d2SParav Pandit 	return set_roce_addr(to_mdev(attr->device), attr->port_num,
623f4df9a7cSParav Pandit 			     attr->index, &attr->gid, attr);
6243cca2606SAchiad Shochat }
6253cca2606SAchiad Shochat 
626414448d2SParav Pandit static int mlx5_ib_del_gid(const struct ib_gid_attr *attr,
627414448d2SParav Pandit 			   __always_unused void **context)
6283cca2606SAchiad Shochat {
629414448d2SParav Pandit 	return set_roce_addr(to_mdev(attr->device), attr->port_num,
630414448d2SParav Pandit 			     attr->index, NULL, NULL);
6313cca2606SAchiad Shochat }
6323cca2606SAchiad Shochat 
63347ec3866SParav Pandit __be16 mlx5_get_roce_udp_sport(struct mlx5_ib_dev *dev,
63447ec3866SParav Pandit 			       const struct ib_gid_attr *attr)
6352811ba51SAchiad Shochat {
63647ec3866SParav Pandit 	if (attr->gid_type != IB_GID_TYPE_ROCE_UDP_ENCAP)
6372811ba51SAchiad Shochat 		return 0;
6382811ba51SAchiad Shochat 
6392811ba51SAchiad Shochat 	return cpu_to_be16(MLX5_CAP_ROCE(dev->mdev, r_roce_min_src_udp_port));
6402811ba51SAchiad Shochat }
6412811ba51SAchiad Shochat 
6421b5daf11SMajd Dibbiny static int mlx5_use_mad_ifc(struct mlx5_ib_dev *dev)
6431b5daf11SMajd Dibbiny {
6447fae6655SNoa Osherovich 	if (MLX5_CAP_GEN(dev->mdev, port_type) == MLX5_CAP_PORT_TYPE_IB)
645d603c809SEli Cohen 		return !MLX5_CAP_GEN(dev->mdev, ib_virt);
6467fae6655SNoa Osherovich 	return 0;
6471b5daf11SMajd Dibbiny }
6481b5daf11SMajd Dibbiny 
6491b5daf11SMajd Dibbiny enum {
6501b5daf11SMajd Dibbiny 	MLX5_VPORT_ACCESS_METHOD_MAD,
6511b5daf11SMajd Dibbiny 	MLX5_VPORT_ACCESS_METHOD_HCA,
6521b5daf11SMajd Dibbiny 	MLX5_VPORT_ACCESS_METHOD_NIC,
6531b5daf11SMajd Dibbiny };
6541b5daf11SMajd Dibbiny 
6551b5daf11SMajd Dibbiny static int mlx5_get_vport_access_method(struct ib_device *ibdev)
6561b5daf11SMajd Dibbiny {
6571b5daf11SMajd Dibbiny 	if (mlx5_use_mad_ifc(to_mdev(ibdev)))
6581b5daf11SMajd Dibbiny 		return MLX5_VPORT_ACCESS_METHOD_MAD;
6591b5daf11SMajd Dibbiny 
660ebd61f68SAchiad Shochat 	if (mlx5_ib_port_link_layer(ibdev, 1) ==
6611b5daf11SMajd Dibbiny 	    IB_LINK_LAYER_ETHERNET)
6621b5daf11SMajd Dibbiny 		return MLX5_VPORT_ACCESS_METHOD_NIC;
6631b5daf11SMajd Dibbiny 
6641b5daf11SMajd Dibbiny 	return MLX5_VPORT_ACCESS_METHOD_HCA;
6651b5daf11SMajd Dibbiny }
6661b5daf11SMajd Dibbiny 
667da7525d2SEran Ben Elisha static void get_atomic_caps(struct mlx5_ib_dev *dev,
668776a3906SMoni Shoua 			    u8 atomic_size_qp,
669da7525d2SEran Ben Elisha 			    struct ib_device_attr *props)
670da7525d2SEran Ben Elisha {
671da7525d2SEran Ben Elisha 	u8 tmp;
672da7525d2SEran Ben Elisha 	u8 atomic_operations = MLX5_CAP_ATOMIC(dev->mdev, atomic_operations);
673da7525d2SEran Ben Elisha 	u8 atomic_req_8B_endianness_mode =
674bd10838aSOr Gerlitz 		MLX5_CAP_ATOMIC(dev->mdev, atomic_req_8B_endianness_mode);
675da7525d2SEran Ben Elisha 
676da7525d2SEran Ben Elisha 	/* Check if HW supports 8 bytes standard atomic operations and capable
677da7525d2SEran Ben Elisha 	 * of host endianness respond
678da7525d2SEran Ben Elisha 	 */
679da7525d2SEran Ben Elisha 	tmp = MLX5_ATOMIC_OPS_CMP_SWAP | MLX5_ATOMIC_OPS_FETCH_ADD;
680da7525d2SEran Ben Elisha 	if (((atomic_operations & tmp) == tmp) &&
681da7525d2SEran Ben Elisha 	    (atomic_size_qp & MLX5_ATOMIC_SIZE_QP_8BYTES) &&
682da7525d2SEran Ben Elisha 	    (atomic_req_8B_endianness_mode)) {
683da7525d2SEran Ben Elisha 		props->atomic_cap = IB_ATOMIC_HCA;
684da7525d2SEran Ben Elisha 	} else {
685da7525d2SEran Ben Elisha 		props->atomic_cap = IB_ATOMIC_NONE;
686da7525d2SEran Ben Elisha 	}
687da7525d2SEran Ben Elisha }
688da7525d2SEran Ben Elisha 
689776a3906SMoni Shoua static void get_atomic_caps_qp(struct mlx5_ib_dev *dev,
690776a3906SMoni Shoua 			       struct ib_device_attr *props)
691776a3906SMoni Shoua {
692776a3906SMoni Shoua 	u8 atomic_size_qp = MLX5_CAP_ATOMIC(dev->mdev, atomic_size_qp);
693776a3906SMoni Shoua 
694776a3906SMoni Shoua 	get_atomic_caps(dev, atomic_size_qp, props);
695776a3906SMoni Shoua }
696776a3906SMoni Shoua 
697776a3906SMoni Shoua static void get_atomic_caps_dc(struct mlx5_ib_dev *dev,
698776a3906SMoni Shoua 			       struct ib_device_attr *props)
699776a3906SMoni Shoua {
700776a3906SMoni Shoua 	u8 atomic_size_qp = MLX5_CAP_ATOMIC(dev->mdev, atomic_size_dc);
701776a3906SMoni Shoua 
702776a3906SMoni Shoua 	get_atomic_caps(dev, atomic_size_qp, props);
703776a3906SMoni Shoua }
704776a3906SMoni Shoua 
705776a3906SMoni Shoua bool mlx5_ib_dc_atomic_is_supported(struct mlx5_ib_dev *dev)
706776a3906SMoni Shoua {
707776a3906SMoni Shoua 	struct ib_device_attr props = {};
708776a3906SMoni Shoua 
709776a3906SMoni Shoua 	get_atomic_caps_dc(dev, &props);
710776a3906SMoni Shoua 	return (props.atomic_cap == IB_ATOMIC_HCA) ? true : false;
711776a3906SMoni Shoua }
7121b5daf11SMajd Dibbiny static int mlx5_query_system_image_guid(struct ib_device *ibdev,
7131b5daf11SMajd Dibbiny 					__be64 *sys_image_guid)
7141b5daf11SMajd Dibbiny {
7151b5daf11SMajd Dibbiny 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
7161b5daf11SMajd Dibbiny 	struct mlx5_core_dev *mdev = dev->mdev;
7171b5daf11SMajd Dibbiny 	u64 tmp;
7181b5daf11SMajd Dibbiny 	int err;
7191b5daf11SMajd Dibbiny 
7201b5daf11SMajd Dibbiny 	switch (mlx5_get_vport_access_method(ibdev)) {
7211b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_MAD:
7221b5daf11SMajd Dibbiny 		return mlx5_query_mad_ifc_system_image_guid(ibdev,
7231b5daf11SMajd Dibbiny 							    sys_image_guid);
7241b5daf11SMajd Dibbiny 
7251b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_HCA:
7261b5daf11SMajd Dibbiny 		err = mlx5_query_hca_vport_system_image_guid(mdev, &tmp);
7273f89a643SAchiad Shochat 		break;
7283f89a643SAchiad Shochat 
7293f89a643SAchiad Shochat 	case MLX5_VPORT_ACCESS_METHOD_NIC:
7303f89a643SAchiad Shochat 		err = mlx5_query_nic_vport_system_image_guid(mdev, &tmp);
7313f89a643SAchiad Shochat 		break;
7321b5daf11SMajd Dibbiny 
7331b5daf11SMajd Dibbiny 	default:
7341b5daf11SMajd Dibbiny 		return -EINVAL;
7351b5daf11SMajd Dibbiny 	}
7363f89a643SAchiad Shochat 
7373f89a643SAchiad Shochat 	if (!err)
7383f89a643SAchiad Shochat 		*sys_image_guid = cpu_to_be64(tmp);
7393f89a643SAchiad Shochat 
7403f89a643SAchiad Shochat 	return err;
7413f89a643SAchiad Shochat 
7421b5daf11SMajd Dibbiny }
7431b5daf11SMajd Dibbiny 
7441b5daf11SMajd Dibbiny static int mlx5_query_max_pkeys(struct ib_device *ibdev,
7451b5daf11SMajd Dibbiny 				u16 *max_pkeys)
7461b5daf11SMajd Dibbiny {
7471b5daf11SMajd Dibbiny 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
7481b5daf11SMajd Dibbiny 	struct mlx5_core_dev *mdev = dev->mdev;
7491b5daf11SMajd Dibbiny 
7501b5daf11SMajd Dibbiny 	switch (mlx5_get_vport_access_method(ibdev)) {
7511b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_MAD:
7521b5daf11SMajd Dibbiny 		return mlx5_query_mad_ifc_max_pkeys(ibdev, max_pkeys);
7531b5daf11SMajd Dibbiny 
7541b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_HCA:
7551b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_NIC:
7561b5daf11SMajd Dibbiny 		*max_pkeys = mlx5_to_sw_pkey_sz(MLX5_CAP_GEN(mdev,
7571b5daf11SMajd Dibbiny 						pkey_table_size));
7581b5daf11SMajd Dibbiny 		return 0;
7591b5daf11SMajd Dibbiny 
7601b5daf11SMajd Dibbiny 	default:
7611b5daf11SMajd Dibbiny 		return -EINVAL;
7621b5daf11SMajd Dibbiny 	}
7631b5daf11SMajd Dibbiny }
7641b5daf11SMajd Dibbiny 
7651b5daf11SMajd Dibbiny static int mlx5_query_vendor_id(struct ib_device *ibdev,
7661b5daf11SMajd Dibbiny 				u32 *vendor_id)
7671b5daf11SMajd Dibbiny {
7681b5daf11SMajd Dibbiny 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
7691b5daf11SMajd Dibbiny 
7701b5daf11SMajd Dibbiny 	switch (mlx5_get_vport_access_method(ibdev)) {
7711b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_MAD:
7721b5daf11SMajd Dibbiny 		return mlx5_query_mad_ifc_vendor_id(ibdev, vendor_id);
7731b5daf11SMajd Dibbiny 
7741b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_HCA:
7751b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_NIC:
7761b5daf11SMajd Dibbiny 		return mlx5_core_query_vendor_id(dev->mdev, vendor_id);
7771b5daf11SMajd Dibbiny 
7781b5daf11SMajd Dibbiny 	default:
7791b5daf11SMajd Dibbiny 		return -EINVAL;
7801b5daf11SMajd Dibbiny 	}
7811b5daf11SMajd Dibbiny }
7821b5daf11SMajd Dibbiny 
7831b5daf11SMajd Dibbiny static int mlx5_query_node_guid(struct mlx5_ib_dev *dev,
7841b5daf11SMajd Dibbiny 				__be64 *node_guid)
7851b5daf11SMajd Dibbiny {
7861b5daf11SMajd Dibbiny 	u64 tmp;
7871b5daf11SMajd Dibbiny 	int err;
7881b5daf11SMajd Dibbiny 
7891b5daf11SMajd Dibbiny 	switch (mlx5_get_vport_access_method(&dev->ib_dev)) {
7901b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_MAD:
7911b5daf11SMajd Dibbiny 		return mlx5_query_mad_ifc_node_guid(dev, node_guid);
7921b5daf11SMajd Dibbiny 
7931b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_HCA:
7941b5daf11SMajd Dibbiny 		err = mlx5_query_hca_vport_node_guid(dev->mdev, &tmp);
7953f89a643SAchiad Shochat 		break;
7963f89a643SAchiad Shochat 
7973f89a643SAchiad Shochat 	case MLX5_VPORT_ACCESS_METHOD_NIC:
7983f89a643SAchiad Shochat 		err = mlx5_query_nic_vport_node_guid(dev->mdev, &tmp);
7993f89a643SAchiad Shochat 		break;
8001b5daf11SMajd Dibbiny 
8011b5daf11SMajd Dibbiny 	default:
8021b5daf11SMajd Dibbiny 		return -EINVAL;
8031b5daf11SMajd Dibbiny 	}
8043f89a643SAchiad Shochat 
8053f89a643SAchiad Shochat 	if (!err)
8063f89a643SAchiad Shochat 		*node_guid = cpu_to_be64(tmp);
8073f89a643SAchiad Shochat 
8083f89a643SAchiad Shochat 	return err;
8091b5daf11SMajd Dibbiny }
8101b5daf11SMajd Dibbiny 
8111b5daf11SMajd Dibbiny struct mlx5_reg_node_desc {
812bd99fdeaSYuval Shaia 	u8	desc[IB_DEVICE_NODE_DESC_MAX];
8131b5daf11SMajd Dibbiny };
8141b5daf11SMajd Dibbiny 
8151b5daf11SMajd Dibbiny static int mlx5_query_node_desc(struct mlx5_ib_dev *dev, char *node_desc)
8161b5daf11SMajd Dibbiny {
8171b5daf11SMajd Dibbiny 	struct mlx5_reg_node_desc in;
8181b5daf11SMajd Dibbiny 
8191b5daf11SMajd Dibbiny 	if (mlx5_use_mad_ifc(dev))
8201b5daf11SMajd Dibbiny 		return mlx5_query_mad_ifc_node_desc(dev, node_desc);
8211b5daf11SMajd Dibbiny 
8221b5daf11SMajd Dibbiny 	memset(&in, 0, sizeof(in));
8231b5daf11SMajd Dibbiny 
8241b5daf11SMajd Dibbiny 	return mlx5_core_access_reg(dev->mdev, &in, sizeof(in), node_desc,
8251b5daf11SMajd Dibbiny 				    sizeof(struct mlx5_reg_node_desc),
8261b5daf11SMajd Dibbiny 				    MLX5_REG_NODE_DESC, 0, 0);
8271b5daf11SMajd Dibbiny }
8281b5daf11SMajd Dibbiny 
829e126ba97SEli Cohen static int mlx5_ib_query_device(struct ib_device *ibdev,
8302528e33eSMatan Barak 				struct ib_device_attr *props,
8312528e33eSMatan Barak 				struct ib_udata *uhw)
832e126ba97SEli Cohen {
833e126ba97SEli Cohen 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
834938fe83cSSaeed Mahameed 	struct mlx5_core_dev *mdev = dev->mdev;
835e126ba97SEli Cohen 	int err = -ENOMEM;
836288c01b7SEli Cohen 	int max_sq_desc;
837e126ba97SEli Cohen 	int max_rq_sg;
838e126ba97SEli Cohen 	int max_sq_sg;
839e0238a6aSSagi Grimberg 	u64 min_page_size = 1ull << MLX5_CAP_GEN(mdev, log_pg_sz);
84085c7c014SDaniel Jurgens 	bool raw_support = !mlx5_core_mp_enabled(mdev);
841402ca536SBodong Wang 	struct mlx5_ib_query_device_resp resp = {};
842402ca536SBodong Wang 	size_t resp_len;
843402ca536SBodong Wang 	u64 max_tso;
844e126ba97SEli Cohen 
845402ca536SBodong Wang 	resp_len = sizeof(resp.comp_mask) + sizeof(resp.response_length);
846402ca536SBodong Wang 	if (uhw->outlen && uhw->outlen < resp_len)
847402ca536SBodong Wang 		return -EINVAL;
8486f26b2acSErez Alfasi 
849402ca536SBodong Wang 	resp.response_length = resp_len;
850402ca536SBodong Wang 
851402ca536SBodong Wang 	if (uhw->inlen && !ib_is_udata_cleared(uhw, 0, uhw->inlen))
8522528e33eSMatan Barak 		return -EINVAL;
8532528e33eSMatan Barak 
854e126ba97SEli Cohen 	memset(props, 0, sizeof(*props));
8551b5daf11SMajd Dibbiny 	err = mlx5_query_system_image_guid(ibdev,
8561b5daf11SMajd Dibbiny 					   &props->sys_image_guid);
8571b5daf11SMajd Dibbiny 	if (err)
8581b5daf11SMajd Dibbiny 		return err;
8591b5daf11SMajd Dibbiny 
8601b5daf11SMajd Dibbiny 	err = mlx5_query_max_pkeys(ibdev, &props->max_pkeys);
8611b5daf11SMajd Dibbiny 	if (err)
8621b5daf11SMajd Dibbiny 		return err;
8631b5daf11SMajd Dibbiny 
8641b5daf11SMajd Dibbiny 	err = mlx5_query_vendor_id(ibdev, &props->vendor_id);
8651b5daf11SMajd Dibbiny 	if (err)
8661b5daf11SMajd Dibbiny 		return err;
867e126ba97SEli Cohen 
8689603b61dSJack Morgenstein 	props->fw_ver = ((u64)fw_rev_maj(dev->mdev) << 32) |
8699603b61dSJack Morgenstein 		(fw_rev_min(dev->mdev) << 16) |
8709603b61dSJack Morgenstein 		fw_rev_sub(dev->mdev);
871e126ba97SEli Cohen 	props->device_cap_flags    = IB_DEVICE_CHANGE_PHY_PORT |
872e126ba97SEli Cohen 		IB_DEVICE_PORT_ACTIVE_EVENT		|
873e126ba97SEli Cohen 		IB_DEVICE_SYS_IMAGE_GUID		|
8741a4c3a3dSEli Cohen 		IB_DEVICE_RC_RNR_NAK_GEN;
875938fe83cSSaeed Mahameed 
876938fe83cSSaeed Mahameed 	if (MLX5_CAP_GEN(mdev, pkv))
877e126ba97SEli Cohen 		props->device_cap_flags |= IB_DEVICE_BAD_PKEY_CNTR;
878938fe83cSSaeed Mahameed 	if (MLX5_CAP_GEN(mdev, qkv))
879e126ba97SEli Cohen 		props->device_cap_flags |= IB_DEVICE_BAD_QKEY_CNTR;
880938fe83cSSaeed Mahameed 	if (MLX5_CAP_GEN(mdev, apm))
881e126ba97SEli Cohen 		props->device_cap_flags |= IB_DEVICE_AUTO_PATH_MIG;
882938fe83cSSaeed Mahameed 	if (MLX5_CAP_GEN(mdev, xrc))
883e126ba97SEli Cohen 		props->device_cap_flags |= IB_DEVICE_XRC;
884d2370e0aSMatan Barak 	if (MLX5_CAP_GEN(mdev, imaicl)) {
885d2370e0aSMatan Barak 		props->device_cap_flags |= IB_DEVICE_MEM_WINDOW |
886d2370e0aSMatan Barak 					   IB_DEVICE_MEM_WINDOW_TYPE_2B;
887d2370e0aSMatan Barak 		props->max_mw = 1 << MLX5_CAP_GEN(mdev, log_max_mkey);
888b005d316SSagi Grimberg 		/* We support 'Gappy' memory registration too */
889b005d316SSagi Grimberg 		props->device_cap_flags |= IB_DEVICE_SG_GAPS_REG;
890d2370e0aSMatan Barak 	}
891e126ba97SEli Cohen 	props->device_cap_flags |= IB_DEVICE_MEM_MGT_EXTENSIONS;
892938fe83cSSaeed Mahameed 	if (MLX5_CAP_GEN(mdev, sho)) {
893c0a6cbb9SIsrael Rukshin 		props->device_cap_flags |= IB_DEVICE_INTEGRITY_HANDOVER;
8942dea9094SSagi Grimberg 		/* At this stage no support for signature handover */
8952dea9094SSagi Grimberg 		props->sig_prot_cap = IB_PROT_T10DIF_TYPE_1 |
8962dea9094SSagi Grimberg 				      IB_PROT_T10DIF_TYPE_2 |
8972dea9094SSagi Grimberg 				      IB_PROT_T10DIF_TYPE_3;
8982dea9094SSagi Grimberg 		props->sig_guard_cap = IB_GUARD_T10DIF_CRC |
8992dea9094SSagi Grimberg 				       IB_GUARD_T10DIF_CSUM;
9002dea9094SSagi Grimberg 	}
901938fe83cSSaeed Mahameed 	if (MLX5_CAP_GEN(mdev, block_lb_mc))
902f360d88aSEli Cohen 		props->device_cap_flags |= IB_DEVICE_BLOCK_MULTICAST_LOOPBACK;
903e126ba97SEli Cohen 
90485c7c014SDaniel Jurgens 	if (MLX5_CAP_GEN(dev->mdev, eth_net_offloads) && raw_support) {
905e8161334SNoa Osherovich 		if (MLX5_CAP_ETH(mdev, csum_cap)) {
906e8161334SNoa Osherovich 			/* Legacy bit to support old userspace libraries */
90788115fe7SBodong Wang 			props->device_cap_flags |= IB_DEVICE_RAW_IP_CSUM;
908e8161334SNoa Osherovich 			props->raw_packet_caps |= IB_RAW_PACKET_CAP_IP_CSUM;
909e8161334SNoa Osherovich 		}
910e8161334SNoa Osherovich 
911e8161334SNoa Osherovich 		if (MLX5_CAP_ETH(dev->mdev, vlan_cap))
912e8161334SNoa Osherovich 			props->raw_packet_caps |=
913e8161334SNoa Osherovich 				IB_RAW_PACKET_CAP_CVLAN_STRIPPING;
91488115fe7SBodong Wang 
915402ca536SBodong Wang 		if (field_avail(typeof(resp), tso_caps, uhw->outlen)) {
916402ca536SBodong Wang 			max_tso = MLX5_CAP_ETH(mdev, max_lso_cap);
917402ca536SBodong Wang 			if (max_tso) {
918402ca536SBodong Wang 				resp.tso_caps.max_tso = 1 << max_tso;
919402ca536SBodong Wang 				resp.tso_caps.supported_qpts |=
920402ca536SBodong Wang 					1 << IB_QPT_RAW_PACKET;
921402ca536SBodong Wang 				resp.response_length += sizeof(resp.tso_caps);
922402ca536SBodong Wang 			}
923402ca536SBodong Wang 		}
92431f69a82SYishai Hadas 
92531f69a82SYishai Hadas 		if (field_avail(typeof(resp), rss_caps, uhw->outlen)) {
92631f69a82SYishai Hadas 			resp.rss_caps.rx_hash_function =
92731f69a82SYishai Hadas 						MLX5_RX_HASH_FUNC_TOEPLITZ;
92831f69a82SYishai Hadas 			resp.rss_caps.rx_hash_fields_mask =
92931f69a82SYishai Hadas 						MLX5_RX_HASH_SRC_IPV4 |
93031f69a82SYishai Hadas 						MLX5_RX_HASH_DST_IPV4 |
93131f69a82SYishai Hadas 						MLX5_RX_HASH_SRC_IPV6 |
93231f69a82SYishai Hadas 						MLX5_RX_HASH_DST_IPV6 |
93331f69a82SYishai Hadas 						MLX5_RX_HASH_SRC_PORT_TCP |
93431f69a82SYishai Hadas 						MLX5_RX_HASH_DST_PORT_TCP |
93531f69a82SYishai Hadas 						MLX5_RX_HASH_SRC_PORT_UDP |
9364e2b53a5SMaor Gottlieb 						MLX5_RX_HASH_DST_PORT_UDP |
9374e2b53a5SMaor Gottlieb 						MLX5_RX_HASH_INNER;
9382d93fc85SMatan Barak 			if (mlx5_accel_ipsec_device_caps(dev->mdev) &
9392d93fc85SMatan Barak 			    MLX5_ACCEL_IPSEC_CAP_DEVICE)
9402d93fc85SMatan Barak 				resp.rss_caps.rx_hash_fields_mask |=
9412d93fc85SMatan Barak 					MLX5_RX_HASH_IPSEC_SPI;
94231f69a82SYishai Hadas 			resp.response_length += sizeof(resp.rss_caps);
94331f69a82SYishai Hadas 		}
94431f69a82SYishai Hadas 	} else {
94531f69a82SYishai Hadas 		if (field_avail(typeof(resp), tso_caps, uhw->outlen))
94631f69a82SYishai Hadas 			resp.response_length += sizeof(resp.tso_caps);
94731f69a82SYishai Hadas 		if (field_avail(typeof(resp), rss_caps, uhw->outlen))
94831f69a82SYishai Hadas 			resp.response_length += sizeof(resp.rss_caps);
949402ca536SBodong Wang 	}
950402ca536SBodong Wang 
951f0313965SErez Shitrit 	if (MLX5_CAP_GEN(mdev, ipoib_basic_offloads)) {
952f0313965SErez Shitrit 		props->device_cap_flags |= IB_DEVICE_UD_IP_CSUM;
953f0313965SErez Shitrit 		props->device_cap_flags |= IB_DEVICE_UD_TSO;
954f0313965SErez Shitrit 	}
955f0313965SErez Shitrit 
95603404e8aSMaor Gottlieb 	if (MLX5_CAP_GEN(dev->mdev, rq_delay_drop) &&
95785c7c014SDaniel Jurgens 	    MLX5_CAP_GEN(dev->mdev, general_notification_event) &&
95885c7c014SDaniel Jurgens 	    raw_support)
95903404e8aSMaor Gottlieb 		props->raw_packet_caps |= IB_RAW_PACKET_CAP_DELAY_DROP;
96003404e8aSMaor Gottlieb 
9611d54f890SYishai Hadas 	if (MLX5_CAP_GEN(mdev, ipoib_enhanced_offloads) &&
9621d54f890SYishai Hadas 	    MLX5_CAP_IPOIB_ENHANCED(mdev, csum_cap))
9631d54f890SYishai Hadas 		props->device_cap_flags |= IB_DEVICE_UD_IP_CSUM;
9641d54f890SYishai Hadas 
965cff5a0f3SMajd Dibbiny 	if (MLX5_CAP_GEN(dev->mdev, eth_net_offloads) &&
96685c7c014SDaniel Jurgens 	    MLX5_CAP_ETH(dev->mdev, scatter_fcs) &&
96785c7c014SDaniel Jurgens 	    raw_support) {
968e8161334SNoa Osherovich 		/* Legacy bit to support old userspace libraries */
969cff5a0f3SMajd Dibbiny 		props->device_cap_flags |= IB_DEVICE_RAW_SCATTER_FCS;
970e8161334SNoa Osherovich 		props->raw_packet_caps |= IB_RAW_PACKET_CAP_SCATTER_FCS;
971e8161334SNoa Osherovich 	}
972cff5a0f3SMajd Dibbiny 
97324da0016SAriel Levkovich 	if (MLX5_CAP_DEV_MEM(mdev, memic)) {
97424da0016SAriel Levkovich 		props->max_dm_size =
97524da0016SAriel Levkovich 			MLX5_CAP_DEV_MEM(mdev, max_memic_size);
97624da0016SAriel Levkovich 	}
97724da0016SAriel Levkovich 
978da6d6ba3SMaor Gottlieb 	if (mlx5_get_flow_namespace(dev->mdev, MLX5_FLOW_NAMESPACE_BYPASS))
979da6d6ba3SMaor Gottlieb 		props->device_cap_flags |= IB_DEVICE_MANAGED_FLOW_STEERING;
980da6d6ba3SMaor Gottlieb 
981b1383aa6SNoa Osherovich 	if (MLX5_CAP_GEN(mdev, end_pad))
982b1383aa6SNoa Osherovich 		props->device_cap_flags |= IB_DEVICE_PCI_WRITE_END_PADDING;
983b1383aa6SNoa Osherovich 
9841b5daf11SMajd Dibbiny 	props->vendor_part_id	   = mdev->pdev->device;
9851b5daf11SMajd Dibbiny 	props->hw_ver		   = mdev->pdev->revision;
986e126ba97SEli Cohen 
987e126ba97SEli Cohen 	props->max_mr_size	   = ~0ull;
988e0238a6aSSagi Grimberg 	props->page_size_cap	   = ~(min_page_size - 1);
989938fe83cSSaeed Mahameed 	props->max_qp		   = 1 << MLX5_CAP_GEN(mdev, log_max_qp);
990938fe83cSSaeed Mahameed 	props->max_qp_wr	   = 1 << MLX5_CAP_GEN(mdev, log_max_qp_sz);
991938fe83cSSaeed Mahameed 	max_rq_sg =  MLX5_CAP_GEN(mdev, max_wqe_sz_rq) /
992938fe83cSSaeed Mahameed 		     sizeof(struct mlx5_wqe_data_seg);
993288c01b7SEli Cohen 	max_sq_desc = min_t(int, MLX5_CAP_GEN(mdev, max_wqe_sz_sq), 512);
994288c01b7SEli Cohen 	max_sq_sg = (max_sq_desc - sizeof(struct mlx5_wqe_ctrl_seg) -
995288c01b7SEli Cohen 		     sizeof(struct mlx5_wqe_raddr_seg)) /
996e126ba97SEli Cohen 		sizeof(struct mlx5_wqe_data_seg);
99733023fb8SSteve Wise 	props->max_send_sge = max_sq_sg;
99833023fb8SSteve Wise 	props->max_recv_sge = max_rq_sg;
999986ef95eSSagi Grimberg 	props->max_sge_rd	   = MLX5_MAX_SGE_RD;
1000938fe83cSSaeed Mahameed 	props->max_cq		   = 1 << MLX5_CAP_GEN(mdev, log_max_cq);
10019f177686SLeon Romanovsky 	props->max_cqe = (1 << MLX5_CAP_GEN(mdev, log_max_cq_sz)) - 1;
1002938fe83cSSaeed Mahameed 	props->max_mr		   = 1 << MLX5_CAP_GEN(mdev, log_max_mkey);
1003938fe83cSSaeed Mahameed 	props->max_pd		   = 1 << MLX5_CAP_GEN(mdev, log_max_pd);
1004938fe83cSSaeed Mahameed 	props->max_qp_rd_atom	   = 1 << MLX5_CAP_GEN(mdev, log_max_ra_req_qp);
1005938fe83cSSaeed Mahameed 	props->max_qp_init_rd_atom = 1 << MLX5_CAP_GEN(mdev, log_max_ra_res_qp);
1006938fe83cSSaeed Mahameed 	props->max_srq		   = 1 << MLX5_CAP_GEN(mdev, log_max_srq);
1007938fe83cSSaeed Mahameed 	props->max_srq_wr = (1 << MLX5_CAP_GEN(mdev, log_max_srq_sz)) - 1;
1008938fe83cSSaeed Mahameed 	props->local_ca_ack_delay  = MLX5_CAP_GEN(mdev, local_ca_ack_delay);
1009e126ba97SEli Cohen 	props->max_res_rd_atom	   = props->max_qp_rd_atom * props->max_qp;
1010e126ba97SEli Cohen 	props->max_srq_sge	   = max_rq_sg - 1;
1011911f4331SSagi Grimberg 	props->max_fast_reg_page_list_len =
1012911f4331SSagi Grimberg 		1 << MLX5_CAP_GEN(mdev, log_max_klm_list_size);
101362e3c379SMax Gurtovoy 	props->max_pi_fast_reg_page_list_len =
101462e3c379SMax Gurtovoy 		props->max_fast_reg_page_list_len / 2;
101536609056SYamin Friedman 	props->max_sgl_rd =
101636609056SYamin Friedman 		MLX5_CAP_GEN(mdev, max_sgl_for_optimized_performance);
1017776a3906SMoni Shoua 	get_atomic_caps_qp(dev, props);
101881bea28fSEli Cohen 	props->masked_atomic_cap   = IB_ATOMIC_NONE;
1019938fe83cSSaeed Mahameed 	props->max_mcast_grp	   = 1 << MLX5_CAP_GEN(mdev, log_max_mcg);
1020938fe83cSSaeed Mahameed 	props->max_mcast_qp_attach = MLX5_CAP_GEN(mdev, max_qp_mcg);
1021e126ba97SEli Cohen 	props->max_total_mcast_qp_attach = props->max_mcast_qp_attach *
1022e126ba97SEli Cohen 					   props->max_mcast_grp;
1023e126ba97SEli Cohen 	props->max_map_per_fmr = INT_MAX; /* no limit in ConnectIB */
102486695a65SMaor Gottlieb 	props->max_ah = INT_MAX;
10257c60bcbbSMatan Barak 	props->hca_core_clock = MLX5_CAP_GEN(mdev, device_frequency_khz);
10267c60bcbbSMatan Barak 	props->timestamp_mask = 0x7FFFFFFFFFFFFFFFULL;
1027e126ba97SEli Cohen 
1028e502b8b0SLeon Romanovsky 	if (IS_ENABLED(CONFIG_INFINIBAND_ON_DEMAND_PAGING)) {
102900815752SMoni Shoua 		if (dev->odp_caps.general_caps & IB_ODP_SUPPORT)
10308cdd312cSHaggai Eran 			props->device_cap_flags |= IB_DEVICE_ON_DEMAND_PAGING;
10318cdd312cSHaggai Eran 		props->odp_caps = dev->odp_caps;
1032e502b8b0SLeon Romanovsky 	}
10338cdd312cSHaggai Eran 
1034051f2630SLeon Romanovsky 	if (MLX5_CAP_GEN(mdev, cd))
1035051f2630SLeon Romanovsky 		props->device_cap_flags |= IB_DEVICE_CROSS_CHANNEL;
1036051f2630SLeon Romanovsky 
1037eff901d3SEli Cohen 	if (!mlx5_core_is_pf(mdev))
1038eff901d3SEli Cohen 		props->device_cap_flags |= IB_DEVICE_VIRTUAL_FUNCTION;
1039eff901d3SEli Cohen 
104031f69a82SYishai Hadas 	if (mlx5_ib_port_link_layer(ibdev, 1) ==
104185c7c014SDaniel Jurgens 	    IB_LINK_LAYER_ETHERNET && raw_support) {
104231f69a82SYishai Hadas 		props->rss_caps.max_rwq_indirection_tables =
104331f69a82SYishai Hadas 			1 << MLX5_CAP_GEN(dev->mdev, log_max_rqt);
104431f69a82SYishai Hadas 		props->rss_caps.max_rwq_indirection_table_size =
104531f69a82SYishai Hadas 			1 << MLX5_CAP_GEN(dev->mdev, log_max_rqt_size);
104631f69a82SYishai Hadas 		props->rss_caps.supported_qpts = 1 << IB_QPT_RAW_PACKET;
104731f69a82SYishai Hadas 		props->max_wq_type_rq =
104831f69a82SYishai Hadas 			1 << MLX5_CAP_GEN(dev->mdev, log_max_rq);
104931f69a82SYishai Hadas 	}
105031f69a82SYishai Hadas 
1051eb761894SArtemy Kovalyov 	if (MLX5_CAP_GEN(mdev, tag_matching)) {
105278b1beb0SLeon Romanovsky 		props->tm_caps.max_num_tags =
1053eb761894SArtemy Kovalyov 			(1 << MLX5_CAP_GEN(mdev, log_tag_matching_list_sz)) - 1;
105478b1beb0SLeon Romanovsky 		props->tm_caps.max_ops =
1055eb761894SArtemy Kovalyov 			1 << MLX5_CAP_GEN(mdev, log_max_qp_sz);
105678b1beb0SLeon Romanovsky 		props->tm_caps.max_sge = MLX5_TM_MAX_SGE;
1057eb761894SArtemy Kovalyov 	}
1058eb761894SArtemy Kovalyov 
105989705e92SDanit Goldberg 	if (MLX5_CAP_GEN(mdev, tag_matching) &&
106089705e92SDanit Goldberg 	    MLX5_CAP_GEN(mdev, rndv_offload_rc)) {
106189705e92SDanit Goldberg 		props->tm_caps.flags = IB_TM_CAP_RNDV_RC;
106289705e92SDanit Goldberg 		props->tm_caps.max_rndv_hdr_size = MLX5_TM_MAX_RNDV_MSG_SIZE;
106389705e92SDanit Goldberg 	}
106489705e92SDanit Goldberg 
106587ab3f52SYonatan Cohen 	if (MLX5_CAP_GEN(dev->mdev, cq_moderation)) {
106687ab3f52SYonatan Cohen 		props->cq_caps.max_cq_moderation_count =
106787ab3f52SYonatan Cohen 						MLX5_MAX_CQ_COUNT;
106887ab3f52SYonatan Cohen 		props->cq_caps.max_cq_moderation_period =
106987ab3f52SYonatan Cohen 						MLX5_MAX_CQ_PERIOD;
107087ab3f52SYonatan Cohen 	}
107187ab3f52SYonatan Cohen 
10727e43a2a5SBodong Wang 	if (field_avail(typeof(resp), cqe_comp_caps, uhw->outlen)) {
1073572f46bfSYonatan Cohen 		resp.response_length += sizeof(resp.cqe_comp_caps);
1074572f46bfSYonatan Cohen 
1075572f46bfSYonatan Cohen 		if (MLX5_CAP_GEN(dev->mdev, cqe_compression)) {
10767e43a2a5SBodong Wang 			resp.cqe_comp_caps.max_num =
1077572f46bfSYonatan Cohen 				MLX5_CAP_GEN(dev->mdev,
1078572f46bfSYonatan Cohen 					     cqe_compression_max_num);
1079572f46bfSYonatan Cohen 
10807e43a2a5SBodong Wang 			resp.cqe_comp_caps.supported_format =
10817e43a2a5SBodong Wang 				MLX5_IB_CQE_RES_FORMAT_HASH |
10827e43a2a5SBodong Wang 				MLX5_IB_CQE_RES_FORMAT_CSUM;
10836f1006a4SYonatan Cohen 
10846f1006a4SYonatan Cohen 			if (MLX5_CAP_GEN(dev->mdev, mini_cqe_resp_stride_index))
10856f1006a4SYonatan Cohen 				resp.cqe_comp_caps.supported_format |=
10866f1006a4SYonatan Cohen 					MLX5_IB_CQE_RES_FORMAT_CSUM_STRIDX;
1087572f46bfSYonatan Cohen 		}
10887e43a2a5SBodong Wang 	}
10897e43a2a5SBodong Wang 
109085c7c014SDaniel Jurgens 	if (field_avail(typeof(resp), packet_pacing_caps, uhw->outlen) &&
109185c7c014SDaniel Jurgens 	    raw_support) {
1092d949167dSBodong Wang 		if (MLX5_CAP_QOS(mdev, packet_pacing) &&
1093d949167dSBodong Wang 		    MLX5_CAP_GEN(mdev, qos)) {
1094d949167dSBodong Wang 			resp.packet_pacing_caps.qp_rate_limit_max =
1095d949167dSBodong Wang 				MLX5_CAP_QOS(mdev, packet_pacing_max_rate);
1096d949167dSBodong Wang 			resp.packet_pacing_caps.qp_rate_limit_min =
1097d949167dSBodong Wang 				MLX5_CAP_QOS(mdev, packet_pacing_min_rate);
1098d949167dSBodong Wang 			resp.packet_pacing_caps.supported_qpts |=
1099d949167dSBodong Wang 				1 << IB_QPT_RAW_PACKET;
110061147f39SBodong Wang 			if (MLX5_CAP_QOS(mdev, packet_pacing_burst_bound) &&
110161147f39SBodong Wang 			    MLX5_CAP_QOS(mdev, packet_pacing_typical_size))
110261147f39SBodong Wang 				resp.packet_pacing_caps.cap_flags |=
110361147f39SBodong Wang 					MLX5_IB_PP_SUPPORT_BURST;
1104d949167dSBodong Wang 		}
1105d949167dSBodong Wang 		resp.response_length += sizeof(resp.packet_pacing_caps);
1106d949167dSBodong Wang 	}
1107d949167dSBodong Wang 
11089f885201SLeon Romanovsky 	if (field_avail(typeof(resp), mlx5_ib_support_multi_pkt_send_wqes,
11099f885201SLeon Romanovsky 			uhw->outlen)) {
1110795b609cSBodong Wang 		if (MLX5_CAP_ETH(mdev, multi_pkt_send_wqe))
11119f885201SLeon Romanovsky 			resp.mlx5_ib_support_multi_pkt_send_wqes =
1112795b609cSBodong Wang 				MLX5_IB_ALLOW_MPW;
1113050da902SBodong Wang 
1114050da902SBodong Wang 		if (MLX5_CAP_ETH(mdev, enhanced_multi_pkt_send_wqe))
1115050da902SBodong Wang 			resp.mlx5_ib_support_multi_pkt_send_wqes |=
1116050da902SBodong Wang 				MLX5_IB_SUPPORT_EMPW;
1117050da902SBodong Wang 
11189f885201SLeon Romanovsky 		resp.response_length +=
11199f885201SLeon Romanovsky 			sizeof(resp.mlx5_ib_support_multi_pkt_send_wqes);
11209f885201SLeon Romanovsky 	}
11219f885201SLeon Romanovsky 
1122de57f2adSGuy Levi 	if (field_avail(typeof(resp), flags, uhw->outlen)) {
1123de57f2adSGuy Levi 		resp.response_length += sizeof(resp.flags);
11247a0c8f42SGuy Levi 
1125de57f2adSGuy Levi 		if (MLX5_CAP_GEN(mdev, cqe_compression_128))
1126de57f2adSGuy Levi 			resp.flags |=
1127de57f2adSGuy Levi 				MLX5_IB_QUERY_DEV_RESP_FLAGS_CQE_128B_COMP;
11287a0c8f42SGuy Levi 
11297a0c8f42SGuy Levi 		if (MLX5_CAP_GEN(mdev, cqe_128_always))
11307a0c8f42SGuy Levi 			resp.flags |= MLX5_IB_QUERY_DEV_RESP_FLAGS_CQE_128B_PAD;
11317e11b911SDanit Goldberg 		if (MLX5_CAP_GEN(mdev, qp_packet_based))
11327e11b911SDanit Goldberg 			resp.flags |=
11337e11b911SDanit Goldberg 				MLX5_IB_QUERY_DEV_RESP_PACKET_BASED_CREDIT_MODE;
11347249c8eaSGuy Levi 
11357249c8eaSGuy Levi 		resp.flags |= MLX5_IB_QUERY_DEV_RESP_FLAGS_SCAT2CQE_DCT;
1136de57f2adSGuy Levi 	}
11379f885201SLeon Romanovsky 
113896dc3fc5SNoa Osherovich 	if (field_avail(typeof(resp), sw_parsing_caps,
113996dc3fc5SNoa Osherovich 			uhw->outlen)) {
114096dc3fc5SNoa Osherovich 		resp.response_length += sizeof(resp.sw_parsing_caps);
114196dc3fc5SNoa Osherovich 		if (MLX5_CAP_ETH(mdev, swp)) {
114296dc3fc5SNoa Osherovich 			resp.sw_parsing_caps.sw_parsing_offloads |=
114396dc3fc5SNoa Osherovich 				MLX5_IB_SW_PARSING;
114496dc3fc5SNoa Osherovich 
114596dc3fc5SNoa Osherovich 			if (MLX5_CAP_ETH(mdev, swp_csum))
114696dc3fc5SNoa Osherovich 				resp.sw_parsing_caps.sw_parsing_offloads |=
114796dc3fc5SNoa Osherovich 					MLX5_IB_SW_PARSING_CSUM;
114896dc3fc5SNoa Osherovich 
114996dc3fc5SNoa Osherovich 			if (MLX5_CAP_ETH(mdev, swp_lso))
115096dc3fc5SNoa Osherovich 				resp.sw_parsing_caps.sw_parsing_offloads |=
115196dc3fc5SNoa Osherovich 					MLX5_IB_SW_PARSING_LSO;
115296dc3fc5SNoa Osherovich 
115396dc3fc5SNoa Osherovich 			if (resp.sw_parsing_caps.sw_parsing_offloads)
115496dc3fc5SNoa Osherovich 				resp.sw_parsing_caps.supported_qpts =
115596dc3fc5SNoa Osherovich 					BIT(IB_QPT_RAW_PACKET);
115696dc3fc5SNoa Osherovich 		}
115796dc3fc5SNoa Osherovich 	}
115896dc3fc5SNoa Osherovich 
115985c7c014SDaniel Jurgens 	if (field_avail(typeof(resp), striding_rq_caps, uhw->outlen) &&
116085c7c014SDaniel Jurgens 	    raw_support) {
1161b4f34597SNoa Osherovich 		resp.response_length += sizeof(resp.striding_rq_caps);
1162b4f34597SNoa Osherovich 		if (MLX5_CAP_GEN(mdev, striding_rq)) {
1163b4f34597SNoa Osherovich 			resp.striding_rq_caps.min_single_stride_log_num_of_bytes =
1164b4f34597SNoa Osherovich 				MLX5_MIN_SINGLE_STRIDE_LOG_NUM_BYTES;
1165b4f34597SNoa Osherovich 			resp.striding_rq_caps.max_single_stride_log_num_of_bytes =
1166b4f34597SNoa Osherovich 				MLX5_MAX_SINGLE_STRIDE_LOG_NUM_BYTES;
1167b4f34597SNoa Osherovich 			resp.striding_rq_caps.min_single_wqe_log_num_of_strides =
1168b4f34597SNoa Osherovich 				MLX5_MIN_SINGLE_WQE_LOG_NUM_STRIDES;
1169b4f34597SNoa Osherovich 			resp.striding_rq_caps.max_single_wqe_log_num_of_strides =
1170b4f34597SNoa Osherovich 				MLX5_MAX_SINGLE_WQE_LOG_NUM_STRIDES;
1171b4f34597SNoa Osherovich 			resp.striding_rq_caps.supported_qpts =
1172b4f34597SNoa Osherovich 				BIT(IB_QPT_RAW_PACKET);
1173b4f34597SNoa Osherovich 		}
1174b4f34597SNoa Osherovich 	}
1175b4f34597SNoa Osherovich 
1176f95ef6cbSMaor Gottlieb 	if (field_avail(typeof(resp), tunnel_offloads_caps,
1177f95ef6cbSMaor Gottlieb 			uhw->outlen)) {
1178f95ef6cbSMaor Gottlieb 		resp.response_length += sizeof(resp.tunnel_offloads_caps);
1179f95ef6cbSMaor Gottlieb 		if (MLX5_CAP_ETH(mdev, tunnel_stateless_vxlan))
1180f95ef6cbSMaor Gottlieb 			resp.tunnel_offloads_caps |=
1181f95ef6cbSMaor Gottlieb 				MLX5_IB_TUNNELED_OFFLOADS_VXLAN;
1182f95ef6cbSMaor Gottlieb 		if (MLX5_CAP_ETH(mdev, tunnel_stateless_geneve_rx))
1183f95ef6cbSMaor Gottlieb 			resp.tunnel_offloads_caps |=
1184f95ef6cbSMaor Gottlieb 				MLX5_IB_TUNNELED_OFFLOADS_GENEVE;
1185f95ef6cbSMaor Gottlieb 		if (MLX5_CAP_ETH(mdev, tunnel_stateless_gre))
1186f95ef6cbSMaor Gottlieb 			resp.tunnel_offloads_caps |=
1187f95ef6cbSMaor Gottlieb 				MLX5_IB_TUNNELED_OFFLOADS_GRE;
1188e818e255SAriel Levkovich 		if (MLX5_CAP_GEN(mdev, flex_parser_protocols) &
1189e818e255SAriel Levkovich 		    MLX5_FLEX_PROTO_CW_MPLS_GRE)
1190e818e255SAriel Levkovich 			resp.tunnel_offloads_caps |=
1191e818e255SAriel Levkovich 				MLX5_IB_TUNNELED_OFFLOADS_MPLS_GRE;
1192e818e255SAriel Levkovich 		if (MLX5_CAP_GEN(mdev, flex_parser_protocols) &
1193e818e255SAriel Levkovich 		    MLX5_FLEX_PROTO_CW_MPLS_UDP)
1194e818e255SAriel Levkovich 			resp.tunnel_offloads_caps |=
1195e818e255SAriel Levkovich 				MLX5_IB_TUNNELED_OFFLOADS_MPLS_UDP;
1196f95ef6cbSMaor Gottlieb 	}
1197f95ef6cbSMaor Gottlieb 
1198402ca536SBodong Wang 	if (uhw->outlen) {
1199402ca536SBodong Wang 		err = ib_copy_to_udata(uhw, &resp, resp.response_length);
1200402ca536SBodong Wang 
1201402ca536SBodong Wang 		if (err)
1202402ca536SBodong Wang 			return err;
1203402ca536SBodong Wang 	}
1204402ca536SBodong Wang 
12051b5daf11SMajd Dibbiny 	return 0;
12061b5daf11SMajd Dibbiny }
1207e126ba97SEli Cohen 
12081b5daf11SMajd Dibbiny enum mlx5_ib_width {
12091b5daf11SMajd Dibbiny 	MLX5_IB_WIDTH_1X	= 1 << 0,
12101b5daf11SMajd Dibbiny 	MLX5_IB_WIDTH_2X	= 1 << 1,
12111b5daf11SMajd Dibbiny 	MLX5_IB_WIDTH_4X	= 1 << 2,
12121b5daf11SMajd Dibbiny 	MLX5_IB_WIDTH_8X	= 1 << 3,
12131b5daf11SMajd Dibbiny 	MLX5_IB_WIDTH_12X	= 1 << 4
12141b5daf11SMajd Dibbiny };
12151b5daf11SMajd Dibbiny 
1216db7a691aSMichael Guralnik static void translate_active_width(struct ib_device *ibdev, u8 active_width,
12171b5daf11SMajd Dibbiny 				  u8 *ib_width)
12181b5daf11SMajd Dibbiny {
12191b5daf11SMajd Dibbiny 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
12201b5daf11SMajd Dibbiny 
1221db7a691aSMichael Guralnik 	if (active_width & MLX5_IB_WIDTH_1X)
12221b5daf11SMajd Dibbiny 		*ib_width = IB_WIDTH_1X;
1223d764970bSMichael Guralnik 	else if (active_width & MLX5_IB_WIDTH_2X)
1224d764970bSMichael Guralnik 		*ib_width = IB_WIDTH_2X;
1225db7a691aSMichael Guralnik 	else if (active_width & MLX5_IB_WIDTH_4X)
12261b5daf11SMajd Dibbiny 		*ib_width = IB_WIDTH_4X;
1227db7a691aSMichael Guralnik 	else if (active_width & MLX5_IB_WIDTH_8X)
12281b5daf11SMajd Dibbiny 		*ib_width = IB_WIDTH_8X;
1229db7a691aSMichael Guralnik 	else if (active_width & MLX5_IB_WIDTH_12X)
12301b5daf11SMajd Dibbiny 		*ib_width = IB_WIDTH_12X;
1231db7a691aSMichael Guralnik 	else {
1232db7a691aSMichael Guralnik 		mlx5_ib_dbg(dev, "Invalid active_width %d, setting width to default value: 4x\n",
12331b5daf11SMajd Dibbiny 			    (int)active_width);
1234db7a691aSMichael Guralnik 		*ib_width = IB_WIDTH_4X;
12351b5daf11SMajd Dibbiny 	}
12361b5daf11SMajd Dibbiny 
1237db7a691aSMichael Guralnik 	return;
12381b5daf11SMajd Dibbiny }
12391b5daf11SMajd Dibbiny 
12401b5daf11SMajd Dibbiny static int mlx5_mtu_to_ib_mtu(int mtu)
12411b5daf11SMajd Dibbiny {
12421b5daf11SMajd Dibbiny 	switch (mtu) {
12431b5daf11SMajd Dibbiny 	case 256: return 1;
12441b5daf11SMajd Dibbiny 	case 512: return 2;
12451b5daf11SMajd Dibbiny 	case 1024: return 3;
12461b5daf11SMajd Dibbiny 	case 2048: return 4;
12471b5daf11SMajd Dibbiny 	case 4096: return 5;
12481b5daf11SMajd Dibbiny 	default:
12491b5daf11SMajd Dibbiny 		pr_warn("invalid mtu\n");
12501b5daf11SMajd Dibbiny 		return -1;
12511b5daf11SMajd Dibbiny 	}
12521b5daf11SMajd Dibbiny }
12531b5daf11SMajd Dibbiny 
12541b5daf11SMajd Dibbiny enum ib_max_vl_num {
12551b5daf11SMajd Dibbiny 	__IB_MAX_VL_0		= 1,
12561b5daf11SMajd Dibbiny 	__IB_MAX_VL_0_1		= 2,
12571b5daf11SMajd Dibbiny 	__IB_MAX_VL_0_3		= 3,
12581b5daf11SMajd Dibbiny 	__IB_MAX_VL_0_7		= 4,
12591b5daf11SMajd Dibbiny 	__IB_MAX_VL_0_14	= 5,
12601b5daf11SMajd Dibbiny };
12611b5daf11SMajd Dibbiny 
12621b5daf11SMajd Dibbiny enum mlx5_vl_hw_cap {
12631b5daf11SMajd Dibbiny 	MLX5_VL_HW_0	= 1,
12641b5daf11SMajd Dibbiny 	MLX5_VL_HW_0_1	= 2,
12651b5daf11SMajd Dibbiny 	MLX5_VL_HW_0_2	= 3,
12661b5daf11SMajd Dibbiny 	MLX5_VL_HW_0_3	= 4,
12671b5daf11SMajd Dibbiny 	MLX5_VL_HW_0_4	= 5,
12681b5daf11SMajd Dibbiny 	MLX5_VL_HW_0_5	= 6,
12691b5daf11SMajd Dibbiny 	MLX5_VL_HW_0_6	= 7,
12701b5daf11SMajd Dibbiny 	MLX5_VL_HW_0_7	= 8,
12711b5daf11SMajd Dibbiny 	MLX5_VL_HW_0_14	= 15
12721b5daf11SMajd Dibbiny };
12731b5daf11SMajd Dibbiny 
12741b5daf11SMajd Dibbiny static int translate_max_vl_num(struct ib_device *ibdev, u8 vl_hw_cap,
12751b5daf11SMajd Dibbiny 				u8 *max_vl_num)
12761b5daf11SMajd Dibbiny {
12771b5daf11SMajd Dibbiny 	switch (vl_hw_cap) {
12781b5daf11SMajd Dibbiny 	case MLX5_VL_HW_0:
12791b5daf11SMajd Dibbiny 		*max_vl_num = __IB_MAX_VL_0;
12801b5daf11SMajd Dibbiny 		break;
12811b5daf11SMajd Dibbiny 	case MLX5_VL_HW_0_1:
12821b5daf11SMajd Dibbiny 		*max_vl_num = __IB_MAX_VL_0_1;
12831b5daf11SMajd Dibbiny 		break;
12841b5daf11SMajd Dibbiny 	case MLX5_VL_HW_0_3:
12851b5daf11SMajd Dibbiny 		*max_vl_num = __IB_MAX_VL_0_3;
12861b5daf11SMajd Dibbiny 		break;
12871b5daf11SMajd Dibbiny 	case MLX5_VL_HW_0_7:
12881b5daf11SMajd Dibbiny 		*max_vl_num = __IB_MAX_VL_0_7;
12891b5daf11SMajd Dibbiny 		break;
12901b5daf11SMajd Dibbiny 	case MLX5_VL_HW_0_14:
12911b5daf11SMajd Dibbiny 		*max_vl_num = __IB_MAX_VL_0_14;
12921b5daf11SMajd Dibbiny 		break;
12931b5daf11SMajd Dibbiny 
12941b5daf11SMajd Dibbiny 	default:
12951b5daf11SMajd Dibbiny 		return -EINVAL;
12961b5daf11SMajd Dibbiny 	}
12971b5daf11SMajd Dibbiny 
12981b5daf11SMajd Dibbiny 	return 0;
12991b5daf11SMajd Dibbiny }
13001b5daf11SMajd Dibbiny 
13011b5daf11SMajd Dibbiny static int mlx5_query_hca_port(struct ib_device *ibdev, u8 port,
13021b5daf11SMajd Dibbiny 			       struct ib_port_attr *props)
13031b5daf11SMajd Dibbiny {
13041b5daf11SMajd Dibbiny 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
13051b5daf11SMajd Dibbiny 	struct mlx5_core_dev *mdev = dev->mdev;
13061b5daf11SMajd Dibbiny 	struct mlx5_hca_vport_context *rep;
1307046339eaSSaeed Mahameed 	u16 max_mtu;
1308046339eaSSaeed Mahameed 	u16 oper_mtu;
13091b5daf11SMajd Dibbiny 	int err;
13101b5daf11SMajd Dibbiny 	u8 ib_link_width_oper;
13111b5daf11SMajd Dibbiny 	u8 vl_hw_cap;
13121b5daf11SMajd Dibbiny 
13131b5daf11SMajd Dibbiny 	rep = kzalloc(sizeof(*rep), GFP_KERNEL);
13141b5daf11SMajd Dibbiny 	if (!rep) {
13151b5daf11SMajd Dibbiny 		err = -ENOMEM;
13161b5daf11SMajd Dibbiny 		goto out;
13171b5daf11SMajd Dibbiny 	}
13181b5daf11SMajd Dibbiny 
1319c4550c63SOr Gerlitz 	/* props being zeroed by the caller, avoid zeroing it here */
13201b5daf11SMajd Dibbiny 
13211b5daf11SMajd Dibbiny 	err = mlx5_query_hca_vport_context(mdev, 0, port, 0, rep);
13221b5daf11SMajd Dibbiny 	if (err)
13231b5daf11SMajd Dibbiny 		goto out;
13241b5daf11SMajd Dibbiny 
13251b5daf11SMajd Dibbiny 	props->lid		= rep->lid;
13261b5daf11SMajd Dibbiny 	props->lmc		= rep->lmc;
13271b5daf11SMajd Dibbiny 	props->sm_lid		= rep->sm_lid;
13281b5daf11SMajd Dibbiny 	props->sm_sl		= rep->sm_sl;
13291b5daf11SMajd Dibbiny 	props->state		= rep->vport_state;
13301b5daf11SMajd Dibbiny 	props->phys_state	= rep->port_physical_state;
13311b5daf11SMajd Dibbiny 	props->port_cap_flags	= rep->cap_mask1;
13321b5daf11SMajd Dibbiny 	props->gid_tbl_len	= mlx5_get_gid_table_len(MLX5_CAP_GEN(mdev, gid_table_size));
13331b5daf11SMajd Dibbiny 	props->max_msg_sz	= 1 << MLX5_CAP_GEN(mdev, log_max_msg);
13341b5daf11SMajd Dibbiny 	props->pkey_tbl_len	= mlx5_to_sw_pkey_sz(MLX5_CAP_GEN(mdev, pkey_table_size));
13351b5daf11SMajd Dibbiny 	props->bad_pkey_cntr	= rep->pkey_violation_counter;
13361b5daf11SMajd Dibbiny 	props->qkey_viol_cntr	= rep->qkey_violation_counter;
13371b5daf11SMajd Dibbiny 	props->subnet_timeout	= rep->subnet_timeout;
13381b5daf11SMajd Dibbiny 	props->init_type_reply	= rep->init_type_reply;
13391b5daf11SMajd Dibbiny 
13404106a758SMichael Guralnik 	if (props->port_cap_flags & IB_PORT_CAP_MASK2_SUP)
13414106a758SMichael Guralnik 		props->port_cap_flags2 = rep->cap_mask2;
13424106a758SMichael Guralnik 
13431b5daf11SMajd Dibbiny 	err = mlx5_query_port_link_width_oper(mdev, &ib_link_width_oper, port);
13441b5daf11SMajd Dibbiny 	if (err)
13451b5daf11SMajd Dibbiny 		goto out;
13461b5daf11SMajd Dibbiny 
1347db7a691aSMichael Guralnik 	translate_active_width(ibdev, ib_link_width_oper, &props->active_width);
1348db7a691aSMichael Guralnik 
1349d5beb7f2SNoa Osherovich 	err = mlx5_query_port_ib_proto_oper(mdev, &props->active_speed, port);
13501b5daf11SMajd Dibbiny 	if (err)
13511b5daf11SMajd Dibbiny 		goto out;
13521b5daf11SMajd Dibbiny 
1353facc9699SSaeed Mahameed 	mlx5_query_port_max_mtu(mdev, &max_mtu, port);
13541b5daf11SMajd Dibbiny 
13551b5daf11SMajd Dibbiny 	props->max_mtu = mlx5_mtu_to_ib_mtu(max_mtu);
13561b5daf11SMajd Dibbiny 
1357facc9699SSaeed Mahameed 	mlx5_query_port_oper_mtu(mdev, &oper_mtu, port);
13581b5daf11SMajd Dibbiny 
13591b5daf11SMajd Dibbiny 	props->active_mtu = mlx5_mtu_to_ib_mtu(oper_mtu);
13601b5daf11SMajd Dibbiny 
13611b5daf11SMajd Dibbiny 	err = mlx5_query_port_vl_hw_cap(mdev, &vl_hw_cap, port);
13621b5daf11SMajd Dibbiny 	if (err)
13631b5daf11SMajd Dibbiny 		goto out;
13641b5daf11SMajd Dibbiny 
13651b5daf11SMajd Dibbiny 	err = translate_max_vl_num(ibdev, vl_hw_cap,
13661b5daf11SMajd Dibbiny 				   &props->max_vl_num);
13671b5daf11SMajd Dibbiny out:
13681b5daf11SMajd Dibbiny 	kfree(rep);
1369e126ba97SEli Cohen 	return err;
1370e126ba97SEli Cohen }
1371e126ba97SEli Cohen 
1372e126ba97SEli Cohen int mlx5_ib_query_port(struct ib_device *ibdev, u8 port,
1373e126ba97SEli Cohen 		       struct ib_port_attr *props)
1374e126ba97SEli Cohen {
1375095b0927SIlan Tayari 	unsigned int count;
1376095b0927SIlan Tayari 	int ret;
1377095b0927SIlan Tayari 
13781b5daf11SMajd Dibbiny 	switch (mlx5_get_vport_access_method(ibdev)) {
13791b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_MAD:
1380095b0927SIlan Tayari 		ret = mlx5_query_mad_ifc_port(ibdev, port, props);
1381095b0927SIlan Tayari 		break;
1382e126ba97SEli Cohen 
13831b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_HCA:
1384095b0927SIlan Tayari 		ret = mlx5_query_hca_port(ibdev, port, props);
1385095b0927SIlan Tayari 		break;
13861b5daf11SMajd Dibbiny 
13873f89a643SAchiad Shochat 	case MLX5_VPORT_ACCESS_METHOD_NIC:
1388095b0927SIlan Tayari 		ret = mlx5_query_port_roce(ibdev, port, props);
1389095b0927SIlan Tayari 		break;
13903f89a643SAchiad Shochat 
13911b5daf11SMajd Dibbiny 	default:
1392095b0927SIlan Tayari 		ret = -EINVAL;
1393e126ba97SEli Cohen 	}
1394095b0927SIlan Tayari 
1395095b0927SIlan Tayari 	if (!ret && props) {
1396b3cbd6f0SDaniel Jurgens 		struct mlx5_ib_dev *dev = to_mdev(ibdev);
1397b3cbd6f0SDaniel Jurgens 		struct mlx5_core_dev *mdev;
1398b3cbd6f0SDaniel Jurgens 		bool put_mdev = true;
1399b3cbd6f0SDaniel Jurgens 
1400b3cbd6f0SDaniel Jurgens 		mdev = mlx5_ib_get_native_port_mdev(dev, port, NULL);
1401b3cbd6f0SDaniel Jurgens 		if (!mdev) {
1402b3cbd6f0SDaniel Jurgens 			/* If the port isn't affiliated yet query the master.
1403b3cbd6f0SDaniel Jurgens 			 * The master and slave will have the same values.
1404b3cbd6f0SDaniel Jurgens 			 */
1405b3cbd6f0SDaniel Jurgens 			mdev = dev->mdev;
1406b3cbd6f0SDaniel Jurgens 			port = 1;
1407b3cbd6f0SDaniel Jurgens 			put_mdev = false;
1408b3cbd6f0SDaniel Jurgens 		}
1409b3cbd6f0SDaniel Jurgens 		count = mlx5_core_reserved_gids_count(mdev);
1410b3cbd6f0SDaniel Jurgens 		if (put_mdev)
1411b3cbd6f0SDaniel Jurgens 			mlx5_ib_put_native_port_mdev(dev, port);
1412095b0927SIlan Tayari 		props->gid_tbl_len -= count;
1413095b0927SIlan Tayari 	}
1414095b0927SIlan Tayari 	return ret;
1415e126ba97SEli Cohen }
1416e126ba97SEli Cohen 
14178e6efa3aSMark Bloch static int mlx5_ib_rep_query_port(struct ib_device *ibdev, u8 port,
14188e6efa3aSMark Bloch 				  struct ib_port_attr *props)
14198e6efa3aSMark Bloch {
14208e6efa3aSMark Bloch 	int ret;
14218e6efa3aSMark Bloch 
142226628e2dSMark Bloch 	/* Only link layer == ethernet is valid for representors
142326628e2dSMark Bloch 	 * and we always use port 1
142426628e2dSMark Bloch 	 */
14258e6efa3aSMark Bloch 	ret = mlx5_query_port_roce(ibdev, port, props);
14268e6efa3aSMark Bloch 	if (ret || !props)
14278e6efa3aSMark Bloch 		return ret;
14288e6efa3aSMark Bloch 
14298e6efa3aSMark Bloch 	/* We don't support GIDS */
14308e6efa3aSMark Bloch 	props->gid_tbl_len = 0;
14318e6efa3aSMark Bloch 
14328e6efa3aSMark Bloch 	return ret;
14338e6efa3aSMark Bloch }
14348e6efa3aSMark Bloch 
1435e126ba97SEli Cohen static int mlx5_ib_query_gid(struct ib_device *ibdev, u8 port, int index,
1436e126ba97SEli Cohen 			     union ib_gid *gid)
1437e126ba97SEli Cohen {
14381b5daf11SMajd Dibbiny 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
14391b5daf11SMajd Dibbiny 	struct mlx5_core_dev *mdev = dev->mdev;
1440e126ba97SEli Cohen 
14411b5daf11SMajd Dibbiny 	switch (mlx5_get_vport_access_method(ibdev)) {
14421b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_MAD:
14431b5daf11SMajd Dibbiny 		return mlx5_query_mad_ifc_gids(ibdev, port, index, gid);
1444e126ba97SEli Cohen 
14451b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_HCA:
14461b5daf11SMajd Dibbiny 		return mlx5_query_hca_vport_gid(mdev, 0, port, 0, index, gid);
1447e126ba97SEli Cohen 
14481b5daf11SMajd Dibbiny 	default:
14491b5daf11SMajd Dibbiny 		return -EINVAL;
14501b5daf11SMajd Dibbiny 	}
1451e126ba97SEli Cohen 
1452e126ba97SEli Cohen }
1453e126ba97SEli Cohen 
1454b3cbd6f0SDaniel Jurgens static int mlx5_query_hca_nic_pkey(struct ib_device *ibdev, u8 port,
1455b3cbd6f0SDaniel Jurgens 				   u16 index, u16 *pkey)
1456b3cbd6f0SDaniel Jurgens {
1457b3cbd6f0SDaniel Jurgens 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
1458b3cbd6f0SDaniel Jurgens 	struct mlx5_core_dev *mdev;
1459b3cbd6f0SDaniel Jurgens 	bool put_mdev = true;
1460b3cbd6f0SDaniel Jurgens 	u8 mdev_port_num;
1461b3cbd6f0SDaniel Jurgens 	int err;
1462b3cbd6f0SDaniel Jurgens 
1463b3cbd6f0SDaniel Jurgens 	mdev = mlx5_ib_get_native_port_mdev(dev, port, &mdev_port_num);
1464b3cbd6f0SDaniel Jurgens 	if (!mdev) {
1465b3cbd6f0SDaniel Jurgens 		/* The port isn't affiliated yet, get the PKey from the master
1466b3cbd6f0SDaniel Jurgens 		 * port. For RoCE the PKey tables will be the same.
1467b3cbd6f0SDaniel Jurgens 		 */
1468b3cbd6f0SDaniel Jurgens 		put_mdev = false;
1469b3cbd6f0SDaniel Jurgens 		mdev = dev->mdev;
1470b3cbd6f0SDaniel Jurgens 		mdev_port_num = 1;
1471b3cbd6f0SDaniel Jurgens 	}
1472b3cbd6f0SDaniel Jurgens 
1473b3cbd6f0SDaniel Jurgens 	err = mlx5_query_hca_vport_pkey(mdev, 0, mdev_port_num, 0,
1474b3cbd6f0SDaniel Jurgens 					index, pkey);
1475b3cbd6f0SDaniel Jurgens 	if (put_mdev)
1476b3cbd6f0SDaniel Jurgens 		mlx5_ib_put_native_port_mdev(dev, port);
1477b3cbd6f0SDaniel Jurgens 
1478b3cbd6f0SDaniel Jurgens 	return err;
1479b3cbd6f0SDaniel Jurgens }
1480b3cbd6f0SDaniel Jurgens 
1481e126ba97SEli Cohen static int mlx5_ib_query_pkey(struct ib_device *ibdev, u8 port, u16 index,
1482e126ba97SEli Cohen 			      u16 *pkey)
1483e126ba97SEli Cohen {
14841b5daf11SMajd Dibbiny 	switch (mlx5_get_vport_access_method(ibdev)) {
14851b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_MAD:
14861b5daf11SMajd Dibbiny 		return mlx5_query_mad_ifc_pkey(ibdev, port, index, pkey);
1487e126ba97SEli Cohen 
14881b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_HCA:
14891b5daf11SMajd Dibbiny 	case MLX5_VPORT_ACCESS_METHOD_NIC:
1490b3cbd6f0SDaniel Jurgens 		return mlx5_query_hca_nic_pkey(ibdev, port, index, pkey);
14911b5daf11SMajd Dibbiny 	default:
14921b5daf11SMajd Dibbiny 		return -EINVAL;
1493e126ba97SEli Cohen 	}
14941b5daf11SMajd Dibbiny }
1495e126ba97SEli Cohen 
1496e126ba97SEli Cohen static int mlx5_ib_modify_device(struct ib_device *ibdev, int mask,
1497e126ba97SEli Cohen 				 struct ib_device_modify *props)
1498e126ba97SEli Cohen {
1499e126ba97SEli Cohen 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
1500e126ba97SEli Cohen 	struct mlx5_reg_node_desc in;
1501e126ba97SEli Cohen 	struct mlx5_reg_node_desc out;
1502e126ba97SEli Cohen 	int err;
1503e126ba97SEli Cohen 
1504e126ba97SEli Cohen 	if (mask & ~IB_DEVICE_MODIFY_NODE_DESC)
1505e126ba97SEli Cohen 		return -EOPNOTSUPP;
1506e126ba97SEli Cohen 
1507e126ba97SEli Cohen 	if (!(mask & IB_DEVICE_MODIFY_NODE_DESC))
1508e126ba97SEli Cohen 		return 0;
1509e126ba97SEli Cohen 
1510e126ba97SEli Cohen 	/*
1511e126ba97SEli Cohen 	 * If possible, pass node desc to FW, so it can generate
1512e126ba97SEli Cohen 	 * a 144 trap.  If cmd fails, just ignore.
1513e126ba97SEli Cohen 	 */
1514bd99fdeaSYuval Shaia 	memcpy(&in, props->node_desc, IB_DEVICE_NODE_DESC_MAX);
15159603b61dSJack Morgenstein 	err = mlx5_core_access_reg(dev->mdev, &in, sizeof(in), &out,
1516e126ba97SEli Cohen 				   sizeof(out), MLX5_REG_NODE_DESC, 0, 1);
1517e126ba97SEli Cohen 	if (err)
1518e126ba97SEli Cohen 		return err;
1519e126ba97SEli Cohen 
1520bd99fdeaSYuval Shaia 	memcpy(ibdev->node_desc, props->node_desc, IB_DEVICE_NODE_DESC_MAX);
1521e126ba97SEli Cohen 
1522e126ba97SEli Cohen 	return err;
1523e126ba97SEli Cohen }
1524e126ba97SEli Cohen 
1525cdbe33d0SEli Cohen static int set_port_caps_atomic(struct mlx5_ib_dev *dev, u8 port_num, u32 mask,
1526cdbe33d0SEli Cohen 				u32 value)
1527cdbe33d0SEli Cohen {
1528cdbe33d0SEli Cohen 	struct mlx5_hca_vport_context ctx = {};
1529b3cbd6f0SDaniel Jurgens 	struct mlx5_core_dev *mdev;
1530b3cbd6f0SDaniel Jurgens 	u8 mdev_port_num;
1531cdbe33d0SEli Cohen 	int err;
1532cdbe33d0SEli Cohen 
1533b3cbd6f0SDaniel Jurgens 	mdev = mlx5_ib_get_native_port_mdev(dev, port_num, &mdev_port_num);
1534b3cbd6f0SDaniel Jurgens 	if (!mdev)
1535b3cbd6f0SDaniel Jurgens 		return -ENODEV;
1536b3cbd6f0SDaniel Jurgens 
1537b3cbd6f0SDaniel Jurgens 	err = mlx5_query_hca_vport_context(mdev, 0, mdev_port_num, 0, &ctx);
1538cdbe33d0SEli Cohen 	if (err)
1539b3cbd6f0SDaniel Jurgens 		goto out;
1540cdbe33d0SEli Cohen 
1541cdbe33d0SEli Cohen 	if (~ctx.cap_mask1_perm & mask) {
1542cdbe33d0SEli Cohen 		mlx5_ib_warn(dev, "trying to change bitmask 0x%X but change supported 0x%X\n",
1543cdbe33d0SEli Cohen 			     mask, ctx.cap_mask1_perm);
1544b3cbd6f0SDaniel Jurgens 		err = -EINVAL;
1545b3cbd6f0SDaniel Jurgens 		goto out;
1546cdbe33d0SEli Cohen 	}
1547cdbe33d0SEli Cohen 
1548cdbe33d0SEli Cohen 	ctx.cap_mask1 = value;
1549cdbe33d0SEli Cohen 	ctx.cap_mask1_perm = mask;
1550b3cbd6f0SDaniel Jurgens 	err = mlx5_core_modify_hca_vport_context(mdev, 0, mdev_port_num,
1551b3cbd6f0SDaniel Jurgens 						 0, &ctx);
1552b3cbd6f0SDaniel Jurgens 
1553b3cbd6f0SDaniel Jurgens out:
1554b3cbd6f0SDaniel Jurgens 	mlx5_ib_put_native_port_mdev(dev, port_num);
1555cdbe33d0SEli Cohen 
1556cdbe33d0SEli Cohen 	return err;
1557cdbe33d0SEli Cohen }
1558cdbe33d0SEli Cohen 
1559e126ba97SEli Cohen static int mlx5_ib_modify_port(struct ib_device *ibdev, u8 port, int mask,
1560e126ba97SEli Cohen 			       struct ib_port_modify *props)
1561e126ba97SEli Cohen {
1562e126ba97SEli Cohen 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
1563e126ba97SEli Cohen 	struct ib_port_attr attr;
1564e126ba97SEli Cohen 	u32 tmp;
1565e126ba97SEli Cohen 	int err;
1566cdbe33d0SEli Cohen 	u32 change_mask;
1567cdbe33d0SEli Cohen 	u32 value;
1568cdbe33d0SEli Cohen 	bool is_ib = (mlx5_ib_port_link_layer(ibdev, port) ==
1569cdbe33d0SEli Cohen 		      IB_LINK_LAYER_INFINIBAND);
1570cdbe33d0SEli Cohen 
1571ec255879SMajd Dibbiny 	/* CM layer calls ib_modify_port() regardless of the link layer. For
1572ec255879SMajd Dibbiny 	 * Ethernet ports, qkey violation and Port capabilities are meaningless.
1573ec255879SMajd Dibbiny 	 */
1574ec255879SMajd Dibbiny 	if (!is_ib)
1575ec255879SMajd Dibbiny 		return 0;
1576ec255879SMajd Dibbiny 
1577cdbe33d0SEli Cohen 	if (MLX5_CAP_GEN(dev->mdev, ib_virt) && is_ib) {
1578cdbe33d0SEli Cohen 		change_mask = props->clr_port_cap_mask | props->set_port_cap_mask;
1579cdbe33d0SEli Cohen 		value = ~props->clr_port_cap_mask | props->set_port_cap_mask;
1580cdbe33d0SEli Cohen 		return set_port_caps_atomic(dev, port, change_mask, value);
1581cdbe33d0SEli Cohen 	}
1582e126ba97SEli Cohen 
1583e126ba97SEli Cohen 	mutex_lock(&dev->cap_mask_mutex);
1584e126ba97SEli Cohen 
1585c4550c63SOr Gerlitz 	err = ib_query_port(ibdev, port, &attr);
1586e126ba97SEli Cohen 	if (err)
1587e126ba97SEli Cohen 		goto out;
1588e126ba97SEli Cohen 
1589e126ba97SEli Cohen 	tmp = (attr.port_cap_flags | props->set_port_cap_mask) &
1590e126ba97SEli Cohen 		~props->clr_port_cap_mask;
1591e126ba97SEli Cohen 
15929603b61dSJack Morgenstein 	err = mlx5_set_port_caps(dev->mdev, port, tmp);
1593e126ba97SEli Cohen 
1594e126ba97SEli Cohen out:
1595e126ba97SEli Cohen 	mutex_unlock(&dev->cap_mask_mutex);
1596e126ba97SEli Cohen 	return err;
1597e126ba97SEli Cohen }
1598e126ba97SEli Cohen 
159930aa60b3SEli Cohen static void print_lib_caps(struct mlx5_ib_dev *dev, u64 caps)
160030aa60b3SEli Cohen {
160130aa60b3SEli Cohen 	mlx5_ib_dbg(dev, "MLX5_LIB_CAP_4K_UAR = %s\n",
160230aa60b3SEli Cohen 		    caps & MLX5_LIB_CAP_4K_UAR ? "y" : "n");
160330aa60b3SEli Cohen }
160430aa60b3SEli Cohen 
160531a78a5aSYishai Hadas static u16 calc_dynamic_bfregs(int uars_per_sys_page)
160631a78a5aSYishai Hadas {
160731a78a5aSYishai Hadas 	/* Large page with non 4k uar support might limit the dynamic size */
160831a78a5aSYishai Hadas 	if (uars_per_sys_page == 1  && PAGE_SIZE > 4096)
160931a78a5aSYishai Hadas 		return MLX5_MIN_DYN_BFREGS;
161031a78a5aSYishai Hadas 
161131a78a5aSYishai Hadas 	return MLX5_MAX_DYN_BFREGS;
161231a78a5aSYishai Hadas }
161331a78a5aSYishai Hadas 
1614b037c29aSEli Cohen static int calc_total_bfregs(struct mlx5_ib_dev *dev, bool lib_uar_4k,
1615b037c29aSEli Cohen 			     struct mlx5_ib_alloc_ucontext_req_v2 *req,
161631a78a5aSYishai Hadas 			     struct mlx5_bfreg_info *bfregi)
1617b037c29aSEli Cohen {
1618b037c29aSEli Cohen 	int uars_per_sys_page;
1619b037c29aSEli Cohen 	int bfregs_per_sys_page;
1620b037c29aSEli Cohen 	int ref_bfregs = req->total_num_bfregs;
1621b037c29aSEli Cohen 
1622b037c29aSEli Cohen 	if (req->total_num_bfregs == 0)
1623b037c29aSEli Cohen 		return -EINVAL;
1624b037c29aSEli Cohen 
1625b037c29aSEli Cohen 	BUILD_BUG_ON(MLX5_MAX_BFREGS % MLX5_NON_FP_BFREGS_IN_PAGE);
1626b037c29aSEli Cohen 	BUILD_BUG_ON(MLX5_MAX_BFREGS < MLX5_NON_FP_BFREGS_IN_PAGE);
1627b037c29aSEli Cohen 
1628b037c29aSEli Cohen 	if (req->total_num_bfregs > MLX5_MAX_BFREGS)
1629b037c29aSEli Cohen 		return -ENOMEM;
1630b037c29aSEli Cohen 
1631b037c29aSEli Cohen 	uars_per_sys_page = get_uars_per_sys_page(dev, lib_uar_4k);
1632b037c29aSEli Cohen 	bfregs_per_sys_page = uars_per_sys_page * MLX5_NON_FP_BFREGS_PER_UAR;
163331a78a5aSYishai Hadas 	/* This holds the required static allocation asked by the user */
1634b037c29aSEli Cohen 	req->total_num_bfregs = ALIGN(req->total_num_bfregs, bfregs_per_sys_page);
1635b037c29aSEli Cohen 	if (req->num_low_latency_bfregs > req->total_num_bfregs - 1)
1636b037c29aSEli Cohen 		return -EINVAL;
1637b037c29aSEli Cohen 
163831a78a5aSYishai Hadas 	bfregi->num_static_sys_pages = req->total_num_bfregs / bfregs_per_sys_page;
163931a78a5aSYishai Hadas 	bfregi->num_dyn_bfregs = ALIGN(calc_dynamic_bfregs(uars_per_sys_page), bfregs_per_sys_page);
164031a78a5aSYishai Hadas 	bfregi->total_num_bfregs = req->total_num_bfregs + bfregi->num_dyn_bfregs;
164131a78a5aSYishai Hadas 	bfregi->num_sys_pages = bfregi->total_num_bfregs / bfregs_per_sys_page;
164231a78a5aSYishai Hadas 
164331a78a5aSYishai Hadas 	mlx5_ib_dbg(dev, "uar_4k: fw support %s, lib support %s, user requested %d bfregs, allocated %d, total bfregs %d, using %d sys pages\n",
1644b037c29aSEli Cohen 		    MLX5_CAP_GEN(dev->mdev, uar_4k) ? "yes" : "no",
1645b037c29aSEli Cohen 		    lib_uar_4k ? "yes" : "no", ref_bfregs,
164631a78a5aSYishai Hadas 		    req->total_num_bfregs, bfregi->total_num_bfregs,
164731a78a5aSYishai Hadas 		    bfregi->num_sys_pages);
1648b037c29aSEli Cohen 
1649b037c29aSEli Cohen 	return 0;
1650b037c29aSEli Cohen }
1651b037c29aSEli Cohen 
1652b037c29aSEli Cohen static int allocate_uars(struct mlx5_ib_dev *dev, struct mlx5_ib_ucontext *context)
1653b037c29aSEli Cohen {
1654b037c29aSEli Cohen 	struct mlx5_bfreg_info *bfregi;
1655b037c29aSEli Cohen 	int err;
1656b037c29aSEli Cohen 	int i;
1657b037c29aSEli Cohen 
1658b037c29aSEli Cohen 	bfregi = &context->bfregi;
165931a78a5aSYishai Hadas 	for (i = 0; i < bfregi->num_static_sys_pages; i++) {
1660b037c29aSEli Cohen 		err = mlx5_cmd_alloc_uar(dev->mdev, &bfregi->sys_pages[i]);
1661b037c29aSEli Cohen 		if (err)
1662b037c29aSEli Cohen 			goto error;
1663b037c29aSEli Cohen 
1664b037c29aSEli Cohen 		mlx5_ib_dbg(dev, "allocated uar %d\n", bfregi->sys_pages[i]);
1665b037c29aSEli Cohen 	}
16664ed131d0SYishai Hadas 
16674ed131d0SYishai Hadas 	for (i = bfregi->num_static_sys_pages; i < bfregi->num_sys_pages; i++)
16684ed131d0SYishai Hadas 		bfregi->sys_pages[i] = MLX5_IB_INVALID_UAR_INDEX;
16694ed131d0SYishai Hadas 
1670b037c29aSEli Cohen 	return 0;
1671b037c29aSEli Cohen 
1672b037c29aSEli Cohen error:
1673b037c29aSEli Cohen 	for (--i; i >= 0; i--)
1674b037c29aSEli Cohen 		if (mlx5_cmd_free_uar(dev->mdev, bfregi->sys_pages[i]))
1675b037c29aSEli Cohen 			mlx5_ib_warn(dev, "failed to free uar %d\n", i);
1676b037c29aSEli Cohen 
1677b037c29aSEli Cohen 	return err;
1678b037c29aSEli Cohen }
1679b037c29aSEli Cohen 
168015177999SLeon Romanovsky static void deallocate_uars(struct mlx5_ib_dev *dev,
168115177999SLeon Romanovsky 			    struct mlx5_ib_ucontext *context)
1682b037c29aSEli Cohen {
1683b037c29aSEli Cohen 	struct mlx5_bfreg_info *bfregi;
1684b037c29aSEli Cohen 	int i;
1685b037c29aSEli Cohen 
1686b037c29aSEli Cohen 	bfregi = &context->bfregi;
168715177999SLeon Romanovsky 	for (i = 0; i < bfregi->num_sys_pages; i++)
16884ed131d0SYishai Hadas 		if (i < bfregi->num_static_sys_pages ||
168915177999SLeon Romanovsky 		    bfregi->sys_pages[i] != MLX5_IB_INVALID_UAR_INDEX)
169015177999SLeon Romanovsky 			mlx5_cmd_free_uar(dev->mdev, bfregi->sys_pages[i]);
1691b037c29aSEli Cohen }
1692b037c29aSEli Cohen 
16930042f9e4SMark Bloch int mlx5_ib_enable_lb(struct mlx5_ib_dev *dev, bool td, bool qp)
1694a560f1d9SMark Bloch {
1695a560f1d9SMark Bloch 	int err = 0;
1696a560f1d9SMark Bloch 
1697a560f1d9SMark Bloch 	mutex_lock(&dev->lb.mutex);
16980042f9e4SMark Bloch 	if (td)
1699a560f1d9SMark Bloch 		dev->lb.user_td++;
17000042f9e4SMark Bloch 	if (qp)
17010042f9e4SMark Bloch 		dev->lb.qps++;
1702a560f1d9SMark Bloch 
17030042f9e4SMark Bloch 	if (dev->lb.user_td == 2 ||
17040042f9e4SMark Bloch 	    dev->lb.qps == 1) {
17050042f9e4SMark Bloch 		if (!dev->lb.enabled) {
1706a560f1d9SMark Bloch 			err = mlx5_nic_vport_update_local_lb(dev->mdev, true);
17070042f9e4SMark Bloch 			dev->lb.enabled = true;
17080042f9e4SMark Bloch 		}
17090042f9e4SMark Bloch 	}
1710a560f1d9SMark Bloch 
1711a560f1d9SMark Bloch 	mutex_unlock(&dev->lb.mutex);
1712a560f1d9SMark Bloch 
1713a560f1d9SMark Bloch 	return err;
1714a560f1d9SMark Bloch }
1715a560f1d9SMark Bloch 
17160042f9e4SMark Bloch void mlx5_ib_disable_lb(struct mlx5_ib_dev *dev, bool td, bool qp)
1717a560f1d9SMark Bloch {
1718a560f1d9SMark Bloch 	mutex_lock(&dev->lb.mutex);
17190042f9e4SMark Bloch 	if (td)
1720a560f1d9SMark Bloch 		dev->lb.user_td--;
17210042f9e4SMark Bloch 	if (qp)
17220042f9e4SMark Bloch 		dev->lb.qps--;
1723a560f1d9SMark Bloch 
17240042f9e4SMark Bloch 	if (dev->lb.user_td == 1 &&
17250042f9e4SMark Bloch 	    dev->lb.qps == 0) {
17260042f9e4SMark Bloch 		if (dev->lb.enabled) {
1727a560f1d9SMark Bloch 			mlx5_nic_vport_update_local_lb(dev->mdev, false);
17280042f9e4SMark Bloch 			dev->lb.enabled = false;
17290042f9e4SMark Bloch 		}
17300042f9e4SMark Bloch 	}
1731a560f1d9SMark Bloch 
1732a560f1d9SMark Bloch 	mutex_unlock(&dev->lb.mutex);
1733a560f1d9SMark Bloch }
1734a560f1d9SMark Bloch 
1735d2d19121SYishai Hadas static int mlx5_ib_alloc_transport_domain(struct mlx5_ib_dev *dev, u32 *tdn,
1736d2d19121SYishai Hadas 					  u16 uid)
1737c85023e1SHuy Nguyen {
1738c85023e1SHuy Nguyen 	int err;
1739c85023e1SHuy Nguyen 
1740cfdeb893SLeon Romanovsky 	if (!MLX5_CAP_GEN(dev->mdev, log_max_transport_domain))
1741cfdeb893SLeon Romanovsky 		return 0;
1742cfdeb893SLeon Romanovsky 
1743d2d19121SYishai Hadas 	err = mlx5_cmd_alloc_transport_domain(dev->mdev, tdn, uid);
1744c85023e1SHuy Nguyen 	if (err)
1745c85023e1SHuy Nguyen 		return err;
1746c85023e1SHuy Nguyen 
1747c85023e1SHuy Nguyen 	if ((MLX5_CAP_GEN(dev->mdev, port_type) != MLX5_CAP_PORT_TYPE_ETH) ||
17488978cc92SEran Ben Elisha 	    (!MLX5_CAP_GEN(dev->mdev, disable_local_lb_uc) &&
17498978cc92SEran Ben Elisha 	     !MLX5_CAP_GEN(dev->mdev, disable_local_lb_mc)))
1750c85023e1SHuy Nguyen 		return err;
1751c85023e1SHuy Nguyen 
17520042f9e4SMark Bloch 	return mlx5_ib_enable_lb(dev, true, false);
1753c85023e1SHuy Nguyen }
1754c85023e1SHuy Nguyen 
1755d2d19121SYishai Hadas static void mlx5_ib_dealloc_transport_domain(struct mlx5_ib_dev *dev, u32 tdn,
1756d2d19121SYishai Hadas 					     u16 uid)
1757c85023e1SHuy Nguyen {
1758cfdeb893SLeon Romanovsky 	if (!MLX5_CAP_GEN(dev->mdev, log_max_transport_domain))
1759cfdeb893SLeon Romanovsky 		return;
1760cfdeb893SLeon Romanovsky 
1761d2d19121SYishai Hadas 	mlx5_cmd_dealloc_transport_domain(dev->mdev, tdn, uid);
1762c85023e1SHuy Nguyen 
1763c85023e1SHuy Nguyen 	if ((MLX5_CAP_GEN(dev->mdev, port_type) != MLX5_CAP_PORT_TYPE_ETH) ||
17648978cc92SEran Ben Elisha 	    (!MLX5_CAP_GEN(dev->mdev, disable_local_lb_uc) &&
17658978cc92SEran Ben Elisha 	     !MLX5_CAP_GEN(dev->mdev, disable_local_lb_mc)))
1766c85023e1SHuy Nguyen 		return;
1767c85023e1SHuy Nguyen 
17680042f9e4SMark Bloch 	mlx5_ib_disable_lb(dev, true, false);
1769c85023e1SHuy Nguyen }
1770c85023e1SHuy Nguyen 
1771a2a074efSLeon Romanovsky static int mlx5_ib_alloc_ucontext(struct ib_ucontext *uctx,
1772e126ba97SEli Cohen 				  struct ib_udata *udata)
1773e126ba97SEli Cohen {
1774a2a074efSLeon Romanovsky 	struct ib_device *ibdev = uctx->device;
1775e126ba97SEli Cohen 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
1776b368d7cbSMatan Barak 	struct mlx5_ib_alloc_ucontext_req_v2 req = {};
1777b368d7cbSMatan Barak 	struct mlx5_ib_alloc_ucontext_resp resp = {};
17785c99eaecSFeras Daoud 	struct mlx5_core_dev *mdev = dev->mdev;
1779a2a074efSLeon Romanovsky 	struct mlx5_ib_ucontext *context = to_mucontext(uctx);
17802f5ff264SEli Cohen 	struct mlx5_bfreg_info *bfregi;
178178c0f98cSEli Cohen 	int ver;
1782e126ba97SEli Cohen 	int err;
1783a168a41cSMajd Dibbiny 	size_t min_req_v2 = offsetof(struct mlx5_ib_alloc_ucontext_req_v2,
1784a168a41cSMajd Dibbiny 				     max_cqe_version);
178525bb36e7SYonatan Cohen 	u32 dump_fill_mkey;
1786b037c29aSEli Cohen 	bool lib_uar_4k;
1787e126ba97SEli Cohen 
1788e126ba97SEli Cohen 	if (!dev->ib_active)
1789a2a074efSLeon Romanovsky 		return -EAGAIN;
1790e126ba97SEli Cohen 
1791e093111dSAmrani, Ram 	if (udata->inlen == sizeof(struct mlx5_ib_alloc_ucontext_req))
179278c0f98cSEli Cohen 		ver = 0;
1793e093111dSAmrani, Ram 	else if (udata->inlen >= min_req_v2)
179478c0f98cSEli Cohen 		ver = 2;
179578c0f98cSEli Cohen 	else
1796a2a074efSLeon Romanovsky 		return -EINVAL;
179778c0f98cSEli Cohen 
1798e093111dSAmrani, Ram 	err = ib_copy_from_udata(&req, udata, min(udata->inlen, sizeof(req)));
1799e126ba97SEli Cohen 	if (err)
1800a2a074efSLeon Romanovsky 		return err;
1801e126ba97SEli Cohen 
1802a8b92ca1SYishai Hadas 	if (req.flags & ~MLX5_IB_ALLOC_UCTX_DEVX)
1803a2a074efSLeon Romanovsky 		return -EOPNOTSUPP;
180478c0f98cSEli Cohen 
1805f72300c5SHaggai Abramovsky 	if (req.comp_mask || req.reserved0 || req.reserved1 || req.reserved2)
1806a2a074efSLeon Romanovsky 		return -EOPNOTSUPP;
1807b368d7cbSMatan Barak 
18082f5ff264SEli Cohen 	req.total_num_bfregs = ALIGN(req.total_num_bfregs,
18092f5ff264SEli Cohen 				    MLX5_NON_FP_BFREGS_PER_UAR);
18102f5ff264SEli Cohen 	if (req.num_low_latency_bfregs > req.total_num_bfregs - 1)
1811a2a074efSLeon Romanovsky 		return -EINVAL;
1812e126ba97SEli Cohen 
1813938fe83cSSaeed Mahameed 	resp.qp_tab_size = 1 << MLX5_CAP_GEN(dev->mdev, log_max_qp);
18142cc6ad5fSNoa Osherovich 	if (mlx5_core_is_pf(dev->mdev) && MLX5_CAP_GEN(dev->mdev, bf))
1815938fe83cSSaeed Mahameed 		resp.bf_reg_size = 1 << MLX5_CAP_GEN(dev->mdev, log_bf_reg_size);
1816b47bd6eaSDaniel Jurgens 	resp.cache_line_size = cache_line_size();
1817938fe83cSSaeed Mahameed 	resp.max_sq_desc_sz = MLX5_CAP_GEN(dev->mdev, max_wqe_sz_sq);
1818938fe83cSSaeed Mahameed 	resp.max_rq_desc_sz = MLX5_CAP_GEN(dev->mdev, max_wqe_sz_rq);
1819938fe83cSSaeed Mahameed 	resp.max_send_wqebb = 1 << MLX5_CAP_GEN(dev->mdev, log_max_qp_sz);
1820938fe83cSSaeed Mahameed 	resp.max_recv_wr = 1 << MLX5_CAP_GEN(dev->mdev, log_max_qp_sz);
1821938fe83cSSaeed Mahameed 	resp.max_srq_recv_wr = 1 << MLX5_CAP_GEN(dev->mdev, log_max_srq_sz);
1822f72300c5SHaggai Abramovsky 	resp.cqe_version = min_t(__u8,
1823f72300c5SHaggai Abramovsky 				 (__u8)MLX5_CAP_GEN(dev->mdev, cqe_version),
1824f72300c5SHaggai Abramovsky 				 req.max_cqe_version);
182530aa60b3SEli Cohen 	resp.log_uar_size = MLX5_CAP_GEN(dev->mdev, uar_4k) ?
182630aa60b3SEli Cohen 				MLX5_ADAPTER_PAGE_SHIFT : PAGE_SHIFT;
182730aa60b3SEli Cohen 	resp.num_uars_per_page = MLX5_CAP_GEN(dev->mdev, uar_4k) ?
182830aa60b3SEli Cohen 					MLX5_CAP_GEN(dev->mdev, num_of_uars_per_page) : 1;
1829b368d7cbSMatan Barak 	resp.response_length = min(offsetof(typeof(resp), response_length) +
1830b368d7cbSMatan Barak 				   sizeof(resp.response_length), udata->outlen);
1831e126ba97SEli Cohen 
1832c03faa56SMatan Barak 	if (mlx5_accel_ipsec_device_caps(dev->mdev) & MLX5_ACCEL_IPSEC_CAP_DEVICE) {
1833c03faa56SMatan Barak 		if (mlx5_get_flow_namespace(dev->mdev, MLX5_FLOW_NAMESPACE_EGRESS))
1834c03faa56SMatan Barak 			resp.flow_action_flags |= MLX5_USER_ALLOC_UCONTEXT_FLOW_ACTION_FLAGS_ESP_AES_GCM;
1835c03faa56SMatan Barak 		if (mlx5_accel_ipsec_device_caps(dev->mdev) & MLX5_ACCEL_IPSEC_CAP_REQUIRED_METADATA)
1836c03faa56SMatan Barak 			resp.flow_action_flags |= MLX5_USER_ALLOC_UCONTEXT_FLOW_ACTION_FLAGS_ESP_AES_GCM_REQ_METADATA;
1837c03faa56SMatan Barak 		if (MLX5_CAP_FLOWTABLE(dev->mdev, flow_table_properties_nic_receive.ft_field_support.outer_esp_spi))
1838c03faa56SMatan Barak 			resp.flow_action_flags |= MLX5_USER_ALLOC_UCONTEXT_FLOW_ACTION_FLAGS_ESP_AES_GCM_SPI_STEERING;
1839c03faa56SMatan Barak 		if (mlx5_accel_ipsec_device_caps(dev->mdev) & MLX5_ACCEL_IPSEC_CAP_TX_IV_IS_ESN)
1840c03faa56SMatan Barak 			resp.flow_action_flags |= MLX5_USER_ALLOC_UCONTEXT_FLOW_ACTION_FLAGS_ESP_AES_GCM_TX_IV_IS_ESN;
1841c03faa56SMatan Barak 		/* MLX5_USER_ALLOC_UCONTEXT_FLOW_ACTION_FLAGS_ESP_AES_GCM_FULL_OFFLOAD is currently always 0 */
1842c03faa56SMatan Barak 	}
1843c03faa56SMatan Barak 
184430aa60b3SEli Cohen 	lib_uar_4k = req.lib_caps & MLX5_LIB_CAP_4K_UAR;
18452f5ff264SEli Cohen 	bfregi = &context->bfregi;
1846b037c29aSEli Cohen 
1847b037c29aSEli Cohen 	/* updates req->total_num_bfregs */
184831a78a5aSYishai Hadas 	err = calc_total_bfregs(dev, lib_uar_4k, &req, bfregi);
1849b037c29aSEli Cohen 	if (err)
1850b037c29aSEli Cohen 		goto out_ctx;
1851b037c29aSEli Cohen 
18522f5ff264SEli Cohen 	mutex_init(&bfregi->lock);
1853b037c29aSEli Cohen 	bfregi->lib_uar_4k = lib_uar_4k;
185431a78a5aSYishai Hadas 	bfregi->count = kcalloc(bfregi->total_num_bfregs, sizeof(*bfregi->count),
1855b037c29aSEli Cohen 				GFP_KERNEL);
1856b037c29aSEli Cohen 	if (!bfregi->count) {
1857e126ba97SEli Cohen 		err = -ENOMEM;
1858e126ba97SEli Cohen 		goto out_ctx;
1859e126ba97SEli Cohen 	}
1860e126ba97SEli Cohen 
1861b037c29aSEli Cohen 	bfregi->sys_pages = kcalloc(bfregi->num_sys_pages,
1862b037c29aSEli Cohen 				    sizeof(*bfregi->sys_pages),
1863e126ba97SEli Cohen 				    GFP_KERNEL);
1864b037c29aSEli Cohen 	if (!bfregi->sys_pages) {
1865e126ba97SEli Cohen 		err = -ENOMEM;
1866e126ba97SEli Cohen 		goto out_count;
1867e126ba97SEli Cohen 	}
1868e126ba97SEli Cohen 
1869b037c29aSEli Cohen 	err = allocate_uars(dev, context);
1870b037c29aSEli Cohen 	if (err)
1871b037c29aSEli Cohen 		goto out_sys_pages;
1872b037c29aSEli Cohen 
1873a8b92ca1SYishai Hadas 	if (req.flags & MLX5_IB_ALLOC_UCTX_DEVX) {
1874fb98153bSYishai Hadas 		err = mlx5_ib_devx_create(dev, true);
187576dc5a84SYishai Hadas 		if (err < 0)
1876d2d19121SYishai Hadas 			goto out_uars;
187776dc5a84SYishai Hadas 		context->devx_uid = err;
1878a8b92ca1SYishai Hadas 	}
1879a8b92ca1SYishai Hadas 
1880d2d19121SYishai Hadas 	err = mlx5_ib_alloc_transport_domain(dev, &context->tdn,
1881d2d19121SYishai Hadas 					     context->devx_uid);
1882a8b92ca1SYishai Hadas 	if (err)
1883d2d19121SYishai Hadas 		goto out_devx;
1884a8b92ca1SYishai Hadas 
188525bb36e7SYonatan Cohen 	if (MLX5_CAP_GEN(dev->mdev, dump_fill_mkey)) {
188625bb36e7SYonatan Cohen 		err = mlx5_cmd_dump_fill_mkey(dev->mdev, &dump_fill_mkey);
188725bb36e7SYonatan Cohen 		if (err)
18888193abb6SJason Gunthorpe 			goto out_mdev;
188925bb36e7SYonatan Cohen 	}
189025bb36e7SYonatan Cohen 
1891e126ba97SEli Cohen 	INIT_LIST_HEAD(&context->db_page_list);
1892e126ba97SEli Cohen 	mutex_init(&context->db_page_mutex);
1893e126ba97SEli Cohen 
18942f5ff264SEli Cohen 	resp.tot_bfregs = req.total_num_bfregs;
1895508562d6SDaniel Jurgens 	resp.num_ports = dev->num_ports;
1896b368d7cbSMatan Barak 
1897f72300c5SHaggai Abramovsky 	if (field_avail(typeof(resp), cqe_version, udata->outlen))
1898f72300c5SHaggai Abramovsky 		resp.response_length += sizeof(resp.cqe_version);
1899b368d7cbSMatan Barak 
1900402ca536SBodong Wang 	if (field_avail(typeof(resp), cmds_supp_uhw, udata->outlen)) {
19016ad279c5SMoni Shoua 		resp.cmds_supp_uhw |= MLX5_USER_CMDS_SUPP_UHW_QUERY_DEVICE |
19026ad279c5SMoni Shoua 				      MLX5_USER_CMDS_SUPP_UHW_CREATE_AH;
1903402ca536SBodong Wang 		resp.response_length += sizeof(resp.cmds_supp_uhw);
1904402ca536SBodong Wang 	}
1905402ca536SBodong Wang 
190678984898SOr Gerlitz 	if (field_avail(typeof(resp), eth_min_inline, udata->outlen)) {
190778984898SOr Gerlitz 		if (mlx5_ib_port_link_layer(ibdev, 1) == IB_LINK_LAYER_ETHERNET) {
190878984898SOr Gerlitz 			mlx5_query_min_inline(dev->mdev, &resp.eth_min_inline);
190978984898SOr Gerlitz 			resp.eth_min_inline++;
191078984898SOr Gerlitz 		}
191178984898SOr Gerlitz 		resp.response_length += sizeof(resp.eth_min_inline);
191278984898SOr Gerlitz 	}
191378984898SOr Gerlitz 
19145c99eaecSFeras Daoud 	if (field_avail(typeof(resp), clock_info_versions, udata->outlen)) {
19155c99eaecSFeras Daoud 		if (mdev->clock_info)
19165c99eaecSFeras Daoud 			resp.clock_info_versions = BIT(MLX5_IB_CLOCK_INFO_V1);
19175c99eaecSFeras Daoud 		resp.response_length += sizeof(resp.clock_info_versions);
19185c99eaecSFeras Daoud 	}
19195c99eaecSFeras Daoud 
1920bc5c6eedSNoa Osherovich 	/*
1921bc5c6eedSNoa Osherovich 	 * We don't want to expose information from the PCI bar that is located
1922bc5c6eedSNoa Osherovich 	 * after 4096 bytes, so if the arch only supports larger pages, let's
1923bc5c6eedSNoa Osherovich 	 * pretend we don't support reading the HCA's core clock. This is also
1924bc5c6eedSNoa Osherovich 	 * forced by mmap function.
1925bc5c6eedSNoa Osherovich 	 */
1926de8d6e02SEli Cohen 	if (field_avail(typeof(resp), hca_core_clock_offset, udata->outlen)) {
1927de8d6e02SEli Cohen 		if (PAGE_SIZE <= 4096) {
1928b368d7cbSMatan Barak 			resp.comp_mask |=
1929b368d7cbSMatan Barak 				MLX5_IB_ALLOC_UCONTEXT_RESP_MASK_CORE_CLOCK_OFFSET;
1930b368d7cbSMatan Barak 			resp.hca_core_clock_offset =
1931de8d6e02SEli Cohen 				offsetof(struct mlx5_init_seg, internal_timer_h) % PAGE_SIZE;
1932de8d6e02SEli Cohen 		}
19335c99eaecSFeras Daoud 		resp.response_length += sizeof(resp.hca_core_clock_offset);
1934b368d7cbSMatan Barak 	}
1935b368d7cbSMatan Barak 
193630aa60b3SEli Cohen 	if (field_avail(typeof(resp), log_uar_size, udata->outlen))
193730aa60b3SEli Cohen 		resp.response_length += sizeof(resp.log_uar_size);
193830aa60b3SEli Cohen 
193930aa60b3SEli Cohen 	if (field_avail(typeof(resp), num_uars_per_page, udata->outlen))
194030aa60b3SEli Cohen 		resp.response_length += sizeof(resp.num_uars_per_page);
194130aa60b3SEli Cohen 
194231a78a5aSYishai Hadas 	if (field_avail(typeof(resp), num_dyn_bfregs, udata->outlen)) {
194331a78a5aSYishai Hadas 		resp.num_dyn_bfregs = bfregi->num_dyn_bfregs;
194431a78a5aSYishai Hadas 		resp.response_length += sizeof(resp.num_dyn_bfregs);
194531a78a5aSYishai Hadas 	}
194631a78a5aSYishai Hadas 
194725bb36e7SYonatan Cohen 	if (field_avail(typeof(resp), dump_fill_mkey, udata->outlen)) {
194825bb36e7SYonatan Cohen 		if (MLX5_CAP_GEN(dev->mdev, dump_fill_mkey)) {
194925bb36e7SYonatan Cohen 			resp.dump_fill_mkey = dump_fill_mkey;
195025bb36e7SYonatan Cohen 			resp.comp_mask |=
195125bb36e7SYonatan Cohen 				MLX5_IB_ALLOC_UCONTEXT_RESP_MASK_DUMP_FILL_MKEY;
195225bb36e7SYonatan Cohen 		}
195325bb36e7SYonatan Cohen 		resp.response_length += sizeof(resp.dump_fill_mkey);
195425bb36e7SYonatan Cohen 	}
195525bb36e7SYonatan Cohen 
1956b368d7cbSMatan Barak 	err = ib_copy_to_udata(udata, &resp, resp.response_length);
1957e126ba97SEli Cohen 	if (err)
1958a8b92ca1SYishai Hadas 		goto out_mdev;
1959e126ba97SEli Cohen 
19602f5ff264SEli Cohen 	bfregi->ver = ver;
19612f5ff264SEli Cohen 	bfregi->num_low_latency_bfregs = req.num_low_latency_bfregs;
1962f72300c5SHaggai Abramovsky 	context->cqe_version = resp.cqe_version;
196330aa60b3SEli Cohen 	context->lib_caps = req.lib_caps;
196430aa60b3SEli Cohen 	print_lib_caps(dev, context->lib_caps);
1965f72300c5SHaggai Abramovsky 
19667c34ec19SAviv Heller 	if (dev->lag_active) {
196795579e78SMark Bloch 		u8 port = mlx5_core_native_port_num(dev->mdev) - 1;
1968c6a21c38SMajd Dibbiny 
1969c6a21c38SMajd Dibbiny 		atomic_set(&context->tx_port_affinity,
1970c6a21c38SMajd Dibbiny 			   atomic_add_return(
197195579e78SMark Bloch 				   1, &dev->port[port].roce.tx_port_affinity));
1972c6a21c38SMajd Dibbiny 	}
1973c6a21c38SMajd Dibbiny 
1974a2a074efSLeon Romanovsky 	return 0;
1975e126ba97SEli Cohen 
1976a8b92ca1SYishai Hadas out_mdev:
1977d2d19121SYishai Hadas 	mlx5_ib_dealloc_transport_domain(dev, context->tdn, context->devx_uid);
1978d2d19121SYishai Hadas out_devx:
1979a8b92ca1SYishai Hadas 	if (req.flags & MLX5_IB_ALLOC_UCTX_DEVX)
198076dc5a84SYishai Hadas 		mlx5_ib_devx_destroy(dev, context->devx_uid);
1981146d2f1aSmajd@mellanox.com 
1982e126ba97SEli Cohen out_uars:
1983b037c29aSEli Cohen 	deallocate_uars(dev, context);
1984b037c29aSEli Cohen 
1985b037c29aSEli Cohen out_sys_pages:
1986b037c29aSEli Cohen 	kfree(bfregi->sys_pages);
1987b037c29aSEli Cohen 
1988e126ba97SEli Cohen out_count:
19892f5ff264SEli Cohen 	kfree(bfregi->count);
1990e126ba97SEli Cohen 
1991e126ba97SEli Cohen out_ctx:
1992a2a074efSLeon Romanovsky 	return err;
1993e126ba97SEli Cohen }
1994e126ba97SEli Cohen 
1995a2a074efSLeon Romanovsky static void mlx5_ib_dealloc_ucontext(struct ib_ucontext *ibcontext)
1996e126ba97SEli Cohen {
1997e126ba97SEli Cohen 	struct mlx5_ib_ucontext *context = to_mucontext(ibcontext);
1998e126ba97SEli Cohen 	struct mlx5_ib_dev *dev = to_mdev(ibcontext->device);
1999b037c29aSEli Cohen 	struct mlx5_bfreg_info *bfregi;
2000e126ba97SEli Cohen 
2001b037c29aSEli Cohen 	bfregi = &context->bfregi;
2002d2d19121SYishai Hadas 	mlx5_ib_dealloc_transport_domain(dev, context->tdn, context->devx_uid);
2003d2d19121SYishai Hadas 
2004b037c29aSEli Cohen 	if (context->devx_uid)
200576dc5a84SYishai Hadas 		mlx5_ib_devx_destroy(dev, context->devx_uid);
2006e126ba97SEli Cohen 
2007e126ba97SEli Cohen 	deallocate_uars(dev, context);
20082f5ff264SEli Cohen 	kfree(bfregi->sys_pages);
20092f5ff264SEli Cohen 	kfree(bfregi->count);
2010e126ba97SEli Cohen }
2011e126ba97SEli Cohen 
2012e126ba97SEli Cohen static phys_addr_t uar_index2pfn(struct mlx5_ib_dev *dev,
2013e126ba97SEli Cohen 				 int uar_idx)
2014e126ba97SEli Cohen {
2015b037c29aSEli Cohen 	int fw_uars_per_page;
2016b037c29aSEli Cohen 
2017b037c29aSEli Cohen 	fw_uars_per_page = MLX5_CAP_GEN(dev->mdev, uar_4k) ? MLX5_UARS_IN_PAGE : 1;
2018b037c29aSEli Cohen 
2019aa8106f1SHuy Nguyen 	return (dev->mdev->bar_addr >> PAGE_SHIFT) + uar_idx / fw_uars_per_page;
2020e126ba97SEli Cohen }
2021e126ba97SEli Cohen 
2022e126ba97SEli Cohen static int get_command(unsigned long offset)
2023e126ba97SEli Cohen {
2024e126ba97SEli Cohen 	return (offset >> MLX5_IB_MMAP_CMD_SHIFT) & MLX5_IB_MMAP_CMD_MASK;
2025e126ba97SEli Cohen }
2026e126ba97SEli Cohen 
2027e126ba97SEli Cohen static int get_arg(unsigned long offset)
2028e126ba97SEli Cohen {
2029e126ba97SEli Cohen 	return offset & ((1 << MLX5_IB_MMAP_CMD_SHIFT) - 1);
2030e126ba97SEli Cohen }
2031e126ba97SEli Cohen 
2032e126ba97SEli Cohen static int get_index(unsigned long offset)
2033e126ba97SEli Cohen {
2034e126ba97SEli Cohen 	return get_arg(offset);
2035e126ba97SEli Cohen }
2036e126ba97SEli Cohen 
20374ed131d0SYishai Hadas /* Index resides in an extra byte to enable larger values than 255 */
20384ed131d0SYishai Hadas static int get_extended_index(unsigned long offset)
20394ed131d0SYishai Hadas {
20404ed131d0SYishai Hadas 	return get_arg(offset) | ((offset >> 16) & 0xff) << 8;
20414ed131d0SYishai Hadas }
20424ed131d0SYishai Hadas 
20437c2344c3SMaor Gottlieb 
20447c2344c3SMaor Gottlieb static void mlx5_ib_disassociate_ucontext(struct ib_ucontext *ibcontext)
20457c2344c3SMaor Gottlieb {
20467c2344c3SMaor Gottlieb }
20477c2344c3SMaor Gottlieb 
204837aa5c36SGuy Levi static inline char *mmap_cmd2str(enum mlx5_ib_mmap_cmd cmd)
2049e126ba97SEli Cohen {
205037aa5c36SGuy Levi 	switch (cmd) {
205137aa5c36SGuy Levi 	case MLX5_IB_MMAP_WC_PAGE:
205237aa5c36SGuy Levi 		return "WC";
2053e126ba97SEli Cohen 	case MLX5_IB_MMAP_REGULAR_PAGE:
205437aa5c36SGuy Levi 		return "best effort WC";
205537aa5c36SGuy Levi 	case MLX5_IB_MMAP_NC_PAGE:
205637aa5c36SGuy Levi 		return "NC";
205724da0016SAriel Levkovich 	case MLX5_IB_MMAP_DEVICE_MEM:
205824da0016SAriel Levkovich 		return "Device Memory";
205937aa5c36SGuy Levi 	default:
206037aa5c36SGuy Levi 		return NULL;
206137aa5c36SGuy Levi 	}
206237aa5c36SGuy Levi }
206337aa5c36SGuy Levi 
20645c99eaecSFeras Daoud static int mlx5_ib_mmap_clock_info_page(struct mlx5_ib_dev *dev,
20655c99eaecSFeras Daoud 					struct vm_area_struct *vma,
20665c99eaecSFeras Daoud 					struct mlx5_ib_ucontext *context)
20675c99eaecSFeras Daoud {
20684eb6ab13SJason Gunthorpe 	if ((vma->vm_end - vma->vm_start != PAGE_SIZE) ||
20694eb6ab13SJason Gunthorpe 	    !(vma->vm_flags & VM_SHARED))
20705c99eaecSFeras Daoud 		return -EINVAL;
20715c99eaecSFeras Daoud 
20725c99eaecSFeras Daoud 	if (get_index(vma->vm_pgoff) != MLX5_IB_CLOCK_INFO_V1)
20735c99eaecSFeras Daoud 		return -EOPNOTSUPP;
20745c99eaecSFeras Daoud 
20754eb6ab13SJason Gunthorpe 	if (vma->vm_flags & (VM_WRITE | VM_EXEC))
20765c99eaecSFeras Daoud 		return -EPERM;
2077c660133cSJason Gunthorpe 	vma->vm_flags &= ~VM_MAYWRITE;
20785c99eaecSFeras Daoud 
2079ddcdc368SJason Gunthorpe 	if (!dev->mdev->clock_info)
20805c99eaecSFeras Daoud 		return -EOPNOTSUPP;
20815c99eaecSFeras Daoud 
20824eb6ab13SJason Gunthorpe 	return vm_insert_page(vma, vma->vm_start,
20834eb6ab13SJason Gunthorpe 			      virt_to_page(dev->mdev->clock_info));
20845c99eaecSFeras Daoud }
20855c99eaecSFeras Daoud 
208637aa5c36SGuy Levi static int uar_mmap(struct mlx5_ib_dev *dev, enum mlx5_ib_mmap_cmd cmd,
20877c2344c3SMaor Gottlieb 		    struct vm_area_struct *vma,
20887c2344c3SMaor Gottlieb 		    struct mlx5_ib_ucontext *context)
208937aa5c36SGuy Levi {
20902f5ff264SEli Cohen 	struct mlx5_bfreg_info *bfregi = &context->bfregi;
209137aa5c36SGuy Levi 	int err;
209237aa5c36SGuy Levi 	unsigned long idx;
2093aa09ea6eSKamal Heib 	phys_addr_t pfn;
209437aa5c36SGuy Levi 	pgprot_t prot;
20954ed131d0SYishai Hadas 	u32 bfreg_dyn_idx = 0;
20964ed131d0SYishai Hadas 	u32 uar_index;
20974ed131d0SYishai Hadas 	int dyn_uar = (cmd == MLX5_IB_MMAP_ALLOC_WC);
20984ed131d0SYishai Hadas 	int max_valid_idx = dyn_uar ? bfregi->num_sys_pages :
20994ed131d0SYishai Hadas 				bfregi->num_static_sys_pages;
2100b037c29aSEli Cohen 
2101b037c29aSEli Cohen 	if (vma->vm_end - vma->vm_start != PAGE_SIZE)
2102b037c29aSEli Cohen 		return -EINVAL;
2103b037c29aSEli Cohen 
21044ed131d0SYishai Hadas 	if (dyn_uar)
21054ed131d0SYishai Hadas 		idx = get_extended_index(vma->vm_pgoff) + bfregi->num_static_sys_pages;
21064ed131d0SYishai Hadas 	else
2107b037c29aSEli Cohen 		idx = get_index(vma->vm_pgoff);
21084ed131d0SYishai Hadas 
21094ed131d0SYishai Hadas 	if (idx >= max_valid_idx) {
21104ed131d0SYishai Hadas 		mlx5_ib_warn(dev, "invalid uar index %lu, max=%d\n",
21114ed131d0SYishai Hadas 			     idx, max_valid_idx);
2112b037c29aSEli Cohen 		return -EINVAL;
2113b037c29aSEli Cohen 	}
211437aa5c36SGuy Levi 
211537aa5c36SGuy Levi 	switch (cmd) {
211637aa5c36SGuy Levi 	case MLX5_IB_MMAP_WC_PAGE:
21174ed131d0SYishai Hadas 	case MLX5_IB_MMAP_ALLOC_WC:
211837aa5c36SGuy Levi /* Some architectures don't support WC memory */
211937aa5c36SGuy Levi #if defined(CONFIG_X86)
212037aa5c36SGuy Levi 		if (!pat_enabled())
212137aa5c36SGuy Levi 			return -EPERM;
212237aa5c36SGuy Levi #elif !(defined(CONFIG_PPC) || (defined(CONFIG_ARM) && defined(CONFIG_MMU)))
212337aa5c36SGuy Levi 			return -EPERM;
212437aa5c36SGuy Levi #endif
212537aa5c36SGuy Levi 	/* fall through */
212637aa5c36SGuy Levi 	case MLX5_IB_MMAP_REGULAR_PAGE:
212737aa5c36SGuy Levi 		/* For MLX5_IB_MMAP_REGULAR_PAGE do the best effort to get WC */
212837aa5c36SGuy Levi 		prot = pgprot_writecombine(vma->vm_page_prot);
212937aa5c36SGuy Levi 		break;
213037aa5c36SGuy Levi 	case MLX5_IB_MMAP_NC_PAGE:
213137aa5c36SGuy Levi 		prot = pgprot_noncached(vma->vm_page_prot);
213237aa5c36SGuy Levi 		break;
213337aa5c36SGuy Levi 	default:
213437aa5c36SGuy Levi 		return -EINVAL;
213537aa5c36SGuy Levi 	}
213637aa5c36SGuy Levi 
21374ed131d0SYishai Hadas 	if (dyn_uar) {
21384ed131d0SYishai Hadas 		int uars_per_page;
21394ed131d0SYishai Hadas 
21404ed131d0SYishai Hadas 		uars_per_page = get_uars_per_sys_page(dev, bfregi->lib_uar_4k);
21414ed131d0SYishai Hadas 		bfreg_dyn_idx = idx * (uars_per_page * MLX5_NON_FP_BFREGS_PER_UAR);
21424ed131d0SYishai Hadas 		if (bfreg_dyn_idx >= bfregi->total_num_bfregs) {
21434ed131d0SYishai Hadas 			mlx5_ib_warn(dev, "invalid bfreg_dyn_idx %u, max=%u\n",
21444ed131d0SYishai Hadas 				     bfreg_dyn_idx, bfregi->total_num_bfregs);
21454ed131d0SYishai Hadas 			return -EINVAL;
21464ed131d0SYishai Hadas 		}
21474ed131d0SYishai Hadas 
21484ed131d0SYishai Hadas 		mutex_lock(&bfregi->lock);
21494ed131d0SYishai Hadas 		/* Fail if uar already allocated, first bfreg index of each
21504ed131d0SYishai Hadas 		 * page holds its count.
21514ed131d0SYishai Hadas 		 */
21524ed131d0SYishai Hadas 		if (bfregi->count[bfreg_dyn_idx]) {
21534ed131d0SYishai Hadas 			mlx5_ib_warn(dev, "wrong offset, idx %lu is busy, bfregn=%u\n", idx, bfreg_dyn_idx);
21544ed131d0SYishai Hadas 			mutex_unlock(&bfregi->lock);
21554ed131d0SYishai Hadas 			return -EINVAL;
21564ed131d0SYishai Hadas 		}
21574ed131d0SYishai Hadas 
21584ed131d0SYishai Hadas 		bfregi->count[bfreg_dyn_idx]++;
21594ed131d0SYishai Hadas 		mutex_unlock(&bfregi->lock);
21604ed131d0SYishai Hadas 
21614ed131d0SYishai Hadas 		err = mlx5_cmd_alloc_uar(dev->mdev, &uar_index);
21624ed131d0SYishai Hadas 		if (err) {
21634ed131d0SYishai Hadas 			mlx5_ib_warn(dev, "UAR alloc failed\n");
21644ed131d0SYishai Hadas 			goto free_bfreg;
21654ed131d0SYishai Hadas 		}
21664ed131d0SYishai Hadas 	} else {
21674ed131d0SYishai Hadas 		uar_index = bfregi->sys_pages[idx];
21684ed131d0SYishai Hadas 	}
21694ed131d0SYishai Hadas 
21704ed131d0SYishai Hadas 	pfn = uar_index2pfn(dev, uar_index);
217137aa5c36SGuy Levi 	mlx5_ib_dbg(dev, "uar idx 0x%lx, pfn %pa\n", idx, &pfn);
2172e126ba97SEli Cohen 
2173e2cd1d1aSJason Gunthorpe 	err = rdma_user_mmap_io(&context->ibucontext, vma, pfn, PAGE_SIZE,
2174e2cd1d1aSJason Gunthorpe 				prot);
217537aa5c36SGuy Levi 	if (err) {
21768f062287SLeon Romanovsky 		mlx5_ib_err(dev,
2177e2cd1d1aSJason Gunthorpe 			    "rdma_user_mmap_io failed with error=%d, mmap_cmd=%s\n",
21788f062287SLeon Romanovsky 			    err, mmap_cmd2str(cmd));
21794ed131d0SYishai Hadas 		goto err;
218037aa5c36SGuy Levi 	}
2181e126ba97SEli Cohen 
21824ed131d0SYishai Hadas 	if (dyn_uar)
21834ed131d0SYishai Hadas 		bfregi->sys_pages[idx] = uar_index;
21844ed131d0SYishai Hadas 	return 0;
21854ed131d0SYishai Hadas 
21864ed131d0SYishai Hadas err:
21874ed131d0SYishai Hadas 	if (!dyn_uar)
21884ed131d0SYishai Hadas 		return err;
21894ed131d0SYishai Hadas 
21904ed131d0SYishai Hadas 	mlx5_cmd_free_uar(dev->mdev, idx);
21914ed131d0SYishai Hadas 
21924ed131d0SYishai Hadas free_bfreg:
21934ed131d0SYishai Hadas 	mlx5_ib_free_bfreg(dev, bfregi, bfreg_dyn_idx);
21944ed131d0SYishai Hadas 
21954ed131d0SYishai Hadas 	return err;
219637aa5c36SGuy Levi }
219737aa5c36SGuy Levi 
219824da0016SAriel Levkovich static int dm_mmap(struct ib_ucontext *context, struct vm_area_struct *vma)
219924da0016SAriel Levkovich {
220024da0016SAriel Levkovich 	struct mlx5_ib_ucontext *mctx = to_mucontext(context);
220124da0016SAriel Levkovich 	struct mlx5_ib_dev *dev = to_mdev(context->device);
220224da0016SAriel Levkovich 	u16 page_idx = get_extended_index(vma->vm_pgoff);
220324da0016SAriel Levkovich 	size_t map_size = vma->vm_end - vma->vm_start;
220424da0016SAriel Levkovich 	u32 npages = map_size >> PAGE_SHIFT;
220524da0016SAriel Levkovich 	phys_addr_t pfn;
220624da0016SAriel Levkovich 
220724da0016SAriel Levkovich 	if (find_next_zero_bit(mctx->dm_pages, page_idx + npages, page_idx) !=
220824da0016SAriel Levkovich 	    page_idx + npages)
220924da0016SAriel Levkovich 		return -EINVAL;
221024da0016SAriel Levkovich 
2211aa8106f1SHuy Nguyen 	pfn = ((dev->mdev->bar_addr +
221224da0016SAriel Levkovich 	      MLX5_CAP64_DEV_MEM(dev->mdev, memic_bar_start_addr)) >>
221324da0016SAriel Levkovich 	      PAGE_SHIFT) +
221424da0016SAriel Levkovich 	      page_idx;
2215e2cd1d1aSJason Gunthorpe 	return rdma_user_mmap_io(context, vma, pfn, map_size,
2216e2cd1d1aSJason Gunthorpe 				 pgprot_writecombine(vma->vm_page_prot));
221724da0016SAriel Levkovich }
221824da0016SAriel Levkovich 
221937aa5c36SGuy Levi static int mlx5_ib_mmap(struct ib_ucontext *ibcontext, struct vm_area_struct *vma)
222037aa5c36SGuy Levi {
222137aa5c36SGuy Levi 	struct mlx5_ib_ucontext *context = to_mucontext(ibcontext);
222237aa5c36SGuy Levi 	struct mlx5_ib_dev *dev = to_mdev(ibcontext->device);
222337aa5c36SGuy Levi 	unsigned long command;
222437aa5c36SGuy Levi 	phys_addr_t pfn;
222537aa5c36SGuy Levi 
222637aa5c36SGuy Levi 	command = get_command(vma->vm_pgoff);
222737aa5c36SGuy Levi 	switch (command) {
222837aa5c36SGuy Levi 	case MLX5_IB_MMAP_WC_PAGE:
222937aa5c36SGuy Levi 	case MLX5_IB_MMAP_NC_PAGE:
223037aa5c36SGuy Levi 	case MLX5_IB_MMAP_REGULAR_PAGE:
22314ed131d0SYishai Hadas 	case MLX5_IB_MMAP_ALLOC_WC:
22327c2344c3SMaor Gottlieb 		return uar_mmap(dev, command, vma, context);
2233e126ba97SEli Cohen 
2234e126ba97SEli Cohen 	case MLX5_IB_MMAP_GET_CONTIGUOUS_PAGES:
2235e126ba97SEli Cohen 		return -ENOSYS;
2236e126ba97SEli Cohen 
2237d69e3bcfSMatan Barak 	case MLX5_IB_MMAP_CORE_CLOCK:
2238d69e3bcfSMatan Barak 		if (vma->vm_end - vma->vm_start != PAGE_SIZE)
2239d69e3bcfSMatan Barak 			return -EINVAL;
2240d69e3bcfSMatan Barak 
22416cbac1e4SMatan Barak 		if (vma->vm_flags & VM_WRITE)
2242d69e3bcfSMatan Barak 			return -EPERM;
2243c660133cSJason Gunthorpe 		vma->vm_flags &= ~VM_MAYWRITE;
2244d69e3bcfSMatan Barak 
2245d69e3bcfSMatan Barak 		/* Don't expose to user-space information it shouldn't have */
2246d69e3bcfSMatan Barak 		if (PAGE_SIZE > 4096)
2247d69e3bcfSMatan Barak 			return -EOPNOTSUPP;
2248d69e3bcfSMatan Barak 
2249d69e3bcfSMatan Barak 		pfn = (dev->mdev->iseg_base +
2250d69e3bcfSMatan Barak 		       offsetof(struct mlx5_init_seg, internal_timer_h)) >>
2251d69e3bcfSMatan Barak 			PAGE_SHIFT;
2252d5e560d3SJason Gunthorpe 		return rdma_user_mmap_io(&context->ibucontext, vma, pfn,
2253d5e560d3SJason Gunthorpe 					 PAGE_SIZE,
2254d5e560d3SJason Gunthorpe 					 pgprot_noncached(vma->vm_page_prot));
22555c99eaecSFeras Daoud 	case MLX5_IB_MMAP_CLOCK_INFO:
22565c99eaecSFeras Daoud 		return mlx5_ib_mmap_clock_info_page(dev, vma, context);
2257d69e3bcfSMatan Barak 
225824da0016SAriel Levkovich 	case MLX5_IB_MMAP_DEVICE_MEM:
225924da0016SAriel Levkovich 		return dm_mmap(ibcontext, vma);
226024da0016SAriel Levkovich 
2261e126ba97SEli Cohen 	default:
2262e126ba97SEli Cohen 		return -EINVAL;
2263e126ba97SEli Cohen 	}
2264e126ba97SEli Cohen 
2265e126ba97SEli Cohen 	return 0;
2266e126ba97SEli Cohen }
2267e126ba97SEli Cohen 
226825c13324SAriel Levkovich static inline int check_dm_type_support(struct mlx5_ib_dev *dev,
226925c13324SAriel Levkovich 					u32 type)
227025c13324SAriel Levkovich {
227125c13324SAriel Levkovich 	switch (type) {
227225c13324SAriel Levkovich 	case MLX5_IB_UAPI_DM_TYPE_MEMIC:
227325c13324SAriel Levkovich 		if (!MLX5_CAP_DEV_MEM(dev->mdev, memic))
227425c13324SAriel Levkovich 			return -EOPNOTSUPP;
227525c13324SAriel Levkovich 		break;
227625c13324SAriel Levkovich 	case MLX5_IB_UAPI_DM_TYPE_STEERING_SW_ICM:
2277c9b9dcb4SAriel Levkovich 	case MLX5_IB_UAPI_DM_TYPE_HEADER_MODIFY_SW_ICM:
227825c13324SAriel Levkovich 		if (!capable(CAP_SYS_RAWIO) ||
227925c13324SAriel Levkovich 		    !capable(CAP_NET_RAW))
228025c13324SAriel Levkovich 			return -EPERM;
228125c13324SAriel Levkovich 
228225c13324SAriel Levkovich 		if (!(MLX5_CAP_FLOWTABLE_NIC_RX(dev->mdev, sw_owner) ||
228325c13324SAriel Levkovich 		      MLX5_CAP_FLOWTABLE_NIC_TX(dev->mdev, sw_owner)))
228425c13324SAriel Levkovich 			return -EOPNOTSUPP;
228525c13324SAriel Levkovich 		break;
228625c13324SAriel Levkovich 	}
228725c13324SAriel Levkovich 
228825c13324SAriel Levkovich 	return 0;
228925c13324SAriel Levkovich }
229025c13324SAriel Levkovich 
22913b113a1eSAriel Levkovich static int handle_alloc_dm_memic(struct ib_ucontext *ctx,
22923b113a1eSAriel Levkovich 				 struct mlx5_ib_dm *dm,
229324da0016SAriel Levkovich 				 struct ib_dm_alloc_attr *attr,
229424da0016SAriel Levkovich 				 struct uverbs_attr_bundle *attrs)
229524da0016SAriel Levkovich {
22963b113a1eSAriel Levkovich 	struct mlx5_dm *dm_db = &to_mdev(ctx->device)->dm;
229724da0016SAriel Levkovich 	u64 start_offset;
229824da0016SAriel Levkovich 	u32 page_idx;
229924da0016SAriel Levkovich 	int err;
230024da0016SAriel Levkovich 
23013b113a1eSAriel Levkovich 	dm->size = roundup(attr->length, MLX5_MEMIC_BASE_SIZE);
230224da0016SAriel Levkovich 
23033b113a1eSAriel Levkovich 	err = mlx5_cmd_alloc_memic(dm_db, &dm->dev_addr,
23043b113a1eSAriel Levkovich 				   dm->size, attr->alignment);
230524da0016SAriel Levkovich 	if (err)
23063b113a1eSAriel Levkovich 		return err;
230724da0016SAriel Levkovich 
23083b113a1eSAriel Levkovich 	page_idx = (dm->dev_addr - pci_resource_start(dm_db->dev->pdev, 0) -
23093b113a1eSAriel Levkovich 		    MLX5_CAP64_DEV_MEM(dm_db->dev, memic_bar_start_addr)) >>
231024da0016SAriel Levkovich 		    PAGE_SHIFT;
231124da0016SAriel Levkovich 
231224da0016SAriel Levkovich 	err = uverbs_copy_to(attrs,
231324da0016SAriel Levkovich 			     MLX5_IB_ATTR_ALLOC_DM_RESP_PAGE_INDEX,
231424da0016SAriel Levkovich 			     &page_idx, sizeof(page_idx));
231524da0016SAriel Levkovich 	if (err)
231624da0016SAriel Levkovich 		goto err_dealloc;
231724da0016SAriel Levkovich 
23183b113a1eSAriel Levkovich 	start_offset = dm->dev_addr & ~PAGE_MASK;
23193b113a1eSAriel Levkovich 	err = uverbs_copy_to(attrs,
23203b113a1eSAriel Levkovich 			     MLX5_IB_ATTR_ALLOC_DM_RESP_START_OFFSET,
23213b113a1eSAriel Levkovich 			     &start_offset, sizeof(start_offset));
23223b113a1eSAriel Levkovich 	if (err)
23233b113a1eSAriel Levkovich 		goto err_dealloc;
232424da0016SAriel Levkovich 
23253b113a1eSAriel Levkovich 	bitmap_set(to_mucontext(ctx)->dm_pages, page_idx,
23263b113a1eSAriel Levkovich 		   DIV_ROUND_UP(dm->size, PAGE_SIZE));
23273b113a1eSAriel Levkovich 
23283b113a1eSAriel Levkovich 	return 0;
23293b113a1eSAriel Levkovich 
23303b113a1eSAriel Levkovich err_dealloc:
23313b113a1eSAriel Levkovich 	mlx5_cmd_dealloc_memic(dm_db, dm->dev_addr, dm->size);
23323b113a1eSAriel Levkovich 
23333b113a1eSAriel Levkovich 	return err;
23343b113a1eSAriel Levkovich }
23353b113a1eSAriel Levkovich 
233625c13324SAriel Levkovich static int handle_alloc_dm_sw_icm(struct ib_ucontext *ctx,
233725c13324SAriel Levkovich 				  struct mlx5_ib_dm *dm,
233825c13324SAriel Levkovich 				  struct ib_dm_alloc_attr *attr,
233925c13324SAriel Levkovich 				  struct uverbs_attr_bundle *attrs,
234025c13324SAriel Levkovich 				  int type)
234125c13324SAriel Levkovich {
2342c9b9dcb4SAriel Levkovich 	struct mlx5_core_dev *dev = to_mdev(ctx->device)->mdev;
234325c13324SAriel Levkovich 	u64 act_size;
234425c13324SAriel Levkovich 	int err;
234525c13324SAriel Levkovich 
234625c13324SAriel Levkovich 	/* Allocation size must a multiple of the basic block size
234725c13324SAriel Levkovich 	 * and a power of 2.
234825c13324SAriel Levkovich 	 */
2349c9b9dcb4SAriel Levkovich 	act_size = round_up(attr->length, MLX5_SW_ICM_BLOCK_SIZE(dev));
235025c13324SAriel Levkovich 	act_size = roundup_pow_of_two(act_size);
235125c13324SAriel Levkovich 
235225c13324SAriel Levkovich 	dm->size = act_size;
2353c9b9dcb4SAriel Levkovich 	err = mlx5_dm_sw_icm_alloc(dev, type, act_size,
235425c13324SAriel Levkovich 				   to_mucontext(ctx)->devx_uid, &dm->dev_addr,
235525c13324SAriel Levkovich 				   &dm->icm_dm.obj_id);
235625c13324SAriel Levkovich 	if (err)
235725c13324SAriel Levkovich 		return err;
235825c13324SAriel Levkovich 
235925c13324SAriel Levkovich 	err = uverbs_copy_to(attrs,
236025c13324SAriel Levkovich 			     MLX5_IB_ATTR_ALLOC_DM_RESP_START_OFFSET,
236125c13324SAriel Levkovich 			     &dm->dev_addr, sizeof(dm->dev_addr));
236225c13324SAriel Levkovich 	if (err)
2363c9b9dcb4SAriel Levkovich 		mlx5_dm_sw_icm_dealloc(dev, type, dm->size,
2364c9b9dcb4SAriel Levkovich 				       to_mucontext(ctx)->devx_uid, dm->dev_addr,
2365c9b9dcb4SAriel Levkovich 				       dm->icm_dm.obj_id);
236625c13324SAriel Levkovich 
236725c13324SAriel Levkovich 	return err;
236825c13324SAriel Levkovich }
236925c13324SAriel Levkovich 
23703b113a1eSAriel Levkovich struct ib_dm *mlx5_ib_alloc_dm(struct ib_device *ibdev,
23713b113a1eSAriel Levkovich 			       struct ib_ucontext *context,
23723b113a1eSAriel Levkovich 			       struct ib_dm_alloc_attr *attr,
23733b113a1eSAriel Levkovich 			       struct uverbs_attr_bundle *attrs)
23743b113a1eSAriel Levkovich {
23753b113a1eSAriel Levkovich 	struct mlx5_ib_dm *dm;
23763b113a1eSAriel Levkovich 	enum mlx5_ib_uapi_dm_type type;
23773b113a1eSAriel Levkovich 	int err;
23783b113a1eSAriel Levkovich 
23793b113a1eSAriel Levkovich 	err = uverbs_get_const_default(&type, attrs,
23803b113a1eSAriel Levkovich 				       MLX5_IB_ATTR_ALLOC_DM_REQ_TYPE,
23813b113a1eSAriel Levkovich 				       MLX5_IB_UAPI_DM_TYPE_MEMIC);
23823b113a1eSAriel Levkovich 	if (err)
23833b113a1eSAriel Levkovich 		return ERR_PTR(err);
23843b113a1eSAriel Levkovich 
23853b113a1eSAriel Levkovich 	mlx5_ib_dbg(to_mdev(ibdev), "alloc_dm req: dm_type=%d user_length=0x%llx log_alignment=%d\n",
23863b113a1eSAriel Levkovich 		    type, attr->length, attr->alignment);
23873b113a1eSAriel Levkovich 
238825c13324SAriel Levkovich 	err = check_dm_type_support(to_mdev(ibdev), type);
238925c13324SAriel Levkovich 	if (err)
239025c13324SAriel Levkovich 		return ERR_PTR(err);
239125c13324SAriel Levkovich 
23923b113a1eSAriel Levkovich 	dm = kzalloc(sizeof(*dm), GFP_KERNEL);
23933b113a1eSAriel Levkovich 	if (!dm)
23943b113a1eSAriel Levkovich 		return ERR_PTR(-ENOMEM);
23953b113a1eSAriel Levkovich 
23963b113a1eSAriel Levkovich 	dm->type = type;
23973b113a1eSAriel Levkovich 
23983b113a1eSAriel Levkovich 	switch (type) {
23993b113a1eSAriel Levkovich 	case MLX5_IB_UAPI_DM_TYPE_MEMIC:
24003b113a1eSAriel Levkovich 		err = handle_alloc_dm_memic(context, dm,
24013b113a1eSAriel Levkovich 					    attr,
24023b113a1eSAriel Levkovich 					    attrs);
24033b113a1eSAriel Levkovich 		break;
240425c13324SAriel Levkovich 	case MLX5_IB_UAPI_DM_TYPE_STEERING_SW_ICM:
2405c9b9dcb4SAriel Levkovich 		err = handle_alloc_dm_sw_icm(context, dm,
2406c9b9dcb4SAriel Levkovich 					     attr, attrs,
2407c9b9dcb4SAriel Levkovich 					     MLX5_SW_ICM_TYPE_STEERING);
2408c9b9dcb4SAriel Levkovich 		break;
240925c13324SAriel Levkovich 	case MLX5_IB_UAPI_DM_TYPE_HEADER_MODIFY_SW_ICM:
2410c9b9dcb4SAriel Levkovich 		err = handle_alloc_dm_sw_icm(context, dm,
2411c9b9dcb4SAriel Levkovich 					     attr, attrs,
2412c9b9dcb4SAriel Levkovich 					     MLX5_SW_ICM_TYPE_HEADER_MODIFY);
241325c13324SAriel Levkovich 		break;
24143b113a1eSAriel Levkovich 	default:
24153b113a1eSAriel Levkovich 		err = -EOPNOTSUPP;
24163b113a1eSAriel Levkovich 	}
24173b113a1eSAriel Levkovich 
24183b113a1eSAriel Levkovich 	if (err)
24193b113a1eSAriel Levkovich 		goto err_free;
242024da0016SAriel Levkovich 
242124da0016SAriel Levkovich 	return &dm->ibdm;
242224da0016SAriel Levkovich 
242324da0016SAriel Levkovich err_free:
242424da0016SAriel Levkovich 	kfree(dm);
242524da0016SAriel Levkovich 	return ERR_PTR(err);
242624da0016SAriel Levkovich }
242724da0016SAriel Levkovich 
2428c4367a26SShamir Rabinovitch int mlx5_ib_dealloc_dm(struct ib_dm *ibdm, struct uverbs_attr_bundle *attrs)
242924da0016SAriel Levkovich {
243025c13324SAriel Levkovich 	struct mlx5_ib_ucontext *ctx = rdma_udata_to_drv_context(
243125c13324SAriel Levkovich 		&attrs->driver_udata, struct mlx5_ib_ucontext, ibucontext);
2432c9b9dcb4SAriel Levkovich 	struct mlx5_core_dev *dev = to_mdev(ibdm->device)->mdev;
24333b113a1eSAriel Levkovich 	struct mlx5_dm *dm_db = &to_mdev(ibdm->device)->dm;
243424da0016SAriel Levkovich 	struct mlx5_ib_dm *dm = to_mdm(ibdm);
243524da0016SAriel Levkovich 	u32 page_idx;
243624da0016SAriel Levkovich 	int ret;
243724da0016SAriel Levkovich 
24383b113a1eSAriel Levkovich 	switch (dm->type) {
24393b113a1eSAriel Levkovich 	case MLX5_IB_UAPI_DM_TYPE_MEMIC:
24403b113a1eSAriel Levkovich 		ret = mlx5_cmd_dealloc_memic(dm_db, dm->dev_addr, dm->size);
244124da0016SAriel Levkovich 		if (ret)
244224da0016SAriel Levkovich 			return ret;
244324da0016SAriel Levkovich 
2444c9b9dcb4SAriel Levkovich 		page_idx = (dm->dev_addr - pci_resource_start(dev->pdev, 0) -
2445c9b9dcb4SAriel Levkovich 			    MLX5_CAP64_DEV_MEM(dev, memic_bar_start_addr)) >>
244624da0016SAriel Levkovich 			    PAGE_SHIFT;
244725c13324SAriel Levkovich 		bitmap_clear(ctx->dm_pages, page_idx,
244825c13324SAriel Levkovich 			     DIV_ROUND_UP(dm->size, PAGE_SIZE));
244925c13324SAriel Levkovich 		break;
245025c13324SAriel Levkovich 	case MLX5_IB_UAPI_DM_TYPE_STEERING_SW_ICM:
2451c9b9dcb4SAriel Levkovich 		ret = mlx5_dm_sw_icm_dealloc(dev, MLX5_SW_ICM_TYPE_STEERING,
2452c9b9dcb4SAriel Levkovich 					     dm->size, ctx->devx_uid, dm->dev_addr,
2453c9b9dcb4SAriel Levkovich 					     dm->icm_dm.obj_id);
2454c9b9dcb4SAriel Levkovich 		if (ret)
2455c9b9dcb4SAriel Levkovich 			return ret;
2456c9b9dcb4SAriel Levkovich 		break;
245725c13324SAriel Levkovich 	case MLX5_IB_UAPI_DM_TYPE_HEADER_MODIFY_SW_ICM:
2458c9b9dcb4SAriel Levkovich 		ret = mlx5_dm_sw_icm_dealloc(dev, MLX5_SW_ICM_TYPE_HEADER_MODIFY,
2459c9b9dcb4SAriel Levkovich 					     dm->size, ctx->devx_uid, dm->dev_addr,
246025c13324SAriel Levkovich 					     dm->icm_dm.obj_id);
246125c13324SAriel Levkovich 		if (ret)
246225c13324SAriel Levkovich 			return ret;
24633b113a1eSAriel Levkovich 		break;
24643b113a1eSAriel Levkovich 	default:
24653b113a1eSAriel Levkovich 		return -EOPNOTSUPP;
24663b113a1eSAriel Levkovich 	}
246724da0016SAriel Levkovich 
246824da0016SAriel Levkovich 	kfree(dm);
246924da0016SAriel Levkovich 
247024da0016SAriel Levkovich 	return 0;
247124da0016SAriel Levkovich }
247224da0016SAriel Levkovich 
2473ff23dfa1SShamir Rabinovitch static int mlx5_ib_alloc_pd(struct ib_pd *ibpd, struct ib_udata *udata)
2474e126ba97SEli Cohen {
247521a428a0SLeon Romanovsky 	struct mlx5_ib_pd *pd = to_mpd(ibpd);
247621a428a0SLeon Romanovsky 	struct ib_device *ibdev = ibpd->device;
2477e126ba97SEli Cohen 	struct mlx5_ib_alloc_pd_resp resp;
2478e126ba97SEli Cohen 	int err;
2479a1069c1cSYishai Hadas 	u32 out[MLX5_ST_SZ_DW(alloc_pd_out)] = {};
2480a1069c1cSYishai Hadas 	u32 in[MLX5_ST_SZ_DW(alloc_pd_in)]   = {};
2481a1069c1cSYishai Hadas 	u16 uid = 0;
2482ff23dfa1SShamir Rabinovitch 	struct mlx5_ib_ucontext *context = rdma_udata_to_drv_context(
2483ff23dfa1SShamir Rabinovitch 		udata, struct mlx5_ib_ucontext, ibucontext);
2484e126ba97SEli Cohen 
2485ff23dfa1SShamir Rabinovitch 	uid = context ? context->devx_uid : 0;
2486a1069c1cSYishai Hadas 	MLX5_SET(alloc_pd_in, in, opcode, MLX5_CMD_OP_ALLOC_PD);
2487a1069c1cSYishai Hadas 	MLX5_SET(alloc_pd_in, in, uid, uid);
2488a1069c1cSYishai Hadas 	err = mlx5_cmd_exec(to_mdev(ibdev)->mdev, in, sizeof(in),
2489a1069c1cSYishai Hadas 			    out, sizeof(out));
249021a428a0SLeon Romanovsky 	if (err)
249121a428a0SLeon Romanovsky 		return err;
2492e126ba97SEli Cohen 
2493a1069c1cSYishai Hadas 	pd->pdn = MLX5_GET(alloc_pd_out, out, pd);
2494a1069c1cSYishai Hadas 	pd->uid = uid;
2495ff23dfa1SShamir Rabinovitch 	if (udata) {
2496e126ba97SEli Cohen 		resp.pdn = pd->pdn;
2497e126ba97SEli Cohen 		if (ib_copy_to_udata(udata, &resp, sizeof(resp))) {
2498a1069c1cSYishai Hadas 			mlx5_cmd_dealloc_pd(to_mdev(ibdev)->mdev, pd->pdn, uid);
249921a428a0SLeon Romanovsky 			return -EFAULT;
2500e126ba97SEli Cohen 		}
2501e126ba97SEli Cohen 	}
2502e126ba97SEli Cohen 
250321a428a0SLeon Romanovsky 	return 0;
2504e126ba97SEli Cohen }
2505e126ba97SEli Cohen 
2506c4367a26SShamir Rabinovitch static void mlx5_ib_dealloc_pd(struct ib_pd *pd, struct ib_udata *udata)
2507e126ba97SEli Cohen {
2508e126ba97SEli Cohen 	struct mlx5_ib_dev *mdev = to_mdev(pd->device);
2509e126ba97SEli Cohen 	struct mlx5_ib_pd *mpd = to_mpd(pd);
2510e126ba97SEli Cohen 
2511a1069c1cSYishai Hadas 	mlx5_cmd_dealloc_pd(mdev->mdev, mpd->pdn, mpd->uid);
2512e126ba97SEli Cohen }
2513e126ba97SEli Cohen 
2514466fa6d2SMaor Gottlieb enum {
2515466fa6d2SMaor Gottlieb 	MATCH_CRITERIA_ENABLE_OUTER_BIT,
2516466fa6d2SMaor Gottlieb 	MATCH_CRITERIA_ENABLE_MISC_BIT,
251771c6e863SAriel Levkovich 	MATCH_CRITERIA_ENABLE_INNER_BIT,
251871c6e863SAriel Levkovich 	MATCH_CRITERIA_ENABLE_MISC2_BIT
2519466fa6d2SMaor Gottlieb };
2520038d2ef8SMaor Gottlieb 
2521466fa6d2SMaor Gottlieb #define HEADER_IS_ZERO(match_criteria, headers)			           \
2522466fa6d2SMaor Gottlieb 	!(memchr_inv(MLX5_ADDR_OF(fte_match_param, match_criteria, headers), \
2523466fa6d2SMaor Gottlieb 		    0, MLX5_FLD_SZ_BYTES(fte_match_param, headers)))       \
2524466fa6d2SMaor Gottlieb 
2525466fa6d2SMaor Gottlieb static u8 get_match_criteria_enable(u32 *match_criteria)
2526466fa6d2SMaor Gottlieb {
2527466fa6d2SMaor Gottlieb 	u8 match_criteria_enable;
2528466fa6d2SMaor Gottlieb 
2529466fa6d2SMaor Gottlieb 	match_criteria_enable =
2530466fa6d2SMaor Gottlieb 		(!HEADER_IS_ZERO(match_criteria, outer_headers)) <<
2531466fa6d2SMaor Gottlieb 		MATCH_CRITERIA_ENABLE_OUTER_BIT;
2532466fa6d2SMaor Gottlieb 	match_criteria_enable |=
2533466fa6d2SMaor Gottlieb 		(!HEADER_IS_ZERO(match_criteria, misc_parameters)) <<
2534466fa6d2SMaor Gottlieb 		MATCH_CRITERIA_ENABLE_MISC_BIT;
2535466fa6d2SMaor Gottlieb 	match_criteria_enable |=
2536466fa6d2SMaor Gottlieb 		(!HEADER_IS_ZERO(match_criteria, inner_headers)) <<
2537466fa6d2SMaor Gottlieb 		MATCH_CRITERIA_ENABLE_INNER_BIT;
253871c6e863SAriel Levkovich 	match_criteria_enable |=
253971c6e863SAriel Levkovich 		(!HEADER_IS_ZERO(match_criteria, misc_parameters_2)) <<
254071c6e863SAriel Levkovich 		MATCH_CRITERIA_ENABLE_MISC2_BIT;
2541466fa6d2SMaor Gottlieb 
2542466fa6d2SMaor Gottlieb 	return match_criteria_enable;
2543038d2ef8SMaor Gottlieb }
2544038d2ef8SMaor Gottlieb 
25456113cc44SMaor Gottlieb static int set_proto(void *outer_c, void *outer_v, u8 mask, u8 val)
2546ca0d4753SMaor Gottlieb {
25476113cc44SMaor Gottlieb 	u8 entry_mask;
25486113cc44SMaor Gottlieb 	u8 entry_val;
25496113cc44SMaor Gottlieb 	int err = 0;
25506113cc44SMaor Gottlieb 
25516113cc44SMaor Gottlieb 	if (!mask)
25526113cc44SMaor Gottlieb 		goto out;
25536113cc44SMaor Gottlieb 
25546113cc44SMaor Gottlieb 	entry_mask = MLX5_GET(fte_match_set_lyr_2_4, outer_c,
25556113cc44SMaor Gottlieb 			      ip_protocol);
25566113cc44SMaor Gottlieb 	entry_val = MLX5_GET(fte_match_set_lyr_2_4, outer_v,
25576113cc44SMaor Gottlieb 			     ip_protocol);
25586113cc44SMaor Gottlieb 	if (!entry_mask) {
2559ca0d4753SMaor Gottlieb 		MLX5_SET(fte_match_set_lyr_2_4, outer_c, ip_protocol, mask);
2560ca0d4753SMaor Gottlieb 		MLX5_SET(fte_match_set_lyr_2_4, outer_v, ip_protocol, val);
25616113cc44SMaor Gottlieb 		goto out;
25626113cc44SMaor Gottlieb 	}
25636113cc44SMaor Gottlieb 	/* Don't override existing ip protocol */
25646113cc44SMaor Gottlieb 	if (mask != entry_mask || val != entry_val)
25656113cc44SMaor Gottlieb 		err = -EINVAL;
25666113cc44SMaor Gottlieb out:
25676113cc44SMaor Gottlieb 	return err;
2568ca0d4753SMaor Gottlieb }
2569ca0d4753SMaor Gottlieb 
257037da2a03SDaria Velikovsky static void set_flow_label(void *misc_c, void *misc_v, u32 mask, u32 val,
25712d1e697eSMoses Reuben 			   bool inner)
25722d1e697eSMoses Reuben {
25732d1e697eSMoses Reuben 	if (inner) {
25742d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_misc,
25752d1e697eSMoses Reuben 			 misc_c, inner_ipv6_flow_label, mask);
25762d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_misc,
25772d1e697eSMoses Reuben 			 misc_v, inner_ipv6_flow_label, val);
25782d1e697eSMoses Reuben 	} else {
25792d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_misc,
25802d1e697eSMoses Reuben 			 misc_c, outer_ipv6_flow_label, mask);
25812d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_misc,
25822d1e697eSMoses Reuben 			 misc_v, outer_ipv6_flow_label, val);
25832d1e697eSMoses Reuben 	}
25842d1e697eSMoses Reuben }
25852d1e697eSMoses Reuben 
2586ca0d4753SMaor Gottlieb static void set_tos(void *outer_c, void *outer_v, u8 mask, u8 val)
2587ca0d4753SMaor Gottlieb {
2588ca0d4753SMaor Gottlieb 	MLX5_SET(fte_match_set_lyr_2_4, outer_c, ip_ecn, mask);
2589ca0d4753SMaor Gottlieb 	MLX5_SET(fte_match_set_lyr_2_4, outer_v, ip_ecn, val);
2590ca0d4753SMaor Gottlieb 	MLX5_SET(fte_match_set_lyr_2_4, outer_c, ip_dscp, mask >> 2);
2591ca0d4753SMaor Gottlieb 	MLX5_SET(fte_match_set_lyr_2_4, outer_v, ip_dscp, val >> 2);
2592ca0d4753SMaor Gottlieb }
2593ca0d4753SMaor Gottlieb 
259471c6e863SAriel Levkovich static int check_mpls_supp_fields(u32 field_support, const __be32 *set_mask)
259571c6e863SAriel Levkovich {
259671c6e863SAriel Levkovich 	if (MLX5_GET(fte_match_mpls, set_mask, mpls_label) &&
259771c6e863SAriel Levkovich 	    !(field_support & MLX5_FIELD_SUPPORT_MPLS_LABEL))
259871c6e863SAriel Levkovich 		return -EOPNOTSUPP;
259971c6e863SAriel Levkovich 
260071c6e863SAriel Levkovich 	if (MLX5_GET(fte_match_mpls, set_mask, mpls_exp) &&
260171c6e863SAriel Levkovich 	    !(field_support & MLX5_FIELD_SUPPORT_MPLS_EXP))
260271c6e863SAriel Levkovich 		return -EOPNOTSUPP;
260371c6e863SAriel Levkovich 
260471c6e863SAriel Levkovich 	if (MLX5_GET(fte_match_mpls, set_mask, mpls_s_bos) &&
260571c6e863SAriel Levkovich 	    !(field_support & MLX5_FIELD_SUPPORT_MPLS_S_BOS))
260671c6e863SAriel Levkovich 		return -EOPNOTSUPP;
260771c6e863SAriel Levkovich 
260871c6e863SAriel Levkovich 	if (MLX5_GET(fte_match_mpls, set_mask, mpls_ttl) &&
260971c6e863SAriel Levkovich 	    !(field_support & MLX5_FIELD_SUPPORT_MPLS_TTL))
261071c6e863SAriel Levkovich 		return -EOPNOTSUPP;
261171c6e863SAriel Levkovich 
261271c6e863SAriel Levkovich 	return 0;
261371c6e863SAriel Levkovich }
261471c6e863SAriel Levkovich 
2615c47ac6aeSMaor Gottlieb #define LAST_ETH_FIELD vlan_tag
2616c47ac6aeSMaor Gottlieb #define LAST_IB_FIELD sl
2617ca0d4753SMaor Gottlieb #define LAST_IPV4_FIELD tos
2618466fa6d2SMaor Gottlieb #define LAST_IPV6_FIELD traffic_class
2619c47ac6aeSMaor Gottlieb #define LAST_TCP_UDP_FIELD src_port
2620ffb30d8fSMoses Reuben #define LAST_TUNNEL_FIELD tunnel_id
26212ac693f9SMoses Reuben #define LAST_FLOW_TAG_FIELD tag_id
2622a22ed86cSSlava Shwartsman #define LAST_DROP_FIELD size
26233b3233fbSRaed Salem #define LAST_COUNTERS_FIELD counters
2624c47ac6aeSMaor Gottlieb 
2625c47ac6aeSMaor Gottlieb /* Field is the last supported field */
2626c47ac6aeSMaor Gottlieb #define FIELDS_NOT_SUPPORTED(filter, field)\
2627c47ac6aeSMaor Gottlieb 	memchr_inv((void *)&filter.field  +\
2628c47ac6aeSMaor Gottlieb 		   sizeof(filter.field), 0,\
2629c47ac6aeSMaor Gottlieb 		   sizeof(filter) -\
2630c47ac6aeSMaor Gottlieb 		   offsetof(typeof(filter), field) -\
2631c47ac6aeSMaor Gottlieb 		   sizeof(filter.field))
2632c47ac6aeSMaor Gottlieb 
26332ea26203SMark Bloch int parse_flow_flow_action(struct mlx5_ib_flow_action *maction,
26342ea26203SMark Bloch 			   bool is_egress,
2635802c2125SAviad Yehezkel 			   struct mlx5_flow_act *action)
2636802c2125SAviad Yehezkel {
2637802c2125SAviad Yehezkel 
2638802c2125SAviad Yehezkel 	switch (maction->ib_action.type) {
2639802c2125SAviad Yehezkel 	case IB_FLOW_ACTION_ESP:
2640501f14e3SMark Bloch 		if (action->action & (MLX5_FLOW_CONTEXT_ACTION_ENCRYPT |
2641501f14e3SMark Bloch 				      MLX5_FLOW_CONTEXT_ACTION_DECRYPT))
2642501f14e3SMark Bloch 			return -EINVAL;
2643802c2125SAviad Yehezkel 		/* Currently only AES_GCM keymat is supported by the driver */
2644802c2125SAviad Yehezkel 		action->esp_id = (uintptr_t)maction->esp_aes_gcm.ctx;
26452ea26203SMark Bloch 		action->action |= is_egress ?
2646802c2125SAviad Yehezkel 			MLX5_FLOW_CONTEXT_ACTION_ENCRYPT :
2647802c2125SAviad Yehezkel 			MLX5_FLOW_CONTEXT_ACTION_DECRYPT;
2648802c2125SAviad Yehezkel 		return 0;
2649b1085be3SMark Bloch 	case IB_FLOW_ACTION_UNSPECIFIED:
2650b1085be3SMark Bloch 		if (maction->flow_action_raw.sub_type ==
2651b1085be3SMark Bloch 		    MLX5_IB_FLOW_ACTION_MODIFY_HEADER) {
2652501f14e3SMark Bloch 			if (action->action & MLX5_FLOW_CONTEXT_ACTION_MOD_HDR)
2653501f14e3SMark Bloch 				return -EINVAL;
2654b1085be3SMark Bloch 			action->action |= MLX5_FLOW_CONTEXT_ACTION_MOD_HDR;
26552b688ea5SMaor Gottlieb 			action->modify_hdr =
26562b688ea5SMaor Gottlieb 				maction->flow_action_raw.modify_hdr;
2657b1085be3SMark Bloch 			return 0;
2658b1085be3SMark Bloch 		}
265910a30896SMark Bloch 		if (maction->flow_action_raw.sub_type ==
266010a30896SMark Bloch 		    MLX5_IB_FLOW_ACTION_DECAP) {
2661501f14e3SMark Bloch 			if (action->action & MLX5_FLOW_CONTEXT_ACTION_DECAP)
2662501f14e3SMark Bloch 				return -EINVAL;
266310a30896SMark Bloch 			action->action |= MLX5_FLOW_CONTEXT_ACTION_DECAP;
266410a30896SMark Bloch 			return 0;
266510a30896SMark Bloch 		}
2666e806f932SMark Bloch 		if (maction->flow_action_raw.sub_type ==
2667e806f932SMark Bloch 		    MLX5_IB_FLOW_ACTION_PACKET_REFORMAT) {
2668501f14e3SMark Bloch 			if (action->action &
2669501f14e3SMark Bloch 			    MLX5_FLOW_CONTEXT_ACTION_PACKET_REFORMAT)
2670501f14e3SMark Bloch 				return -EINVAL;
2671e806f932SMark Bloch 			action->action |=
2672e806f932SMark Bloch 				MLX5_FLOW_CONTEXT_ACTION_PACKET_REFORMAT;
26732b688ea5SMaor Gottlieb 			action->pkt_reformat =
26742b688ea5SMaor Gottlieb 				maction->flow_action_raw.pkt_reformat;
2675e806f932SMark Bloch 			return 0;
2676e806f932SMark Bloch 		}
2677b1085be3SMark Bloch 		/* fall through */
2678802c2125SAviad Yehezkel 	default:
2679802c2125SAviad Yehezkel 		return -EOPNOTSUPP;
2680802c2125SAviad Yehezkel 	}
2681802c2125SAviad Yehezkel }
2682802c2125SAviad Yehezkel 
2683bb0ee7dcSJianbo Liu static int parse_flow_attr(struct mlx5_core_dev *mdev,
2684bb0ee7dcSJianbo Liu 			   struct mlx5_flow_spec *spec,
2685bb0ee7dcSJianbo Liu 			   const union ib_flow_spec *ib_spec,
2686802c2125SAviad Yehezkel 			   const struct ib_flow_attr *flow_attr,
268771c6e863SAriel Levkovich 			   struct mlx5_flow_act *action, u32 prev_type)
2688038d2ef8SMaor Gottlieb {
2689bb0ee7dcSJianbo Liu 	struct mlx5_flow_context *flow_context = &spec->flow_context;
2690bb0ee7dcSJianbo Liu 	u32 *match_c = spec->match_criteria;
2691bb0ee7dcSJianbo Liu 	u32 *match_v = spec->match_value;
2692466fa6d2SMaor Gottlieb 	void *misc_params_c = MLX5_ADDR_OF(fte_match_param, match_c,
2693466fa6d2SMaor Gottlieb 					   misc_parameters);
2694466fa6d2SMaor Gottlieb 	void *misc_params_v = MLX5_ADDR_OF(fte_match_param, match_v,
2695466fa6d2SMaor Gottlieb 					   misc_parameters);
269671c6e863SAriel Levkovich 	void *misc_params2_c = MLX5_ADDR_OF(fte_match_param, match_c,
269771c6e863SAriel Levkovich 					    misc_parameters_2);
269871c6e863SAriel Levkovich 	void *misc_params2_v = MLX5_ADDR_OF(fte_match_param, match_v,
269971c6e863SAriel Levkovich 					    misc_parameters_2);
27002d1e697eSMoses Reuben 	void *headers_c;
27012d1e697eSMoses Reuben 	void *headers_v;
270219cc7524SAriel Levkovich 	int match_ipv;
2703802c2125SAviad Yehezkel 	int ret;
2704466fa6d2SMaor Gottlieb 
27052d1e697eSMoses Reuben 	if (ib_spec->type & IB_FLOW_SPEC_INNER) {
27062d1e697eSMoses Reuben 		headers_c = MLX5_ADDR_OF(fte_match_param, match_c,
27072d1e697eSMoses Reuben 					 inner_headers);
27082d1e697eSMoses Reuben 		headers_v = MLX5_ADDR_OF(fte_match_param, match_v,
27092d1e697eSMoses Reuben 					 inner_headers);
271019cc7524SAriel Levkovich 		match_ipv = MLX5_CAP_FLOWTABLE_NIC_RX(mdev,
271119cc7524SAriel Levkovich 					ft_field_support.inner_ip_version);
27122d1e697eSMoses Reuben 	} else {
27132d1e697eSMoses Reuben 		headers_c = MLX5_ADDR_OF(fte_match_param, match_c,
27142d1e697eSMoses Reuben 					 outer_headers);
27152d1e697eSMoses Reuben 		headers_v = MLX5_ADDR_OF(fte_match_param, match_v,
27162d1e697eSMoses Reuben 					 outer_headers);
271719cc7524SAriel Levkovich 		match_ipv = MLX5_CAP_FLOWTABLE_NIC_RX(mdev,
271819cc7524SAriel Levkovich 					ft_field_support.outer_ip_version);
27192d1e697eSMoses Reuben 	}
27202d1e697eSMoses Reuben 
27212d1e697eSMoses Reuben 	switch (ib_spec->type & ~IB_FLOW_SPEC_INNER) {
2722038d2ef8SMaor Gottlieb 	case IB_FLOW_SPEC_ETH:
2723c47ac6aeSMaor Gottlieb 		if (FIELDS_NOT_SUPPORTED(ib_spec->eth.mask, LAST_ETH_FIELD))
27241ffd3a26SLeon Romanovsky 			return -EOPNOTSUPP;
2725038d2ef8SMaor Gottlieb 
27262d1e697eSMoses Reuben 		ether_addr_copy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_c,
2727038d2ef8SMaor Gottlieb 					     dmac_47_16),
2728038d2ef8SMaor Gottlieb 				ib_spec->eth.mask.dst_mac);
27292d1e697eSMoses Reuben 		ether_addr_copy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_v,
2730038d2ef8SMaor Gottlieb 					     dmac_47_16),
2731038d2ef8SMaor Gottlieb 				ib_spec->eth.val.dst_mac);
2732038d2ef8SMaor Gottlieb 
27332d1e697eSMoses Reuben 		ether_addr_copy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_c,
2734ee3da804SMaor Gottlieb 					     smac_47_16),
2735ee3da804SMaor Gottlieb 				ib_spec->eth.mask.src_mac);
27362d1e697eSMoses Reuben 		ether_addr_copy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_v,
2737ee3da804SMaor Gottlieb 					     smac_47_16),
2738ee3da804SMaor Gottlieb 				ib_spec->eth.val.src_mac);
2739ee3da804SMaor Gottlieb 
2740038d2ef8SMaor Gottlieb 		if (ib_spec->eth.mask.vlan_tag) {
27412d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_c,
274210543365SMohamad Haj Yahia 				 cvlan_tag, 1);
27432d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_v,
274410543365SMohamad Haj Yahia 				 cvlan_tag, 1);
2745038d2ef8SMaor Gottlieb 
27462d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_c,
2747038d2ef8SMaor Gottlieb 				 first_vid, ntohs(ib_spec->eth.mask.vlan_tag));
27482d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_v,
2749038d2ef8SMaor Gottlieb 				 first_vid, ntohs(ib_spec->eth.val.vlan_tag));
2750038d2ef8SMaor Gottlieb 
27512d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_c,
2752038d2ef8SMaor Gottlieb 				 first_cfi,
2753038d2ef8SMaor Gottlieb 				 ntohs(ib_spec->eth.mask.vlan_tag) >> 12);
27542d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_v,
2755038d2ef8SMaor Gottlieb 				 first_cfi,
2756038d2ef8SMaor Gottlieb 				 ntohs(ib_spec->eth.val.vlan_tag) >> 12);
2757038d2ef8SMaor Gottlieb 
27582d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_c,
2759038d2ef8SMaor Gottlieb 				 first_prio,
2760038d2ef8SMaor Gottlieb 				 ntohs(ib_spec->eth.mask.vlan_tag) >> 13);
27612d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_v,
2762038d2ef8SMaor Gottlieb 				 first_prio,
2763038d2ef8SMaor Gottlieb 				 ntohs(ib_spec->eth.val.vlan_tag) >> 13);
2764038d2ef8SMaor Gottlieb 		}
27652d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_c,
2766038d2ef8SMaor Gottlieb 			 ethertype, ntohs(ib_spec->eth.mask.ether_type));
27672d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_v,
2768038d2ef8SMaor Gottlieb 			 ethertype, ntohs(ib_spec->eth.val.ether_type));
2769038d2ef8SMaor Gottlieb 		break;
2770038d2ef8SMaor Gottlieb 	case IB_FLOW_SPEC_IPV4:
2771c47ac6aeSMaor Gottlieb 		if (FIELDS_NOT_SUPPORTED(ib_spec->ipv4.mask, LAST_IPV4_FIELD))
27721ffd3a26SLeon Romanovsky 			return -EOPNOTSUPP;
2773038d2ef8SMaor Gottlieb 
277419cc7524SAriel Levkovich 		if (match_ipv) {
277519cc7524SAriel Levkovich 			MLX5_SET(fte_match_set_lyr_2_4, headers_c,
277619cc7524SAriel Levkovich 				 ip_version, 0xf);
277719cc7524SAriel Levkovich 			MLX5_SET(fte_match_set_lyr_2_4, headers_v,
27783346c487SBoris Pismenny 				 ip_version, MLX5_FS_IPV4_VERSION);
277919cc7524SAriel Levkovich 		} else {
27802d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_c,
2781038d2ef8SMaor Gottlieb 				 ethertype, 0xffff);
27822d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_v,
2783038d2ef8SMaor Gottlieb 				 ethertype, ETH_P_IP);
278419cc7524SAriel Levkovich 		}
2785038d2ef8SMaor Gottlieb 
27862d1e697eSMoses Reuben 		memcpy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_c,
2787038d2ef8SMaor Gottlieb 				    src_ipv4_src_ipv6.ipv4_layout.ipv4),
2788038d2ef8SMaor Gottlieb 		       &ib_spec->ipv4.mask.src_ip,
2789038d2ef8SMaor Gottlieb 		       sizeof(ib_spec->ipv4.mask.src_ip));
27902d1e697eSMoses Reuben 		memcpy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_v,
2791038d2ef8SMaor Gottlieb 				    src_ipv4_src_ipv6.ipv4_layout.ipv4),
2792038d2ef8SMaor Gottlieb 		       &ib_spec->ipv4.val.src_ip,
2793038d2ef8SMaor Gottlieb 		       sizeof(ib_spec->ipv4.val.src_ip));
27942d1e697eSMoses Reuben 		memcpy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_c,
2795038d2ef8SMaor Gottlieb 				    dst_ipv4_dst_ipv6.ipv4_layout.ipv4),
2796038d2ef8SMaor Gottlieb 		       &ib_spec->ipv4.mask.dst_ip,
2797038d2ef8SMaor Gottlieb 		       sizeof(ib_spec->ipv4.mask.dst_ip));
27982d1e697eSMoses Reuben 		memcpy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_v,
2799038d2ef8SMaor Gottlieb 				    dst_ipv4_dst_ipv6.ipv4_layout.ipv4),
2800038d2ef8SMaor Gottlieb 		       &ib_spec->ipv4.val.dst_ip,
2801038d2ef8SMaor Gottlieb 		       sizeof(ib_spec->ipv4.val.dst_ip));
2802ca0d4753SMaor Gottlieb 
28032d1e697eSMoses Reuben 		set_tos(headers_c, headers_v,
2804ca0d4753SMaor Gottlieb 			ib_spec->ipv4.mask.tos, ib_spec->ipv4.val.tos);
2805ca0d4753SMaor Gottlieb 
28066113cc44SMaor Gottlieb 		if (set_proto(headers_c, headers_v,
28076113cc44SMaor Gottlieb 			      ib_spec->ipv4.mask.proto,
28086113cc44SMaor Gottlieb 			      ib_spec->ipv4.val.proto))
28096113cc44SMaor Gottlieb 			return -EINVAL;
2810038d2ef8SMaor Gottlieb 		break;
2811026bae0cSMaor Gottlieb 	case IB_FLOW_SPEC_IPV6:
2812c47ac6aeSMaor Gottlieb 		if (FIELDS_NOT_SUPPORTED(ib_spec->ipv6.mask, LAST_IPV6_FIELD))
28131ffd3a26SLeon Romanovsky 			return -EOPNOTSUPP;
2814026bae0cSMaor Gottlieb 
281519cc7524SAriel Levkovich 		if (match_ipv) {
281619cc7524SAriel Levkovich 			MLX5_SET(fte_match_set_lyr_2_4, headers_c,
281719cc7524SAriel Levkovich 				 ip_version, 0xf);
281819cc7524SAriel Levkovich 			MLX5_SET(fte_match_set_lyr_2_4, headers_v,
28193346c487SBoris Pismenny 				 ip_version, MLX5_FS_IPV6_VERSION);
282019cc7524SAriel Levkovich 		} else {
28212d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_c,
2822026bae0cSMaor Gottlieb 				 ethertype, 0xffff);
28232d1e697eSMoses Reuben 			MLX5_SET(fte_match_set_lyr_2_4, headers_v,
2824026bae0cSMaor Gottlieb 				 ethertype, ETH_P_IPV6);
282519cc7524SAriel Levkovich 		}
2826026bae0cSMaor Gottlieb 
28272d1e697eSMoses Reuben 		memcpy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_c,
2828026bae0cSMaor Gottlieb 				    src_ipv4_src_ipv6.ipv6_layout.ipv6),
2829026bae0cSMaor Gottlieb 		       &ib_spec->ipv6.mask.src_ip,
2830026bae0cSMaor Gottlieb 		       sizeof(ib_spec->ipv6.mask.src_ip));
28312d1e697eSMoses Reuben 		memcpy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_v,
2832026bae0cSMaor Gottlieb 				    src_ipv4_src_ipv6.ipv6_layout.ipv6),
2833026bae0cSMaor Gottlieb 		       &ib_spec->ipv6.val.src_ip,
2834026bae0cSMaor Gottlieb 		       sizeof(ib_spec->ipv6.val.src_ip));
28352d1e697eSMoses Reuben 		memcpy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_c,
2836026bae0cSMaor Gottlieb 				    dst_ipv4_dst_ipv6.ipv6_layout.ipv6),
2837026bae0cSMaor Gottlieb 		       &ib_spec->ipv6.mask.dst_ip,
2838026bae0cSMaor Gottlieb 		       sizeof(ib_spec->ipv6.mask.dst_ip));
28392d1e697eSMoses Reuben 		memcpy(MLX5_ADDR_OF(fte_match_set_lyr_2_4, headers_v,
2840026bae0cSMaor Gottlieb 				    dst_ipv4_dst_ipv6.ipv6_layout.ipv6),
2841026bae0cSMaor Gottlieb 		       &ib_spec->ipv6.val.dst_ip,
2842026bae0cSMaor Gottlieb 		       sizeof(ib_spec->ipv6.val.dst_ip));
2843466fa6d2SMaor Gottlieb 
28442d1e697eSMoses Reuben 		set_tos(headers_c, headers_v,
2845466fa6d2SMaor Gottlieb 			ib_spec->ipv6.mask.traffic_class,
2846466fa6d2SMaor Gottlieb 			ib_spec->ipv6.val.traffic_class);
2847466fa6d2SMaor Gottlieb 
28486113cc44SMaor Gottlieb 		if (set_proto(headers_c, headers_v,
2849466fa6d2SMaor Gottlieb 			      ib_spec->ipv6.mask.next_hdr,
28506113cc44SMaor Gottlieb 			      ib_spec->ipv6.val.next_hdr))
28516113cc44SMaor Gottlieb 			return -EINVAL;
2852466fa6d2SMaor Gottlieb 
28532d1e697eSMoses Reuben 		set_flow_label(misc_params_c, misc_params_v,
28542d1e697eSMoses Reuben 			       ntohl(ib_spec->ipv6.mask.flow_label),
28552d1e697eSMoses Reuben 			       ntohl(ib_spec->ipv6.val.flow_label),
28562d1e697eSMoses Reuben 			       ib_spec->type & IB_FLOW_SPEC_INNER);
2857802c2125SAviad Yehezkel 		break;
2858802c2125SAviad Yehezkel 	case IB_FLOW_SPEC_ESP:
2859802c2125SAviad Yehezkel 		if (ib_spec->esp.mask.seq)
2860802c2125SAviad Yehezkel 			return -EOPNOTSUPP;
28612d1e697eSMoses Reuben 
2862802c2125SAviad Yehezkel 		MLX5_SET(fte_match_set_misc, misc_params_c, outer_esp_spi,
2863802c2125SAviad Yehezkel 			 ntohl(ib_spec->esp.mask.spi));
2864802c2125SAviad Yehezkel 		MLX5_SET(fte_match_set_misc, misc_params_v, outer_esp_spi,
2865802c2125SAviad Yehezkel 			 ntohl(ib_spec->esp.val.spi));
2866026bae0cSMaor Gottlieb 		break;
2867038d2ef8SMaor Gottlieb 	case IB_FLOW_SPEC_TCP:
2868c47ac6aeSMaor Gottlieb 		if (FIELDS_NOT_SUPPORTED(ib_spec->tcp_udp.mask,
2869c47ac6aeSMaor Gottlieb 					 LAST_TCP_UDP_FIELD))
28701ffd3a26SLeon Romanovsky 			return -EOPNOTSUPP;
2871038d2ef8SMaor Gottlieb 
28726113cc44SMaor Gottlieb 		if (set_proto(headers_c, headers_v, 0xff, IPPROTO_TCP))
28736113cc44SMaor Gottlieb 			return -EINVAL;
2874038d2ef8SMaor Gottlieb 
28752d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_c, tcp_sport,
2876038d2ef8SMaor Gottlieb 			 ntohs(ib_spec->tcp_udp.mask.src_port));
28772d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_v, tcp_sport,
2878038d2ef8SMaor Gottlieb 			 ntohs(ib_spec->tcp_udp.val.src_port));
2879038d2ef8SMaor Gottlieb 
28802d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_c, tcp_dport,
2881038d2ef8SMaor Gottlieb 			 ntohs(ib_spec->tcp_udp.mask.dst_port));
28822d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_v, tcp_dport,
2883038d2ef8SMaor Gottlieb 			 ntohs(ib_spec->tcp_udp.val.dst_port));
2884038d2ef8SMaor Gottlieb 		break;
2885038d2ef8SMaor Gottlieb 	case IB_FLOW_SPEC_UDP:
2886c47ac6aeSMaor Gottlieb 		if (FIELDS_NOT_SUPPORTED(ib_spec->tcp_udp.mask,
2887c47ac6aeSMaor Gottlieb 					 LAST_TCP_UDP_FIELD))
28881ffd3a26SLeon Romanovsky 			return -EOPNOTSUPP;
2889038d2ef8SMaor Gottlieb 
28906113cc44SMaor Gottlieb 		if (set_proto(headers_c, headers_v, 0xff, IPPROTO_UDP))
28916113cc44SMaor Gottlieb 			return -EINVAL;
2892038d2ef8SMaor Gottlieb 
28932d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_c, udp_sport,
2894038d2ef8SMaor Gottlieb 			 ntohs(ib_spec->tcp_udp.mask.src_port));
28952d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_v, udp_sport,
2896038d2ef8SMaor Gottlieb 			 ntohs(ib_spec->tcp_udp.val.src_port));
2897038d2ef8SMaor Gottlieb 
28982d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_c, udp_dport,
2899038d2ef8SMaor Gottlieb 			 ntohs(ib_spec->tcp_udp.mask.dst_port));
29002d1e697eSMoses Reuben 		MLX5_SET(fte_match_set_lyr_2_4, headers_v, udp_dport,
2901038d2ef8SMaor Gottlieb 			 ntohs(ib_spec->tcp_udp.val.dst_port));
2902038d2ef8SMaor Gottlieb 		break;
2903da2f22aeSAriel Levkovich 	case IB_FLOW_SPEC_GRE:
2904da2f22aeSAriel Levkovich 		if (ib_spec->gre.mask.c_ks_res0_ver)
2905da2f22aeSAriel Levkovich 			return -EOPNOTSUPP;
2906da2f22aeSAriel Levkovich 
29076113cc44SMaor Gottlieb 		if (set_proto(headers_c, headers_v, 0xff, IPPROTO_GRE))
29086113cc44SMaor Gottlieb 			return -EINVAL;
29096113cc44SMaor Gottlieb 
2910da2f22aeSAriel Levkovich 		MLX5_SET(fte_match_set_lyr_2_4, headers_c, ip_protocol,
2911da2f22aeSAriel Levkovich 			 0xff);
2912da2f22aeSAriel Levkovich 		MLX5_SET(fte_match_set_lyr_2_4, headers_v, ip_protocol,
2913da2f22aeSAriel Levkovich 			 IPPROTO_GRE);
2914da2f22aeSAriel Levkovich 
2915da2f22aeSAriel Levkovich 		MLX5_SET(fte_match_set_misc, misc_params_c, gre_protocol,
2916a93b632cSMaor Gottlieb 			 ntohs(ib_spec->gre.mask.protocol));
2917da2f22aeSAriel Levkovich 		MLX5_SET(fte_match_set_misc, misc_params_v, gre_protocol,
2918da2f22aeSAriel Levkovich 			 ntohs(ib_spec->gre.val.protocol));
2919da2f22aeSAriel Levkovich 
2920da2f22aeSAriel Levkovich 		memcpy(MLX5_ADDR_OF(fte_match_set_misc, misc_params_c,
29215886a96aSOz Shlomo 				    gre_key.nvgre.hi),
2922da2f22aeSAriel Levkovich 		       &ib_spec->gre.mask.key,
2923da2f22aeSAriel Levkovich 		       sizeof(ib_spec->gre.mask.key));
2924da2f22aeSAriel Levkovich 		memcpy(MLX5_ADDR_OF(fte_match_set_misc, misc_params_v,
29255886a96aSOz Shlomo 				    gre_key.nvgre.hi),
2926da2f22aeSAriel Levkovich 		       &ib_spec->gre.val.key,
2927da2f22aeSAriel Levkovich 		       sizeof(ib_spec->gre.val.key));
2928da2f22aeSAriel Levkovich 		break;
292971c6e863SAriel Levkovich 	case IB_FLOW_SPEC_MPLS:
293071c6e863SAriel Levkovich 		switch (prev_type) {
293171c6e863SAriel Levkovich 		case IB_FLOW_SPEC_UDP:
293271c6e863SAriel Levkovich 			if (check_mpls_supp_fields(MLX5_CAP_FLOWTABLE_NIC_RX(mdev,
293371c6e863SAriel Levkovich 						   ft_field_support.outer_first_mpls_over_udp),
293471c6e863SAriel Levkovich 						   &ib_spec->mpls.mask.tag))
293571c6e863SAriel Levkovich 				return -EOPNOTSUPP;
293671c6e863SAriel Levkovich 
293771c6e863SAriel Levkovich 			memcpy(MLX5_ADDR_OF(fte_match_set_misc2, misc_params2_v,
293871c6e863SAriel Levkovich 					    outer_first_mpls_over_udp),
293971c6e863SAriel Levkovich 			       &ib_spec->mpls.val.tag,
294071c6e863SAriel Levkovich 			       sizeof(ib_spec->mpls.val.tag));
294171c6e863SAriel Levkovich 			memcpy(MLX5_ADDR_OF(fte_match_set_misc2, misc_params2_c,
294271c6e863SAriel Levkovich 					    outer_first_mpls_over_udp),
294371c6e863SAriel Levkovich 			       &ib_spec->mpls.mask.tag,
294471c6e863SAriel Levkovich 			       sizeof(ib_spec->mpls.mask.tag));
294571c6e863SAriel Levkovich 			break;
294671c6e863SAriel Levkovich 		case IB_FLOW_SPEC_GRE:
294771c6e863SAriel Levkovich 			if (check_mpls_supp_fields(MLX5_CAP_FLOWTABLE_NIC_RX(mdev,
294871c6e863SAriel Levkovich 						   ft_field_support.outer_first_mpls_over_gre),
294971c6e863SAriel Levkovich 						   &ib_spec->mpls.mask.tag))
295071c6e863SAriel Levkovich 				return -EOPNOTSUPP;
295171c6e863SAriel Levkovich 
295271c6e863SAriel Levkovich 			memcpy(MLX5_ADDR_OF(fte_match_set_misc2, misc_params2_v,
295371c6e863SAriel Levkovich 					    outer_first_mpls_over_gre),
295471c6e863SAriel Levkovich 			       &ib_spec->mpls.val.tag,
295571c6e863SAriel Levkovich 			       sizeof(ib_spec->mpls.val.tag));
295671c6e863SAriel Levkovich 			memcpy(MLX5_ADDR_OF(fte_match_set_misc2, misc_params2_c,
295771c6e863SAriel Levkovich 					    outer_first_mpls_over_gre),
295871c6e863SAriel Levkovich 			       &ib_spec->mpls.mask.tag,
295971c6e863SAriel Levkovich 			       sizeof(ib_spec->mpls.mask.tag));
296071c6e863SAriel Levkovich 			break;
296171c6e863SAriel Levkovich 		default:
296271c6e863SAriel Levkovich 			if (ib_spec->type & IB_FLOW_SPEC_INNER) {
296371c6e863SAriel Levkovich 				if (check_mpls_supp_fields(MLX5_CAP_FLOWTABLE_NIC_RX(mdev,
296471c6e863SAriel Levkovich 							   ft_field_support.inner_first_mpls),
296571c6e863SAriel Levkovich 							   &ib_spec->mpls.mask.tag))
296671c6e863SAriel Levkovich 					return -EOPNOTSUPP;
296771c6e863SAriel Levkovich 
296871c6e863SAriel Levkovich 				memcpy(MLX5_ADDR_OF(fte_match_set_misc2, misc_params2_v,
296971c6e863SAriel Levkovich 						    inner_first_mpls),
297071c6e863SAriel Levkovich 				       &ib_spec->mpls.val.tag,
297171c6e863SAriel Levkovich 				       sizeof(ib_spec->mpls.val.tag));
297271c6e863SAriel Levkovich 				memcpy(MLX5_ADDR_OF(fte_match_set_misc2, misc_params2_c,
297371c6e863SAriel Levkovich 						    inner_first_mpls),
297471c6e863SAriel Levkovich 				       &ib_spec->mpls.mask.tag,
297571c6e863SAriel Levkovich 				       sizeof(ib_spec->mpls.mask.tag));
297671c6e863SAriel Levkovich 			} else {
297771c6e863SAriel Levkovich 				if (check_mpls_supp_fields(MLX5_CAP_FLOWTABLE_NIC_RX(mdev,
297871c6e863SAriel Levkovich 							   ft_field_support.outer_first_mpls),
297971c6e863SAriel Levkovich 							   &ib_spec->mpls.mask.tag))
298071c6e863SAriel Levkovich 					return -EOPNOTSUPP;
298171c6e863SAriel Levkovich 
298271c6e863SAriel Levkovich 				memcpy(MLX5_ADDR_OF(fte_match_set_misc2, misc_params2_v,
298371c6e863SAriel Levkovich 						    outer_first_mpls),
298471c6e863SAriel Levkovich 				       &ib_spec->mpls.val.tag,
298571c6e863SAriel Levkovich 				       sizeof(ib_spec->mpls.val.tag));
298671c6e863SAriel Levkovich 				memcpy(MLX5_ADDR_OF(fte_match_set_misc2, misc_params2_c,
298771c6e863SAriel Levkovich 						    outer_first_mpls),
298871c6e863SAriel Levkovich 				       &ib_spec->mpls.mask.tag,
298971c6e863SAriel Levkovich 				       sizeof(ib_spec->mpls.mask.tag));
299071c6e863SAriel Levkovich 			}
299171c6e863SAriel Levkovich 		}
299271c6e863SAriel Levkovich 		break;
2993ffb30d8fSMoses Reuben 	case IB_FLOW_SPEC_VXLAN_TUNNEL:
2994ffb30d8fSMoses Reuben 		if (FIELDS_NOT_SUPPORTED(ib_spec->tunnel.mask,
2995ffb30d8fSMoses Reuben 					 LAST_TUNNEL_FIELD))
29961ffd3a26SLeon Romanovsky 			return -EOPNOTSUPP;
2997ffb30d8fSMoses Reuben 
2998ffb30d8fSMoses Reuben 		MLX5_SET(fte_match_set_misc, misc_params_c, vxlan_vni,
2999ffb30d8fSMoses Reuben 			 ntohl(ib_spec->tunnel.mask.tunnel_id));
3000ffb30d8fSMoses Reuben 		MLX5_SET(fte_match_set_misc, misc_params_v, vxlan_vni,
3001ffb30d8fSMoses Reuben 			 ntohl(ib_spec->tunnel.val.tunnel_id));
3002ffb30d8fSMoses Reuben 		break;
30032ac693f9SMoses Reuben 	case IB_FLOW_SPEC_ACTION_TAG:
30042ac693f9SMoses Reuben 		if (FIELDS_NOT_SUPPORTED(ib_spec->flow_tag,
30052ac693f9SMoses Reuben 					 LAST_FLOW_TAG_FIELD))
30062ac693f9SMoses Reuben 			return -EOPNOTSUPP;
30072ac693f9SMoses Reuben 		if (ib_spec->flow_tag.tag_id >= BIT(24))
30082ac693f9SMoses Reuben 			return -EINVAL;
30092ac693f9SMoses Reuben 
3010bb0ee7dcSJianbo Liu 		flow_context->flow_tag = ib_spec->flow_tag.tag_id;
3011bb0ee7dcSJianbo Liu 		flow_context->flags |= FLOW_CONTEXT_HAS_TAG;
30122ac693f9SMoses Reuben 		break;
3013a22ed86cSSlava Shwartsman 	case IB_FLOW_SPEC_ACTION_DROP:
3014a22ed86cSSlava Shwartsman 		if (FIELDS_NOT_SUPPORTED(ib_spec->drop,
3015a22ed86cSSlava Shwartsman 					 LAST_DROP_FIELD))
3016a22ed86cSSlava Shwartsman 			return -EOPNOTSUPP;
3017075572d4SBoris Pismenny 		action->action |= MLX5_FLOW_CONTEXT_ACTION_DROP;
3018a22ed86cSSlava Shwartsman 		break;
3019802c2125SAviad Yehezkel 	case IB_FLOW_SPEC_ACTION_HANDLE:
30202ea26203SMark Bloch 		ret = parse_flow_flow_action(to_mflow_act(ib_spec->action.act),
30212ea26203SMark Bloch 			flow_attr->flags & IB_FLOW_ATTR_FLAGS_EGRESS, action);
3022802c2125SAviad Yehezkel 		if (ret)
3023802c2125SAviad Yehezkel 			return ret;
3024802c2125SAviad Yehezkel 		break;
30253b3233fbSRaed Salem 	case IB_FLOW_SPEC_ACTION_COUNT:
30263b3233fbSRaed Salem 		if (FIELDS_NOT_SUPPORTED(ib_spec->flow_count,
30273b3233fbSRaed Salem 					 LAST_COUNTERS_FIELD))
30283b3233fbSRaed Salem 			return -EOPNOTSUPP;
30293b3233fbSRaed Salem 
30303b3233fbSRaed Salem 		/* for now support only one counters spec per flow */
30313b3233fbSRaed Salem 		if (action->action & MLX5_FLOW_CONTEXT_ACTION_COUNT)
30323b3233fbSRaed Salem 			return -EINVAL;
30333b3233fbSRaed Salem 
30343b3233fbSRaed Salem 		action->counters = ib_spec->flow_count.counters;
30353b3233fbSRaed Salem 		action->action |= MLX5_FLOW_CONTEXT_ACTION_COUNT;
30363b3233fbSRaed Salem 		break;
3037038d2ef8SMaor Gottlieb 	default:
3038038d2ef8SMaor Gottlieb 		return -EINVAL;
3039038d2ef8SMaor Gottlieb 	}
3040038d2ef8SMaor Gottlieb 
3041038d2ef8SMaor Gottlieb 	return 0;
3042038d2ef8SMaor Gottlieb }
3043038d2ef8SMaor Gottlieb 
3044038d2ef8SMaor Gottlieb /* If a flow could catch both multicast and unicast packets,
3045038d2ef8SMaor Gottlieb  * it won't fall into the multicast flow steering table and this rule
3046038d2ef8SMaor Gottlieb  * could steal other multicast packets.
3047038d2ef8SMaor Gottlieb  */
3048a550ddfcSYishai Hadas static bool flow_is_multicast_only(const struct ib_flow_attr *ib_attr)
3049038d2ef8SMaor Gottlieb {
305081e30880SYishai Hadas 	union ib_flow_spec *flow_spec;
3051038d2ef8SMaor Gottlieb 
3052038d2ef8SMaor Gottlieb 	if (ib_attr->type != IB_FLOW_ATTR_NORMAL ||
3053038d2ef8SMaor Gottlieb 	    ib_attr->num_of_specs < 1)
3054038d2ef8SMaor Gottlieb 		return false;
3055038d2ef8SMaor Gottlieb 
305681e30880SYishai Hadas 	flow_spec = (union ib_flow_spec *)(ib_attr + 1);
305781e30880SYishai Hadas 	if (flow_spec->type == IB_FLOW_SPEC_IPV4) {
305881e30880SYishai Hadas 		struct ib_flow_spec_ipv4 *ipv4_spec;
3059038d2ef8SMaor Gottlieb 
306081e30880SYishai Hadas 		ipv4_spec = (struct ib_flow_spec_ipv4 *)flow_spec;
306181e30880SYishai Hadas 		if (ipv4_is_multicast(ipv4_spec->val.dst_ip))
306281e30880SYishai Hadas 			return true;
306381e30880SYishai Hadas 
306481e30880SYishai Hadas 		return false;
306581e30880SYishai Hadas 	}
306681e30880SYishai Hadas 
306781e30880SYishai Hadas 	if (flow_spec->type == IB_FLOW_SPEC_ETH) {
306881e30880SYishai Hadas 		struct ib_flow_spec_eth *eth_spec;
306981e30880SYishai Hadas 
307081e30880SYishai Hadas 		eth_spec = (struct ib_flow_spec_eth *)flow_spec;
3071038d2ef8SMaor Gottlieb 		return is_multicast_ether_addr(eth_spec->mask.dst_mac) &&
3072038d2ef8SMaor Gottlieb 		       is_multicast_ether_addr(eth_spec->val.dst_mac);
3073038d2ef8SMaor Gottlieb 	}
3074038d2ef8SMaor Gottlieb 
307581e30880SYishai Hadas 	return false;
307681e30880SYishai Hadas }
307781e30880SYishai Hadas 
3078802c2125SAviad Yehezkel enum valid_spec {
3079802c2125SAviad Yehezkel 	VALID_SPEC_INVALID,
3080802c2125SAviad Yehezkel 	VALID_SPEC_VALID,
3081802c2125SAviad Yehezkel 	VALID_SPEC_NA,
3082802c2125SAviad Yehezkel };
3083802c2125SAviad Yehezkel 
3084802c2125SAviad Yehezkel static enum valid_spec
3085802c2125SAviad Yehezkel is_valid_esp_aes_gcm(struct mlx5_core_dev *mdev,
3086802c2125SAviad Yehezkel 		     const struct mlx5_flow_spec *spec,
3087802c2125SAviad Yehezkel 		     const struct mlx5_flow_act *flow_act,
3088802c2125SAviad Yehezkel 		     bool egress)
3089802c2125SAviad Yehezkel {
3090802c2125SAviad Yehezkel 	const u32 *match_c = spec->match_criteria;
3091802c2125SAviad Yehezkel 	bool is_crypto =
3092802c2125SAviad Yehezkel 		(flow_act->action & (MLX5_FLOW_CONTEXT_ACTION_ENCRYPT |
3093802c2125SAviad Yehezkel 				     MLX5_FLOW_CONTEXT_ACTION_DECRYPT));
3094802c2125SAviad Yehezkel 	bool is_ipsec = mlx5_fs_is_ipsec_flow(match_c);
3095802c2125SAviad Yehezkel 	bool is_drop = flow_act->action & MLX5_FLOW_CONTEXT_ACTION_DROP;
3096802c2125SAviad Yehezkel 
3097802c2125SAviad Yehezkel 	/*
3098802c2125SAviad Yehezkel 	 * Currently only crypto is supported in egress, when regular egress
3099802c2125SAviad Yehezkel 	 * rules would be supported, always return VALID_SPEC_NA.
3100802c2125SAviad Yehezkel 	 */
3101802c2125SAviad Yehezkel 	if (!is_crypto)
310278dd0c43SMark Bloch 		return VALID_SPEC_NA;
3103802c2125SAviad Yehezkel 
3104802c2125SAviad Yehezkel 	return is_crypto && is_ipsec &&
3105bb0ee7dcSJianbo Liu 		(!egress || (!is_drop &&
3106bb0ee7dcSJianbo Liu 			     !(spec->flow_context.flags & FLOW_CONTEXT_HAS_TAG))) ?
3107802c2125SAviad Yehezkel 		VALID_SPEC_VALID : VALID_SPEC_INVALID;
3108802c2125SAviad Yehezkel }
3109802c2125SAviad Yehezkel 
3110802c2125SAviad Yehezkel static bool is_valid_spec(struct mlx5_core_dev *mdev,
3111802c2125SAviad Yehezkel 			  const struct mlx5_flow_spec *spec,
3112802c2125SAviad Yehezkel 			  const struct mlx5_flow_act *flow_act,
3113802c2125SAviad Yehezkel 			  bool egress)
3114802c2125SAviad Yehezkel {
3115802c2125SAviad Yehezkel 	/* We curretly only support ipsec egress flow */
3116802c2125SAviad Yehezkel 	return is_valid_esp_aes_gcm(mdev, spec, flow_act, egress) != VALID_SPEC_INVALID;
3117802c2125SAviad Yehezkel }
3118802c2125SAviad Yehezkel 
311919cc7524SAriel Levkovich static bool is_valid_ethertype(struct mlx5_core_dev *mdev,
312019cc7524SAriel Levkovich 			       const struct ib_flow_attr *flow_attr,
31210f750966SAriel Levkovich 			       bool check_inner)
3122038d2ef8SMaor Gottlieb {
3123038d2ef8SMaor Gottlieb 	union ib_flow_spec *ib_spec = (union ib_flow_spec *)(flow_attr + 1);
312419cc7524SAriel Levkovich 	int match_ipv = check_inner ?
312519cc7524SAriel Levkovich 			MLX5_CAP_FLOWTABLE_NIC_RX(mdev,
312619cc7524SAriel Levkovich 					ft_field_support.inner_ip_version) :
312719cc7524SAriel Levkovich 			MLX5_CAP_FLOWTABLE_NIC_RX(mdev,
312819cc7524SAriel Levkovich 					ft_field_support.outer_ip_version);
31290f750966SAriel Levkovich 	int inner_bit = check_inner ? IB_FLOW_SPEC_INNER : 0;
31300f750966SAriel Levkovich 	bool ipv4_spec_valid, ipv6_spec_valid;
31310f750966SAriel Levkovich 	unsigned int ip_spec_type = 0;
31320f750966SAriel Levkovich 	bool has_ethertype = false;
3133038d2ef8SMaor Gottlieb 	unsigned int spec_index;
31340f750966SAriel Levkovich 	bool mask_valid = true;
31350f750966SAriel Levkovich 	u16 eth_type = 0;
31360f750966SAriel Levkovich 	bool type_valid;
3137038d2ef8SMaor Gottlieb 
3138038d2ef8SMaor Gottlieb 	/* Validate that ethertype is correct */
3139038d2ef8SMaor Gottlieb 	for (spec_index = 0; spec_index < flow_attr->num_of_specs; spec_index++) {
31400f750966SAriel Levkovich 		if ((ib_spec->type == (IB_FLOW_SPEC_ETH | inner_bit)) &&
3141038d2ef8SMaor Gottlieb 		    ib_spec->eth.mask.ether_type) {
31420f750966SAriel Levkovich 			mask_valid = (ib_spec->eth.mask.ether_type ==
31430f750966SAriel Levkovich 				      htons(0xffff));
31440f750966SAriel Levkovich 			has_ethertype = true;
31450f750966SAriel Levkovich 			eth_type = ntohs(ib_spec->eth.val.ether_type);
31460f750966SAriel Levkovich 		} else if ((ib_spec->type == (IB_FLOW_SPEC_IPV4 | inner_bit)) ||
31470f750966SAriel Levkovich 			   (ib_spec->type == (IB_FLOW_SPEC_IPV6 | inner_bit))) {
31480f750966SAriel Levkovich 			ip_spec_type = ib_spec->type;
3149038d2ef8SMaor Gottlieb 		}
3150038d2ef8SMaor Gottlieb 		ib_spec = (void *)ib_spec + ib_spec->size;
3151038d2ef8SMaor Gottlieb 	}
31520f750966SAriel Levkovich 
31530f750966SAriel Levkovich 	type_valid = (!has_ethertype) || (!ip_spec_type);
31540f750966SAriel Levkovich 	if (!type_valid && mask_valid) {
31550f750966SAriel Levkovich 		ipv4_spec_valid = (eth_type == ETH_P_IP) &&
31560f750966SAriel Levkovich 			(ip_spec_type == (IB_FLOW_SPEC_IPV4 | inner_bit));
31570f750966SAriel Levkovich 		ipv6_spec_valid = (eth_type == ETH_P_IPV6) &&
31580f750966SAriel Levkovich 			(ip_spec_type == (IB_FLOW_SPEC_IPV6 | inner_bit));
315919cc7524SAriel Levkovich 
316019cc7524SAriel Levkovich 		type_valid = (ipv4_spec_valid) || (ipv6_spec_valid) ||
316119cc7524SAriel Levkovich 			     (((eth_type == ETH_P_MPLS_UC) ||
316219cc7524SAriel Levkovich 			       (eth_type == ETH_P_MPLS_MC)) && match_ipv);
31630f750966SAriel Levkovich 	}
31640f750966SAriel Levkovich 
31650f750966SAriel Levkovich 	return type_valid;
31660f750966SAriel Levkovich }
31670f750966SAriel Levkovich 
316819cc7524SAriel Levkovich static bool is_valid_attr(struct mlx5_core_dev *mdev,
316919cc7524SAriel Levkovich 			  const struct ib_flow_attr *flow_attr)
31700f750966SAriel Levkovich {
317119cc7524SAriel Levkovich 	return is_valid_ethertype(mdev, flow_attr, false) &&
317219cc7524SAriel Levkovich 	       is_valid_ethertype(mdev, flow_attr, true);
3173038d2ef8SMaor Gottlieb }
3174038d2ef8SMaor Gottlieb 
3175038d2ef8SMaor Gottlieb static void put_flow_table(struct mlx5_ib_dev *dev,
3176038d2ef8SMaor Gottlieb 			   struct mlx5_ib_flow_prio *prio, bool ft_added)
3177038d2ef8SMaor Gottlieb {
3178038d2ef8SMaor Gottlieb 	prio->refcount -= !!ft_added;
3179038d2ef8SMaor Gottlieb 	if (!prio->refcount) {
3180038d2ef8SMaor Gottlieb 		mlx5_destroy_flow_table(prio->flow_table);
3181038d2ef8SMaor Gottlieb 		prio->flow_table = NULL;
3182038d2ef8SMaor Gottlieb 	}
3183038d2ef8SMaor Gottlieb }
3184038d2ef8SMaor Gottlieb 
31853b3233fbSRaed Salem static void counters_clear_description(struct ib_counters *counters)
31863b3233fbSRaed Salem {
31873b3233fbSRaed Salem 	struct mlx5_ib_mcounters *mcounters = to_mcounters(counters);
31883b3233fbSRaed Salem 
31893b3233fbSRaed Salem 	mutex_lock(&mcounters->mcntrs_mutex);
31903b3233fbSRaed Salem 	kfree(mcounters->counters_data);
31913b3233fbSRaed Salem 	mcounters->counters_data = NULL;
31923b3233fbSRaed Salem 	mcounters->cntrs_max_index = 0;
31933b3233fbSRaed Salem 	mutex_unlock(&mcounters->mcntrs_mutex);
31943b3233fbSRaed Salem }
31953b3233fbSRaed Salem 
3196038d2ef8SMaor Gottlieb static int mlx5_ib_destroy_flow(struct ib_flow *flow_id)
3197038d2ef8SMaor Gottlieb {
3198038d2ef8SMaor Gottlieb 	struct mlx5_ib_flow_handler *handler = container_of(flow_id,
3199038d2ef8SMaor Gottlieb 							  struct mlx5_ib_flow_handler,
3200038d2ef8SMaor Gottlieb 							  ibflow);
3201038d2ef8SMaor Gottlieb 	struct mlx5_ib_flow_handler *iter, *tmp;
3202d4be3f44SYishai Hadas 	struct mlx5_ib_dev *dev = handler->dev;
3203038d2ef8SMaor Gottlieb 
32049a4ca38dSMark Bloch 	mutex_lock(&dev->flow_db->lock);
3205038d2ef8SMaor Gottlieb 
3206038d2ef8SMaor Gottlieb 	list_for_each_entry_safe(iter, tmp, &handler->list, list) {
320774491de9SMark Bloch 		mlx5_del_flow_rules(iter->rule);
3208cc0e5d42SMaor Gottlieb 		put_flow_table(dev, iter->prio, true);
3209038d2ef8SMaor Gottlieb 		list_del(&iter->list);
3210038d2ef8SMaor Gottlieb 		kfree(iter);
3211038d2ef8SMaor Gottlieb 	}
3212038d2ef8SMaor Gottlieb 
321374491de9SMark Bloch 	mlx5_del_flow_rules(handler->rule);
32145497adc6SMaor Gottlieb 	put_flow_table(dev, handler->prio, true);
32153b3233fbSRaed Salem 	if (handler->ibcounters &&
32163b3233fbSRaed Salem 	    atomic_read(&handler->ibcounters->usecnt) == 1)
32173b3233fbSRaed Salem 		counters_clear_description(handler->ibcounters);
3218038d2ef8SMaor Gottlieb 
32193b3233fbSRaed Salem 	mutex_unlock(&dev->flow_db->lock);
3220d4be3f44SYishai Hadas 	if (handler->flow_matcher)
3221d4be3f44SYishai Hadas 		atomic_dec(&handler->flow_matcher->usecnt);
3222038d2ef8SMaor Gottlieb 	kfree(handler);
3223038d2ef8SMaor Gottlieb 
3224038d2ef8SMaor Gottlieb 	return 0;
3225038d2ef8SMaor Gottlieb }
3226038d2ef8SMaor Gottlieb 
322735d19011SMaor Gottlieb static int ib_prio_to_core_prio(unsigned int priority, bool dont_trap)
322835d19011SMaor Gottlieb {
322935d19011SMaor Gottlieb 	priority *= 2;
323035d19011SMaor Gottlieb 	if (!dont_trap)
323135d19011SMaor Gottlieb 		priority++;
323235d19011SMaor Gottlieb 	return priority;
323335d19011SMaor Gottlieb }
323435d19011SMaor Gottlieb 
3235cc0e5d42SMaor Gottlieb enum flow_table_type {
3236cc0e5d42SMaor Gottlieb 	MLX5_IB_FT_RX,
3237cc0e5d42SMaor Gottlieb 	MLX5_IB_FT_TX
3238cc0e5d42SMaor Gottlieb };
3239cc0e5d42SMaor Gottlieb 
324000b7c2abSMaor Gottlieb #define MLX5_FS_MAX_TYPES	 6
324100b7c2abSMaor Gottlieb #define MLX5_FS_MAX_ENTRIES	 BIT(16)
3242d4be3f44SYishai Hadas 
3243d4be3f44SYishai Hadas static struct mlx5_ib_flow_prio *_get_prio(struct mlx5_flow_namespace *ns,
3244d4be3f44SYishai Hadas 					   struct mlx5_ib_flow_prio *prio,
3245d4be3f44SYishai Hadas 					   int priority,
32464adda112SMark Bloch 					   int num_entries, int num_groups,
32474adda112SMark Bloch 					   u32 flags)
3248d4be3f44SYishai Hadas {
3249d4be3f44SYishai Hadas 	struct mlx5_flow_table *ft;
3250d4be3f44SYishai Hadas 
3251d4be3f44SYishai Hadas 	ft = mlx5_create_auto_grouped_flow_table(ns, priority,
3252d4be3f44SYishai Hadas 						 num_entries,
3253d4be3f44SYishai Hadas 						 num_groups,
32544adda112SMark Bloch 						 0, flags);
3255d4be3f44SYishai Hadas 	if (IS_ERR(ft))
3256d4be3f44SYishai Hadas 		return ERR_CAST(ft);
3257d4be3f44SYishai Hadas 
3258d4be3f44SYishai Hadas 	prio->flow_table = ft;
3259d4be3f44SYishai Hadas 	prio->refcount = 0;
3260d4be3f44SYishai Hadas 	return prio;
3261d4be3f44SYishai Hadas }
3262d4be3f44SYishai Hadas 
3263038d2ef8SMaor Gottlieb static struct mlx5_ib_flow_prio *get_flow_table(struct mlx5_ib_dev *dev,
3264cc0e5d42SMaor Gottlieb 						struct ib_flow_attr *flow_attr,
3265cc0e5d42SMaor Gottlieb 						enum flow_table_type ft_type)
3266038d2ef8SMaor Gottlieb {
326735d19011SMaor Gottlieb 	bool dont_trap = flow_attr->flags & IB_FLOW_ATTR_FLAGS_DONT_TRAP;
3268038d2ef8SMaor Gottlieb 	struct mlx5_flow_namespace *ns = NULL;
3269038d2ef8SMaor Gottlieb 	struct mlx5_ib_flow_prio *prio;
3270038d2ef8SMaor Gottlieb 	struct mlx5_flow_table *ft;
3271dac388efSMaor Gottlieb 	int max_table_size;
3272038d2ef8SMaor Gottlieb 	int num_entries;
3273038d2ef8SMaor Gottlieb 	int num_groups;
3274cecae747SMaor Gottlieb 	bool esw_encap;
32754adda112SMark Bloch 	u32 flags = 0;
3276038d2ef8SMaor Gottlieb 	int priority;
3277038d2ef8SMaor Gottlieb 
3278dac388efSMaor Gottlieb 	max_table_size = BIT(MLX5_CAP_FLOWTABLE_NIC_RX(dev->mdev,
3279dac388efSMaor Gottlieb 						       log_max_ft_size));
3280cecae747SMaor Gottlieb 	esw_encap = mlx5_eswitch_get_encap_mode(dev->mdev) !=
3281cecae747SMaor Gottlieb 		DEVLINK_ESWITCH_ENCAP_MODE_NONE;
3282038d2ef8SMaor Gottlieb 	if (flow_attr->type == IB_FLOW_ATTR_NORMAL) {
328378dd0c43SMark Bloch 		enum mlx5_flow_namespace_type fn_type;
328478dd0c43SMark Bloch 
328578dd0c43SMark Bloch 		if (flow_is_multicast_only(flow_attr) &&
328635d19011SMaor Gottlieb 		    !dont_trap)
3287038d2ef8SMaor Gottlieb 			priority = MLX5_IB_FLOW_MCAST_PRIO;
3288038d2ef8SMaor Gottlieb 		else
328935d19011SMaor Gottlieb 			priority = ib_prio_to_core_prio(flow_attr->priority,
329035d19011SMaor Gottlieb 							dont_trap);
329178dd0c43SMark Bloch 		if (ft_type == MLX5_IB_FT_RX) {
329278dd0c43SMark Bloch 			fn_type = MLX5_FLOW_NAMESPACE_BYPASS;
329378dd0c43SMark Bloch 			prio = &dev->flow_db->prios[priority];
3294cecae747SMaor Gottlieb 			if (!dev->is_rep && !esw_encap &&
32954adda112SMark Bloch 			    MLX5_CAP_FLOWTABLE_NIC_RX(dev->mdev, decap))
32964adda112SMark Bloch 				flags |= MLX5_FLOW_TABLE_TUNNEL_EN_DECAP;
3297cecae747SMaor Gottlieb 			if (!dev->is_rep && !esw_encap &&
32985c2db53fSMark Bloch 			    MLX5_CAP_FLOWTABLE_NIC_RX(dev->mdev,
32995c2db53fSMark Bloch 					reformat_l3_tunnel_to_l2))
33005c2db53fSMark Bloch 				flags |= MLX5_FLOW_TABLE_TUNNEL_EN_REFORMAT;
330178dd0c43SMark Bloch 		} else {
330278dd0c43SMark Bloch 			max_table_size =
330378dd0c43SMark Bloch 				BIT(MLX5_CAP_FLOWTABLE_NIC_TX(dev->mdev,
330478dd0c43SMark Bloch 							      log_max_ft_size));
330578dd0c43SMark Bloch 			fn_type = MLX5_FLOW_NAMESPACE_EGRESS;
330678dd0c43SMark Bloch 			prio = &dev->flow_db->egress_prios[priority];
3307cecae747SMaor Gottlieb 			if (!dev->is_rep && !esw_encap &&
33084adda112SMark Bloch 			    MLX5_CAP_FLOWTABLE_NIC_TX(dev->mdev, reformat))
33094adda112SMark Bloch 				flags |= MLX5_FLOW_TABLE_TUNNEL_EN_REFORMAT;
331078dd0c43SMark Bloch 		}
331178dd0c43SMark Bloch 		ns = mlx5_get_flow_namespace(dev->mdev, fn_type);
3312038d2ef8SMaor Gottlieb 		num_entries = MLX5_FS_MAX_ENTRIES;
3313038d2ef8SMaor Gottlieb 		num_groups = MLX5_FS_MAX_TYPES;
3314038d2ef8SMaor Gottlieb 	} else if (flow_attr->type == IB_FLOW_ATTR_ALL_DEFAULT ||
3315038d2ef8SMaor Gottlieb 		   flow_attr->type == IB_FLOW_ATTR_MC_DEFAULT) {
3316038d2ef8SMaor Gottlieb 		ns = mlx5_get_flow_namespace(dev->mdev,
3317038d2ef8SMaor Gottlieb 					     MLX5_FLOW_NAMESPACE_LEFTOVERS);
3318038d2ef8SMaor Gottlieb 		build_leftovers_ft_param(&priority,
3319038d2ef8SMaor Gottlieb 					 &num_entries,
3320038d2ef8SMaor Gottlieb 					 &num_groups);
33219a4ca38dSMark Bloch 		prio = &dev->flow_db->prios[MLX5_IB_FLOW_LEFTOVERS_PRIO];
3322cc0e5d42SMaor Gottlieb 	} else if (flow_attr->type == IB_FLOW_ATTR_SNIFFER) {
3323cc0e5d42SMaor Gottlieb 		if (!MLX5_CAP_FLOWTABLE(dev->mdev,
3324cc0e5d42SMaor Gottlieb 					allow_sniffer_and_nic_rx_shared_tir))
3325cc0e5d42SMaor Gottlieb 			return ERR_PTR(-ENOTSUPP);
3326cc0e5d42SMaor Gottlieb 
3327cc0e5d42SMaor Gottlieb 		ns = mlx5_get_flow_namespace(dev->mdev, ft_type == MLX5_IB_FT_RX ?
3328cc0e5d42SMaor Gottlieb 					     MLX5_FLOW_NAMESPACE_SNIFFER_RX :
3329cc0e5d42SMaor Gottlieb 					     MLX5_FLOW_NAMESPACE_SNIFFER_TX);
3330cc0e5d42SMaor Gottlieb 
33319a4ca38dSMark Bloch 		prio = &dev->flow_db->sniffer[ft_type];
3332cc0e5d42SMaor Gottlieb 		priority = 0;
3333cc0e5d42SMaor Gottlieb 		num_entries = 1;
3334cc0e5d42SMaor Gottlieb 		num_groups = 1;
3335038d2ef8SMaor Gottlieb 	}
3336038d2ef8SMaor Gottlieb 
3337038d2ef8SMaor Gottlieb 	if (!ns)
3338038d2ef8SMaor Gottlieb 		return ERR_PTR(-ENOTSUPP);
3339038d2ef8SMaor Gottlieb 
33403b70508aSMark Bloch 	max_table_size = min_t(int, num_entries, max_table_size);
3341dac388efSMaor Gottlieb 
3342038d2ef8SMaor Gottlieb 	ft = prio->flow_table;
3343d4be3f44SYishai Hadas 	if (!ft)
33443b70508aSMark Bloch 		return _get_prio(ns, prio, priority, max_table_size, num_groups,
33454adda112SMark Bloch 				 flags);
3346038d2ef8SMaor Gottlieb 
3347d4be3f44SYishai Hadas 	return prio;
3348038d2ef8SMaor Gottlieb }
3349038d2ef8SMaor Gottlieb 
3350a550ddfcSYishai Hadas static void set_underlay_qp(struct mlx5_ib_dev *dev,
3351a550ddfcSYishai Hadas 			    struct mlx5_flow_spec *spec,
3352a550ddfcSYishai Hadas 			    u32 underlay_qpn)
3353a550ddfcSYishai Hadas {
3354a550ddfcSYishai Hadas 	void *misc_params_c = MLX5_ADDR_OF(fte_match_param,
3355a550ddfcSYishai Hadas 					   spec->match_criteria,
3356a550ddfcSYishai Hadas 					   misc_parameters);
3357a550ddfcSYishai Hadas 	void *misc_params_v = MLX5_ADDR_OF(fte_match_param, spec->match_value,
3358a550ddfcSYishai Hadas 					   misc_parameters);
3359a550ddfcSYishai Hadas 
3360a550ddfcSYishai Hadas 	if (underlay_qpn &&
3361a550ddfcSYishai Hadas 	    MLX5_CAP_FLOWTABLE_NIC_RX(dev->mdev,
3362a550ddfcSYishai Hadas 				      ft_field_support.bth_dst_qp)) {
3363a550ddfcSYishai Hadas 		MLX5_SET(fte_match_set_misc,
3364a550ddfcSYishai Hadas 			 misc_params_v, bth_dst_qp, underlay_qpn);
3365a550ddfcSYishai Hadas 		MLX5_SET(fte_match_set_misc,
3366a550ddfcSYishai Hadas 			 misc_params_c, bth_dst_qp, 0xffffff);
3367a550ddfcSYishai Hadas 	}
3368a550ddfcSYishai Hadas }
3369a550ddfcSYishai Hadas 
33705e95af5fSRaed Salem static int read_flow_counters(struct ib_device *ibdev,
33715e95af5fSRaed Salem 			      struct mlx5_read_counters_attr *read_attr)
33725e95af5fSRaed Salem {
33735e95af5fSRaed Salem 	struct mlx5_fc *fc = read_attr->hw_cntrs_hndl;
33745e95af5fSRaed Salem 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
33755e95af5fSRaed Salem 
33765e95af5fSRaed Salem 	return mlx5_fc_query(dev->mdev, fc,
33775e95af5fSRaed Salem 			     &read_attr->out[IB_COUNTER_PACKETS],
33785e95af5fSRaed Salem 			     &read_attr->out[IB_COUNTER_BYTES]);
33795e95af5fSRaed Salem }
33805e95af5fSRaed Salem 
33815e95af5fSRaed Salem /* flow counters currently expose two counters packets and bytes */
33825e95af5fSRaed Salem #define FLOW_COUNTERS_NUM 2
33833b3233fbSRaed Salem static int counters_set_description(struct ib_counters *counters,
33843b3233fbSRaed Salem 				    enum mlx5_ib_counters_type counters_type,
33853b3233fbSRaed Salem 				    struct mlx5_ib_flow_counters_desc *desc_data,
33863b3233fbSRaed Salem 				    u32 ncounters)
33873b3233fbSRaed Salem {
33883b3233fbSRaed Salem 	struct mlx5_ib_mcounters *mcounters = to_mcounters(counters);
33893b3233fbSRaed Salem 	u32 cntrs_max_index = 0;
33903b3233fbSRaed Salem 	int i;
33913b3233fbSRaed Salem 
33923b3233fbSRaed Salem 	if (counters_type != MLX5_IB_COUNTERS_FLOW)
33933b3233fbSRaed Salem 		return -EINVAL;
33943b3233fbSRaed Salem 
33953b3233fbSRaed Salem 	/* init the fields for the object */
33963b3233fbSRaed Salem 	mcounters->type = counters_type;
33975e95af5fSRaed Salem 	mcounters->read_counters = read_flow_counters;
33985e95af5fSRaed Salem 	mcounters->counters_num = FLOW_COUNTERS_NUM;
33993b3233fbSRaed Salem 	mcounters->ncounters = ncounters;
34003b3233fbSRaed Salem 	/* each counter entry have both description and index pair */
34013b3233fbSRaed Salem 	for (i = 0; i < ncounters; i++) {
34023b3233fbSRaed Salem 		if (desc_data[i].description > IB_COUNTER_BYTES)
34033b3233fbSRaed Salem 			return -EINVAL;
34043b3233fbSRaed Salem 
34053b3233fbSRaed Salem 		if (cntrs_max_index <= desc_data[i].index)
34063b3233fbSRaed Salem 			cntrs_max_index = desc_data[i].index + 1;
34073b3233fbSRaed Salem 	}
34083b3233fbSRaed Salem 
34093b3233fbSRaed Salem 	mutex_lock(&mcounters->mcntrs_mutex);
34103b3233fbSRaed Salem 	mcounters->counters_data = desc_data;
34113b3233fbSRaed Salem 	mcounters->cntrs_max_index = cntrs_max_index;
34123b3233fbSRaed Salem 	mutex_unlock(&mcounters->mcntrs_mutex);
34133b3233fbSRaed Salem 
34143b3233fbSRaed Salem 	return 0;
34153b3233fbSRaed Salem }
34163b3233fbSRaed Salem 
34173b3233fbSRaed Salem #define MAX_COUNTERS_NUM (USHRT_MAX / (sizeof(u32) * 2))
34183b3233fbSRaed Salem static int flow_counters_set_data(struct ib_counters *ibcounters,
34193b3233fbSRaed Salem 				  struct mlx5_ib_create_flow *ucmd)
34203b3233fbSRaed Salem {
34213b3233fbSRaed Salem 	struct mlx5_ib_mcounters *mcounters = to_mcounters(ibcounters);
34223b3233fbSRaed Salem 	struct mlx5_ib_flow_counters_data *cntrs_data = NULL;
34233b3233fbSRaed Salem 	struct mlx5_ib_flow_counters_desc *desc_data = NULL;
34243b3233fbSRaed Salem 	bool hw_hndl = false;
34253b3233fbSRaed Salem 	int ret = 0;
34263b3233fbSRaed Salem 
34273b3233fbSRaed Salem 	if (ucmd && ucmd->ncounters_data != 0) {
34283b3233fbSRaed Salem 		cntrs_data = ucmd->data;
34293b3233fbSRaed Salem 		if (cntrs_data->ncounters > MAX_COUNTERS_NUM)
34303b3233fbSRaed Salem 			return -EINVAL;
34313b3233fbSRaed Salem 
34323b3233fbSRaed Salem 		desc_data = kcalloc(cntrs_data->ncounters,
34333b3233fbSRaed Salem 				    sizeof(*desc_data),
34343b3233fbSRaed Salem 				    GFP_KERNEL);
34353b3233fbSRaed Salem 		if (!desc_data)
34363b3233fbSRaed Salem 			return  -ENOMEM;
34373b3233fbSRaed Salem 
34383b3233fbSRaed Salem 		if (copy_from_user(desc_data,
34393b3233fbSRaed Salem 				   u64_to_user_ptr(cntrs_data->counters_data),
34403b3233fbSRaed Salem 				   sizeof(*desc_data) * cntrs_data->ncounters)) {
34413b3233fbSRaed Salem 			ret = -EFAULT;
34423b3233fbSRaed Salem 			goto free;
34433b3233fbSRaed Salem 		}
34443b3233fbSRaed Salem 	}
34453b3233fbSRaed Salem 
34463b3233fbSRaed Salem 	if (!mcounters->hw_cntrs_hndl) {
34473b3233fbSRaed Salem 		mcounters->hw_cntrs_hndl = mlx5_fc_create(
34483b3233fbSRaed Salem 			to_mdev(ibcounters->device)->mdev, false);
3449e31abf76Sweiyongjun (A) 		if (IS_ERR(mcounters->hw_cntrs_hndl)) {
3450e31abf76Sweiyongjun (A) 			ret = PTR_ERR(mcounters->hw_cntrs_hndl);
34513b3233fbSRaed Salem 			goto free;
34523b3233fbSRaed Salem 		}
34533b3233fbSRaed Salem 		hw_hndl = true;
34543b3233fbSRaed Salem 	}
34553b3233fbSRaed Salem 
34563b3233fbSRaed Salem 	if (desc_data) {
34573b3233fbSRaed Salem 		/* counters already bound to at least one flow */
34583b3233fbSRaed Salem 		if (mcounters->cntrs_max_index) {
34593b3233fbSRaed Salem 			ret = -EINVAL;
34603b3233fbSRaed Salem 			goto free_hndl;
34613b3233fbSRaed Salem 		}
34623b3233fbSRaed Salem 
34633b3233fbSRaed Salem 		ret = counters_set_description(ibcounters,
34643b3233fbSRaed Salem 					       MLX5_IB_COUNTERS_FLOW,
34653b3233fbSRaed Salem 					       desc_data,
34663b3233fbSRaed Salem 					       cntrs_data->ncounters);
34673b3233fbSRaed Salem 		if (ret)
34683b3233fbSRaed Salem 			goto free_hndl;
34693b3233fbSRaed Salem 
34703b3233fbSRaed Salem 	} else if (!mcounters->cntrs_max_index) {
34713b3233fbSRaed Salem 		/* counters not bound yet, must have udata passed */
34723b3233fbSRaed Salem 		ret = -EINVAL;
34733b3233fbSRaed Salem 		goto free_hndl;
34743b3233fbSRaed Salem 	}
34753b3233fbSRaed Salem 
34763b3233fbSRaed Salem 	return 0;
34773b3233fbSRaed Salem 
34783b3233fbSRaed Salem free_hndl:
34793b3233fbSRaed Salem 	if (hw_hndl) {
34803b3233fbSRaed Salem 		mlx5_fc_destroy(to_mdev(ibcounters->device)->mdev,
34813b3233fbSRaed Salem 				mcounters->hw_cntrs_hndl);
34823b3233fbSRaed Salem 		mcounters->hw_cntrs_hndl = NULL;
34833b3233fbSRaed Salem 	}
34843b3233fbSRaed Salem free:
34853b3233fbSRaed Salem 	kfree(desc_data);
34863b3233fbSRaed Salem 	return ret;
34873b3233fbSRaed Salem }
34883b3233fbSRaed Salem 
3489669ff1e3SJianbo Liu static void mlx5_ib_set_rule_source_port(struct mlx5_ib_dev *dev,
3490669ff1e3SJianbo Liu 					 struct mlx5_flow_spec *spec,
3491669ff1e3SJianbo Liu 					 struct mlx5_eswitch_rep *rep)
3492669ff1e3SJianbo Liu {
3493669ff1e3SJianbo Liu 	struct mlx5_eswitch *esw = dev->mdev->priv.eswitch;
3494669ff1e3SJianbo Liu 	void *misc;
3495669ff1e3SJianbo Liu 
3496669ff1e3SJianbo Liu 	if (mlx5_eswitch_vport_match_metadata_enabled(esw)) {
3497669ff1e3SJianbo Liu 		misc = MLX5_ADDR_OF(fte_match_param, spec->match_value,
3498669ff1e3SJianbo Liu 				    misc_parameters_2);
3499669ff1e3SJianbo Liu 
3500669ff1e3SJianbo Liu 		MLX5_SET(fte_match_set_misc2, misc, metadata_reg_c_0,
3501669ff1e3SJianbo Liu 			 mlx5_eswitch_get_vport_metadata_for_match(esw,
3502669ff1e3SJianbo Liu 								   rep->vport));
3503669ff1e3SJianbo Liu 		misc = MLX5_ADDR_OF(fte_match_param, spec->match_criteria,
3504669ff1e3SJianbo Liu 				    misc_parameters_2);
3505669ff1e3SJianbo Liu 
3506669ff1e3SJianbo Liu 		MLX5_SET_TO_ONES(fte_match_set_misc2, misc, metadata_reg_c_0);
3507669ff1e3SJianbo Liu 	} else {
3508669ff1e3SJianbo Liu 		misc = MLX5_ADDR_OF(fte_match_param, spec->match_value,
3509669ff1e3SJianbo Liu 				    misc_parameters);
3510669ff1e3SJianbo Liu 
3511669ff1e3SJianbo Liu 		MLX5_SET(fte_match_set_misc, misc, source_port, rep->vport);
3512669ff1e3SJianbo Liu 
3513669ff1e3SJianbo Liu 		misc = MLX5_ADDR_OF(fte_match_param, spec->match_criteria,
3514669ff1e3SJianbo Liu 				    misc_parameters);
3515669ff1e3SJianbo Liu 
3516669ff1e3SJianbo Liu 		MLX5_SET_TO_ONES(fte_match_set_misc, misc, source_port);
3517669ff1e3SJianbo Liu 	}
3518669ff1e3SJianbo Liu }
3519669ff1e3SJianbo Liu 
3520a550ddfcSYishai Hadas static struct mlx5_ib_flow_handler *_create_flow_rule(struct mlx5_ib_dev *dev,
3521038d2ef8SMaor Gottlieb 						      struct mlx5_ib_flow_prio *ft_prio,
3522dd063d0eSMaor Gottlieb 						      const struct ib_flow_attr *flow_attr,
3523a550ddfcSYishai Hadas 						      struct mlx5_flow_destination *dst,
35243b3233fbSRaed Salem 						      u32 underlay_qpn,
35253b3233fbSRaed Salem 						      struct mlx5_ib_create_flow *ucmd)
3526038d2ef8SMaor Gottlieb {
3527038d2ef8SMaor Gottlieb 	struct mlx5_flow_table	*ft = ft_prio->flow_table;
3528038d2ef8SMaor Gottlieb 	struct mlx5_ib_flow_handler *handler;
3529bb0ee7dcSJianbo Liu 	struct mlx5_flow_act flow_act = {};
3530c5bb1730SMaor Gottlieb 	struct mlx5_flow_spec *spec;
35313b3233fbSRaed Salem 	struct mlx5_flow_destination dest_arr[2] = {};
35323b3233fbSRaed Salem 	struct mlx5_flow_destination *rule_dst = dest_arr;
3533dd063d0eSMaor Gottlieb 	const void *ib_flow = (const void *)flow_attr + sizeof(*flow_attr);
3534038d2ef8SMaor Gottlieb 	unsigned int spec_index;
353571c6e863SAriel Levkovich 	u32 prev_type = 0;
3536038d2ef8SMaor Gottlieb 	int err = 0;
35373b3233fbSRaed Salem 	int dest_num = 0;
3538802c2125SAviad Yehezkel 	bool is_egress = flow_attr->flags & IB_FLOW_ATTR_FLAGS_EGRESS;
3539038d2ef8SMaor Gottlieb 
354019cc7524SAriel Levkovich 	if (!is_valid_attr(dev->mdev, flow_attr))
3541038d2ef8SMaor Gottlieb 		return ERR_PTR(-EINVAL);
3542038d2ef8SMaor Gottlieb 
35436a4d00beSMark Bloch 	if (dev->is_rep && is_egress)
354478dd0c43SMark Bloch 		return ERR_PTR(-EINVAL);
354578dd0c43SMark Bloch 
35461b9a07eeSLeon Romanovsky 	spec = kvzalloc(sizeof(*spec), GFP_KERNEL);
3547038d2ef8SMaor Gottlieb 	handler = kzalloc(sizeof(*handler), GFP_KERNEL);
3548c5bb1730SMaor Gottlieb 	if (!handler || !spec) {
3549038d2ef8SMaor Gottlieb 		err = -ENOMEM;
3550038d2ef8SMaor Gottlieb 		goto free;
3551038d2ef8SMaor Gottlieb 	}
3552038d2ef8SMaor Gottlieb 
3553038d2ef8SMaor Gottlieb 	INIT_LIST_HEAD(&handler->list);
35543b3233fbSRaed Salem 	if (dst) {
35553b3233fbSRaed Salem 		memcpy(&dest_arr[0], dst, sizeof(*dst));
35563b3233fbSRaed Salem 		dest_num++;
35573b3233fbSRaed Salem 	}
3558038d2ef8SMaor Gottlieb 
3559038d2ef8SMaor Gottlieb 	for (spec_index = 0; spec_index < flow_attr->num_of_specs; spec_index++) {
3560bb0ee7dcSJianbo Liu 		err = parse_flow_attr(dev->mdev, spec,
356171c6e863SAriel Levkovich 				      ib_flow, flow_attr, &flow_act,
356271c6e863SAriel Levkovich 				      prev_type);
3563038d2ef8SMaor Gottlieb 		if (err < 0)
3564038d2ef8SMaor Gottlieb 			goto free;
3565038d2ef8SMaor Gottlieb 
356671c6e863SAriel Levkovich 		prev_type = ((union ib_flow_spec *)ib_flow)->type;
3567038d2ef8SMaor Gottlieb 		ib_flow += ((union ib_flow_spec *)ib_flow)->size;
3568038d2ef8SMaor Gottlieb 	}
3569038d2ef8SMaor Gottlieb 
3570a550ddfcSYishai Hadas 	if (!flow_is_multicast_only(flow_attr))
3571a550ddfcSYishai Hadas 		set_underlay_qp(dev, spec, underlay_qpn);
3572a550ddfcSYishai Hadas 
35736a4d00beSMark Bloch 	if (dev->is_rep) {
3574669ff1e3SJianbo Liu 		struct mlx5_eswitch_rep *rep;
3575018a94eeSMark Bloch 
3576669ff1e3SJianbo Liu 		rep = dev->port[flow_attr->port - 1].rep;
3577669ff1e3SJianbo Liu 		if (!rep) {
35786a4d00beSMark Bloch 			err = -EINVAL;
35796a4d00beSMark Bloch 			goto free;
35806a4d00beSMark Bloch 		}
3581669ff1e3SJianbo Liu 
3582669ff1e3SJianbo Liu 		mlx5_ib_set_rule_source_port(dev, spec, rep);
3583018a94eeSMark Bloch 	}
3584018a94eeSMark Bloch 
3585466fa6d2SMaor Gottlieb 	spec->match_criteria_enable = get_match_criteria_enable(spec->match_criteria);
3586802c2125SAviad Yehezkel 
3587802c2125SAviad Yehezkel 	if (is_egress &&
3588802c2125SAviad Yehezkel 	    !is_valid_spec(dev->mdev, spec, &flow_act, is_egress)) {
3589802c2125SAviad Yehezkel 		err = -EINVAL;
3590802c2125SAviad Yehezkel 		goto free;
3591802c2125SAviad Yehezkel 	}
3592802c2125SAviad Yehezkel 
35933b3233fbSRaed Salem 	if (flow_act.action & MLX5_FLOW_CONTEXT_ACTION_COUNT) {
3594171c7625SMark Bloch 		struct mlx5_ib_mcounters *mcounters;
3595171c7625SMark Bloch 
35963b3233fbSRaed Salem 		err = flow_counters_set_data(flow_act.counters, ucmd);
35973b3233fbSRaed Salem 		if (err)
35983b3233fbSRaed Salem 			goto free;
35993b3233fbSRaed Salem 
3600171c7625SMark Bloch 		mcounters = to_mcounters(flow_act.counters);
36013b3233fbSRaed Salem 		handler->ibcounters = flow_act.counters;
36023b3233fbSRaed Salem 		dest_arr[dest_num].type =
36033b3233fbSRaed Salem 			MLX5_FLOW_DESTINATION_TYPE_COUNTER;
3604171c7625SMark Bloch 		dest_arr[dest_num].counter_id =
3605171c7625SMark Bloch 			mlx5_fc_id(mcounters->hw_cntrs_hndl);
36063b3233fbSRaed Salem 		dest_num++;
36073b3233fbSRaed Salem 	}
36083b3233fbSRaed Salem 
3609075572d4SBoris Pismenny 	if (flow_act.action & MLX5_FLOW_CONTEXT_ACTION_DROP) {
36103b3233fbSRaed Salem 		if (!(flow_act.action & MLX5_FLOW_CONTEXT_ACTION_COUNT)) {
3611a22ed86cSSlava Shwartsman 			rule_dst = NULL;
3612a22ed86cSSlava Shwartsman 			dest_num = 0;
36133b3233fbSRaed Salem 		}
3614a22ed86cSSlava Shwartsman 	} else {
3615802c2125SAviad Yehezkel 		if (is_egress)
3616802c2125SAviad Yehezkel 			flow_act.action |= MLX5_FLOW_CONTEXT_ACTION_ALLOW;
3617802c2125SAviad Yehezkel 		else
3618802c2125SAviad Yehezkel 			flow_act.action |=
36193b3233fbSRaed Salem 				dest_num ?  MLX5_FLOW_CONTEXT_ACTION_FWD_DEST :
362035d19011SMaor Gottlieb 					MLX5_FLOW_CONTEXT_ACTION_FWD_NEXT_PRIO;
3621a22ed86cSSlava Shwartsman 	}
36222ac693f9SMoses Reuben 
3623bb0ee7dcSJianbo Liu 	if ((spec->flow_context.flags & FLOW_CONTEXT_HAS_TAG)  &&
36242ac693f9SMoses Reuben 	    (flow_attr->type == IB_FLOW_ATTR_ALL_DEFAULT ||
36252ac693f9SMoses Reuben 	     flow_attr->type == IB_FLOW_ATTR_MC_DEFAULT)) {
36262ac693f9SMoses Reuben 		mlx5_ib_warn(dev, "Flow tag %u and attribute type %x isn't allowed in leftovers\n",
3627bb0ee7dcSJianbo Liu 			     spec->flow_context.flow_tag, flow_attr->type);
36282ac693f9SMoses Reuben 		err = -EINVAL;
36292ac693f9SMoses Reuben 		goto free;
36302ac693f9SMoses Reuben 	}
363174491de9SMark Bloch 	handler->rule = mlx5_add_flow_rules(ft, spec,
363266958ed9SHadar Hen Zion 					    &flow_act,
3633a22ed86cSSlava Shwartsman 					    rule_dst, dest_num);
3634038d2ef8SMaor Gottlieb 
3635038d2ef8SMaor Gottlieb 	if (IS_ERR(handler->rule)) {
3636038d2ef8SMaor Gottlieb 		err = PTR_ERR(handler->rule);
3637038d2ef8SMaor Gottlieb 		goto free;
3638038d2ef8SMaor Gottlieb 	}
3639038d2ef8SMaor Gottlieb 
3640d9d4980aSMaor Gottlieb 	ft_prio->refcount++;
36415497adc6SMaor Gottlieb 	handler->prio = ft_prio;
3642d4be3f44SYishai Hadas 	handler->dev = dev;
3643038d2ef8SMaor Gottlieb 
3644038d2ef8SMaor Gottlieb 	ft_prio->flow_table = ft;
3645038d2ef8SMaor Gottlieb free:
36463b3233fbSRaed Salem 	if (err && handler) {
36473b3233fbSRaed Salem 		if (handler->ibcounters &&
36483b3233fbSRaed Salem 		    atomic_read(&handler->ibcounters->usecnt) == 1)
36493b3233fbSRaed Salem 			counters_clear_description(handler->ibcounters);
3650038d2ef8SMaor Gottlieb 		kfree(handler);
36513b3233fbSRaed Salem 	}
3652c5bb1730SMaor Gottlieb 	kvfree(spec);
3653038d2ef8SMaor Gottlieb 	return err ? ERR_PTR(err) : handler;
3654038d2ef8SMaor Gottlieb }
3655038d2ef8SMaor Gottlieb 
3656a550ddfcSYishai Hadas static struct mlx5_ib_flow_handler *create_flow_rule(struct mlx5_ib_dev *dev,
3657a550ddfcSYishai Hadas 						     struct mlx5_ib_flow_prio *ft_prio,
3658a550ddfcSYishai Hadas 						     const struct ib_flow_attr *flow_attr,
3659a550ddfcSYishai Hadas 						     struct mlx5_flow_destination *dst)
3660a550ddfcSYishai Hadas {
36613b3233fbSRaed Salem 	return _create_flow_rule(dev, ft_prio, flow_attr, dst, 0, NULL);
3662a550ddfcSYishai Hadas }
3663a550ddfcSYishai Hadas 
366435d19011SMaor Gottlieb static struct mlx5_ib_flow_handler *create_dont_trap_rule(struct mlx5_ib_dev *dev,
366535d19011SMaor Gottlieb 							  struct mlx5_ib_flow_prio *ft_prio,
366635d19011SMaor Gottlieb 							  struct ib_flow_attr *flow_attr,
366735d19011SMaor Gottlieb 							  struct mlx5_flow_destination *dst)
366835d19011SMaor Gottlieb {
366935d19011SMaor Gottlieb 	struct mlx5_ib_flow_handler *handler_dst = NULL;
367035d19011SMaor Gottlieb 	struct mlx5_ib_flow_handler *handler = NULL;
367135d19011SMaor Gottlieb 
367235d19011SMaor Gottlieb 	handler = create_flow_rule(dev, ft_prio, flow_attr, NULL);
367335d19011SMaor Gottlieb 	if (!IS_ERR(handler)) {
367435d19011SMaor Gottlieb 		handler_dst = create_flow_rule(dev, ft_prio,
367535d19011SMaor Gottlieb 					       flow_attr, dst);
367635d19011SMaor Gottlieb 		if (IS_ERR(handler_dst)) {
367774491de9SMark Bloch 			mlx5_del_flow_rules(handler->rule);
3678d9d4980aSMaor Gottlieb 			ft_prio->refcount--;
367935d19011SMaor Gottlieb 			kfree(handler);
368035d19011SMaor Gottlieb 			handler = handler_dst;
368135d19011SMaor Gottlieb 		} else {
368235d19011SMaor Gottlieb 			list_add(&handler_dst->list, &handler->list);
368335d19011SMaor Gottlieb 		}
368435d19011SMaor Gottlieb 	}
368535d19011SMaor Gottlieb 
368635d19011SMaor Gottlieb 	return handler;
368735d19011SMaor Gottlieb }
3688038d2ef8SMaor Gottlieb enum {
3689038d2ef8SMaor Gottlieb 	LEFTOVERS_MC,
3690038d2ef8SMaor Gottlieb 	LEFTOVERS_UC,
3691038d2ef8SMaor Gottlieb };
3692038d2ef8SMaor Gottlieb 
3693038d2ef8SMaor Gottlieb static struct mlx5_ib_flow_handler *create_leftovers_rule(struct mlx5_ib_dev *dev,
3694038d2ef8SMaor Gottlieb 							  struct mlx5_ib_flow_prio *ft_prio,
3695038d2ef8SMaor Gottlieb 							  struct ib_flow_attr *flow_attr,
3696038d2ef8SMaor Gottlieb 							  struct mlx5_flow_destination *dst)
3697038d2ef8SMaor Gottlieb {
3698038d2ef8SMaor Gottlieb 	struct mlx5_ib_flow_handler *handler_ucast = NULL;
3699038d2ef8SMaor Gottlieb 	struct mlx5_ib_flow_handler *handler = NULL;
3700038d2ef8SMaor Gottlieb 
3701038d2ef8SMaor Gottlieb 	static struct {
3702038d2ef8SMaor Gottlieb 		struct ib_flow_attr	flow_attr;
3703038d2ef8SMaor Gottlieb 		struct ib_flow_spec_eth eth_flow;
3704038d2ef8SMaor Gottlieb 	} leftovers_specs[] = {
3705038d2ef8SMaor Gottlieb 		[LEFTOVERS_MC] = {
3706038d2ef8SMaor Gottlieb 			.flow_attr = {
3707038d2ef8SMaor Gottlieb 				.num_of_specs = 1,
3708038d2ef8SMaor Gottlieb 				.size = sizeof(leftovers_specs[0])
3709038d2ef8SMaor Gottlieb 			},
3710038d2ef8SMaor Gottlieb 			.eth_flow = {
3711038d2ef8SMaor Gottlieb 				.type = IB_FLOW_SPEC_ETH,
3712038d2ef8SMaor Gottlieb 				.size = sizeof(struct ib_flow_spec_eth),
3713038d2ef8SMaor Gottlieb 				.mask = {.dst_mac = {0x1} },
3714038d2ef8SMaor Gottlieb 				.val =  {.dst_mac = {0x1} }
3715038d2ef8SMaor Gottlieb 			}
3716038d2ef8SMaor Gottlieb 		},
3717038d2ef8SMaor Gottlieb 		[LEFTOVERS_UC] = {
3718038d2ef8SMaor Gottlieb 			.flow_attr = {
3719038d2ef8SMaor Gottlieb 				.num_of_specs = 1,
3720038d2ef8SMaor Gottlieb 				.size = sizeof(leftovers_specs[0])
3721038d2ef8SMaor Gottlieb 			},
3722038d2ef8SMaor Gottlieb 			.eth_flow = {
3723038d2ef8SMaor Gottlieb 				.type = IB_FLOW_SPEC_ETH,
3724038d2ef8SMaor Gottlieb 				.size = sizeof(struct ib_flow_spec_eth),
3725038d2ef8SMaor Gottlieb 				.mask = {.dst_mac = {0x1} },
3726038d2ef8SMaor Gottlieb 				.val = {.dst_mac = {} }
3727038d2ef8SMaor Gottlieb 			}
3728038d2ef8SMaor Gottlieb 		}
3729038d2ef8SMaor Gottlieb 	};
3730038d2ef8SMaor Gottlieb 
3731038d2ef8SMaor Gottlieb 	handler = create_flow_rule(dev, ft_prio,
3732038d2ef8SMaor Gottlieb 				   &leftovers_specs[LEFTOVERS_MC].flow_attr,
3733038d2ef8SMaor Gottlieb 				   dst);
3734038d2ef8SMaor Gottlieb 	if (!IS_ERR(handler) &&
3735038d2ef8SMaor Gottlieb 	    flow_attr->type == IB_FLOW_ATTR_ALL_DEFAULT) {
3736038d2ef8SMaor Gottlieb 		handler_ucast = create_flow_rule(dev, ft_prio,
3737038d2ef8SMaor Gottlieb 						 &leftovers_specs[LEFTOVERS_UC].flow_attr,
3738038d2ef8SMaor Gottlieb 						 dst);
3739038d2ef8SMaor Gottlieb 		if (IS_ERR(handler_ucast)) {
374074491de9SMark Bloch 			mlx5_del_flow_rules(handler->rule);
3741d9d4980aSMaor Gottlieb 			ft_prio->refcount--;
3742038d2ef8SMaor Gottlieb 			kfree(handler);
3743038d2ef8SMaor Gottlieb 			handler = handler_ucast;
3744038d2ef8SMaor Gottlieb 		} else {
3745038d2ef8SMaor Gottlieb 			list_add(&handler_ucast->list, &handler->list);
3746038d2ef8SMaor Gottlieb 		}
3747038d2ef8SMaor Gottlieb 	}
3748038d2ef8SMaor Gottlieb 
3749038d2ef8SMaor Gottlieb 	return handler;
3750038d2ef8SMaor Gottlieb }
3751038d2ef8SMaor Gottlieb 
3752cc0e5d42SMaor Gottlieb static struct mlx5_ib_flow_handler *create_sniffer_rule(struct mlx5_ib_dev *dev,
3753cc0e5d42SMaor Gottlieb 							struct mlx5_ib_flow_prio *ft_rx,
3754cc0e5d42SMaor Gottlieb 							struct mlx5_ib_flow_prio *ft_tx,
3755cc0e5d42SMaor Gottlieb 							struct mlx5_flow_destination *dst)
3756cc0e5d42SMaor Gottlieb {
3757cc0e5d42SMaor Gottlieb 	struct mlx5_ib_flow_handler *handler_rx;
3758cc0e5d42SMaor Gottlieb 	struct mlx5_ib_flow_handler *handler_tx;
3759cc0e5d42SMaor Gottlieb 	int err;
3760cc0e5d42SMaor Gottlieb 	static const struct ib_flow_attr flow_attr  = {
3761cc0e5d42SMaor Gottlieb 		.num_of_specs = 0,
3762cc0e5d42SMaor Gottlieb 		.size = sizeof(flow_attr)
3763cc0e5d42SMaor Gottlieb 	};
3764cc0e5d42SMaor Gottlieb 
3765cc0e5d42SMaor Gottlieb 	handler_rx = create_flow_rule(dev, ft_rx, &flow_attr, dst);
3766cc0e5d42SMaor Gottlieb 	if (IS_ERR(handler_rx)) {
3767cc0e5d42SMaor Gottlieb 		err = PTR_ERR(handler_rx);
3768cc0e5d42SMaor Gottlieb 		goto err;
3769cc0e5d42SMaor Gottlieb 	}
3770cc0e5d42SMaor Gottlieb 
3771cc0e5d42SMaor Gottlieb 	handler_tx = create_flow_rule(dev, ft_tx, &flow_attr, dst);
3772cc0e5d42SMaor Gottlieb 	if (IS_ERR(handler_tx)) {
3773cc0e5d42SMaor Gottlieb 		err = PTR_ERR(handler_tx);
3774cc0e5d42SMaor Gottlieb 		goto err_tx;
3775cc0e5d42SMaor Gottlieb 	}
3776cc0e5d42SMaor Gottlieb 
3777cc0e5d42SMaor Gottlieb 	list_add(&handler_tx->list, &handler_rx->list);
3778cc0e5d42SMaor Gottlieb 
3779cc0e5d42SMaor Gottlieb 	return handler_rx;
3780cc0e5d42SMaor Gottlieb 
3781cc0e5d42SMaor Gottlieb err_tx:
378274491de9SMark Bloch 	mlx5_del_flow_rules(handler_rx->rule);
3783cc0e5d42SMaor Gottlieb 	ft_rx->refcount--;
3784cc0e5d42SMaor Gottlieb 	kfree(handler_rx);
3785cc0e5d42SMaor Gottlieb err:
3786cc0e5d42SMaor Gottlieb 	return ERR_PTR(err);
3787cc0e5d42SMaor Gottlieb }
3788cc0e5d42SMaor Gottlieb 
3789038d2ef8SMaor Gottlieb static struct ib_flow *mlx5_ib_create_flow(struct ib_qp *qp,
3790038d2ef8SMaor Gottlieb 					   struct ib_flow_attr *flow_attr,
379159082a32SMatan Barak 					   int domain,
379259082a32SMatan Barak 					   struct ib_udata *udata)
3793038d2ef8SMaor Gottlieb {
3794038d2ef8SMaor Gottlieb 	struct mlx5_ib_dev *dev = to_mdev(qp->device);
3795d9f88e5aSYishai Hadas 	struct mlx5_ib_qp *mqp = to_mqp(qp);
3796038d2ef8SMaor Gottlieb 	struct mlx5_ib_flow_handler *handler = NULL;
3797038d2ef8SMaor Gottlieb 	struct mlx5_flow_destination *dst = NULL;
3798cc0e5d42SMaor Gottlieb 	struct mlx5_ib_flow_prio *ft_prio_tx = NULL;
3799038d2ef8SMaor Gottlieb 	struct mlx5_ib_flow_prio *ft_prio;
3800802c2125SAviad Yehezkel 	bool is_egress = flow_attr->flags & IB_FLOW_ATTR_FLAGS_EGRESS;
38013b3233fbSRaed Salem 	struct mlx5_ib_create_flow *ucmd = NULL, ucmd_hdr;
38023b3233fbSRaed Salem 	size_t min_ucmd_sz, required_ucmd_sz;
3803038d2ef8SMaor Gottlieb 	int err;
3804a550ddfcSYishai Hadas 	int underlay_qpn;
3805038d2ef8SMaor Gottlieb 
38063b3233fbSRaed Salem 	if (udata && udata->inlen) {
38073b3233fbSRaed Salem 		min_ucmd_sz = offsetof(typeof(ucmd_hdr), reserved) +
38083b3233fbSRaed Salem 				sizeof(ucmd_hdr.reserved);
38093b3233fbSRaed Salem 		if (udata->inlen < min_ucmd_sz)
381059082a32SMatan Barak 			return ERR_PTR(-EOPNOTSUPP);
381159082a32SMatan Barak 
38123b3233fbSRaed Salem 		err = ib_copy_from_udata(&ucmd_hdr, udata, min_ucmd_sz);
38133b3233fbSRaed Salem 		if (err)
38143b3233fbSRaed Salem 			return ERR_PTR(err);
38153b3233fbSRaed Salem 
38163b3233fbSRaed Salem 		/* currently supports only one counters data */
38173b3233fbSRaed Salem 		if (ucmd_hdr.ncounters_data > 1)
38183b3233fbSRaed Salem 			return ERR_PTR(-EINVAL);
38193b3233fbSRaed Salem 
38203b3233fbSRaed Salem 		required_ucmd_sz = min_ucmd_sz +
38213b3233fbSRaed Salem 			sizeof(struct mlx5_ib_flow_counters_data) *
38223b3233fbSRaed Salem 			ucmd_hdr.ncounters_data;
38233b3233fbSRaed Salem 		if (udata->inlen > required_ucmd_sz &&
38243b3233fbSRaed Salem 		    !ib_is_udata_cleared(udata, required_ucmd_sz,
38253b3233fbSRaed Salem 					 udata->inlen - required_ucmd_sz))
38263b3233fbSRaed Salem 			return ERR_PTR(-EOPNOTSUPP);
38273b3233fbSRaed Salem 
38283b3233fbSRaed Salem 		ucmd = kzalloc(required_ucmd_sz, GFP_KERNEL);
38293b3233fbSRaed Salem 		if (!ucmd)
38303b3233fbSRaed Salem 			return ERR_PTR(-ENOMEM);
38313b3233fbSRaed Salem 
38323b3233fbSRaed Salem 		err = ib_copy_from_udata(ucmd, udata, required_ucmd_sz);
3833299eafeeSGustavo A. R. Silva 		if (err)
3834299eafeeSGustavo A. R. Silva 			goto free_ucmd;
38353b3233fbSRaed Salem 	}
38363b3233fbSRaed Salem 
3837299eafeeSGustavo A. R. Silva 	if (flow_attr->priority > MLX5_IB_FLOW_LAST_PRIO) {
3838299eafeeSGustavo A. R. Silva 		err = -ENOMEM;
3839299eafeeSGustavo A. R. Silva 		goto free_ucmd;
3840299eafeeSGustavo A. R. Silva 	}
3841038d2ef8SMaor Gottlieb 
3842038d2ef8SMaor Gottlieb 	if (domain != IB_FLOW_DOMAIN_USER ||
3843508562d6SDaniel Jurgens 	    flow_attr->port > dev->num_ports ||
3844802c2125SAviad Yehezkel 	    (flow_attr->flags & ~(IB_FLOW_ATTR_FLAGS_DONT_TRAP |
3845299eafeeSGustavo A. R. Silva 				  IB_FLOW_ATTR_FLAGS_EGRESS))) {
3846299eafeeSGustavo A. R. Silva 		err = -EINVAL;
3847299eafeeSGustavo A. R. Silva 		goto free_ucmd;
3848299eafeeSGustavo A. R. Silva 	}
3849802c2125SAviad Yehezkel 
3850802c2125SAviad Yehezkel 	if (is_egress &&
3851802c2125SAviad Yehezkel 	    (flow_attr->type == IB_FLOW_ATTR_ALL_DEFAULT ||
3852299eafeeSGustavo A. R. Silva 	     flow_attr->type == IB_FLOW_ATTR_MC_DEFAULT)) {
3853299eafeeSGustavo A. R. Silva 		err = -EINVAL;
3854299eafeeSGustavo A. R. Silva 		goto free_ucmd;
3855299eafeeSGustavo A. R. Silva 	}
3856038d2ef8SMaor Gottlieb 
3857038d2ef8SMaor Gottlieb 	dst = kzalloc(sizeof(*dst), GFP_KERNEL);
3858299eafeeSGustavo A. R. Silva 	if (!dst) {
3859299eafeeSGustavo A. R. Silva 		err = -ENOMEM;
3860299eafeeSGustavo A. R. Silva 		goto free_ucmd;
3861299eafeeSGustavo A. R. Silva 	}
3862038d2ef8SMaor Gottlieb 
38639a4ca38dSMark Bloch 	mutex_lock(&dev->flow_db->lock);
3864038d2ef8SMaor Gottlieb 
3865802c2125SAviad Yehezkel 	ft_prio = get_flow_table(dev, flow_attr,
3866802c2125SAviad Yehezkel 				 is_egress ? MLX5_IB_FT_TX : MLX5_IB_FT_RX);
3867038d2ef8SMaor Gottlieb 	if (IS_ERR(ft_prio)) {
3868038d2ef8SMaor Gottlieb 		err = PTR_ERR(ft_prio);
3869038d2ef8SMaor Gottlieb 		goto unlock;
3870038d2ef8SMaor Gottlieb 	}
3871cc0e5d42SMaor Gottlieb 	if (flow_attr->type == IB_FLOW_ATTR_SNIFFER) {
3872cc0e5d42SMaor Gottlieb 		ft_prio_tx = get_flow_table(dev, flow_attr, MLX5_IB_FT_TX);
3873cc0e5d42SMaor Gottlieb 		if (IS_ERR(ft_prio_tx)) {
3874cc0e5d42SMaor Gottlieb 			err = PTR_ERR(ft_prio_tx);
3875cc0e5d42SMaor Gottlieb 			ft_prio_tx = NULL;
3876cc0e5d42SMaor Gottlieb 			goto destroy_ft;
3877cc0e5d42SMaor Gottlieb 		}
3878cc0e5d42SMaor Gottlieb 	}
3879038d2ef8SMaor Gottlieb 
3880802c2125SAviad Yehezkel 	if (is_egress) {
3881802c2125SAviad Yehezkel 		dst->type = MLX5_FLOW_DESTINATION_TYPE_PORT;
3882802c2125SAviad Yehezkel 	} else {
3883038d2ef8SMaor Gottlieb 		dst->type = MLX5_FLOW_DESTINATION_TYPE_TIR;
3884d9f88e5aSYishai Hadas 		if (mqp->flags & MLX5_IB_QP_RSS)
3885d9f88e5aSYishai Hadas 			dst->tir_num = mqp->rss_qp.tirn;
3886d9f88e5aSYishai Hadas 		else
3887d9f88e5aSYishai Hadas 			dst->tir_num = mqp->raw_packet_qp.rq.tirn;
3888802c2125SAviad Yehezkel 	}
3889038d2ef8SMaor Gottlieb 
3890038d2ef8SMaor Gottlieb 	if (flow_attr->type == IB_FLOW_ATTR_NORMAL) {
389135d19011SMaor Gottlieb 		if (flow_attr->flags & IB_FLOW_ATTR_FLAGS_DONT_TRAP)  {
389235d19011SMaor Gottlieb 			handler = create_dont_trap_rule(dev, ft_prio,
389335d19011SMaor Gottlieb 							flow_attr, dst);
389435d19011SMaor Gottlieb 		} else {
3895a550ddfcSYishai Hadas 			underlay_qpn = (mqp->flags & MLX5_IB_QP_UNDERLAY) ?
3896a550ddfcSYishai Hadas 					mqp->underlay_qpn : 0;
3897a550ddfcSYishai Hadas 			handler = _create_flow_rule(dev, ft_prio, flow_attr,
38983b3233fbSRaed Salem 						    dst, underlay_qpn, ucmd);
389935d19011SMaor Gottlieb 		}
3900038d2ef8SMaor Gottlieb 	} else if (flow_attr->type == IB_FLOW_ATTR_ALL_DEFAULT ||
3901038d2ef8SMaor Gottlieb 		   flow_attr->type == IB_FLOW_ATTR_MC_DEFAULT) {
3902038d2ef8SMaor Gottlieb 		handler = create_leftovers_rule(dev, ft_prio, flow_attr,
3903038d2ef8SMaor Gottlieb 						dst);
3904cc0e5d42SMaor Gottlieb 	} else if (flow_attr->type == IB_FLOW_ATTR_SNIFFER) {
3905cc0e5d42SMaor Gottlieb 		handler = create_sniffer_rule(dev, ft_prio, ft_prio_tx, dst);
3906038d2ef8SMaor Gottlieb 	} else {
3907038d2ef8SMaor Gottlieb 		err = -EINVAL;
3908038d2ef8SMaor Gottlieb 		goto destroy_ft;
3909038d2ef8SMaor Gottlieb 	}
3910038d2ef8SMaor Gottlieb 
3911038d2ef8SMaor Gottlieb 	if (IS_ERR(handler)) {
3912038d2ef8SMaor Gottlieb 		err = PTR_ERR(handler);
3913038d2ef8SMaor Gottlieb 		handler = NULL;
3914038d2ef8SMaor Gottlieb 		goto destroy_ft;
3915038d2ef8SMaor Gottlieb 	}
3916038d2ef8SMaor Gottlieb 
39179a4ca38dSMark Bloch 	mutex_unlock(&dev->flow_db->lock);
3918038d2ef8SMaor Gottlieb 	kfree(dst);
39193b3233fbSRaed Salem 	kfree(ucmd);
3920038d2ef8SMaor Gottlieb 
3921038d2ef8SMaor Gottlieb 	return &handler->ibflow;
3922038d2ef8SMaor Gottlieb 
3923038d2ef8SMaor Gottlieb destroy_ft:
3924038d2ef8SMaor Gottlieb 	put_flow_table(dev, ft_prio, false);
3925cc0e5d42SMaor Gottlieb 	if (ft_prio_tx)
3926cc0e5d42SMaor Gottlieb 		put_flow_table(dev, ft_prio_tx, false);
3927038d2ef8SMaor Gottlieb unlock:
39289a4ca38dSMark Bloch 	mutex_unlock(&dev->flow_db->lock);
3929038d2ef8SMaor Gottlieb 	kfree(dst);
3930299eafeeSGustavo A. R. Silva free_ucmd:
39313b3233fbSRaed Salem 	kfree(ucmd);
3932038d2ef8SMaor Gottlieb 	return ERR_PTR(err);
3933038d2ef8SMaor Gottlieb }
3934038d2ef8SMaor Gottlieb 
3935b47fd4ffSMark Bloch static struct mlx5_ib_flow_prio *
3936b47fd4ffSMark Bloch _get_flow_table(struct mlx5_ib_dev *dev,
3937b47fd4ffSMark Bloch 		struct mlx5_ib_flow_matcher *fs_matcher,
3938b47fd4ffSMark Bloch 		bool mcast)
3939d4be3f44SYishai Hadas {
3940d4be3f44SYishai Hadas 	struct mlx5_flow_namespace *ns = NULL;
394113a43765SMark Bloch 	struct mlx5_ib_flow_prio *prio = NULL;
394213a43765SMark Bloch 	int max_table_size = 0;
3943cecae747SMaor Gottlieb 	bool esw_encap;
3944b47fd4ffSMark Bloch 	u32 flags = 0;
3945b47fd4ffSMark Bloch 	int priority;
3946d4be3f44SYishai Hadas 
394713a43765SMark Bloch 	if (mcast)
394813a43765SMark Bloch 		priority = MLX5_IB_FLOW_MCAST_PRIO;
394913a43765SMark Bloch 	else
395013a43765SMark Bloch 		priority = ib_prio_to_core_prio(fs_matcher->priority, false);
395113a43765SMark Bloch 
3952cecae747SMaor Gottlieb 	esw_encap = mlx5_eswitch_get_encap_mode(dev->mdev) !=
3953cecae747SMaor Gottlieb 		DEVLINK_ESWITCH_ENCAP_MODE_NONE;
3954b47fd4ffSMark Bloch 	if (fs_matcher->ns_type == MLX5_FLOW_NAMESPACE_BYPASS) {
3955d4be3f44SYishai Hadas 		max_table_size = BIT(MLX5_CAP_FLOWTABLE_NIC_RX(dev->mdev,
3956d4be3f44SYishai Hadas 					log_max_ft_size));
3957cecae747SMaor Gottlieb 		if (MLX5_CAP_FLOWTABLE_NIC_RX(dev->mdev, decap) && !esw_encap)
3958b47fd4ffSMark Bloch 			flags |= MLX5_FLOW_TABLE_TUNNEL_EN_DECAP;
3959b47fd4ffSMark Bloch 		if (MLX5_CAP_FLOWTABLE_NIC_RX(dev->mdev,
3960cecae747SMaor Gottlieb 					      reformat_l3_tunnel_to_l2) &&
3961cecae747SMaor Gottlieb 		    !esw_encap)
3962b47fd4ffSMark Bloch 			flags |= MLX5_FLOW_TABLE_TUNNEL_EN_REFORMAT;
396313a43765SMark Bloch 	} else if (fs_matcher->ns_type == MLX5_FLOW_NAMESPACE_EGRESS) {
396413a43765SMark Bloch 		max_table_size = BIT(
396513a43765SMark Bloch 			MLX5_CAP_FLOWTABLE_NIC_TX(dev->mdev, log_max_ft_size));
3966cecae747SMaor Gottlieb 		if (MLX5_CAP_FLOWTABLE_NIC_TX(dev->mdev, reformat) && !esw_encap)
3967b47fd4ffSMark Bloch 			flags |= MLX5_FLOW_TABLE_TUNNEL_EN_REFORMAT;
396813a43765SMark Bloch 	} else if (fs_matcher->ns_type == MLX5_FLOW_NAMESPACE_FDB) {
396913a43765SMark Bloch 		max_table_size = BIT(
397013a43765SMark Bloch 			MLX5_CAP_ESW_FLOWTABLE_FDB(dev->mdev, log_max_ft_size));
397109d985beSMaor Gottlieb 		if (MLX5_CAP_ESW_FLOWTABLE_FDB(dev->mdev, decap) && esw_encap)
397209d985beSMaor Gottlieb 			flags |= MLX5_FLOW_TABLE_TUNNEL_EN_DECAP;
397309d985beSMaor Gottlieb 		if (MLX5_CAP_ESW_FLOWTABLE_FDB(dev->mdev, reformat_l3_tunnel_to_l2) &&
397409d985beSMaor Gottlieb 		    esw_encap)
397509d985beSMaor Gottlieb 			flags |= MLX5_FLOW_TABLE_TUNNEL_EN_REFORMAT;
397613a43765SMark Bloch 		priority = FDB_BYPASS_PATH;
3977d8abe884SMark Zhang 	} else if (fs_matcher->ns_type == MLX5_FLOW_NAMESPACE_RDMA_RX) {
3978d8abe884SMark Zhang 		max_table_size =
3979d8abe884SMark Zhang 			BIT(MLX5_CAP_FLOWTABLE_RDMA_RX(dev->mdev,
3980d8abe884SMark Zhang 						       log_max_ft_size));
3981d8abe884SMark Zhang 		priority = fs_matcher->priority;
3982b47fd4ffSMark Bloch 	}
3983b47fd4ffSMark Bloch 
39843b70508aSMark Bloch 	max_table_size = min_t(int, max_table_size, MLX5_FS_MAX_ENTRIES);
3985d4be3f44SYishai Hadas 
3986b47fd4ffSMark Bloch 	ns = mlx5_get_flow_namespace(dev->mdev, fs_matcher->ns_type);
3987d4be3f44SYishai Hadas 	if (!ns)
3988d4be3f44SYishai Hadas 		return ERR_PTR(-ENOTSUPP);
3989d4be3f44SYishai Hadas 
3990b47fd4ffSMark Bloch 	if (fs_matcher->ns_type == MLX5_FLOW_NAMESPACE_BYPASS)
3991d4be3f44SYishai Hadas 		prio = &dev->flow_db->prios[priority];
399213a43765SMark Bloch 	else if (fs_matcher->ns_type == MLX5_FLOW_NAMESPACE_EGRESS)
3993b47fd4ffSMark Bloch 		prio = &dev->flow_db->egress_prios[priority];
399413a43765SMark Bloch 	else if (fs_matcher->ns_type == MLX5_FLOW_NAMESPACE_FDB)
399513a43765SMark Bloch 		prio = &dev->flow_db->fdb;
3996d8abe884SMark Zhang 	else if (fs_matcher->ns_type == MLX5_FLOW_NAMESPACE_RDMA_RX)
3997d8abe884SMark Zhang 		prio = &dev->flow_db->rdma_rx[priority];
399813a43765SMark Bloch 
399913a43765SMark Bloch 	if (!prio)
400013a43765SMark Bloch 		return ERR_PTR(-EINVAL);
4001d4be3f44SYishai Hadas 
4002d4be3f44SYishai Hadas 	if (prio->flow_table)
4003d4be3f44SYishai Hadas 		return prio;
4004d4be3f44SYishai Hadas 
40053b70508aSMark Bloch 	return _get_prio(ns, prio, priority, max_table_size,
4006b47fd4ffSMark Bloch 			 MLX5_FS_MAX_TYPES, flags);
4007d4be3f44SYishai Hadas }
4008d4be3f44SYishai Hadas 
4009d4be3f44SYishai Hadas static struct mlx5_ib_flow_handler *
4010d4be3f44SYishai Hadas _create_raw_flow_rule(struct mlx5_ib_dev *dev,
4011d4be3f44SYishai Hadas 		      struct mlx5_ib_flow_prio *ft_prio,
4012d4be3f44SYishai Hadas 		      struct mlx5_flow_destination *dst,
4013d4be3f44SYishai Hadas 		      struct mlx5_ib_flow_matcher  *fs_matcher,
4014bb0ee7dcSJianbo Liu 		      struct mlx5_flow_context *flow_context,
4015b823dd6dSMark Bloch 		      struct mlx5_flow_act *flow_act,
4016bfc5d839SMark Bloch 		      void *cmd_in, int inlen,
4017bfc5d839SMark Bloch 		      int dst_num)
4018d4be3f44SYishai Hadas {
4019d4be3f44SYishai Hadas 	struct mlx5_ib_flow_handler *handler;
4020d4be3f44SYishai Hadas 	struct mlx5_flow_spec *spec;
4021d4be3f44SYishai Hadas 	struct mlx5_flow_table *ft = ft_prio->flow_table;
4022d4be3f44SYishai Hadas 	int err = 0;
4023d4be3f44SYishai Hadas 
4024d4be3f44SYishai Hadas 	spec = kvzalloc(sizeof(*spec), GFP_KERNEL);
4025d4be3f44SYishai Hadas 	handler = kzalloc(sizeof(*handler), GFP_KERNEL);
4026d4be3f44SYishai Hadas 	if (!handler || !spec) {
4027d4be3f44SYishai Hadas 		err = -ENOMEM;
4028d4be3f44SYishai Hadas 		goto free;
4029d4be3f44SYishai Hadas 	}
4030d4be3f44SYishai Hadas 
4031d4be3f44SYishai Hadas 	INIT_LIST_HEAD(&handler->list);
4032d4be3f44SYishai Hadas 
4033d4be3f44SYishai Hadas 	memcpy(spec->match_value, cmd_in, inlen);
4034d4be3f44SYishai Hadas 	memcpy(spec->match_criteria, fs_matcher->matcher_mask.match_params,
4035d4be3f44SYishai Hadas 	       fs_matcher->mask_len);
4036d4be3f44SYishai Hadas 	spec->match_criteria_enable = fs_matcher->match_criteria_enable;
4037bb0ee7dcSJianbo Liu 	spec->flow_context = *flow_context;
4038d4be3f44SYishai Hadas 
4039d4be3f44SYishai Hadas 	handler->rule = mlx5_add_flow_rules(ft, spec,
4040bfc5d839SMark Bloch 					    flow_act, dst, dst_num);
4041d4be3f44SYishai Hadas 
4042d4be3f44SYishai Hadas 	if (IS_ERR(handler->rule)) {
4043d4be3f44SYishai Hadas 		err = PTR_ERR(handler->rule);
4044d4be3f44SYishai Hadas 		goto free;
4045d4be3f44SYishai Hadas 	}
4046d4be3f44SYishai Hadas 
4047d4be3f44SYishai Hadas 	ft_prio->refcount++;
4048d4be3f44SYishai Hadas 	handler->prio = ft_prio;
4049d4be3f44SYishai Hadas 	handler->dev = dev;
4050d4be3f44SYishai Hadas 	ft_prio->flow_table = ft;
4051d4be3f44SYishai Hadas 
4052d4be3f44SYishai Hadas free:
4053d4be3f44SYishai Hadas 	if (err)
4054d4be3f44SYishai Hadas 		kfree(handler);
4055d4be3f44SYishai Hadas 	kvfree(spec);
4056d4be3f44SYishai Hadas 	return err ? ERR_PTR(err) : handler;
4057d4be3f44SYishai Hadas }
4058d4be3f44SYishai Hadas 
4059d4be3f44SYishai Hadas static bool raw_fs_is_multicast(struct mlx5_ib_flow_matcher *fs_matcher,
4060d4be3f44SYishai Hadas 				void *match_v)
4061d4be3f44SYishai Hadas {
4062d4be3f44SYishai Hadas 	void *match_c;
4063d4be3f44SYishai Hadas 	void *match_v_set_lyr_2_4, *match_c_set_lyr_2_4;
4064d4be3f44SYishai Hadas 	void *dmac, *dmac_mask;
4065d4be3f44SYishai Hadas 	void *ipv4, *ipv4_mask;
4066d4be3f44SYishai Hadas 
4067d4be3f44SYishai Hadas 	if (!(fs_matcher->match_criteria_enable &
4068d4be3f44SYishai Hadas 	      (1 << MATCH_CRITERIA_ENABLE_OUTER_BIT)))
4069d4be3f44SYishai Hadas 		return false;
4070d4be3f44SYishai Hadas 
4071d4be3f44SYishai Hadas 	match_c = fs_matcher->matcher_mask.match_params;
4072d4be3f44SYishai Hadas 	match_v_set_lyr_2_4 = MLX5_ADDR_OF(fte_match_param, match_v,
4073d4be3f44SYishai Hadas 					   outer_headers);
4074d4be3f44SYishai Hadas 	match_c_set_lyr_2_4 = MLX5_ADDR_OF(fte_match_param, match_c,
4075d4be3f44SYishai Hadas 					   outer_headers);
4076d4be3f44SYishai Hadas 
4077d4be3f44SYishai Hadas 	dmac = MLX5_ADDR_OF(fte_match_set_lyr_2_4, match_v_set_lyr_2_4,
4078d4be3f44SYishai Hadas 			    dmac_47_16);
4079d4be3f44SYishai Hadas 	dmac_mask = MLX5_ADDR_OF(fte_match_set_lyr_2_4, match_c_set_lyr_2_4,
4080d4be3f44SYishai Hadas 				 dmac_47_16);
4081d4be3f44SYishai Hadas 
4082d4be3f44SYishai Hadas 	if (is_multicast_ether_addr(dmac) &&
4083d4be3f44SYishai Hadas 	    is_multicast_ether_addr(dmac_mask))
4084d4be3f44SYishai Hadas 		return true;
4085d4be3f44SYishai Hadas 
4086d4be3f44SYishai Hadas 	ipv4 = MLX5_ADDR_OF(fte_match_set_lyr_2_4, match_v_set_lyr_2_4,
4087d4be3f44SYishai Hadas 			    dst_ipv4_dst_ipv6.ipv4_layout.ipv4);
4088d4be3f44SYishai Hadas 
4089d4be3f44SYishai Hadas 	ipv4_mask = MLX5_ADDR_OF(fte_match_set_lyr_2_4, match_c_set_lyr_2_4,
4090d4be3f44SYishai Hadas 				 dst_ipv4_dst_ipv6.ipv4_layout.ipv4);
4091d4be3f44SYishai Hadas 
4092d4be3f44SYishai Hadas 	if (ipv4_is_multicast(*(__be32 *)(ipv4)) &&
4093d4be3f44SYishai Hadas 	    ipv4_is_multicast(*(__be32 *)(ipv4_mask)))
4094d4be3f44SYishai Hadas 		return true;
4095d4be3f44SYishai Hadas 
4096d4be3f44SYishai Hadas 	return false;
4097d4be3f44SYishai Hadas }
4098d4be3f44SYishai Hadas 
409932269441SYishai Hadas struct mlx5_ib_flow_handler *
410032269441SYishai Hadas mlx5_ib_raw_fs_rule_add(struct mlx5_ib_dev *dev,
410132269441SYishai Hadas 			struct mlx5_ib_flow_matcher *fs_matcher,
4102bb0ee7dcSJianbo Liu 			struct mlx5_flow_context *flow_context,
4103b823dd6dSMark Bloch 			struct mlx5_flow_act *flow_act,
4104bfc5d839SMark Bloch 			u32 counter_id,
410532269441SYishai Hadas 			void *cmd_in, int inlen, int dest_id,
410632269441SYishai Hadas 			int dest_type)
410732269441SYishai Hadas {
4108d4be3f44SYishai Hadas 	struct mlx5_flow_destination *dst;
4109d4be3f44SYishai Hadas 	struct mlx5_ib_flow_prio *ft_prio;
4110d4be3f44SYishai Hadas 	struct mlx5_ib_flow_handler *handler;
4111bfc5d839SMark Bloch 	int dst_num = 0;
4112d4be3f44SYishai Hadas 	bool mcast;
4113d4be3f44SYishai Hadas 	int err;
4114d4be3f44SYishai Hadas 
4115d4be3f44SYishai Hadas 	if (fs_matcher->flow_type != MLX5_IB_FLOW_TYPE_NORMAL)
411632269441SYishai Hadas 		return ERR_PTR(-EOPNOTSUPP);
4117d4be3f44SYishai Hadas 
4118d4be3f44SYishai Hadas 	if (fs_matcher->priority > MLX5_IB_FLOW_LAST_PRIO)
4119d4be3f44SYishai Hadas 		return ERR_PTR(-ENOMEM);
4120d4be3f44SYishai Hadas 
41218e8aa145SGustavo A. R. Silva 	dst = kcalloc(2, sizeof(*dst), GFP_KERNEL);
4122d4be3f44SYishai Hadas 	if (!dst)
4123d4be3f44SYishai Hadas 		return ERR_PTR(-ENOMEM);
4124d4be3f44SYishai Hadas 
4125d4be3f44SYishai Hadas 	mcast = raw_fs_is_multicast(fs_matcher, cmd_in);
4126d4be3f44SYishai Hadas 	mutex_lock(&dev->flow_db->lock);
4127d4be3f44SYishai Hadas 
4128b47fd4ffSMark Bloch 	ft_prio = _get_flow_table(dev, fs_matcher, mcast);
4129d4be3f44SYishai Hadas 	if (IS_ERR(ft_prio)) {
4130d4be3f44SYishai Hadas 		err = PTR_ERR(ft_prio);
4131d4be3f44SYishai Hadas 		goto unlock;
4132d4be3f44SYishai Hadas 	}
4133d4be3f44SYishai Hadas 
41346346f0bfSYishai Hadas 	if (dest_type == MLX5_FLOW_DESTINATION_TYPE_TIR) {
4135bfc5d839SMark Bloch 		dst[dst_num].type = dest_type;
4136bfc5d839SMark Bloch 		dst[dst_num].tir_num = dest_id;
4137b823dd6dSMark Bloch 		flow_act->action |= MLX5_FLOW_CONTEXT_ACTION_FWD_DEST;
4138a7ee18bdSMark Bloch 	} else if (dest_type == MLX5_FLOW_DESTINATION_TYPE_FLOW_TABLE) {
4139bfc5d839SMark Bloch 		dst[dst_num].type = MLX5_FLOW_DESTINATION_TYPE_FLOW_TABLE_NUM;
4140bfc5d839SMark Bloch 		dst[dst_num].ft_num = dest_id;
4141b823dd6dSMark Bloch 		flow_act->action |= MLX5_FLOW_CONTEXT_ACTION_FWD_DEST;
4142a7ee18bdSMark Bloch 	} else {
4143bfc5d839SMark Bloch 		dst[dst_num].type = MLX5_FLOW_DESTINATION_TYPE_PORT;
4144a7ee18bdSMark Bloch 		flow_act->action |= MLX5_FLOW_CONTEXT_ACTION_ALLOW;
41456346f0bfSYishai Hadas 	}
41466346f0bfSYishai Hadas 
4147bfc5d839SMark Bloch 	dst_num++;
4148bfc5d839SMark Bloch 
4149bfc5d839SMark Bloch 	if (flow_act->action & MLX5_FLOW_CONTEXT_ACTION_COUNT) {
4150bfc5d839SMark Bloch 		dst[dst_num].type = MLX5_FLOW_DESTINATION_TYPE_COUNTER;
4151bfc5d839SMark Bloch 		dst[dst_num].counter_id = counter_id;
4152bfc5d839SMark Bloch 		dst_num++;
4153bfc5d839SMark Bloch 	}
4154bfc5d839SMark Bloch 
4155bb0ee7dcSJianbo Liu 	handler = _create_raw_flow_rule(dev, ft_prio, dst, fs_matcher,
4156bb0ee7dcSJianbo Liu 					flow_context, flow_act,
4157bfc5d839SMark Bloch 					cmd_in, inlen, dst_num);
4158d4be3f44SYishai Hadas 
4159d4be3f44SYishai Hadas 	if (IS_ERR(handler)) {
4160d4be3f44SYishai Hadas 		err = PTR_ERR(handler);
4161d4be3f44SYishai Hadas 		goto destroy_ft;
4162d4be3f44SYishai Hadas 	}
4163d4be3f44SYishai Hadas 
4164d4be3f44SYishai Hadas 	mutex_unlock(&dev->flow_db->lock);
4165d4be3f44SYishai Hadas 	atomic_inc(&fs_matcher->usecnt);
4166d4be3f44SYishai Hadas 	handler->flow_matcher = fs_matcher;
4167d4be3f44SYishai Hadas 
4168d4be3f44SYishai Hadas 	kfree(dst);
4169d4be3f44SYishai Hadas 
4170d4be3f44SYishai Hadas 	return handler;
4171d4be3f44SYishai Hadas 
4172d4be3f44SYishai Hadas destroy_ft:
4173d4be3f44SYishai Hadas 	put_flow_table(dev, ft_prio, false);
4174d4be3f44SYishai Hadas unlock:
4175d4be3f44SYishai Hadas 	mutex_unlock(&dev->flow_db->lock);
4176d4be3f44SYishai Hadas 	kfree(dst);
4177d4be3f44SYishai Hadas 
4178d4be3f44SYishai Hadas 	return ERR_PTR(err);
417932269441SYishai Hadas }
418032269441SYishai Hadas 
4181c6475a0bSAviad Yehezkel static u32 mlx5_ib_flow_action_flags_to_accel_xfrm_flags(u32 mlx5_flags)
4182c6475a0bSAviad Yehezkel {
4183c6475a0bSAviad Yehezkel 	u32 flags = 0;
4184c6475a0bSAviad Yehezkel 
4185c6475a0bSAviad Yehezkel 	if (mlx5_flags & MLX5_IB_UAPI_FLOW_ACTION_FLAGS_REQUIRE_METADATA)
4186c6475a0bSAviad Yehezkel 		flags |= MLX5_ACCEL_XFRM_FLAG_REQUIRE_METADATA;
4187c6475a0bSAviad Yehezkel 
4188c6475a0bSAviad Yehezkel 	return flags;
4189c6475a0bSAviad Yehezkel }
4190c6475a0bSAviad Yehezkel 
4191c6475a0bSAviad Yehezkel #define MLX5_FLOW_ACTION_ESP_CREATE_LAST_SUPPORTED	MLX5_IB_UAPI_FLOW_ACTION_FLAGS_REQUIRE_METADATA
4192c6475a0bSAviad Yehezkel static struct ib_flow_action *
4193c6475a0bSAviad Yehezkel mlx5_ib_create_flow_action_esp(struct ib_device *device,
4194c6475a0bSAviad Yehezkel 			       const struct ib_flow_action_attrs_esp *attr,
4195c6475a0bSAviad Yehezkel 			       struct uverbs_attr_bundle *attrs)
4196c6475a0bSAviad Yehezkel {
4197c6475a0bSAviad Yehezkel 	struct mlx5_ib_dev *mdev = to_mdev(device);
4198c6475a0bSAviad Yehezkel 	struct ib_uverbs_flow_action_esp_keymat_aes_gcm *aes_gcm;
4199c6475a0bSAviad Yehezkel 	struct mlx5_accel_esp_xfrm_attrs accel_attrs = {};
4200c6475a0bSAviad Yehezkel 	struct mlx5_ib_flow_action *action;
4201c6475a0bSAviad Yehezkel 	u64 action_flags;
4202c6475a0bSAviad Yehezkel 	u64 flags;
4203c6475a0bSAviad Yehezkel 	int err = 0;
4204c6475a0bSAviad Yehezkel 
4205bccd0622SJason Gunthorpe 	err = uverbs_get_flags64(
4206bccd0622SJason Gunthorpe 		&action_flags, attrs, MLX5_IB_ATTR_CREATE_FLOW_ACTION_FLAGS,
4207bccd0622SJason Gunthorpe 		((MLX5_FLOW_ACTION_ESP_CREATE_LAST_SUPPORTED << 1) - 1));
4208bccd0622SJason Gunthorpe 	if (err)
4209bccd0622SJason Gunthorpe 		return ERR_PTR(err);
4210c6475a0bSAviad Yehezkel 
4211c6475a0bSAviad Yehezkel 	flags = mlx5_ib_flow_action_flags_to_accel_xfrm_flags(action_flags);
4212c6475a0bSAviad Yehezkel 
4213c6475a0bSAviad Yehezkel 	/* We current only support a subset of the standard features. Only a
4214c6475a0bSAviad Yehezkel 	 * keymat of type AES_GCM, with icv_len == 16, iv_algo == SEQ and esn
4215c6475a0bSAviad Yehezkel 	 * (with overlap). Full offload mode isn't supported.
4216c6475a0bSAviad Yehezkel 	 */
4217c6475a0bSAviad Yehezkel 	if (!attr->keymat || attr->replay || attr->encap ||
4218c6475a0bSAviad Yehezkel 	    attr->spi || attr->seq || attr->tfc_pad ||
4219c6475a0bSAviad Yehezkel 	    attr->hard_limit_pkts ||
4220c6475a0bSAviad Yehezkel 	    (attr->flags & ~(IB_FLOW_ACTION_ESP_FLAGS_ESN_TRIGGERED |
4221c6475a0bSAviad Yehezkel 			     IB_UVERBS_FLOW_ACTION_ESP_FLAGS_ENCRYPT)))
4222c6475a0bSAviad Yehezkel 		return ERR_PTR(-EOPNOTSUPP);
4223c6475a0bSAviad Yehezkel 
4224c6475a0bSAviad Yehezkel 	if (attr->keymat->protocol !=
4225c6475a0bSAviad Yehezkel 	    IB_UVERBS_FLOW_ACTION_ESP_KEYMAT_AES_GCM)
4226c6475a0bSAviad Yehezkel 		return ERR_PTR(-EOPNOTSUPP);
4227c6475a0bSAviad Yehezkel 
4228c6475a0bSAviad Yehezkel 	aes_gcm = &attr->keymat->keymat.aes_gcm;
4229c6475a0bSAviad Yehezkel 
4230c6475a0bSAviad Yehezkel 	if (aes_gcm->icv_len != 16 ||
4231c6475a0bSAviad Yehezkel 	    aes_gcm->iv_algo != IB_UVERBS_FLOW_ACTION_IV_ALGO_SEQ)
4232c6475a0bSAviad Yehezkel 		return ERR_PTR(-EOPNOTSUPP);
4233c6475a0bSAviad Yehezkel 
4234c6475a0bSAviad Yehezkel 	action = kmalloc(sizeof(*action), GFP_KERNEL);
4235c6475a0bSAviad Yehezkel 	if (!action)
4236c6475a0bSAviad Yehezkel 		return ERR_PTR(-ENOMEM);
4237c6475a0bSAviad Yehezkel 
4238c6475a0bSAviad Yehezkel 	action->esp_aes_gcm.ib_flags = attr->flags;
4239c6475a0bSAviad Yehezkel 	memcpy(&accel_attrs.keymat.aes_gcm.aes_key, &aes_gcm->aes_key,
4240c6475a0bSAviad Yehezkel 	       sizeof(accel_attrs.keymat.aes_gcm.aes_key));
4241c6475a0bSAviad Yehezkel 	accel_attrs.keymat.aes_gcm.key_len = aes_gcm->key_len * 8;
4242c6475a0bSAviad Yehezkel 	memcpy(&accel_attrs.keymat.aes_gcm.salt, &aes_gcm->salt,
4243c6475a0bSAviad Yehezkel 	       sizeof(accel_attrs.keymat.aes_gcm.salt));
4244c6475a0bSAviad Yehezkel 	memcpy(&accel_attrs.keymat.aes_gcm.seq_iv, &aes_gcm->iv,
4245c6475a0bSAviad Yehezkel 	       sizeof(accel_attrs.keymat.aes_gcm.seq_iv));
4246c6475a0bSAviad Yehezkel 	accel_attrs.keymat.aes_gcm.icv_len = aes_gcm->icv_len * 8;
4247c6475a0bSAviad Yehezkel 	accel_attrs.keymat.aes_gcm.iv_algo = MLX5_ACCEL_ESP_AES_GCM_IV_ALGO_SEQ;
4248c6475a0bSAviad Yehezkel 	accel_attrs.keymat_type = MLX5_ACCEL_ESP_KEYMAT_AES_GCM;
4249c6475a0bSAviad Yehezkel 
4250c6475a0bSAviad Yehezkel 	accel_attrs.esn = attr->esn;
4251c6475a0bSAviad Yehezkel 	if (attr->flags & IB_FLOW_ACTION_ESP_FLAGS_ESN_TRIGGERED)
4252c6475a0bSAviad Yehezkel 		accel_attrs.flags |= MLX5_ACCEL_ESP_FLAGS_ESN_TRIGGERED;
4253c6475a0bSAviad Yehezkel 	if (attr->flags & IB_UVERBS_FLOW_ACTION_ESP_FLAGS_ESN_NEW_WINDOW)
4254c6475a0bSAviad Yehezkel 		accel_attrs.flags |= MLX5_ACCEL_ESP_FLAGS_ESN_STATE_OVERLAP;
4255c6475a0bSAviad Yehezkel 
4256c6475a0bSAviad Yehezkel 	if (attr->flags & IB_UVERBS_FLOW_ACTION_ESP_FLAGS_ENCRYPT)
4257c6475a0bSAviad Yehezkel 		accel_attrs.action |= MLX5_ACCEL_ESP_ACTION_ENCRYPT;
4258c6475a0bSAviad Yehezkel 
4259c6475a0bSAviad Yehezkel 	action->esp_aes_gcm.ctx =
4260c6475a0bSAviad Yehezkel 		mlx5_accel_esp_create_xfrm(mdev->mdev, &accel_attrs, flags);
4261c6475a0bSAviad Yehezkel 	if (IS_ERR(action->esp_aes_gcm.ctx)) {
4262c6475a0bSAviad Yehezkel 		err = PTR_ERR(action->esp_aes_gcm.ctx);
4263c6475a0bSAviad Yehezkel 		goto err_parse;
4264c6475a0bSAviad Yehezkel 	}
4265c6475a0bSAviad Yehezkel 
4266c6475a0bSAviad Yehezkel 	action->esp_aes_gcm.ib_flags = attr->flags;
4267c6475a0bSAviad Yehezkel 
4268c6475a0bSAviad Yehezkel 	return &action->ib_action;
4269c6475a0bSAviad Yehezkel 
4270c6475a0bSAviad Yehezkel err_parse:
4271c6475a0bSAviad Yehezkel 	kfree(action);
4272c6475a0bSAviad Yehezkel 	return ERR_PTR(err);
4273c6475a0bSAviad Yehezkel }
4274c6475a0bSAviad Yehezkel 
4275349705c1SMatan Barak static int
4276349705c1SMatan Barak mlx5_ib_modify_flow_action_esp(struct ib_flow_action *action,
4277349705c1SMatan Barak 			       const struct ib_flow_action_attrs_esp *attr,
4278349705c1SMatan Barak 			       struct uverbs_attr_bundle *attrs)
4279349705c1SMatan Barak {
4280349705c1SMatan Barak 	struct mlx5_ib_flow_action *maction = to_mflow_act(action);
4281349705c1SMatan Barak 	struct mlx5_accel_esp_xfrm_attrs accel_attrs;
4282349705c1SMatan Barak 	int err = 0;
4283349705c1SMatan Barak 
4284349705c1SMatan Barak 	if (attr->keymat || attr->replay || attr->encap ||
4285349705c1SMatan Barak 	    attr->spi || attr->seq || attr->tfc_pad ||
4286349705c1SMatan Barak 	    attr->hard_limit_pkts ||
4287349705c1SMatan Barak 	    (attr->flags & ~(IB_FLOW_ACTION_ESP_FLAGS_ESN_TRIGGERED |
4288349705c1SMatan Barak 			     IB_FLOW_ACTION_ESP_FLAGS_MOD_ESP_ATTRS |
4289349705c1SMatan Barak 			     IB_UVERBS_FLOW_ACTION_ESP_FLAGS_ESN_NEW_WINDOW)))
4290349705c1SMatan Barak 		return -EOPNOTSUPP;
4291349705c1SMatan Barak 
4292349705c1SMatan Barak 	/* Only the ESN value or the MLX5_ACCEL_ESP_FLAGS_ESN_STATE_OVERLAP can
4293349705c1SMatan Barak 	 * be modified.
4294349705c1SMatan Barak 	 */
4295349705c1SMatan Barak 	if (!(maction->esp_aes_gcm.ib_flags &
4296349705c1SMatan Barak 	      IB_FLOW_ACTION_ESP_FLAGS_ESN_TRIGGERED) &&
4297349705c1SMatan Barak 	    attr->flags & (IB_FLOW_ACTION_ESP_FLAGS_ESN_TRIGGERED |
4298349705c1SMatan Barak 			   IB_UVERBS_FLOW_ACTION_ESP_FLAGS_ESN_NEW_WINDOW))
4299349705c1SMatan Barak 		return -EINVAL;
4300349705c1SMatan Barak 
4301349705c1SMatan Barak 	memcpy(&accel_attrs, &maction->esp_aes_gcm.ctx->attrs,
4302349705c1SMatan Barak 	       sizeof(accel_attrs));
4303349705c1SMatan Barak 
4304349705c1SMatan Barak 	accel_attrs.esn = attr->esn;
4305349705c1SMatan Barak 	if (attr->flags & IB_UVERBS_FLOW_ACTION_ESP_FLAGS_ESN_NEW_WINDOW)
4306349705c1SMatan Barak 		accel_attrs.flags |= MLX5_ACCEL_ESP_FLAGS_ESN_STATE_OVERLAP;
4307349705c1SMatan Barak 	else
4308349705c1SMatan Barak 		accel_attrs.flags &= ~MLX5_ACCEL_ESP_FLAGS_ESN_STATE_OVERLAP;
4309349705c1SMatan Barak 
4310349705c1SMatan Barak 	err = mlx5_accel_esp_modify_xfrm(maction->esp_aes_gcm.ctx,
4311349705c1SMatan Barak 					 &accel_attrs);
4312349705c1SMatan Barak 	if (err)
4313349705c1SMatan Barak 		return err;
4314349705c1SMatan Barak 
4315349705c1SMatan Barak 	maction->esp_aes_gcm.ib_flags &=
4316349705c1SMatan Barak 		~IB_UVERBS_FLOW_ACTION_ESP_FLAGS_ESN_NEW_WINDOW;
4317349705c1SMatan Barak 	maction->esp_aes_gcm.ib_flags |=
4318349705c1SMatan Barak 		attr->flags & IB_UVERBS_FLOW_ACTION_ESP_FLAGS_ESN_NEW_WINDOW;
4319349705c1SMatan Barak 
4320349705c1SMatan Barak 	return 0;
4321349705c1SMatan Barak }
4322349705c1SMatan Barak 
4323c6475a0bSAviad Yehezkel static int mlx5_ib_destroy_flow_action(struct ib_flow_action *action)
4324c6475a0bSAviad Yehezkel {
4325c6475a0bSAviad Yehezkel 	struct mlx5_ib_flow_action *maction = to_mflow_act(action);
4326c6475a0bSAviad Yehezkel 
4327c6475a0bSAviad Yehezkel 	switch (action->type) {
4328c6475a0bSAviad Yehezkel 	case IB_FLOW_ACTION_ESP:
4329c6475a0bSAviad Yehezkel 		/*
4330c6475a0bSAviad Yehezkel 		 * We only support aes_gcm by now, so we implicitly know this is
4331c6475a0bSAviad Yehezkel 		 * the underline crypto.
4332c6475a0bSAviad Yehezkel 		 */
4333c6475a0bSAviad Yehezkel 		mlx5_accel_esp_destroy_xfrm(maction->esp_aes_gcm.ctx);
4334c6475a0bSAviad Yehezkel 		break;
4335b4749bf2SMark Bloch 	case IB_FLOW_ACTION_UNSPECIFIED:
4336b4749bf2SMark Bloch 		mlx5_ib_destroy_flow_action_raw(maction);
4337b4749bf2SMark Bloch 		break;
4338c6475a0bSAviad Yehezkel 	default:
4339c6475a0bSAviad Yehezkel 		WARN_ON(true);
4340c6475a0bSAviad Yehezkel 		break;
4341c6475a0bSAviad Yehezkel 	}
4342c6475a0bSAviad Yehezkel 
4343c6475a0bSAviad Yehezkel 	kfree(maction);
4344c6475a0bSAviad Yehezkel 	return 0;
4345c6475a0bSAviad Yehezkel }
4346c6475a0bSAviad Yehezkel 
4347e126ba97SEli Cohen static int mlx5_ib_mcg_attach(struct ib_qp *ibqp, union ib_gid *gid, u16 lid)
4348e126ba97SEli Cohen {
4349e126ba97SEli Cohen 	struct mlx5_ib_dev *dev = to_mdev(ibqp->device);
435081e30880SYishai Hadas 	struct mlx5_ib_qp *mqp = to_mqp(ibqp);
4351e126ba97SEli Cohen 	int err;
4352539ec982SYishai Hadas 	u16 uid;
4353539ec982SYishai Hadas 
4354539ec982SYishai Hadas 	uid = ibqp->pd ?
4355539ec982SYishai Hadas 		to_mpd(ibqp->pd)->uid : 0;
4356e126ba97SEli Cohen 
435781e30880SYishai Hadas 	if (mqp->flags & MLX5_IB_QP_UNDERLAY) {
435881e30880SYishai Hadas 		mlx5_ib_dbg(dev, "Attaching a multi cast group to underlay QP is not supported\n");
435981e30880SYishai Hadas 		return -EOPNOTSUPP;
436081e30880SYishai Hadas 	}
436181e30880SYishai Hadas 
4362539ec982SYishai Hadas 	err = mlx5_cmd_attach_mcg(dev->mdev, gid, ibqp->qp_num, uid);
4363e126ba97SEli Cohen 	if (err)
4364e126ba97SEli Cohen 		mlx5_ib_warn(dev, "failed attaching QPN 0x%x, MGID %pI6\n",
4365e126ba97SEli Cohen 			     ibqp->qp_num, gid->raw);
4366e126ba97SEli Cohen 
4367e126ba97SEli Cohen 	return err;
4368e126ba97SEli Cohen }
4369e126ba97SEli Cohen 
4370e126ba97SEli Cohen static int mlx5_ib_mcg_detach(struct ib_qp *ibqp, union ib_gid *gid, u16 lid)
4371e126ba97SEli Cohen {
4372e126ba97SEli Cohen 	struct mlx5_ib_dev *dev = to_mdev(ibqp->device);
4373e126ba97SEli Cohen 	int err;
4374539ec982SYishai Hadas 	u16 uid;
4375e126ba97SEli Cohen 
4376539ec982SYishai Hadas 	uid = ibqp->pd ?
4377539ec982SYishai Hadas 		to_mpd(ibqp->pd)->uid : 0;
4378539ec982SYishai Hadas 	err = mlx5_cmd_detach_mcg(dev->mdev, gid, ibqp->qp_num, uid);
4379e126ba97SEli Cohen 	if (err)
4380e126ba97SEli Cohen 		mlx5_ib_warn(dev, "failed detaching QPN 0x%x, MGID %pI6\n",
4381e126ba97SEli Cohen 			     ibqp->qp_num, gid->raw);
4382e126ba97SEli Cohen 
4383e126ba97SEli Cohen 	return err;
4384e126ba97SEli Cohen }
4385e126ba97SEli Cohen 
4386e126ba97SEli Cohen static int init_node_data(struct mlx5_ib_dev *dev)
4387e126ba97SEli Cohen {
43881b5daf11SMajd Dibbiny 	int err;
4389e126ba97SEli Cohen 
43901b5daf11SMajd Dibbiny 	err = mlx5_query_node_desc(dev, dev->ib_dev.node_desc);
4391e126ba97SEli Cohen 	if (err)
4392e126ba97SEli Cohen 		return err;
43931b5daf11SMajd Dibbiny 
43941b5daf11SMajd Dibbiny 	dev->mdev->rev_id = dev->mdev->pdev->revision;
43951b5daf11SMajd Dibbiny 
43961b5daf11SMajd Dibbiny 	return mlx5_query_node_guid(dev, &dev->ib_dev.node_guid);
4397e126ba97SEli Cohen }
4398e126ba97SEli Cohen 
4399508a523fSParav Pandit static ssize_t fw_pages_show(struct device *device,
4400508a523fSParav Pandit 			     struct device_attribute *attr, char *buf)
4401e126ba97SEli Cohen {
4402e126ba97SEli Cohen 	struct mlx5_ib_dev *dev =
440354747231SParav Pandit 		rdma_device_to_drv_device(device, struct mlx5_ib_dev, ib_dev);
4404e126ba97SEli Cohen 
44059603b61dSJack Morgenstein 	return sprintf(buf, "%d\n", dev->mdev->priv.fw_pages);
4406e126ba97SEli Cohen }
4407508a523fSParav Pandit static DEVICE_ATTR_RO(fw_pages);
4408e126ba97SEli Cohen 
4409508a523fSParav Pandit static ssize_t reg_pages_show(struct device *device,
4410e126ba97SEli Cohen 			      struct device_attribute *attr, char *buf)
4411e126ba97SEli Cohen {
4412e126ba97SEli Cohen 	struct mlx5_ib_dev *dev =
441354747231SParav Pandit 		rdma_device_to_drv_device(device, struct mlx5_ib_dev, ib_dev);
4414e126ba97SEli Cohen 
44156aec21f6SHaggai Eran 	return sprintf(buf, "%d\n", atomic_read(&dev->mdev->priv.reg_pages));
4416e126ba97SEli Cohen }
4417508a523fSParav Pandit static DEVICE_ATTR_RO(reg_pages);
4418e126ba97SEli Cohen 
4419508a523fSParav Pandit static ssize_t hca_type_show(struct device *device,
4420508a523fSParav Pandit 			     struct device_attribute *attr, char *buf)
4421e126ba97SEli Cohen {
4422e126ba97SEli Cohen 	struct mlx5_ib_dev *dev =
442354747231SParav Pandit 		rdma_device_to_drv_device(device, struct mlx5_ib_dev, ib_dev);
442454747231SParav Pandit 
44259603b61dSJack Morgenstein 	return sprintf(buf, "MT%d\n", dev->mdev->pdev->device);
4426e126ba97SEli Cohen }
4427508a523fSParav Pandit static DEVICE_ATTR_RO(hca_type);
4428e126ba97SEli Cohen 
4429508a523fSParav Pandit static ssize_t hw_rev_show(struct device *device,
4430508a523fSParav Pandit 			   struct device_attribute *attr, char *buf)
4431e126ba97SEli Cohen {
4432e126ba97SEli Cohen 	struct mlx5_ib_dev *dev =
443354747231SParav Pandit 		rdma_device_to_drv_device(device, struct mlx5_ib_dev, ib_dev);
443454747231SParav Pandit 
44359603b61dSJack Morgenstein 	return sprintf(buf, "%x\n", dev->mdev->rev_id);
4436e126ba97SEli Cohen }
4437508a523fSParav Pandit static DEVICE_ATTR_RO(hw_rev);
4438e126ba97SEli Cohen 
4439508a523fSParav Pandit static ssize_t board_id_show(struct device *device,
4440508a523fSParav Pandit 			     struct device_attribute *attr, char *buf)
4441e126ba97SEli Cohen {
4442e126ba97SEli Cohen 	struct mlx5_ib_dev *dev =
444354747231SParav Pandit 		rdma_device_to_drv_device(device, struct mlx5_ib_dev, ib_dev);
444454747231SParav Pandit 
4445e126ba97SEli Cohen 	return sprintf(buf, "%.*s\n", MLX5_BOARD_ID_LEN,
44469603b61dSJack Morgenstein 		       dev->mdev->board_id);
4447e126ba97SEli Cohen }
4448508a523fSParav Pandit static DEVICE_ATTR_RO(board_id);
4449e126ba97SEli Cohen 
4450508a523fSParav Pandit static struct attribute *mlx5_class_attributes[] = {
4451508a523fSParav Pandit 	&dev_attr_hw_rev.attr,
4452508a523fSParav Pandit 	&dev_attr_hca_type.attr,
4453508a523fSParav Pandit 	&dev_attr_board_id.attr,
4454508a523fSParav Pandit 	&dev_attr_fw_pages.attr,
4455508a523fSParav Pandit 	&dev_attr_reg_pages.attr,
4456508a523fSParav Pandit 	NULL,
4457508a523fSParav Pandit };
4458e126ba97SEli Cohen 
4459508a523fSParav Pandit static const struct attribute_group mlx5_attr_group = {
4460508a523fSParav Pandit 	.attrs = mlx5_class_attributes,
4461e126ba97SEli Cohen };
4462e126ba97SEli Cohen 
44637722f47eSHaggai Eran static void pkey_change_handler(struct work_struct *work)
44647722f47eSHaggai Eran {
44657722f47eSHaggai Eran 	struct mlx5_ib_port_resources *ports =
44667722f47eSHaggai Eran 		container_of(work, struct mlx5_ib_port_resources,
44677722f47eSHaggai Eran 			     pkey_change_work);
44687722f47eSHaggai Eran 
44697722f47eSHaggai Eran 	mutex_lock(&ports->devr->mutex);
44707722f47eSHaggai Eran 	mlx5_ib_gsi_pkey_change(ports->gsi);
44717722f47eSHaggai Eran 	mutex_unlock(&ports->devr->mutex);
44727722f47eSHaggai Eran }
44737722f47eSHaggai Eran 
447489ea94a7SMaor Gottlieb static void mlx5_ib_handle_internal_error(struct mlx5_ib_dev *ibdev)
447589ea94a7SMaor Gottlieb {
447689ea94a7SMaor Gottlieb 	struct mlx5_ib_qp *mqp;
447789ea94a7SMaor Gottlieb 	struct mlx5_ib_cq *send_mcq, *recv_mcq;
447889ea94a7SMaor Gottlieb 	struct mlx5_core_cq *mcq;
447989ea94a7SMaor Gottlieb 	struct list_head cq_armed_list;
448089ea94a7SMaor Gottlieb 	unsigned long flags_qp;
448189ea94a7SMaor Gottlieb 	unsigned long flags_cq;
448289ea94a7SMaor Gottlieb 	unsigned long flags;
448389ea94a7SMaor Gottlieb 
448489ea94a7SMaor Gottlieb 	INIT_LIST_HEAD(&cq_armed_list);
448589ea94a7SMaor Gottlieb 
448689ea94a7SMaor Gottlieb 	/* Go over qp list reside on that ibdev, sync with create/destroy qp.*/
448789ea94a7SMaor Gottlieb 	spin_lock_irqsave(&ibdev->reset_flow_resource_lock, flags);
448889ea94a7SMaor Gottlieb 	list_for_each_entry(mqp, &ibdev->qp_list, qps_list) {
448989ea94a7SMaor Gottlieb 		spin_lock_irqsave(&mqp->sq.lock, flags_qp);
449089ea94a7SMaor Gottlieb 		if (mqp->sq.tail != mqp->sq.head) {
449189ea94a7SMaor Gottlieb 			send_mcq = to_mcq(mqp->ibqp.send_cq);
449289ea94a7SMaor Gottlieb 			spin_lock_irqsave(&send_mcq->lock, flags_cq);
449389ea94a7SMaor Gottlieb 			if (send_mcq->mcq.comp &&
449489ea94a7SMaor Gottlieb 			    mqp->ibqp.send_cq->comp_handler) {
449589ea94a7SMaor Gottlieb 				if (!send_mcq->mcq.reset_notify_added) {
449689ea94a7SMaor Gottlieb 					send_mcq->mcq.reset_notify_added = 1;
449789ea94a7SMaor Gottlieb 					list_add_tail(&send_mcq->mcq.reset_notify,
449889ea94a7SMaor Gottlieb 						      &cq_armed_list);
449989ea94a7SMaor Gottlieb 				}
450089ea94a7SMaor Gottlieb 			}
450189ea94a7SMaor Gottlieb 			spin_unlock_irqrestore(&send_mcq->lock, flags_cq);
450289ea94a7SMaor Gottlieb 		}
450389ea94a7SMaor Gottlieb 		spin_unlock_irqrestore(&mqp->sq.lock, flags_qp);
450489ea94a7SMaor Gottlieb 		spin_lock_irqsave(&mqp->rq.lock, flags_qp);
450589ea94a7SMaor Gottlieb 		/* no handling is needed for SRQ */
450689ea94a7SMaor Gottlieb 		if (!mqp->ibqp.srq) {
450789ea94a7SMaor Gottlieb 			if (mqp->rq.tail != mqp->rq.head) {
450889ea94a7SMaor Gottlieb 				recv_mcq = to_mcq(mqp->ibqp.recv_cq);
450989ea94a7SMaor Gottlieb 				spin_lock_irqsave(&recv_mcq->lock, flags_cq);
451089ea94a7SMaor Gottlieb 				if (recv_mcq->mcq.comp &&
451189ea94a7SMaor Gottlieb 				    mqp->ibqp.recv_cq->comp_handler) {
451289ea94a7SMaor Gottlieb 					if (!recv_mcq->mcq.reset_notify_added) {
451389ea94a7SMaor Gottlieb 						recv_mcq->mcq.reset_notify_added = 1;
451489ea94a7SMaor Gottlieb 						list_add_tail(&recv_mcq->mcq.reset_notify,
451589ea94a7SMaor Gottlieb 							      &cq_armed_list);
451689ea94a7SMaor Gottlieb 					}
451789ea94a7SMaor Gottlieb 				}
451889ea94a7SMaor Gottlieb 				spin_unlock_irqrestore(&recv_mcq->lock,
451989ea94a7SMaor Gottlieb 						       flags_cq);
452089ea94a7SMaor Gottlieb 			}
452189ea94a7SMaor Gottlieb 		}
452289ea94a7SMaor Gottlieb 		spin_unlock_irqrestore(&mqp->rq.lock, flags_qp);
452389ea94a7SMaor Gottlieb 	}
452489ea94a7SMaor Gottlieb 	/*At that point all inflight post send were put to be executed as of we
452589ea94a7SMaor Gottlieb 	 * lock/unlock above locks Now need to arm all involved CQs.
452689ea94a7SMaor Gottlieb 	 */
452789ea94a7SMaor Gottlieb 	list_for_each_entry(mcq, &cq_armed_list, reset_notify) {
45284e0e2ea1SYishai Hadas 		mcq->comp(mcq, NULL);
452989ea94a7SMaor Gottlieb 	}
453089ea94a7SMaor Gottlieb 	spin_unlock_irqrestore(&ibdev->reset_flow_resource_lock, flags);
453189ea94a7SMaor Gottlieb }
453289ea94a7SMaor Gottlieb 
453303404e8aSMaor Gottlieb static void delay_drop_handler(struct work_struct *work)
453403404e8aSMaor Gottlieb {
453503404e8aSMaor Gottlieb 	int err;
453603404e8aSMaor Gottlieb 	struct mlx5_ib_delay_drop *delay_drop =
453703404e8aSMaor Gottlieb 		container_of(work, struct mlx5_ib_delay_drop,
453803404e8aSMaor Gottlieb 			     delay_drop_work);
453903404e8aSMaor Gottlieb 
4540fe248c3aSMaor Gottlieb 	atomic_inc(&delay_drop->events_cnt);
4541fe248c3aSMaor Gottlieb 
454203404e8aSMaor Gottlieb 	mutex_lock(&delay_drop->lock);
454303404e8aSMaor Gottlieb 	err = mlx5_core_set_delay_drop(delay_drop->dev->mdev,
454403404e8aSMaor Gottlieb 				       delay_drop->timeout);
454503404e8aSMaor Gottlieb 	if (err) {
454603404e8aSMaor Gottlieb 		mlx5_ib_warn(delay_drop->dev, "Failed to set delay drop, timeout=%u\n",
454703404e8aSMaor Gottlieb 			     delay_drop->timeout);
454803404e8aSMaor Gottlieb 		delay_drop->activate = false;
454903404e8aSMaor Gottlieb 	}
455003404e8aSMaor Gottlieb 	mutex_unlock(&delay_drop->lock);
455103404e8aSMaor Gottlieb }
455203404e8aSMaor Gottlieb 
455309e574faSSaeed Mahameed static void handle_general_event(struct mlx5_ib_dev *ibdev, struct mlx5_eqe *eqe,
455409e574faSSaeed Mahameed 				 struct ib_event *ibev)
455509e574faSSaeed Mahameed {
45566cfdc7e4SAya Levin 	u8 port = (eqe->data.port.port >> 4) & 0xf;
45576cfdc7e4SAya Levin 
455809e574faSSaeed Mahameed 	switch (eqe->sub_type) {
455909e574faSSaeed Mahameed 	case MLX5_GENERAL_SUBTYPE_DELAY_DROP_TIMEOUT:
45606cfdc7e4SAya Levin 		if (mlx5_ib_port_link_layer(&ibdev->ib_dev, port) ==
45616cfdc7e4SAya Levin 					    IB_LINK_LAYER_ETHERNET)
456209e574faSSaeed Mahameed 			schedule_work(&ibdev->delay_drop.delay_drop_work);
456309e574faSSaeed Mahameed 		break;
456409e574faSSaeed Mahameed 	default: /* do nothing */
456509e574faSSaeed Mahameed 		return;
456609e574faSSaeed Mahameed 	}
456709e574faSSaeed Mahameed }
456809e574faSSaeed Mahameed 
4569134e9349SSaeed Mahameed static int handle_port_change(struct mlx5_ib_dev *ibdev, struct mlx5_eqe *eqe,
4570134e9349SSaeed Mahameed 			      struct ib_event *ibev)
4571134e9349SSaeed Mahameed {
4572134e9349SSaeed Mahameed 	u8 port = (eqe->data.port.port >> 4) & 0xf;
4573134e9349SSaeed Mahameed 
4574134e9349SSaeed Mahameed 	ibev->element.port_num = port;
4575134e9349SSaeed Mahameed 
4576134e9349SSaeed Mahameed 	switch (eqe->sub_type) {
4577134e9349SSaeed Mahameed 	case MLX5_PORT_CHANGE_SUBTYPE_ACTIVE:
4578134e9349SSaeed Mahameed 	case MLX5_PORT_CHANGE_SUBTYPE_DOWN:
4579134e9349SSaeed Mahameed 	case MLX5_PORT_CHANGE_SUBTYPE_INITIALIZED:
4580134e9349SSaeed Mahameed 		/* In RoCE, port up/down events are handled in
4581134e9349SSaeed Mahameed 		 * mlx5_netdev_event().
4582134e9349SSaeed Mahameed 		 */
4583134e9349SSaeed Mahameed 		if (mlx5_ib_port_link_layer(&ibdev->ib_dev, port) ==
4584134e9349SSaeed Mahameed 					    IB_LINK_LAYER_ETHERNET)
4585134e9349SSaeed Mahameed 			return -EINVAL;
4586134e9349SSaeed Mahameed 
4587134e9349SSaeed Mahameed 		ibev->event = (eqe->sub_type == MLX5_PORT_CHANGE_SUBTYPE_ACTIVE) ?
4588134e9349SSaeed Mahameed 				IB_EVENT_PORT_ACTIVE : IB_EVENT_PORT_ERR;
4589134e9349SSaeed Mahameed 		break;
4590134e9349SSaeed Mahameed 
4591134e9349SSaeed Mahameed 	case MLX5_PORT_CHANGE_SUBTYPE_LID:
4592134e9349SSaeed Mahameed 		ibev->event = IB_EVENT_LID_CHANGE;
4593134e9349SSaeed Mahameed 		break;
4594134e9349SSaeed Mahameed 
4595134e9349SSaeed Mahameed 	case MLX5_PORT_CHANGE_SUBTYPE_PKEY:
4596134e9349SSaeed Mahameed 		ibev->event = IB_EVENT_PKEY_CHANGE;
4597134e9349SSaeed Mahameed 		schedule_work(&ibdev->devr.ports[port - 1].pkey_change_work);
4598134e9349SSaeed Mahameed 		break;
4599134e9349SSaeed Mahameed 
4600134e9349SSaeed Mahameed 	case MLX5_PORT_CHANGE_SUBTYPE_GUID:
4601134e9349SSaeed Mahameed 		ibev->event = IB_EVENT_GID_CHANGE;
4602134e9349SSaeed Mahameed 		break;
4603134e9349SSaeed Mahameed 
4604134e9349SSaeed Mahameed 	case MLX5_PORT_CHANGE_SUBTYPE_CLIENT_REREG:
4605134e9349SSaeed Mahameed 		ibev->event = IB_EVENT_CLIENT_REREGISTER;
4606134e9349SSaeed Mahameed 		break;
4607134e9349SSaeed Mahameed 	default:
4608134e9349SSaeed Mahameed 		return -EINVAL;
4609134e9349SSaeed Mahameed 	}
4610134e9349SSaeed Mahameed 
4611134e9349SSaeed Mahameed 	return 0;
4612134e9349SSaeed Mahameed }
4613134e9349SSaeed Mahameed 
4614d69a24e0SDaniel Jurgens static void mlx5_ib_handle_event(struct work_struct *_work)
4615e126ba97SEli Cohen {
4616d69a24e0SDaniel Jurgens 	struct mlx5_ib_event_work *work =
4617d69a24e0SDaniel Jurgens 		container_of(_work, struct mlx5_ib_event_work, work);
4618d69a24e0SDaniel Jurgens 	struct mlx5_ib_dev *ibdev;
4619e126ba97SEli Cohen 	struct ib_event ibev;
4620dbaaff2aSEli Cohen 	bool fatal = false;
4621e126ba97SEli Cohen 
4622df097a27SSaeed Mahameed 	if (work->is_slave) {
4623df097a27SSaeed Mahameed 		ibdev = mlx5_ib_get_ibdev_from_mpi(work->mpi);
4624d69a24e0SDaniel Jurgens 		if (!ibdev)
4625d69a24e0SDaniel Jurgens 			goto out;
4626d69a24e0SDaniel Jurgens 	} else {
4627df097a27SSaeed Mahameed 		ibdev = work->dev;
4628d69a24e0SDaniel Jurgens 	}
4629d69a24e0SDaniel Jurgens 
4630d69a24e0SDaniel Jurgens 	switch (work->event) {
4631e126ba97SEli Cohen 	case MLX5_DEV_EVENT_SYS_ERROR:
4632e126ba97SEli Cohen 		ibev.event = IB_EVENT_DEVICE_FATAL;
463389ea94a7SMaor Gottlieb 		mlx5_ib_handle_internal_error(ibdev);
4634134e9349SSaeed Mahameed 		ibev.element.port_num  = (u8)(unsigned long)work->param;
4635dbaaff2aSEli Cohen 		fatal = true;
4636e126ba97SEli Cohen 		break;
4637134e9349SSaeed Mahameed 	case MLX5_EVENT_TYPE_PORT_CHANGE:
4638134e9349SSaeed Mahameed 		if (handle_port_change(ibdev, work->param, &ibev))
4639d69a24e0SDaniel Jurgens 			goto out;
4640e126ba97SEli Cohen 		break;
464109e574faSSaeed Mahameed 	case MLX5_EVENT_TYPE_GENERAL_EVENT:
464209e574faSSaeed Mahameed 		handle_general_event(ibdev, work->param, &ibev);
464309e574faSSaeed Mahameed 		/* fall through */
4644bdc37924SSaeed Mahameed 	default:
464503404e8aSMaor Gottlieb 		goto out;
4646e126ba97SEli Cohen 	}
4647e126ba97SEli Cohen 
4648e126ba97SEli Cohen 	ibev.device = &ibdev->ib_dev;
4649e126ba97SEli Cohen 
4650134e9349SSaeed Mahameed 	if (!rdma_is_port_valid(&ibdev->ib_dev, ibev.element.port_num)) {
4651134e9349SSaeed Mahameed 		mlx5_ib_warn(ibdev, "warning: event on port %d\n",  ibev.element.port_num);
465203404e8aSMaor Gottlieb 		goto out;
4653a0c84c32SEli Cohen 	}
4654a0c84c32SEli Cohen 
4655e126ba97SEli Cohen 	if (ibdev->ib_active)
4656e126ba97SEli Cohen 		ib_dispatch_event(&ibev);
4657dbaaff2aSEli Cohen 
4658dbaaff2aSEli Cohen 	if (fatal)
4659dbaaff2aSEli Cohen 		ibdev->ib_active = false;
466003404e8aSMaor Gottlieb out:
4661d69a24e0SDaniel Jurgens 	kfree(work);
4662d69a24e0SDaniel Jurgens }
4663d69a24e0SDaniel Jurgens 
4664df097a27SSaeed Mahameed static int mlx5_ib_event(struct notifier_block *nb,
4665df097a27SSaeed Mahameed 			 unsigned long event, void *param)
4666d69a24e0SDaniel Jurgens {
4667d69a24e0SDaniel Jurgens 	struct mlx5_ib_event_work *work;
4668d69a24e0SDaniel Jurgens 
4669d69a24e0SDaniel Jurgens 	work = kmalloc(sizeof(*work), GFP_ATOMIC);
467010bea9c8SLeon Romanovsky 	if (!work)
4671df097a27SSaeed Mahameed 		return NOTIFY_DONE;
467210bea9c8SLeon Romanovsky 
4673d69a24e0SDaniel Jurgens 	INIT_WORK(&work->work, mlx5_ib_handle_event);
4674df097a27SSaeed Mahameed 	work->dev = container_of(nb, struct mlx5_ib_dev, mdev_events);
4675df097a27SSaeed Mahameed 	work->is_slave = false;
4676d69a24e0SDaniel Jurgens 	work->param = param;
4677d69a24e0SDaniel Jurgens 	work->event = event;
4678d69a24e0SDaniel Jurgens 
4679d69a24e0SDaniel Jurgens 	queue_work(mlx5_ib_event_wq, &work->work);
4680df097a27SSaeed Mahameed 
4681df097a27SSaeed Mahameed 	return NOTIFY_OK;
4682df097a27SSaeed Mahameed }
4683df097a27SSaeed Mahameed 
4684df097a27SSaeed Mahameed static int mlx5_ib_event_slave_port(struct notifier_block *nb,
4685df097a27SSaeed Mahameed 				    unsigned long event, void *param)
4686df097a27SSaeed Mahameed {
4687df097a27SSaeed Mahameed 	struct mlx5_ib_event_work *work;
4688df097a27SSaeed Mahameed 
4689df097a27SSaeed Mahameed 	work = kmalloc(sizeof(*work), GFP_ATOMIC);
4690df097a27SSaeed Mahameed 	if (!work)
4691df097a27SSaeed Mahameed 		return NOTIFY_DONE;
4692df097a27SSaeed Mahameed 
4693df097a27SSaeed Mahameed 	INIT_WORK(&work->work, mlx5_ib_handle_event);
4694df097a27SSaeed Mahameed 	work->mpi = container_of(nb, struct mlx5_ib_multiport_info, mdev_events);
4695df097a27SSaeed Mahameed 	work->is_slave = true;
4696df097a27SSaeed Mahameed 	work->param = param;
4697df097a27SSaeed Mahameed 	work->event = event;
4698df097a27SSaeed Mahameed 	queue_work(mlx5_ib_event_wq, &work->work);
4699df097a27SSaeed Mahameed 
4700df097a27SSaeed Mahameed 	return NOTIFY_OK;
4701d69a24e0SDaniel Jurgens }
4702d69a24e0SDaniel Jurgens 
4703c43f1112SMaor Gottlieb static int set_has_smi_cap(struct mlx5_ib_dev *dev)
4704c43f1112SMaor Gottlieb {
4705c43f1112SMaor Gottlieb 	struct mlx5_hca_vport_context vport_ctx;
4706c43f1112SMaor Gottlieb 	int err;
4707c43f1112SMaor Gottlieb 	int port;
4708c43f1112SMaor Gottlieb 
4709a989ea01SMark Bloch 	for (port = 1; port <= ARRAY_SIZE(dev->mdev->port_caps); port++) {
4710c43f1112SMaor Gottlieb 		dev->mdev->port_caps[port - 1].has_smi = false;
4711c43f1112SMaor Gottlieb 		if (MLX5_CAP_GEN(dev->mdev, port_type) ==
4712c43f1112SMaor Gottlieb 		    MLX5_CAP_PORT_TYPE_IB) {
4713c43f1112SMaor Gottlieb 			if (MLX5_CAP_GEN(dev->mdev, ib_virt)) {
4714c43f1112SMaor Gottlieb 				err = mlx5_query_hca_vport_context(dev->mdev, 0,
4715c43f1112SMaor Gottlieb 								   port, 0,
4716c43f1112SMaor Gottlieb 								   &vport_ctx);
4717c43f1112SMaor Gottlieb 				if (err) {
4718c43f1112SMaor Gottlieb 					mlx5_ib_err(dev, "query_hca_vport_context for port=%d failed %d\n",
4719c43f1112SMaor Gottlieb 						    port, err);
4720c43f1112SMaor Gottlieb 					return err;
4721c43f1112SMaor Gottlieb 				}
4722c43f1112SMaor Gottlieb 				dev->mdev->port_caps[port - 1].has_smi =
4723c43f1112SMaor Gottlieb 					vport_ctx.has_smi;
4724c43f1112SMaor Gottlieb 			} else {
4725c43f1112SMaor Gottlieb 				dev->mdev->port_caps[port - 1].has_smi = true;
4726c43f1112SMaor Gottlieb 			}
4727c43f1112SMaor Gottlieb 		}
4728c43f1112SMaor Gottlieb 	}
4729c43f1112SMaor Gottlieb 	return 0;
4730c43f1112SMaor Gottlieb }
4731c43f1112SMaor Gottlieb 
4732e126ba97SEli Cohen static void get_ext_port_caps(struct mlx5_ib_dev *dev)
4733e126ba97SEli Cohen {
4734e126ba97SEli Cohen 	int port;
4735e126ba97SEli Cohen 
4736508562d6SDaniel Jurgens 	for (port = 1; port <= dev->num_ports; port++)
4737e126ba97SEli Cohen 		mlx5_query_ext_port_caps(dev, port);
4738e126ba97SEli Cohen }
4739e126ba97SEli Cohen 
474026628e2dSMark Bloch static int __get_port_caps(struct mlx5_ib_dev *dev, u8 port)
4741e126ba97SEli Cohen {
4742e126ba97SEli Cohen 	struct ib_device_attr *dprops = NULL;
4743e126ba97SEli Cohen 	struct ib_port_attr *pprops = NULL;
4744f614fc15SDan Carpenter 	int err = -ENOMEM;
47452528e33eSMatan Barak 	struct ib_udata uhw = {.inlen = 0, .outlen = 0};
4746e126ba97SEli Cohen 
474750ba3c18SLeon Romanovsky 	pprops = kzalloc(sizeof(*pprops), GFP_KERNEL);
4748e126ba97SEli Cohen 	if (!pprops)
4749e126ba97SEli Cohen 		goto out;
4750e126ba97SEli Cohen 
4751e126ba97SEli Cohen 	dprops = kmalloc(sizeof(*dprops), GFP_KERNEL);
4752e126ba97SEli Cohen 	if (!dprops)
4753e126ba97SEli Cohen 		goto out;
4754e126ba97SEli Cohen 
47552528e33eSMatan Barak 	err = mlx5_ib_query_device(&dev->ib_dev, dprops, &uhw);
4756e126ba97SEli Cohen 	if (err) {
4757e126ba97SEli Cohen 		mlx5_ib_warn(dev, "query_device failed %d\n", err);
4758e126ba97SEli Cohen 		goto out;
4759e126ba97SEli Cohen 	}
4760e126ba97SEli Cohen 
4761e126ba97SEli Cohen 	err = mlx5_ib_query_port(&dev->ib_dev, port, pprops);
4762e126ba97SEli Cohen 	if (err) {
4763938fe83cSSaeed Mahameed 		mlx5_ib_warn(dev, "query_port %d failed %d\n",
4764938fe83cSSaeed Mahameed 			     port, err);
476532f69e4bSDaniel Jurgens 		goto out;
4766e126ba97SEli Cohen 	}
476732f69e4bSDaniel Jurgens 
4768938fe83cSSaeed Mahameed 	dev->mdev->port_caps[port - 1].pkey_table_len =
4769938fe83cSSaeed Mahameed 					dprops->max_pkeys;
4770938fe83cSSaeed Mahameed 	dev->mdev->port_caps[port - 1].gid_table_len =
4771938fe83cSSaeed Mahameed 					pprops->gid_tbl_len;
477232f69e4bSDaniel Jurgens 	mlx5_ib_dbg(dev, "port %d: pkey_table_len %d, gid_table_len %d\n",
477332f69e4bSDaniel Jurgens 		    port, dprops->max_pkeys, pprops->gid_tbl_len);
4774e126ba97SEli Cohen 
4775e126ba97SEli Cohen out:
4776e126ba97SEli Cohen 	kfree(pprops);
4777e126ba97SEli Cohen 	kfree(dprops);
4778e126ba97SEli Cohen 
4779e126ba97SEli Cohen 	return err;
4780e126ba97SEli Cohen }
4781e126ba97SEli Cohen 
478226628e2dSMark Bloch static int get_port_caps(struct mlx5_ib_dev *dev, u8 port)
478326628e2dSMark Bloch {
478426628e2dSMark Bloch 	/* For representors use port 1, is this is the only native
478526628e2dSMark Bloch 	 * port
478626628e2dSMark Bloch 	 */
478726628e2dSMark Bloch 	if (dev->is_rep)
478826628e2dSMark Bloch 		return __get_port_caps(dev, 1);
478926628e2dSMark Bloch 	return __get_port_caps(dev, port);
479026628e2dSMark Bloch }
479126628e2dSMark Bloch 
4792e126ba97SEli Cohen static void destroy_umrc_res(struct mlx5_ib_dev *dev)
4793e126ba97SEli Cohen {
4794e126ba97SEli Cohen 	int err;
4795e126ba97SEli Cohen 
4796e126ba97SEli Cohen 	err = mlx5_mr_cache_cleanup(dev);
4797e126ba97SEli Cohen 	if (err)
4798e126ba97SEli Cohen 		mlx5_ib_warn(dev, "mr cache cleanup failed\n");
4799e126ba97SEli Cohen 
480032927e28SMark Bloch 	if (dev->umrc.qp)
4801c4367a26SShamir Rabinovitch 		mlx5_ib_destroy_qp(dev->umrc.qp, NULL);
480232927e28SMark Bloch 	if (dev->umrc.cq)
4803add08d76SChristoph Hellwig 		ib_free_cq(dev->umrc.cq);
480432927e28SMark Bloch 	if (dev->umrc.pd)
4805e126ba97SEli Cohen 		ib_dealloc_pd(dev->umrc.pd);
4806e126ba97SEli Cohen }
4807e126ba97SEli Cohen 
4808e126ba97SEli Cohen enum {
4809e126ba97SEli Cohen 	MAX_UMR_WR = 128,
4810e126ba97SEli Cohen };
4811e126ba97SEli Cohen 
4812e126ba97SEli Cohen static int create_umr_res(struct mlx5_ib_dev *dev)
4813e126ba97SEli Cohen {
4814e126ba97SEli Cohen 	struct ib_qp_init_attr *init_attr = NULL;
4815e126ba97SEli Cohen 	struct ib_qp_attr *attr = NULL;
4816e126ba97SEli Cohen 	struct ib_pd *pd;
4817e126ba97SEli Cohen 	struct ib_cq *cq;
4818e126ba97SEli Cohen 	struct ib_qp *qp;
4819e126ba97SEli Cohen 	int ret;
4820e126ba97SEli Cohen 
4821e126ba97SEli Cohen 	attr = kzalloc(sizeof(*attr), GFP_KERNEL);
4822e126ba97SEli Cohen 	init_attr = kzalloc(sizeof(*init_attr), GFP_KERNEL);
4823e126ba97SEli Cohen 	if (!attr || !init_attr) {
4824e126ba97SEli Cohen 		ret = -ENOMEM;
4825e126ba97SEli Cohen 		goto error_0;
4826e126ba97SEli Cohen 	}
4827e126ba97SEli Cohen 
4828ed082d36SChristoph Hellwig 	pd = ib_alloc_pd(&dev->ib_dev, 0);
4829e126ba97SEli Cohen 	if (IS_ERR(pd)) {
4830e126ba97SEli Cohen 		mlx5_ib_dbg(dev, "Couldn't create PD for sync UMR QP\n");
4831e126ba97SEli Cohen 		ret = PTR_ERR(pd);
4832e126ba97SEli Cohen 		goto error_0;
4833e126ba97SEli Cohen 	}
4834e126ba97SEli Cohen 
4835add08d76SChristoph Hellwig 	cq = ib_alloc_cq(&dev->ib_dev, NULL, 128, 0, IB_POLL_SOFTIRQ);
4836e126ba97SEli Cohen 	if (IS_ERR(cq)) {
4837e126ba97SEli Cohen 		mlx5_ib_dbg(dev, "Couldn't create CQ for sync UMR QP\n");
4838e126ba97SEli Cohen 		ret = PTR_ERR(cq);
4839e126ba97SEli Cohen 		goto error_2;
4840e126ba97SEli Cohen 	}
4841e126ba97SEli Cohen 
4842e126ba97SEli Cohen 	init_attr->send_cq = cq;
4843e126ba97SEli Cohen 	init_attr->recv_cq = cq;
4844e126ba97SEli Cohen 	init_attr->sq_sig_type = IB_SIGNAL_ALL_WR;
4845e126ba97SEli Cohen 	init_attr->cap.max_send_wr = MAX_UMR_WR;
4846e126ba97SEli Cohen 	init_attr->cap.max_send_sge = 1;
4847e126ba97SEli Cohen 	init_attr->qp_type = MLX5_IB_QPT_REG_UMR;
4848e126ba97SEli Cohen 	init_attr->port_num = 1;
4849e126ba97SEli Cohen 	qp = mlx5_ib_create_qp(pd, init_attr, NULL);
4850e126ba97SEli Cohen 	if (IS_ERR(qp)) {
4851e126ba97SEli Cohen 		mlx5_ib_dbg(dev, "Couldn't create sync UMR QP\n");
4852e126ba97SEli Cohen 		ret = PTR_ERR(qp);
4853e126ba97SEli Cohen 		goto error_3;
4854e126ba97SEli Cohen 	}
4855e126ba97SEli Cohen 	qp->device     = &dev->ib_dev;
4856e126ba97SEli Cohen 	qp->real_qp    = qp;
4857e126ba97SEli Cohen 	qp->uobject    = NULL;
4858e126ba97SEli Cohen 	qp->qp_type    = MLX5_IB_QPT_REG_UMR;
485931fde034SMajd Dibbiny 	qp->send_cq    = init_attr->send_cq;
486031fde034SMajd Dibbiny 	qp->recv_cq    = init_attr->recv_cq;
4861e126ba97SEli Cohen 
4862e126ba97SEli Cohen 	attr->qp_state = IB_QPS_INIT;
4863e126ba97SEli Cohen 	attr->port_num = 1;
4864e126ba97SEli Cohen 	ret = mlx5_ib_modify_qp(qp, attr, IB_QP_STATE | IB_QP_PKEY_INDEX |
4865e126ba97SEli Cohen 				IB_QP_PORT, NULL);
4866e126ba97SEli Cohen 	if (ret) {
4867e126ba97SEli Cohen 		mlx5_ib_dbg(dev, "Couldn't modify UMR QP\n");
4868e126ba97SEli Cohen 		goto error_4;
4869e126ba97SEli Cohen 	}
4870e126ba97SEli Cohen 
4871e126ba97SEli Cohen 	memset(attr, 0, sizeof(*attr));
4872e126ba97SEli Cohen 	attr->qp_state = IB_QPS_RTR;
4873e126ba97SEli Cohen 	attr->path_mtu = IB_MTU_256;
4874e126ba97SEli Cohen 
4875e126ba97SEli Cohen 	ret = mlx5_ib_modify_qp(qp, attr, IB_QP_STATE, NULL);
4876e126ba97SEli Cohen 	if (ret) {
4877e126ba97SEli Cohen 		mlx5_ib_dbg(dev, "Couldn't modify umr QP to rtr\n");
4878e126ba97SEli Cohen 		goto error_4;
4879e126ba97SEli Cohen 	}
4880e126ba97SEli Cohen 
4881e126ba97SEli Cohen 	memset(attr, 0, sizeof(*attr));
4882e126ba97SEli Cohen 	attr->qp_state = IB_QPS_RTS;
4883e126ba97SEli Cohen 	ret = mlx5_ib_modify_qp(qp, attr, IB_QP_STATE, NULL);
4884e126ba97SEli Cohen 	if (ret) {
4885e126ba97SEli Cohen 		mlx5_ib_dbg(dev, "Couldn't modify umr QP to rts\n");
4886e126ba97SEli Cohen 		goto error_4;
4887e126ba97SEli Cohen 	}
4888e126ba97SEli Cohen 
4889e126ba97SEli Cohen 	dev->umrc.qp = qp;
4890e126ba97SEli Cohen 	dev->umrc.cq = cq;
4891e126ba97SEli Cohen 	dev->umrc.pd = pd;
4892e126ba97SEli Cohen 
4893e126ba97SEli Cohen 	sema_init(&dev->umrc.sem, MAX_UMR_WR);
4894e126ba97SEli Cohen 	ret = mlx5_mr_cache_init(dev);
4895e126ba97SEli Cohen 	if (ret) {
4896e126ba97SEli Cohen 		mlx5_ib_warn(dev, "mr cache init failed %d\n", ret);
4897e126ba97SEli Cohen 		goto error_4;
4898e126ba97SEli Cohen 	}
4899e126ba97SEli Cohen 
4900e126ba97SEli Cohen 	kfree(attr);
4901e126ba97SEli Cohen 	kfree(init_attr);
4902e126ba97SEli Cohen 
4903e126ba97SEli Cohen 	return 0;
4904e126ba97SEli Cohen 
4905e126ba97SEli Cohen error_4:
4906c4367a26SShamir Rabinovitch 	mlx5_ib_destroy_qp(qp, NULL);
490732927e28SMark Bloch 	dev->umrc.qp = NULL;
4908e126ba97SEli Cohen 
4909e126ba97SEli Cohen error_3:
4910add08d76SChristoph Hellwig 	ib_free_cq(cq);
491132927e28SMark Bloch 	dev->umrc.cq = NULL;
4912e126ba97SEli Cohen 
4913e126ba97SEli Cohen error_2:
4914e126ba97SEli Cohen 	ib_dealloc_pd(pd);
491532927e28SMark Bloch 	dev->umrc.pd = NULL;
4916e126ba97SEli Cohen 
4917e126ba97SEli Cohen error_0:
4918e126ba97SEli Cohen 	kfree(attr);
4919e126ba97SEli Cohen 	kfree(init_attr);
4920e126ba97SEli Cohen 	return ret;
4921e126ba97SEli Cohen }
4922e126ba97SEli Cohen 
49236e8484c5SMax Gurtovoy static u8 mlx5_get_umr_fence(u8 umr_fence_cap)
49246e8484c5SMax Gurtovoy {
49256e8484c5SMax Gurtovoy 	switch (umr_fence_cap) {
49266e8484c5SMax Gurtovoy 	case MLX5_CAP_UMR_FENCE_NONE:
49276e8484c5SMax Gurtovoy 		return MLX5_FENCE_MODE_NONE;
49286e8484c5SMax Gurtovoy 	case MLX5_CAP_UMR_FENCE_SMALL:
49296e8484c5SMax Gurtovoy 		return MLX5_FENCE_MODE_INITIATOR_SMALL;
49306e8484c5SMax Gurtovoy 	default:
49316e8484c5SMax Gurtovoy 		return MLX5_FENCE_MODE_STRONG_ORDERING;
49326e8484c5SMax Gurtovoy 	}
49336e8484c5SMax Gurtovoy }
49346e8484c5SMax Gurtovoy 
4935e126ba97SEli Cohen static int create_dev_resources(struct mlx5_ib_resources *devr)
4936e126ba97SEli Cohen {
4937e126ba97SEli Cohen 	struct ib_srq_init_attr attr;
4938e126ba97SEli Cohen 	struct mlx5_ib_dev *dev;
493921a428a0SLeon Romanovsky 	struct ib_device *ibdev;
4940bcf4c1eaSMatan Barak 	struct ib_cq_init_attr cq_attr = {.cqe = 1};
49417722f47eSHaggai Eran 	int port;
4942e126ba97SEli Cohen 	int ret = 0;
4943e126ba97SEli Cohen 
4944e126ba97SEli Cohen 	dev = container_of(devr, struct mlx5_ib_dev, devr);
494521a428a0SLeon Romanovsky 	ibdev = &dev->ib_dev;
4946e126ba97SEli Cohen 
4947d16e91daSHaggai Eran 	mutex_init(&devr->mutex);
4948d16e91daSHaggai Eran 
494921a428a0SLeon Romanovsky 	devr->p0 = rdma_zalloc_drv_obj(ibdev, ib_pd);
495021a428a0SLeon Romanovsky 	if (!devr->p0)
495121a428a0SLeon Romanovsky 		return -ENOMEM;
495221a428a0SLeon Romanovsky 
495321a428a0SLeon Romanovsky 	devr->p0->device  = ibdev;
4954e126ba97SEli Cohen 	devr->p0->uobject = NULL;
4955e126ba97SEli Cohen 	atomic_set(&devr->p0->usecnt, 0);
4956e126ba97SEli Cohen 
4957ff23dfa1SShamir Rabinovitch 	ret = mlx5_ib_alloc_pd(devr->p0, NULL);
495821a428a0SLeon Romanovsky 	if (ret)
495921a428a0SLeon Romanovsky 		goto error0;
496021a428a0SLeon Romanovsky 
4961e39afe3dSLeon Romanovsky 	devr->c0 = rdma_zalloc_drv_obj(ibdev, ib_cq);
4962e39afe3dSLeon Romanovsky 	if (!devr->c0) {
4963e39afe3dSLeon Romanovsky 		ret = -ENOMEM;
4964e126ba97SEli Cohen 		goto error1;
4965e126ba97SEli Cohen 	}
4966e39afe3dSLeon Romanovsky 
4967e126ba97SEli Cohen 	devr->c0->device = &dev->ib_dev;
4968e126ba97SEli Cohen 	atomic_set(&devr->c0->usecnt, 0);
4969e126ba97SEli Cohen 
4970e39afe3dSLeon Romanovsky 	ret = mlx5_ib_create_cq(devr->c0, &cq_attr, NULL);
4971e39afe3dSLeon Romanovsky 	if (ret)
4972e39afe3dSLeon Romanovsky 		goto err_create_cq;
4973e39afe3dSLeon Romanovsky 
4974ff23dfa1SShamir Rabinovitch 	devr->x0 = mlx5_ib_alloc_xrcd(&dev->ib_dev, NULL);
4975e126ba97SEli Cohen 	if (IS_ERR(devr->x0)) {
4976e126ba97SEli Cohen 		ret = PTR_ERR(devr->x0);
4977e126ba97SEli Cohen 		goto error2;
4978e126ba97SEli Cohen 	}
4979e126ba97SEli Cohen 	devr->x0->device = &dev->ib_dev;
4980e126ba97SEli Cohen 	devr->x0->inode = NULL;
4981e126ba97SEli Cohen 	atomic_set(&devr->x0->usecnt, 0);
4982e126ba97SEli Cohen 	mutex_init(&devr->x0->tgt_qp_mutex);
4983e126ba97SEli Cohen 	INIT_LIST_HEAD(&devr->x0->tgt_qp_list);
4984e126ba97SEli Cohen 
4985ff23dfa1SShamir Rabinovitch 	devr->x1 = mlx5_ib_alloc_xrcd(&dev->ib_dev, NULL);
4986e126ba97SEli Cohen 	if (IS_ERR(devr->x1)) {
4987e126ba97SEli Cohen 		ret = PTR_ERR(devr->x1);
4988e126ba97SEli Cohen 		goto error3;
4989e126ba97SEli Cohen 	}
4990e126ba97SEli Cohen 	devr->x1->device = &dev->ib_dev;
4991e126ba97SEli Cohen 	devr->x1->inode = NULL;
4992e126ba97SEli Cohen 	atomic_set(&devr->x1->usecnt, 0);
4993e126ba97SEli Cohen 	mutex_init(&devr->x1->tgt_qp_mutex);
4994e126ba97SEli Cohen 	INIT_LIST_HEAD(&devr->x1->tgt_qp_list);
4995e126ba97SEli Cohen 
4996e126ba97SEli Cohen 	memset(&attr, 0, sizeof(attr));
4997e126ba97SEli Cohen 	attr.attr.max_sge = 1;
4998e126ba97SEli Cohen 	attr.attr.max_wr = 1;
4999e126ba97SEli Cohen 	attr.srq_type = IB_SRQT_XRC;
50001a56ff6dSArtemy Kovalyov 	attr.ext.cq = devr->c0;
5001e126ba97SEli Cohen 	attr.ext.xrc.xrcd = devr->x0;
5002e126ba97SEli Cohen 
500368e326deSLeon Romanovsky 	devr->s0 = rdma_zalloc_drv_obj(ibdev, ib_srq);
500468e326deSLeon Romanovsky 	if (!devr->s0) {
500568e326deSLeon Romanovsky 		ret = -ENOMEM;
5006e126ba97SEli Cohen 		goto error4;
5007e126ba97SEli Cohen 	}
500868e326deSLeon Romanovsky 
5009e126ba97SEli Cohen 	devr->s0->device	= &dev->ib_dev;
5010e126ba97SEli Cohen 	devr->s0->pd		= devr->p0;
5011e126ba97SEli Cohen 	devr->s0->srq_type      = IB_SRQT_XRC;
5012e126ba97SEli Cohen 	devr->s0->ext.xrc.xrcd	= devr->x0;
50131a56ff6dSArtemy Kovalyov 	devr->s0->ext.cq	= devr->c0;
501468e326deSLeon Romanovsky 	ret = mlx5_ib_create_srq(devr->s0, &attr, NULL);
501568e326deSLeon Romanovsky 	if (ret)
501668e326deSLeon Romanovsky 		goto err_create;
501768e326deSLeon Romanovsky 
5018e126ba97SEli Cohen 	atomic_inc(&devr->s0->ext.xrc.xrcd->usecnt);
50191a56ff6dSArtemy Kovalyov 	atomic_inc(&devr->s0->ext.cq->usecnt);
5020e126ba97SEli Cohen 	atomic_inc(&devr->p0->usecnt);
5021e126ba97SEli Cohen 	atomic_set(&devr->s0->usecnt, 0);
5022e126ba97SEli Cohen 
50234aa17b28SHaggai Abramonvsky 	memset(&attr, 0, sizeof(attr));
50244aa17b28SHaggai Abramonvsky 	attr.attr.max_sge = 1;
50254aa17b28SHaggai Abramonvsky 	attr.attr.max_wr = 1;
50264aa17b28SHaggai Abramonvsky 	attr.srq_type = IB_SRQT_BASIC;
502768e326deSLeon Romanovsky 	devr->s1 = rdma_zalloc_drv_obj(ibdev, ib_srq);
502868e326deSLeon Romanovsky 	if (!devr->s1) {
502968e326deSLeon Romanovsky 		ret = -ENOMEM;
50304aa17b28SHaggai Abramonvsky 		goto error5;
50314aa17b28SHaggai Abramonvsky 	}
503268e326deSLeon Romanovsky 
50334aa17b28SHaggai Abramonvsky 	devr->s1->device	= &dev->ib_dev;
50344aa17b28SHaggai Abramonvsky 	devr->s1->pd		= devr->p0;
50354aa17b28SHaggai Abramonvsky 	devr->s1->srq_type      = IB_SRQT_BASIC;
50361a56ff6dSArtemy Kovalyov 	devr->s1->ext.cq	= devr->c0;
503768e326deSLeon Romanovsky 
503868e326deSLeon Romanovsky 	ret = mlx5_ib_create_srq(devr->s1, &attr, NULL);
503968e326deSLeon Romanovsky 	if (ret)
504068e326deSLeon Romanovsky 		goto error6;
504168e326deSLeon Romanovsky 
50424aa17b28SHaggai Abramonvsky 	atomic_inc(&devr->p0->usecnt);
50431a56ff6dSArtemy Kovalyov 	atomic_set(&devr->s1->usecnt, 0);
50444aa17b28SHaggai Abramonvsky 
50457722f47eSHaggai Eran 	for (port = 0; port < ARRAY_SIZE(devr->ports); ++port) {
50467722f47eSHaggai Eran 		INIT_WORK(&devr->ports[port].pkey_change_work,
50477722f47eSHaggai Eran 			  pkey_change_handler);
50487722f47eSHaggai Eran 		devr->ports[port].devr = devr;
50497722f47eSHaggai Eran 	}
50507722f47eSHaggai Eran 
5051e126ba97SEli Cohen 	return 0;
5052e126ba97SEli Cohen 
505368e326deSLeon Romanovsky error6:
505468e326deSLeon Romanovsky 	kfree(devr->s1);
50554aa17b28SHaggai Abramonvsky error5:
5056c4367a26SShamir Rabinovitch 	mlx5_ib_destroy_srq(devr->s0, NULL);
505768e326deSLeon Romanovsky err_create:
505868e326deSLeon Romanovsky 	kfree(devr->s0);
5059e126ba97SEli Cohen error4:
5060c4367a26SShamir Rabinovitch 	mlx5_ib_dealloc_xrcd(devr->x1, NULL);
5061e126ba97SEli Cohen error3:
5062c4367a26SShamir Rabinovitch 	mlx5_ib_dealloc_xrcd(devr->x0, NULL);
5063e126ba97SEli Cohen error2:
5064c4367a26SShamir Rabinovitch 	mlx5_ib_destroy_cq(devr->c0, NULL);
5065e39afe3dSLeon Romanovsky err_create_cq:
5066e39afe3dSLeon Romanovsky 	kfree(devr->c0);
5067e126ba97SEli Cohen error1:
5068c4367a26SShamir Rabinovitch 	mlx5_ib_dealloc_pd(devr->p0, NULL);
5069e126ba97SEli Cohen error0:
507021a428a0SLeon Romanovsky 	kfree(devr->p0);
5071e126ba97SEli Cohen 	return ret;
5072e126ba97SEli Cohen }
5073e126ba97SEli Cohen 
5074e126ba97SEli Cohen static void destroy_dev_resources(struct mlx5_ib_resources *devr)
5075e126ba97SEli Cohen {
50767722f47eSHaggai Eran 	int port;
50777722f47eSHaggai Eran 
5078c4367a26SShamir Rabinovitch 	mlx5_ib_destroy_srq(devr->s1, NULL);
507968e326deSLeon Romanovsky 	kfree(devr->s1);
5080c4367a26SShamir Rabinovitch 	mlx5_ib_destroy_srq(devr->s0, NULL);
508168e326deSLeon Romanovsky 	kfree(devr->s0);
5082c4367a26SShamir Rabinovitch 	mlx5_ib_dealloc_xrcd(devr->x0, NULL);
5083c4367a26SShamir Rabinovitch 	mlx5_ib_dealloc_xrcd(devr->x1, NULL);
5084c4367a26SShamir Rabinovitch 	mlx5_ib_destroy_cq(devr->c0, NULL);
5085e39afe3dSLeon Romanovsky 	kfree(devr->c0);
5086c4367a26SShamir Rabinovitch 	mlx5_ib_dealloc_pd(devr->p0, NULL);
508721a428a0SLeon Romanovsky 	kfree(devr->p0);
50887722f47eSHaggai Eran 
50897722f47eSHaggai Eran 	/* Make sure no change P_Key work items are still executing */
50905d8f6a0eSMark Bloch 	for (port = 0; port < ARRAY_SIZE(devr->ports); ++port)
50917722f47eSHaggai Eran 		cancel_work_sync(&devr->ports[port].pkey_change_work);
5092e126ba97SEli Cohen }
5093e126ba97SEli Cohen 
5094b02289b3SArtemy Kovalyov static u32 get_core_cap_flags(struct ib_device *ibdev,
5095b02289b3SArtemy Kovalyov 			      struct mlx5_hca_vport_context *rep)
5096e53505a8SAchiad Shochat {
5097e53505a8SAchiad Shochat 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
5098e53505a8SAchiad Shochat 	enum rdma_link_layer ll = mlx5_ib_port_link_layer(ibdev, 1);
5099e53505a8SAchiad Shochat 	u8 l3_type_cap = MLX5_CAP_ROCE(dev->mdev, l3_type);
5100e53505a8SAchiad Shochat 	u8 roce_version_cap = MLX5_CAP_ROCE(dev->mdev, roce_version);
510185c7c014SDaniel Jurgens 	bool raw_support = !mlx5_core_mp_enabled(dev->mdev);
5102e53505a8SAchiad Shochat 	u32 ret = 0;
5103e53505a8SAchiad Shochat 
5104b02289b3SArtemy Kovalyov 	if (rep->grh_required)
5105b02289b3SArtemy Kovalyov 		ret |= RDMA_CORE_CAP_IB_GRH_REQUIRED;
5106b02289b3SArtemy Kovalyov 
5107e53505a8SAchiad Shochat 	if (ll == IB_LINK_LAYER_INFINIBAND)
5108b02289b3SArtemy Kovalyov 		return ret | RDMA_CORE_PORT_IBA_IB;
5109e53505a8SAchiad Shochat 
511085c7c014SDaniel Jurgens 	if (raw_support)
5111b02289b3SArtemy Kovalyov 		ret |= RDMA_CORE_PORT_RAW_PACKET;
511272cd5717SOr Gerlitz 
5113e53505a8SAchiad Shochat 	if (!(l3_type_cap & MLX5_ROCE_L3_TYPE_IPV4_CAP))
511472cd5717SOr Gerlitz 		return ret;
5115e53505a8SAchiad Shochat 
5116e53505a8SAchiad Shochat 	if (!(l3_type_cap & MLX5_ROCE_L3_TYPE_IPV6_CAP))
511772cd5717SOr Gerlitz 		return ret;
5118e53505a8SAchiad Shochat 
5119e53505a8SAchiad Shochat 	if (roce_version_cap & MLX5_ROCE_VERSION_1_CAP)
5120e53505a8SAchiad Shochat 		ret |= RDMA_CORE_PORT_IBA_ROCE;
5121e53505a8SAchiad Shochat 
5122e53505a8SAchiad Shochat 	if (roce_version_cap & MLX5_ROCE_VERSION_2_CAP)
5123e53505a8SAchiad Shochat 		ret |= RDMA_CORE_PORT_IBA_ROCE_UDP_ENCAP;
5124e53505a8SAchiad Shochat 
5125e53505a8SAchiad Shochat 	return ret;
5126e53505a8SAchiad Shochat }
5127e53505a8SAchiad Shochat 
51287738613eSIra Weiny static int mlx5_port_immutable(struct ib_device *ibdev, u8 port_num,
51297738613eSIra Weiny 			       struct ib_port_immutable *immutable)
51307738613eSIra Weiny {
51317738613eSIra Weiny 	struct ib_port_attr attr;
5132ca5b91d6SOr Gerlitz 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
5133ca5b91d6SOr Gerlitz 	enum rdma_link_layer ll = mlx5_ib_port_link_layer(ibdev, port_num);
5134b02289b3SArtemy Kovalyov 	struct mlx5_hca_vport_context rep = {0};
51357738613eSIra Weiny 	int err;
51367738613eSIra Weiny 
5137c4550c63SOr Gerlitz 	err = ib_query_port(ibdev, port_num, &attr);
51387738613eSIra Weiny 	if (err)
51397738613eSIra Weiny 		return err;
51407738613eSIra Weiny 
5141b02289b3SArtemy Kovalyov 	if (ll == IB_LINK_LAYER_INFINIBAND) {
5142b02289b3SArtemy Kovalyov 		err = mlx5_query_hca_vport_context(dev->mdev, 0, port_num, 0,
5143b02289b3SArtemy Kovalyov 						   &rep);
5144b02289b3SArtemy Kovalyov 		if (err)
5145b02289b3SArtemy Kovalyov 			return err;
5146b02289b3SArtemy Kovalyov 	}
5147b02289b3SArtemy Kovalyov 
51487738613eSIra Weiny 	immutable->pkey_tbl_len = attr.pkey_tbl_len;
51497738613eSIra Weiny 	immutable->gid_tbl_len = attr.gid_tbl_len;
5150b02289b3SArtemy Kovalyov 	immutable->core_cap_flags = get_core_cap_flags(ibdev, &rep);
5151ca5b91d6SOr Gerlitz 	if ((ll == IB_LINK_LAYER_INFINIBAND) || MLX5_CAP_GEN(dev->mdev, roce))
5152337877a4SIra Weiny 		immutable->max_mad_size = IB_MGMT_MAD_SIZE;
51537738613eSIra Weiny 
51547738613eSIra Weiny 	return 0;
51557738613eSIra Weiny }
51567738613eSIra Weiny 
51578e6efa3aSMark Bloch static int mlx5_port_rep_immutable(struct ib_device *ibdev, u8 port_num,
51588e6efa3aSMark Bloch 				   struct ib_port_immutable *immutable)
51598e6efa3aSMark Bloch {
51608e6efa3aSMark Bloch 	struct ib_port_attr attr;
51618e6efa3aSMark Bloch 	int err;
51628e6efa3aSMark Bloch 
51638e6efa3aSMark Bloch 	immutable->core_cap_flags = RDMA_CORE_PORT_RAW_PACKET;
51648e6efa3aSMark Bloch 
51658e6efa3aSMark Bloch 	err = ib_query_port(ibdev, port_num, &attr);
51668e6efa3aSMark Bloch 	if (err)
51678e6efa3aSMark Bloch 		return err;
51688e6efa3aSMark Bloch 
51698e6efa3aSMark Bloch 	immutable->pkey_tbl_len = attr.pkey_tbl_len;
51708e6efa3aSMark Bloch 	immutable->gid_tbl_len = attr.gid_tbl_len;
51718e6efa3aSMark Bloch 	immutable->core_cap_flags = RDMA_CORE_PORT_RAW_PACKET;
51728e6efa3aSMark Bloch 
51738e6efa3aSMark Bloch 	return 0;
51748e6efa3aSMark Bloch }
51758e6efa3aSMark Bloch 
51769abb0d1bSLeon Romanovsky static void get_dev_fw_str(struct ib_device *ibdev, char *str)
5177c7342823SIra Weiny {
5178c7342823SIra Weiny 	struct mlx5_ib_dev *dev =
5179c7342823SIra Weiny 		container_of(ibdev, struct mlx5_ib_dev, ib_dev);
51809abb0d1bSLeon Romanovsky 	snprintf(str, IB_FW_VERSION_NAME_MAX, "%d.%d.%04d",
51819abb0d1bSLeon Romanovsky 		 fw_rev_maj(dev->mdev), fw_rev_min(dev->mdev),
51829abb0d1bSLeon Romanovsky 		 fw_rev_sub(dev->mdev));
5183c7342823SIra Weiny }
5184c7342823SIra Weiny 
518545f95acdSOr Gerlitz static int mlx5_eth_lag_init(struct mlx5_ib_dev *dev)
51869ef9c640SAviv Heller {
51879ef9c640SAviv Heller 	struct mlx5_core_dev *mdev = dev->mdev;
51889ef9c640SAviv Heller 	struct mlx5_flow_namespace *ns = mlx5_get_flow_namespace(mdev,
51899ef9c640SAviv Heller 								 MLX5_FLOW_NAMESPACE_LAG);
51909ef9c640SAviv Heller 	struct mlx5_flow_table *ft;
51919ef9c640SAviv Heller 	int err;
51929ef9c640SAviv Heller 
51937c34ec19SAviv Heller 	if (!ns || !mlx5_lag_is_roce(mdev))
51949ef9c640SAviv Heller 		return 0;
51959ef9c640SAviv Heller 
51969ef9c640SAviv Heller 	err = mlx5_cmd_create_vport_lag(mdev);
51979ef9c640SAviv Heller 	if (err)
51989ef9c640SAviv Heller 		return err;
51999ef9c640SAviv Heller 
52009ef9c640SAviv Heller 	ft = mlx5_create_lag_demux_flow_table(ns, 0, 0);
52019ef9c640SAviv Heller 	if (IS_ERR(ft)) {
52029ef9c640SAviv Heller 		err = PTR_ERR(ft);
52039ef9c640SAviv Heller 		goto err_destroy_vport_lag;
52049ef9c640SAviv Heller 	}
52059ef9c640SAviv Heller 
52069a4ca38dSMark Bloch 	dev->flow_db->lag_demux_ft = ft;
52077c34ec19SAviv Heller 	dev->lag_active = true;
52089ef9c640SAviv Heller 	return 0;
52099ef9c640SAviv Heller 
52109ef9c640SAviv Heller err_destroy_vport_lag:
52119ef9c640SAviv Heller 	mlx5_cmd_destroy_vport_lag(mdev);
52129ef9c640SAviv Heller 	return err;
52139ef9c640SAviv Heller }
52149ef9c640SAviv Heller 
521545f95acdSOr Gerlitz static void mlx5_eth_lag_cleanup(struct mlx5_ib_dev *dev)
52169ef9c640SAviv Heller {
52179ef9c640SAviv Heller 	struct mlx5_core_dev *mdev = dev->mdev;
52189ef9c640SAviv Heller 
52197c34ec19SAviv Heller 	if (dev->lag_active) {
52207c34ec19SAviv Heller 		dev->lag_active = false;
52217c34ec19SAviv Heller 
52229a4ca38dSMark Bloch 		mlx5_destroy_flow_table(dev->flow_db->lag_demux_ft);
52239a4ca38dSMark Bloch 		dev->flow_db->lag_demux_ft = NULL;
52249ef9c640SAviv Heller 
52259ef9c640SAviv Heller 		mlx5_cmd_destroy_vport_lag(mdev);
52269ef9c640SAviv Heller 	}
52279ef9c640SAviv Heller }
52289ef9c640SAviv Heller 
52297fd8aefbSDaniel Jurgens static int mlx5_add_netdev_notifier(struct mlx5_ib_dev *dev, u8 port_num)
5230fc24fc5eSAchiad Shochat {
5231e53505a8SAchiad Shochat 	int err;
5232e53505a8SAchiad Shochat 
523395579e78SMark Bloch 	dev->port[port_num].roce.nb.notifier_call = mlx5_netdev_event;
523495579e78SMark Bloch 	err = register_netdevice_notifier(&dev->port[port_num].roce.nb);
52355ec8c83eSAviv Heller 	if (err) {
523695579e78SMark Bloch 		dev->port[port_num].roce.nb.notifier_call = NULL;
5237e53505a8SAchiad Shochat 		return err;
52385ec8c83eSAviv Heller 	}
5239e53505a8SAchiad Shochat 
5240d012f5d6SOr Gerlitz 	return 0;
5241d012f5d6SOr Gerlitz }
5242d012f5d6SOr Gerlitz 
52437fd8aefbSDaniel Jurgens static void mlx5_remove_netdev_notifier(struct mlx5_ib_dev *dev, u8 port_num)
5244e126ba97SEli Cohen {
524595579e78SMark Bloch 	if (dev->port[port_num].roce.nb.notifier_call) {
524695579e78SMark Bloch 		unregister_netdevice_notifier(&dev->port[port_num].roce.nb);
524795579e78SMark Bloch 		dev->port[port_num].roce.nb.notifier_call = NULL;
5248e126ba97SEli Cohen 	}
5249e126ba97SEli Cohen }
5250e126ba97SEli Cohen 
5251e3f1ed1fSLeon Romanovsky static int mlx5_enable_eth(struct mlx5_ib_dev *dev)
5252e126ba97SEli Cohen {
5253e126ba97SEli Cohen 	int err;
5254e126ba97SEli Cohen 
5255ca5b91d6SOr Gerlitz 	if (MLX5_CAP_GEN(dev->mdev, roce)) {
5256e53505a8SAchiad Shochat 		err = mlx5_nic_vport_enable_roce(dev->mdev);
5257e53505a8SAchiad Shochat 		if (err)
52588e6efa3aSMark Bloch 			return err;
5259ca5b91d6SOr Gerlitz 	}
5260e53505a8SAchiad Shochat 
526145f95acdSOr Gerlitz 	err = mlx5_eth_lag_init(dev);
52629ef9c640SAviv Heller 	if (err)
52639ef9c640SAviv Heller 		goto err_disable_roce;
52649ef9c640SAviv Heller 
5265e53505a8SAchiad Shochat 	return 0;
5266e53505a8SAchiad Shochat 
52679ef9c640SAviv Heller err_disable_roce:
5268ca5b91d6SOr Gerlitz 	if (MLX5_CAP_GEN(dev->mdev, roce))
52699ef9c640SAviv Heller 		mlx5_nic_vport_disable_roce(dev->mdev);
52709ef9c640SAviv Heller 
5271e53505a8SAchiad Shochat 	return err;
5272fc24fc5eSAchiad Shochat }
5273fc24fc5eSAchiad Shochat 
527445f95acdSOr Gerlitz static void mlx5_disable_eth(struct mlx5_ib_dev *dev)
5275fc24fc5eSAchiad Shochat {
527645f95acdSOr Gerlitz 	mlx5_eth_lag_cleanup(dev);
5277ca5b91d6SOr Gerlitz 	if (MLX5_CAP_GEN(dev->mdev, roce))
5278e53505a8SAchiad Shochat 		mlx5_nic_vport_disable_roce(dev->mdev);
5279fc24fc5eSAchiad Shochat }
5280fc24fc5eSAchiad Shochat 
5281e1f24a79SParav Pandit struct mlx5_ib_counter {
52827c16f477SKamal Heib 	const char *name;
52837c16f477SKamal Heib 	size_t offset;
52847c16f477SKamal Heib };
52857c16f477SKamal Heib 
52867c16f477SKamal Heib #define INIT_Q_COUNTER(_name)		\
52877c16f477SKamal Heib 	{ .name = #_name, .offset = MLX5_BYTE_OFF(query_q_counter_out, _name)}
52887c16f477SKamal Heib 
5289e1f24a79SParav Pandit static const struct mlx5_ib_counter basic_q_cnts[] = {
52907c16f477SKamal Heib 	INIT_Q_COUNTER(rx_write_requests),
52917c16f477SKamal Heib 	INIT_Q_COUNTER(rx_read_requests),
52927c16f477SKamal Heib 	INIT_Q_COUNTER(rx_atomic_requests),
52937c16f477SKamal Heib 	INIT_Q_COUNTER(out_of_buffer),
52947c16f477SKamal Heib };
52957c16f477SKamal Heib 
5296e1f24a79SParav Pandit static const struct mlx5_ib_counter out_of_seq_q_cnts[] = {
52977c16f477SKamal Heib 	INIT_Q_COUNTER(out_of_sequence),
52987c16f477SKamal Heib };
52997c16f477SKamal Heib 
5300e1f24a79SParav Pandit static const struct mlx5_ib_counter retrans_q_cnts[] = {
53017c16f477SKamal Heib 	INIT_Q_COUNTER(duplicate_request),
53027c16f477SKamal Heib 	INIT_Q_COUNTER(rnr_nak_retry_err),
53037c16f477SKamal Heib 	INIT_Q_COUNTER(packet_seq_err),
53047c16f477SKamal Heib 	INIT_Q_COUNTER(implied_nak_seq_err),
53057c16f477SKamal Heib 	INIT_Q_COUNTER(local_ack_timeout_err),
53067c16f477SKamal Heib };
53077c16f477SKamal Heib 
5308e1f24a79SParav Pandit #define INIT_CONG_COUNTER(_name)		\
5309e1f24a79SParav Pandit 	{ .name = #_name, .offset =	\
5310e1f24a79SParav Pandit 		MLX5_BYTE_OFF(query_cong_statistics_out, _name ## _high)}
5311e1f24a79SParav Pandit 
5312e1f24a79SParav Pandit static const struct mlx5_ib_counter cong_cnts[] = {
5313e1f24a79SParav Pandit 	INIT_CONG_COUNTER(rp_cnp_ignored),
5314e1f24a79SParav Pandit 	INIT_CONG_COUNTER(rp_cnp_handled),
5315e1f24a79SParav Pandit 	INIT_CONG_COUNTER(np_ecn_marked_roce_packets),
5316e1f24a79SParav Pandit 	INIT_CONG_COUNTER(np_cnp_sent),
5317e1f24a79SParav Pandit };
5318e1f24a79SParav Pandit 
531958dcb60aSParav Pandit static const struct mlx5_ib_counter extended_err_cnts[] = {
532058dcb60aSParav Pandit 	INIT_Q_COUNTER(resp_local_length_error),
532158dcb60aSParav Pandit 	INIT_Q_COUNTER(resp_cqe_error),
532258dcb60aSParav Pandit 	INIT_Q_COUNTER(req_cqe_error),
532358dcb60aSParav Pandit 	INIT_Q_COUNTER(req_remote_invalid_request),
532458dcb60aSParav Pandit 	INIT_Q_COUNTER(req_remote_access_errors),
532558dcb60aSParav Pandit 	INIT_Q_COUNTER(resp_remote_access_errors),
532658dcb60aSParav Pandit 	INIT_Q_COUNTER(resp_cqe_flush_error),
532758dcb60aSParav Pandit 	INIT_Q_COUNTER(req_cqe_flush_error),
532858dcb60aSParav Pandit };
532958dcb60aSParav Pandit 
53309f876f3dSTalat Batheesh #define INIT_EXT_PPCNT_COUNTER(_name)		\
53319f876f3dSTalat Batheesh 	{ .name = #_name, .offset =	\
53329f876f3dSTalat Batheesh 	MLX5_BYTE_OFF(ppcnt_reg, \
53339f876f3dSTalat Batheesh 		      counter_set.eth_extended_cntrs_grp_data_layout._name##_high)}
53349f876f3dSTalat Batheesh 
53359f876f3dSTalat Batheesh static const struct mlx5_ib_counter ext_ppcnt_cnts[] = {
53369f876f3dSTalat Batheesh 	INIT_EXT_PPCNT_COUNTER(rx_icrc_encapsulated),
53379f876f3dSTalat Batheesh };
53389f876f3dSTalat Batheesh 
53393e1f000fSParav Pandit static bool is_mdev_switchdev_mode(const struct mlx5_core_dev *mdev)
53403e1f000fSParav Pandit {
53413e1f000fSParav Pandit 	return MLX5_ESWITCH_MANAGER(mdev) &&
53423e1f000fSParav Pandit 	       mlx5_ib_eswitch_mode(mdev->priv.eswitch) ==
53433e1f000fSParav Pandit 		       MLX5_ESWITCH_OFFLOADS;
53443e1f000fSParav Pandit }
53453e1f000fSParav Pandit 
5346e1f24a79SParav Pandit static void mlx5_ib_dealloc_counters(struct mlx5_ib_dev *dev)
53470837e86aSMark Bloch {
53483e1f000fSParav Pandit 	int num_cnt_ports;
5349aac4492eSDaniel Jurgens 	int i;
53500837e86aSMark Bloch 
53513e1f000fSParav Pandit 	num_cnt_ports = is_mdev_switchdev_mode(dev->mdev) ? 1 : dev->num_ports;
53523e1f000fSParav Pandit 
53533e1f000fSParav Pandit 	for (i = 0; i < num_cnt_ports; i++) {
5354921c0f5bSParav Pandit 		if (dev->port[i].cnts.set_id_valid)
53550837e86aSMark Bloch 			mlx5_core_dealloc_q_counter(dev->mdev,
5356e1f24a79SParav Pandit 						    dev->port[i].cnts.set_id);
5357e1f24a79SParav Pandit 		kfree(dev->port[i].cnts.names);
5358e1f24a79SParav Pandit 		kfree(dev->port[i].cnts.offsets);
53597c16f477SKamal Heib 	}
53607c16f477SKamal Heib }
53617c16f477SKamal Heib 
5362e1f24a79SParav Pandit static int __mlx5_ib_alloc_counters(struct mlx5_ib_dev *dev,
5363e1f24a79SParav Pandit 				    struct mlx5_ib_counters *cnts)
53647c16f477SKamal Heib {
53657c16f477SKamal Heib 	u32 num_counters;
53667c16f477SKamal Heib 
53677c16f477SKamal Heib 	num_counters = ARRAY_SIZE(basic_q_cnts);
53687c16f477SKamal Heib 
53697c16f477SKamal Heib 	if (MLX5_CAP_GEN(dev->mdev, out_of_seq_cnt))
53707c16f477SKamal Heib 		num_counters += ARRAY_SIZE(out_of_seq_q_cnts);
53717c16f477SKamal Heib 
53727c16f477SKamal Heib 	if (MLX5_CAP_GEN(dev->mdev, retransmission_q_counters))
53737c16f477SKamal Heib 		num_counters += ARRAY_SIZE(retrans_q_cnts);
537458dcb60aSParav Pandit 
537558dcb60aSParav Pandit 	if (MLX5_CAP_GEN(dev->mdev, enhanced_error_q_counters))
537658dcb60aSParav Pandit 		num_counters += ARRAY_SIZE(extended_err_cnts);
537758dcb60aSParav Pandit 
5378e1f24a79SParav Pandit 	cnts->num_q_counters = num_counters;
53797c16f477SKamal Heib 
5380e1f24a79SParav Pandit 	if (MLX5_CAP_GEN(dev->mdev, cc_query_allowed)) {
5381e1f24a79SParav Pandit 		cnts->num_cong_counters = ARRAY_SIZE(cong_cnts);
5382e1f24a79SParav Pandit 		num_counters += ARRAY_SIZE(cong_cnts);
5383e1f24a79SParav Pandit 	}
53849f876f3dSTalat Batheesh 	if (MLX5_CAP_PCAM_FEATURE(dev->mdev, rx_icrc_encapsulated_counter)) {
53859f876f3dSTalat Batheesh 		cnts->num_ext_ppcnt_counters = ARRAY_SIZE(ext_ppcnt_cnts);
53869f876f3dSTalat Batheesh 		num_counters += ARRAY_SIZE(ext_ppcnt_cnts);
53879f876f3dSTalat Batheesh 	}
5388e1f24a79SParav Pandit 	cnts->names = kcalloc(num_counters, sizeof(cnts->names), GFP_KERNEL);
5389e1f24a79SParav Pandit 	if (!cnts->names)
53907c16f477SKamal Heib 		return -ENOMEM;
53917c16f477SKamal Heib 
5392e1f24a79SParav Pandit 	cnts->offsets = kcalloc(num_counters,
5393e1f24a79SParav Pandit 				sizeof(cnts->offsets), GFP_KERNEL);
5394e1f24a79SParav Pandit 	if (!cnts->offsets)
53957c16f477SKamal Heib 		goto err_names;
53967c16f477SKamal Heib 
53977c16f477SKamal Heib 	return 0;
53987c16f477SKamal Heib 
53997c16f477SKamal Heib err_names:
5400e1f24a79SParav Pandit 	kfree(cnts->names);
5401aac4492eSDaniel Jurgens 	cnts->names = NULL;
54027c16f477SKamal Heib 	return -ENOMEM;
54037c16f477SKamal Heib }
54047c16f477SKamal Heib 
5405e1f24a79SParav Pandit static void mlx5_ib_fill_counters(struct mlx5_ib_dev *dev,
54067c16f477SKamal Heib 				  const char **names,
54077c16f477SKamal Heib 				  size_t *offsets)
54087c16f477SKamal Heib {
54097c16f477SKamal Heib 	int i;
54107c16f477SKamal Heib 	int j = 0;
54117c16f477SKamal Heib 
54127c16f477SKamal Heib 	for (i = 0; i < ARRAY_SIZE(basic_q_cnts); i++, j++) {
54137c16f477SKamal Heib 		names[j] = basic_q_cnts[i].name;
54147c16f477SKamal Heib 		offsets[j] = basic_q_cnts[i].offset;
54157c16f477SKamal Heib 	}
54167c16f477SKamal Heib 
54177c16f477SKamal Heib 	if (MLX5_CAP_GEN(dev->mdev, out_of_seq_cnt)) {
54187c16f477SKamal Heib 		for (i = 0; i < ARRAY_SIZE(out_of_seq_q_cnts); i++, j++) {
54197c16f477SKamal Heib 			names[j] = out_of_seq_q_cnts[i].name;
54207c16f477SKamal Heib 			offsets[j] = out_of_seq_q_cnts[i].offset;
54217c16f477SKamal Heib 		}
54227c16f477SKamal Heib 	}
54237c16f477SKamal Heib 
54247c16f477SKamal Heib 	if (MLX5_CAP_GEN(dev->mdev, retransmission_q_counters)) {
54257c16f477SKamal Heib 		for (i = 0; i < ARRAY_SIZE(retrans_q_cnts); i++, j++) {
54267c16f477SKamal Heib 			names[j] = retrans_q_cnts[i].name;
54277c16f477SKamal Heib 			offsets[j] = retrans_q_cnts[i].offset;
54287c16f477SKamal Heib 		}
54297c16f477SKamal Heib 	}
5430e1f24a79SParav Pandit 
543158dcb60aSParav Pandit 	if (MLX5_CAP_GEN(dev->mdev, enhanced_error_q_counters)) {
543258dcb60aSParav Pandit 		for (i = 0; i < ARRAY_SIZE(extended_err_cnts); i++, j++) {
543358dcb60aSParav Pandit 			names[j] = extended_err_cnts[i].name;
543458dcb60aSParav Pandit 			offsets[j] = extended_err_cnts[i].offset;
543558dcb60aSParav Pandit 		}
543658dcb60aSParav Pandit 	}
543758dcb60aSParav Pandit 
5438e1f24a79SParav Pandit 	if (MLX5_CAP_GEN(dev->mdev, cc_query_allowed)) {
5439e1f24a79SParav Pandit 		for (i = 0; i < ARRAY_SIZE(cong_cnts); i++, j++) {
5440e1f24a79SParav Pandit 			names[j] = cong_cnts[i].name;
5441e1f24a79SParav Pandit 			offsets[j] = cong_cnts[i].offset;
5442e1f24a79SParav Pandit 		}
5443e1f24a79SParav Pandit 	}
54449f876f3dSTalat Batheesh 
54459f876f3dSTalat Batheesh 	if (MLX5_CAP_PCAM_FEATURE(dev->mdev, rx_icrc_encapsulated_counter)) {
54469f876f3dSTalat Batheesh 		for (i = 0; i < ARRAY_SIZE(ext_ppcnt_cnts); i++, j++) {
54479f876f3dSTalat Batheesh 			names[j] = ext_ppcnt_cnts[i].name;
54489f876f3dSTalat Batheesh 			offsets[j] = ext_ppcnt_cnts[i].offset;
54499f876f3dSTalat Batheesh 		}
54509f876f3dSTalat Batheesh 	}
54510837e86aSMark Bloch }
54520837e86aSMark Bloch 
5453e1f24a79SParav Pandit static int mlx5_ib_alloc_counters(struct mlx5_ib_dev *dev)
54540837e86aSMark Bloch {
54553e1f000fSParav Pandit 	int num_cnt_ports;
5456aac4492eSDaniel Jurgens 	int err = 0;
54570837e86aSMark Bloch 	int i;
5458aa74be6eSYishai Hadas 	bool is_shared;
5459aa74be6eSYishai Hadas 
5460aa74be6eSYishai Hadas 	is_shared = MLX5_CAP_GEN(dev->mdev, log_max_uctx) != 0;
54613e1f000fSParav Pandit 	num_cnt_ports = is_mdev_switchdev_mode(dev->mdev) ? 1 : dev->num_ports;
54620837e86aSMark Bloch 
54633e1f000fSParav Pandit 	for (i = 0; i < num_cnt_ports; i++) {
5464aac4492eSDaniel Jurgens 		err = __mlx5_ib_alloc_counters(dev, &dev->port[i].cnts);
5465aac4492eSDaniel Jurgens 		if (err)
5466aac4492eSDaniel Jurgens 			goto err_alloc;
54677c16f477SKamal Heib 
5468aac4492eSDaniel Jurgens 		mlx5_ib_fill_counters(dev, dev->port[i].cnts.names,
5469aac4492eSDaniel Jurgens 				      dev->port[i].cnts.offsets);
5470aac4492eSDaniel Jurgens 
5471aa74be6eSYishai Hadas 		err = mlx5_cmd_alloc_q_counter(dev->mdev,
5472aa74be6eSYishai Hadas 					       &dev->port[i].cnts.set_id,
5473aa74be6eSYishai Hadas 					       is_shared ?
5474aa74be6eSYishai Hadas 					       MLX5_SHARED_RESOURCE_UID : 0);
5475aac4492eSDaniel Jurgens 		if (err) {
54760837e86aSMark Bloch 			mlx5_ib_warn(dev,
54770837e86aSMark Bloch 				     "couldn't allocate queue counter for port %d, err %d\n",
5478aac4492eSDaniel Jurgens 				     i + 1, err);
5479aac4492eSDaniel Jurgens 			goto err_alloc;
54800837e86aSMark Bloch 		}
5481aac4492eSDaniel Jurgens 		dev->port[i].cnts.set_id_valid = true;
54820837e86aSMark Bloch 	}
54830837e86aSMark Bloch 	return 0;
54840837e86aSMark Bloch 
5485aac4492eSDaniel Jurgens err_alloc:
5486aac4492eSDaniel Jurgens 	mlx5_ib_dealloc_counters(dev);
5487aac4492eSDaniel Jurgens 	return err;
54880837e86aSMark Bloch }
54890837e86aSMark Bloch 
54903e1f000fSParav Pandit static const struct mlx5_ib_counters *get_counters(struct mlx5_ib_dev *dev,
54913e1f000fSParav Pandit 						   u8 port_num)
54923e1f000fSParav Pandit {
54933e1f000fSParav Pandit 	return is_mdev_switchdev_mode(dev->mdev) ? &dev->port[0].cnts :
54943e1f000fSParav Pandit 						   &dev->port[port_num].cnts;
54953e1f000fSParav Pandit }
54963e1f000fSParav Pandit 
54973e1f000fSParav Pandit /**
54983e1f000fSParav Pandit  * mlx5_ib_get_counters_id - Returns counters id to use for device+port
54993e1f000fSParav Pandit  * @dev:	Pointer to mlx5 IB device
55003e1f000fSParav Pandit  * @port_num:	Zero based port number
55013e1f000fSParav Pandit  *
55023e1f000fSParav Pandit  * mlx5_ib_get_counters_id() Returns counters set id to use for given
55033e1f000fSParav Pandit  * device port combination in switchdev and non switchdev mode of the
55043e1f000fSParav Pandit  * parent device.
55053e1f000fSParav Pandit  */
55063e1f000fSParav Pandit u16 mlx5_ib_get_counters_id(struct mlx5_ib_dev *dev, u8 port_num)
55073e1f000fSParav Pandit {
55083e1f000fSParav Pandit 	const struct mlx5_ib_counters *cnts = get_counters(dev, port_num);
55093e1f000fSParav Pandit 
55103e1f000fSParav Pandit 	return cnts->set_id;
55113e1f000fSParav Pandit }
55123e1f000fSParav Pandit 
55130ad17a8fSMark Bloch static struct rdma_hw_stats *mlx5_ib_alloc_hw_stats(struct ib_device *ibdev,
55140ad17a8fSMark Bloch 						    u8 port_num)
55150ad17a8fSMark Bloch {
55167c16f477SKamal Heib 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
55173e1f000fSParav Pandit 	const struct mlx5_ib_counters *cnts;
55183e1f000fSParav Pandit 	bool is_switchdev = is_mdev_switchdev_mode(dev->mdev);
55190ad17a8fSMark Bloch 
55203e1f000fSParav Pandit 	if ((is_switchdev && port_num) || (!is_switchdev && !port_num))
55210ad17a8fSMark Bloch 		return NULL;
55220ad17a8fSMark Bloch 
55233e1f000fSParav Pandit 	cnts = get_counters(dev, port_num - 1);
55243e1f000fSParav Pandit 
55255dcecbc9SParav Pandit 	return rdma_alloc_hw_stats_struct(cnts->names,
55265dcecbc9SParav Pandit 					  cnts->num_q_counters +
55275dcecbc9SParav Pandit 					  cnts->num_cong_counters +
55285dcecbc9SParav Pandit 					  cnts->num_ext_ppcnt_counters,
55290ad17a8fSMark Bloch 					  RDMA_HW_STATS_DEFAULT_LIFESPAN);
55300ad17a8fSMark Bloch }
55310ad17a8fSMark Bloch 
5532aac4492eSDaniel Jurgens static int mlx5_ib_query_q_counters(struct mlx5_core_dev *mdev,
55335dcecbc9SParav Pandit 				    const struct mlx5_ib_counters *cnts,
5534318d535cSMark Zhang 				    struct rdma_hw_stats *stats,
5535318d535cSMark Zhang 				    u16 set_id)
5536e1f24a79SParav Pandit {
5537e1f24a79SParav Pandit 	int outlen = MLX5_ST_SZ_BYTES(query_q_counter_out);
5538e1f24a79SParav Pandit 	void *out;
5539e1f24a79SParav Pandit 	__be32 val;
5540e1f24a79SParav Pandit 	int ret, i;
5541e1f24a79SParav Pandit 
55421b9a07eeSLeon Romanovsky 	out = kvzalloc(outlen, GFP_KERNEL);
5543e1f24a79SParav Pandit 	if (!out)
5544e1f24a79SParav Pandit 		return -ENOMEM;
5545e1f24a79SParav Pandit 
5546318d535cSMark Zhang 	ret = mlx5_core_query_q_counter(mdev, set_id, 0, out, outlen);
5547e1f24a79SParav Pandit 	if (ret)
5548e1f24a79SParav Pandit 		goto free;
5549e1f24a79SParav Pandit 
55505dcecbc9SParav Pandit 	for (i = 0; i < cnts->num_q_counters; i++) {
55515dcecbc9SParav Pandit 		val = *(__be32 *)(out + cnts->offsets[i]);
5552e1f24a79SParav Pandit 		stats->value[i] = (u64)be32_to_cpu(val);
5553e1f24a79SParav Pandit 	}
5554e1f24a79SParav Pandit 
5555e1f24a79SParav Pandit free:
5556e1f24a79SParav Pandit 	kvfree(out);
5557e1f24a79SParav Pandit 	return ret;
5558e1f24a79SParav Pandit }
5559e1f24a79SParav Pandit 
55609f876f3dSTalat Batheesh static int mlx5_ib_query_ext_ppcnt_counters(struct mlx5_ib_dev *dev,
55615dcecbc9SParav Pandit 					    const struct mlx5_ib_counters *cnts,
55629f876f3dSTalat Batheesh 					    struct rdma_hw_stats *stats)
55639f876f3dSTalat Batheesh {
55645dcecbc9SParav Pandit 	int offset = cnts->num_q_counters + cnts->num_cong_counters;
55659f876f3dSTalat Batheesh 	int sz = MLX5_ST_SZ_BYTES(ppcnt_reg);
55669f876f3dSTalat Batheesh 	int ret, i;
55679f876f3dSTalat Batheesh 	void *out;
55689f876f3dSTalat Batheesh 
55699f876f3dSTalat Batheesh 	out = kvzalloc(sz, GFP_KERNEL);
55709f876f3dSTalat Batheesh 	if (!out)
55719f876f3dSTalat Batheesh 		return -ENOMEM;
55729f876f3dSTalat Batheesh 
55739f876f3dSTalat Batheesh 	ret = mlx5_cmd_query_ext_ppcnt_counters(dev->mdev, out);
55749f876f3dSTalat Batheesh 	if (ret)
55759f876f3dSTalat Batheesh 		goto free;
55769f876f3dSTalat Batheesh 
55775dcecbc9SParav Pandit 	for (i = 0; i < cnts->num_ext_ppcnt_counters; i++)
55789f876f3dSTalat Batheesh 		stats->value[i + offset] =
55799f876f3dSTalat Batheesh 			be64_to_cpup((__be64 *)(out +
55805dcecbc9SParav Pandit 				    cnts->offsets[i + offset]));
55819f876f3dSTalat Batheesh free:
55829f876f3dSTalat Batheesh 	kvfree(out);
55839f876f3dSTalat Batheesh 	return ret;
55849f876f3dSTalat Batheesh }
55859f876f3dSTalat Batheesh 
55860ad17a8fSMark Bloch static int mlx5_ib_get_hw_stats(struct ib_device *ibdev,
55870ad17a8fSMark Bloch 				struct rdma_hw_stats *stats,
55887c16f477SKamal Heib 				u8 port_num, int index)
55890ad17a8fSMark Bloch {
55900ad17a8fSMark Bloch 	struct mlx5_ib_dev *dev = to_mdev(ibdev);
55913e1f000fSParav Pandit 	const struct mlx5_ib_counters *cnts = get_counters(dev, port_num - 1);
5592aac4492eSDaniel Jurgens 	struct mlx5_core_dev *mdev;
5593e1f24a79SParav Pandit 	int ret, num_counters;
5594aac4492eSDaniel Jurgens 	u8 mdev_port_num;
55950ad17a8fSMark Bloch 
55967c16f477SKamal Heib 	if (!stats)
5597e1f24a79SParav Pandit 		return -EINVAL;
55980ad17a8fSMark Bloch 
55995dcecbc9SParav Pandit 	num_counters = cnts->num_q_counters +
56005dcecbc9SParav Pandit 		       cnts->num_cong_counters +
56015dcecbc9SParav Pandit 		       cnts->num_ext_ppcnt_counters;
5602aac4492eSDaniel Jurgens 
5603aac4492eSDaniel Jurgens 	/* q_counters are per IB device, query the master mdev */
56045dcecbc9SParav Pandit 	ret = mlx5_ib_query_q_counters(dev->mdev, cnts, stats, cnts->set_id);
56050ad17a8fSMark Bloch 	if (ret)
5606e1f24a79SParav Pandit 		return ret;
56070ad17a8fSMark Bloch 
56089f876f3dSTalat Batheesh 	if (MLX5_CAP_PCAM_FEATURE(dev->mdev, rx_icrc_encapsulated_counter)) {
56095dcecbc9SParav Pandit 		ret =  mlx5_ib_query_ext_ppcnt_counters(dev, cnts, stats);
56109f876f3dSTalat Batheesh 		if (ret)
56119f876f3dSTalat Batheesh 			return ret;
56129f876f3dSTalat Batheesh 	}
56139f876f3dSTalat Batheesh 
5614e1f24a79SParav Pandit 	if (MLX5_CAP_GEN(dev->mdev, cc_query_allowed)) {
5615aac4492eSDaniel Jurgens 		mdev = mlx5_ib_get_native_port_mdev(dev, port_num,
5616aac4492eSDaniel Jurgens 						    &mdev_port_num);
5617aac4492eSDaniel Jurgens 		if (!mdev) {
5618aac4492eSDaniel Jurgens 			/* If port is not affiliated yet, its in down state
5619aac4492eSDaniel Jurgens 			 * which doesn't have any counters yet, so it would be
5620aac4492eSDaniel Jurgens 			 * zero. So no need to read from the HCA.
5621aac4492eSDaniel Jurgens 			 */
5622aac4492eSDaniel Jurgens 			goto done;
5623aac4492eSDaniel Jurgens 		}
562471a0ff65SMajd Dibbiny 		ret = mlx5_lag_query_cong_counters(dev->mdev,
562571a0ff65SMajd Dibbiny 						   stats->value +
56265dcecbc9SParav Pandit 						   cnts->num_q_counters,
56275dcecbc9SParav Pandit 						   cnts->num_cong_counters,
56285dcecbc9SParav Pandit 						   cnts->offsets +
56295dcecbc9SParav Pandit 						   cnts->num_q_counters);
5630aac4492eSDaniel Jurgens 
5631aac4492eSDaniel Jurgens 		mlx5_ib_put_native_port_mdev(dev, port_num);
5632e1f24a79SParav Pandit 		if (ret)
5633e1f24a79SParav Pandit 			return ret;
56340ad17a8fSMark Bloch 	}
56357c16f477SKamal Heib 
5636aac4492eSDaniel Jurgens done:
5637e1f24a79SParav Pandit 	return num_counters;
56380ad17a8fSMark Bloch }
56390ad17a8fSMark Bloch 
564018d422ceSMark Zhang static struct rdma_hw_stats *
564118d422ceSMark Zhang mlx5_ib_counter_alloc_stats(struct rdma_counter *counter)
564218d422ceSMark Zhang {
564318d422ceSMark Zhang 	struct mlx5_ib_dev *dev = to_mdev(counter->device);
56445dcecbc9SParav Pandit 	const struct mlx5_ib_counters *cnts =
56453e1f000fSParav Pandit 		get_counters(dev, counter->port - 1);
564618d422ceSMark Zhang 
564718d422ceSMark Zhang 	/* Q counters are in the beginning of all counters */
56485dcecbc9SParav Pandit 	return rdma_alloc_hw_stats_struct(cnts->names,
56495dcecbc9SParav Pandit 					  cnts->num_q_counters,
565018d422ceSMark Zhang 					  RDMA_HW_STATS_DEFAULT_LIFESPAN);
565118d422ceSMark Zhang }
565218d422ceSMark Zhang 
565318d422ceSMark Zhang static int mlx5_ib_counter_update_stats(struct rdma_counter *counter)
565418d422ceSMark Zhang {
565518d422ceSMark Zhang 	struct mlx5_ib_dev *dev = to_mdev(counter->device);
56563e1f000fSParav Pandit 	const struct mlx5_ib_counters *cnts =
56573e1f000fSParav Pandit 		get_counters(dev, counter->port - 1);
565818d422ceSMark Zhang 
56595dcecbc9SParav Pandit 	return mlx5_ib_query_q_counters(dev->mdev, cnts,
566018d422ceSMark Zhang 					counter->stats, counter->id);
566118d422ceSMark Zhang }
566218d422ceSMark Zhang 
566345842fc6SMark Zhang static int mlx5_ib_counter_bind_qp(struct rdma_counter *counter,
566445842fc6SMark Zhang 				   struct ib_qp *qp)
566545842fc6SMark Zhang {
566645842fc6SMark Zhang 	struct mlx5_ib_dev *dev = to_mdev(qp->device);
566745842fc6SMark Zhang 	u16 cnt_set_id = 0;
566845842fc6SMark Zhang 	int err;
566945842fc6SMark Zhang 
567045842fc6SMark Zhang 	if (!counter->id) {
567145842fc6SMark Zhang 		err = mlx5_cmd_alloc_q_counter(dev->mdev,
567245842fc6SMark Zhang 					       &cnt_set_id,
567345842fc6SMark Zhang 					       MLX5_SHARED_RESOURCE_UID);
567445842fc6SMark Zhang 		if (err)
567545842fc6SMark Zhang 			return err;
567645842fc6SMark Zhang 		counter->id = cnt_set_id;
567745842fc6SMark Zhang 	}
567845842fc6SMark Zhang 
567945842fc6SMark Zhang 	err = mlx5_ib_qp_set_counter(qp, counter);
568045842fc6SMark Zhang 	if (err)
568145842fc6SMark Zhang 		goto fail_set_counter;
568245842fc6SMark Zhang 
568345842fc6SMark Zhang 	return 0;
568445842fc6SMark Zhang 
568545842fc6SMark Zhang fail_set_counter:
568645842fc6SMark Zhang 	mlx5_core_dealloc_q_counter(dev->mdev, cnt_set_id);
568745842fc6SMark Zhang 	counter->id = 0;
568845842fc6SMark Zhang 
568945842fc6SMark Zhang 	return err;
569045842fc6SMark Zhang }
569145842fc6SMark Zhang 
569245842fc6SMark Zhang static int mlx5_ib_counter_unbind_qp(struct ib_qp *qp)
569345842fc6SMark Zhang {
569445842fc6SMark Zhang 	return mlx5_ib_qp_set_counter(qp, NULL);
569545842fc6SMark Zhang }
569645842fc6SMark Zhang 
569745842fc6SMark Zhang static int mlx5_ib_counter_dealloc(struct rdma_counter *counter)
569845842fc6SMark Zhang {
569945842fc6SMark Zhang 	struct mlx5_ib_dev *dev = to_mdev(counter->device);
570045842fc6SMark Zhang 
570145842fc6SMark Zhang 	return mlx5_core_dealloc_q_counter(dev->mdev, counter->id);
570245842fc6SMark Zhang }
570345842fc6SMark Zhang 
5704f6a8a19bSDenis Drozdov static int mlx5_ib_rn_get_params(struct ib_device *device, u8 port_num,
5705693dfd5aSErez Shitrit 				 enum rdma_netdev_t type,
5706f6a8a19bSDenis Drozdov 				 struct rdma_netdev_alloc_params *params)
5707693dfd5aSErez Shitrit {
5708693dfd5aSErez Shitrit 	if (type != RDMA_NETDEV_IPOIB)
5709f6a8a19bSDenis Drozdov 		return -EOPNOTSUPP;
5710693dfd5aSErez Shitrit 
5711f6a8a19bSDenis Drozdov 	return mlx5_rdma_rn_get_params(to_mdev(device)->mdev, device, params);
5712693dfd5aSErez Shitrit }
5713693dfd5aSErez Shitrit 
5714fe248c3aSMaor Gottlieb static void delay_drop_debugfs_cleanup(struct mlx5_ib_dev *dev)
5715fe248c3aSMaor Gottlieb {
5716fe248c3aSMaor Gottlieb 	if (!dev->delay_drop.dbg)
5717fe248c3aSMaor Gottlieb 		return;
5718fe248c3aSMaor Gottlieb 	debugfs_remove_recursive(dev->delay_drop.dbg->dir_debugfs);
5719fe248c3aSMaor Gottlieb 	kfree(dev->delay_drop.dbg);
5720fe248c3aSMaor Gottlieb 	dev->delay_drop.dbg = NULL;
5721fe248c3aSMaor Gottlieb }
5722fe248c3aSMaor Gottlieb 
572303404e8aSMaor Gottlieb static void cancel_delay_drop(struct mlx5_ib_dev *dev)
572403404e8aSMaor Gottlieb {
572503404e8aSMaor Gottlieb 	if (!(dev->ib_dev.attrs.raw_packet_caps & IB_RAW_PACKET_CAP_DELAY_DROP))
572603404e8aSMaor Gottlieb 		return;
572703404e8aSMaor Gottlieb 
572803404e8aSMaor Gottlieb 	cancel_work_sync(&dev->delay_drop.delay_drop_work);
5729fe248c3aSMaor Gottlieb 	delay_drop_debugfs_cleanup(dev);
5730fe248c3aSMaor Gottlieb }
5731fe248c3aSMaor Gottlieb 
5732fe248c3aSMaor Gottlieb static ssize_t delay_drop_timeout_read(struct file *filp, char __user *buf,
5733fe248c3aSMaor Gottlieb 				       size_t count, loff_t *pos)
5734fe248c3aSMaor Gottlieb {
5735fe248c3aSMaor Gottlieb 	struct mlx5_ib_delay_drop *delay_drop = filp->private_data;
5736fe248c3aSMaor Gottlieb 	char lbuf[20];
5737fe248c3aSMaor Gottlieb 	int len;
5738fe248c3aSMaor Gottlieb 
5739fe248c3aSMaor Gottlieb 	len = snprintf(lbuf, sizeof(lbuf), "%u\n", delay_drop->timeout);
5740fe248c3aSMaor Gottlieb 	return simple_read_from_buffer(buf, count, pos, lbuf, len);
5741fe248c3aSMaor Gottlieb }
5742fe248c3aSMaor Gottlieb 
5743fe248c3aSMaor Gottlieb static ssize_t delay_drop_timeout_write(struct file *filp, const char __user *buf,
5744fe248c3aSMaor Gottlieb 					size_t count, loff_t *pos)
5745fe248c3aSMaor Gottlieb {
5746fe248c3aSMaor Gottlieb 	struct mlx5_ib_delay_drop *delay_drop = filp->private_data;
5747fe248c3aSMaor Gottlieb 	u32 timeout;
5748fe248c3aSMaor Gottlieb 	u32 var;
5749fe248c3aSMaor Gottlieb 
5750fe248c3aSMaor Gottlieb 	if (kstrtouint_from_user(buf, count, 0, &var))
5751fe248c3aSMaor Gottlieb 		return -EFAULT;
5752fe248c3aSMaor Gottlieb 
5753fe248c3aSMaor Gottlieb 	timeout = min_t(u32, roundup(var, 100), MLX5_MAX_DELAY_DROP_TIMEOUT_MS *
5754fe248c3aSMaor Gottlieb 			1000);
5755fe248c3aSMaor Gottlieb 	if (timeout != var)
5756fe248c3aSMaor Gottlieb 		mlx5_ib_dbg(delay_drop->dev, "Round delay drop timeout to %u usec\n",
5757fe248c3aSMaor Gottlieb 			    timeout);
5758fe248c3aSMaor Gottlieb 
5759fe248c3aSMaor Gottlieb 	delay_drop->timeout = timeout;
5760fe248c3aSMaor Gottlieb 
5761fe248c3aSMaor Gottlieb 	return count;
5762fe248c3aSMaor Gottlieb }
5763fe248c3aSMaor Gottlieb 
5764fe248c3aSMaor Gottlieb static const struct file_operations fops_delay_drop_timeout = {
5765fe248c3aSMaor Gottlieb 	.owner	= THIS_MODULE,
5766fe248c3aSMaor Gottlieb 	.open	= simple_open,
5767fe248c3aSMaor Gottlieb 	.write	= delay_drop_timeout_write,
5768fe248c3aSMaor Gottlieb 	.read	= delay_drop_timeout_read,
5769fe248c3aSMaor Gottlieb };
5770fe248c3aSMaor Gottlieb 
5771fe248c3aSMaor Gottlieb static int delay_drop_debugfs_init(struct mlx5_ib_dev *dev)
5772fe248c3aSMaor Gottlieb {
5773fe248c3aSMaor Gottlieb 	struct mlx5_ib_dbg_delay_drop *dbg;
5774fe248c3aSMaor Gottlieb 
5775fe248c3aSMaor Gottlieb 	if (!mlx5_debugfs_root)
5776fe248c3aSMaor Gottlieb 		return 0;
5777fe248c3aSMaor Gottlieb 
5778fe248c3aSMaor Gottlieb 	dbg = kzalloc(sizeof(*dbg), GFP_KERNEL);
5779fe248c3aSMaor Gottlieb 	if (!dbg)
5780fe248c3aSMaor Gottlieb 		return -ENOMEM;
5781fe248c3aSMaor Gottlieb 
5782cbafad87SSudip Mukherjee 	dev->delay_drop.dbg = dbg;
5783cbafad87SSudip Mukherjee 
5784fe248c3aSMaor Gottlieb 	dbg->dir_debugfs =
5785fe248c3aSMaor Gottlieb 		debugfs_create_dir("delay_drop",
5786fe248c3aSMaor Gottlieb 				   dev->mdev->priv.dbg_root);
5787fe248c3aSMaor Gottlieb 	if (!dbg->dir_debugfs)
5788cbafad87SSudip Mukherjee 		goto out_debugfs;
5789fe248c3aSMaor Gottlieb 
5790fe248c3aSMaor Gottlieb 	dbg->events_cnt_debugfs =
5791fe248c3aSMaor Gottlieb 		debugfs_create_atomic_t("num_timeout_events", 0400,
5792fe248c3aSMaor Gottlieb 					dbg->dir_debugfs,
5793fe248c3aSMaor Gottlieb 					&dev->delay_drop.events_cnt);
5794fe248c3aSMaor Gottlieb 	if (!dbg->events_cnt_debugfs)
5795fe248c3aSMaor Gottlieb 		goto out_debugfs;
5796fe248c3aSMaor Gottlieb 
5797fe248c3aSMaor Gottlieb 	dbg->rqs_cnt_debugfs =
5798fe248c3aSMaor Gottlieb 		debugfs_create_atomic_t("num_rqs", 0400,
5799fe248c3aSMaor Gottlieb 					dbg->dir_debugfs,
5800fe248c3aSMaor Gottlieb 					&dev->delay_drop.rqs_cnt);
5801fe248c3aSMaor Gottlieb 	if (!dbg->rqs_cnt_debugfs)
5802fe248c3aSMaor Gottlieb 		goto out_debugfs;
5803fe248c3aSMaor Gottlieb 
5804fe248c3aSMaor Gottlieb 	dbg->timeout_debugfs =
5805fe248c3aSMaor Gottlieb 		debugfs_create_file("timeout", 0600,
5806fe248c3aSMaor Gottlieb 				    dbg->dir_debugfs,
5807fe248c3aSMaor Gottlieb 				    &dev->delay_drop,
5808fe248c3aSMaor Gottlieb 				    &fops_delay_drop_timeout);
5809fe248c3aSMaor Gottlieb 	if (!dbg->timeout_debugfs)
5810fe248c3aSMaor Gottlieb 		goto out_debugfs;
5811fe248c3aSMaor Gottlieb 
5812fe248c3aSMaor Gottlieb 	return 0;
5813fe248c3aSMaor Gottlieb 
5814fe248c3aSMaor Gottlieb out_debugfs:
5815fe248c3aSMaor Gottlieb 	delay_drop_debugfs_cleanup(dev);
5816fe248c3aSMaor Gottlieb 	return -ENOMEM;
581703404e8aSMaor Gottlieb }
581803404e8aSMaor Gottlieb 
581903404e8aSMaor Gottlieb static void init_delay_drop(struct mlx5_ib_dev *dev)
582003404e8aSMaor Gottlieb {
582103404e8aSMaor Gottlieb 	if (!(dev->ib_dev.attrs.raw_packet_caps & IB_RAW_PACKET_CAP_DELAY_DROP))
582203404e8aSMaor Gottlieb 		return;
582303404e8aSMaor Gottlieb 
582403404e8aSMaor Gottlieb 	mutex_init(&dev->delay_drop.lock);
582503404e8aSMaor Gottlieb 	dev->delay_drop.dev = dev;
582603404e8aSMaor Gottlieb 	dev->delay_drop.activate = false;
582703404e8aSMaor Gottlieb 	dev->delay_drop.timeout = MLX5_MAX_DELAY_DROP_TIMEOUT_MS * 1000;
582803404e8aSMaor Gottlieb 	INIT_WORK(&dev->delay_drop.delay_drop_work, delay_drop_handler);
5829fe248c3aSMaor Gottlieb 	atomic_set(&dev->delay_drop.rqs_cnt, 0);
5830fe248c3aSMaor Gottlieb 	atomic_set(&dev->delay_drop.events_cnt, 0);
5831fe248c3aSMaor Gottlieb 
5832fe248c3aSMaor Gottlieb 	if (delay_drop_debugfs_init(dev))
5833fe248c3aSMaor Gottlieb 		mlx5_ib_warn(dev, "Failed to init delay drop debugfs\n");
583403404e8aSMaor Gottlieb }
583503404e8aSMaor Gottlieb 
583632f69e4bSDaniel Jurgens static void mlx5_ib_unbind_slave_port(struct mlx5_ib_dev *ibdev,
583732f69e4bSDaniel Jurgens 				      struct mlx5_ib_multiport_info *mpi)
583832f69e4bSDaniel Jurgens {
583932f69e4bSDaniel Jurgens 	u8 port_num = mlx5_core_native_port_num(mpi->mdev) - 1;
584032f69e4bSDaniel Jurgens 	struct mlx5_ib_port *port = &ibdev->port[port_num];
584132f69e4bSDaniel Jurgens 	int comps;
584232f69e4bSDaniel Jurgens 	int err;
584332f69e4bSDaniel Jurgens 	int i;
584432f69e4bSDaniel Jurgens 
58459dc4cfffSLeon Romanovsky 	lockdep_assert_held(&mlx5_ib_multiport_mutex);
58469dc4cfffSLeon Romanovsky 
5847a9e546e7SParav Pandit 	mlx5_ib_cleanup_cong_debugfs(ibdev, port_num);
5848a9e546e7SParav Pandit 
584932f69e4bSDaniel Jurgens 	spin_lock(&port->mp.mpi_lock);
585032f69e4bSDaniel Jurgens 	if (!mpi->ibdev) {
585132f69e4bSDaniel Jurgens 		spin_unlock(&port->mp.mpi_lock);
585232f69e4bSDaniel Jurgens 		return;
585332f69e4bSDaniel Jurgens 	}
5854df097a27SSaeed Mahameed 
585532f69e4bSDaniel Jurgens 	mpi->ibdev = NULL;
585632f69e4bSDaniel Jurgens 
585732f69e4bSDaniel Jurgens 	spin_unlock(&port->mp.mpi_lock);
585823eaf3b5SLeon Romanovsky 	if (mpi->mdev_events.notifier_call)
585923eaf3b5SLeon Romanovsky 		mlx5_notifier_unregister(mpi->mdev, &mpi->mdev_events);
586023eaf3b5SLeon Romanovsky 	mpi->mdev_events.notifier_call = NULL;
586132f69e4bSDaniel Jurgens 	mlx5_remove_netdev_notifier(ibdev, port_num);
586232f69e4bSDaniel Jurgens 	spin_lock(&port->mp.mpi_lock);
586332f69e4bSDaniel Jurgens 
586432f69e4bSDaniel Jurgens 	comps = mpi->mdev_refcnt;
586532f69e4bSDaniel Jurgens 	if (comps) {
586632f69e4bSDaniel Jurgens 		mpi->unaffiliate = true;
586732f69e4bSDaniel Jurgens 		init_completion(&mpi->unref_comp);
586832f69e4bSDaniel Jurgens 		spin_unlock(&port->mp.mpi_lock);
586932f69e4bSDaniel Jurgens 
587032f69e4bSDaniel Jurgens 		for (i = 0; i < comps; i++)
587132f69e4bSDaniel Jurgens 			wait_for_completion(&mpi->unref_comp);
587232f69e4bSDaniel Jurgens 
587332f69e4bSDaniel Jurgens 		spin_lock(&port->mp.mpi_lock);
587432f69e4bSDaniel Jurgens 		mpi->unaffiliate = false;
587532f69e4bSDaniel Jurgens 	}
587632f69e4bSDaniel Jurgens 
587732f69e4bSDaniel Jurgens 	port->mp.mpi = NULL;
587832f69e4bSDaniel Jurgens 
587932f69e4bSDaniel Jurgens 	list_add_tail(&mpi->list, &mlx5_ib_unaffiliated_port_list);
588032f69e4bSDaniel Jurgens 
588132f69e4bSDaniel Jurgens 	spin_unlock(&port->mp.mpi_lock);
588232f69e4bSDaniel Jurgens 
588332f69e4bSDaniel Jurgens 	err = mlx5_nic_vport_unaffiliate_multiport(mpi->mdev);
588432f69e4bSDaniel Jurgens 
588532f69e4bSDaniel Jurgens 	mlx5_ib_dbg(ibdev, "unaffiliated port %d\n", port_num + 1);
588632f69e4bSDaniel Jurgens 	/* Log an error, still needed to cleanup the pointers and add
588732f69e4bSDaniel Jurgens 	 * it back to the list.
588832f69e4bSDaniel Jurgens 	 */
588932f69e4bSDaniel Jurgens 	if (err)
589032f69e4bSDaniel Jurgens 		mlx5_ib_err(ibdev, "Failed to unaffiliate port %u\n",
589132f69e4bSDaniel Jurgens 			    port_num + 1);
589232f69e4bSDaniel Jurgens 
589395579e78SMark Bloch 	ibdev->port[port_num].roce.last_port_state = IB_PORT_DOWN;
589432f69e4bSDaniel Jurgens }
589532f69e4bSDaniel Jurgens 
589632f69e4bSDaniel Jurgens static bool mlx5_ib_bind_slave_port(struct mlx5_ib_dev *ibdev,
589732f69e4bSDaniel Jurgens 				    struct mlx5_ib_multiport_info *mpi)
589832f69e4bSDaniel Jurgens {
589932f69e4bSDaniel Jurgens 	u8 port_num = mlx5_core_native_port_num(mpi->mdev) - 1;
590032f69e4bSDaniel Jurgens 	int err;
590132f69e4bSDaniel Jurgens 
59029dc4cfffSLeon Romanovsky 	lockdep_assert_held(&mlx5_ib_multiport_mutex);
59039dc4cfffSLeon Romanovsky 
590432f69e4bSDaniel Jurgens 	spin_lock(&ibdev->port[port_num].mp.mpi_lock);
590532f69e4bSDaniel Jurgens 	if (ibdev->port[port_num].mp.mpi) {
59062577188eSQing Huang 		mlx5_ib_dbg(ibdev, "port %d already affiliated.\n",
590732f69e4bSDaniel Jurgens 			    port_num + 1);
590832f69e4bSDaniel Jurgens 		spin_unlock(&ibdev->port[port_num].mp.mpi_lock);
590932f69e4bSDaniel Jurgens 		return false;
591032f69e4bSDaniel Jurgens 	}
591132f69e4bSDaniel Jurgens 
591232f69e4bSDaniel Jurgens 	ibdev->port[port_num].mp.mpi = mpi;
591332f69e4bSDaniel Jurgens 	mpi->ibdev = ibdev;
5914df097a27SSaeed Mahameed 	mpi->mdev_events.notifier_call = NULL;
591532f69e4bSDaniel Jurgens 	spin_unlock(&ibdev->port[port_num].mp.mpi_lock);
591632f69e4bSDaniel Jurgens 
591732f69e4bSDaniel Jurgens 	err = mlx5_nic_vport_affiliate_multiport(ibdev->mdev, mpi->mdev);
591832f69e4bSDaniel Jurgens 	if (err)
591932f69e4bSDaniel Jurgens 		goto unbind;
592032f69e4bSDaniel Jurgens 
592132f69e4bSDaniel Jurgens 	err = get_port_caps(ibdev, mlx5_core_native_port_num(mpi->mdev));
592232f69e4bSDaniel Jurgens 	if (err)
592332f69e4bSDaniel Jurgens 		goto unbind;
592432f69e4bSDaniel Jurgens 
592532f69e4bSDaniel Jurgens 	err = mlx5_add_netdev_notifier(ibdev, port_num);
592632f69e4bSDaniel Jurgens 	if (err) {
592732f69e4bSDaniel Jurgens 		mlx5_ib_err(ibdev, "failed adding netdev notifier for port %u\n",
592832f69e4bSDaniel Jurgens 			    port_num + 1);
592932f69e4bSDaniel Jurgens 		goto unbind;
593032f69e4bSDaniel Jurgens 	}
593132f69e4bSDaniel Jurgens 
5932df097a27SSaeed Mahameed 	mpi->mdev_events.notifier_call = mlx5_ib_event_slave_port;
5933df097a27SSaeed Mahameed 	mlx5_notifier_register(mpi->mdev, &mpi->mdev_events);
5934df097a27SSaeed Mahameed 
593573eb8f03SGreg Kroah-Hartman 	mlx5_ib_init_cong_debugfs(ibdev, port_num);
5936a9e546e7SParav Pandit 
593732f69e4bSDaniel Jurgens 	return true;
593832f69e4bSDaniel Jurgens 
593932f69e4bSDaniel Jurgens unbind:
594032f69e4bSDaniel Jurgens 	mlx5_ib_unbind_slave_port(ibdev, mpi);
594132f69e4bSDaniel Jurgens 	return false;
594232f69e4bSDaniel Jurgens }
594332f69e4bSDaniel Jurgens 
594432f69e4bSDaniel Jurgens static int mlx5_ib_init_multiport_master(struct mlx5_ib_dev *dev)
594532f69e4bSDaniel Jurgens {
594632f69e4bSDaniel Jurgens 	int port_num = mlx5_core_native_port_num(dev->mdev) - 1;
594732f69e4bSDaniel Jurgens 	enum rdma_link_layer ll = mlx5_ib_port_link_layer(&dev->ib_dev,
594832f69e4bSDaniel Jurgens 							  port_num + 1);
594932f69e4bSDaniel Jurgens 	struct mlx5_ib_multiport_info *mpi;
595032f69e4bSDaniel Jurgens 	int err;
595132f69e4bSDaniel Jurgens 	int i;
595232f69e4bSDaniel Jurgens 
595332f69e4bSDaniel Jurgens 	if (!mlx5_core_is_mp_master(dev->mdev) || ll != IB_LINK_LAYER_ETHERNET)
595432f69e4bSDaniel Jurgens 		return 0;
595532f69e4bSDaniel Jurgens 
595632f69e4bSDaniel Jurgens 	err = mlx5_query_nic_vport_system_image_guid(dev->mdev,
595732f69e4bSDaniel Jurgens 						     &dev->sys_image_guid);
595832f69e4bSDaniel Jurgens 	if (err)
595932f69e4bSDaniel Jurgens 		return err;
596032f69e4bSDaniel Jurgens 
596132f69e4bSDaniel Jurgens 	err = mlx5_nic_vport_enable_roce(dev->mdev);
596232f69e4bSDaniel Jurgens 	if (err)
596332f69e4bSDaniel Jurgens 		return err;
596432f69e4bSDaniel Jurgens 
596532f69e4bSDaniel Jurgens 	mutex_lock(&mlx5_ib_multiport_mutex);
596632f69e4bSDaniel Jurgens 	for (i = 0; i < dev->num_ports; i++) {
596732f69e4bSDaniel Jurgens 		bool bound = false;
596832f69e4bSDaniel Jurgens 
596932f69e4bSDaniel Jurgens 		/* build a stub multiport info struct for the native port. */
597032f69e4bSDaniel Jurgens 		if (i == port_num) {
597132f69e4bSDaniel Jurgens 			mpi = kzalloc(sizeof(*mpi), GFP_KERNEL);
597232f69e4bSDaniel Jurgens 			if (!mpi) {
597332f69e4bSDaniel Jurgens 				mutex_unlock(&mlx5_ib_multiport_mutex);
597432f69e4bSDaniel Jurgens 				mlx5_nic_vport_disable_roce(dev->mdev);
597532f69e4bSDaniel Jurgens 				return -ENOMEM;
597632f69e4bSDaniel Jurgens 			}
597732f69e4bSDaniel Jurgens 
597832f69e4bSDaniel Jurgens 			mpi->is_master = true;
597932f69e4bSDaniel Jurgens 			mpi->mdev = dev->mdev;
598032f69e4bSDaniel Jurgens 			mpi->sys_image_guid = dev->sys_image_guid;
598132f69e4bSDaniel Jurgens 			dev->port[i].mp.mpi = mpi;
598232f69e4bSDaniel Jurgens 			mpi->ibdev = dev;
598332f69e4bSDaniel Jurgens 			mpi = NULL;
598432f69e4bSDaniel Jurgens 			continue;
598532f69e4bSDaniel Jurgens 		}
598632f69e4bSDaniel Jurgens 
598732f69e4bSDaniel Jurgens 		list_for_each_entry(mpi, &mlx5_ib_unaffiliated_port_list,
598832f69e4bSDaniel Jurgens 				    list) {
598932f69e4bSDaniel Jurgens 			if (dev->sys_image_guid == mpi->sys_image_guid &&
599032f69e4bSDaniel Jurgens 			    (mlx5_core_native_port_num(mpi->mdev) - 1) == i) {
599132f69e4bSDaniel Jurgens 				bound = mlx5_ib_bind_slave_port(dev, mpi);
599232f69e4bSDaniel Jurgens 			}
599332f69e4bSDaniel Jurgens 
599432f69e4bSDaniel Jurgens 			if (bound) {
5995c42260f1SVu Pham 				dev_dbg(mpi->mdev->device,
5996c42260f1SVu Pham 					"removing port from unaffiliated list.\n");
599732f69e4bSDaniel Jurgens 				mlx5_ib_dbg(dev, "port %d bound\n", i + 1);
599832f69e4bSDaniel Jurgens 				list_del(&mpi->list);
599932f69e4bSDaniel Jurgens 				break;
600032f69e4bSDaniel Jurgens 			}
600132f69e4bSDaniel Jurgens 		}
600232f69e4bSDaniel Jurgens 		if (!bound) {
600332f69e4bSDaniel Jurgens 			get_port_caps(dev, i + 1);
600432f69e4bSDaniel Jurgens 			mlx5_ib_dbg(dev, "no free port found for port %d\n",
600532f69e4bSDaniel Jurgens 				    i + 1);
600632f69e4bSDaniel Jurgens 		}
600732f69e4bSDaniel Jurgens 	}
600832f69e4bSDaniel Jurgens 
600932f69e4bSDaniel Jurgens 	list_add_tail(&dev->ib_dev_list, &mlx5_ib_dev_list);
601032f69e4bSDaniel Jurgens 	mutex_unlock(&mlx5_ib_multiport_mutex);
601132f69e4bSDaniel Jurgens 	return err;
601232f69e4bSDaniel Jurgens }
601332f69e4bSDaniel Jurgens 
601432f69e4bSDaniel Jurgens static void mlx5_ib_cleanup_multiport_master(struct mlx5_ib_dev *dev)
601532f69e4bSDaniel Jurgens {
601632f69e4bSDaniel Jurgens 	int port_num = mlx5_core_native_port_num(dev->mdev) - 1;
601732f69e4bSDaniel Jurgens 	enum rdma_link_layer ll = mlx5_ib_port_link_layer(&dev->ib_dev,
601832f69e4bSDaniel Jurgens 							  port_num + 1);
601932f69e4bSDaniel Jurgens 	int i;
602032f69e4bSDaniel Jurgens 
602132f69e4bSDaniel Jurgens 	if (!mlx5_core_is_mp_master(dev->mdev) || ll != IB_LINK_LAYER_ETHERNET)
602232f69e4bSDaniel Jurgens 		return;
602332f69e4bSDaniel Jurgens 
602432f69e4bSDaniel Jurgens 	mutex_lock(&mlx5_ib_multiport_mutex);
602532f69e4bSDaniel Jurgens 	for (i = 0; i < dev->num_ports; i++) {
602632f69e4bSDaniel Jurgens 		if (dev->port[i].mp.mpi) {
602732f69e4bSDaniel Jurgens 			/* Destroy the native port stub */
602832f69e4bSDaniel Jurgens 			if (i == port_num) {
602932f69e4bSDaniel Jurgens 				kfree(dev->port[i].mp.mpi);
603032f69e4bSDaniel Jurgens 				dev->port[i].mp.mpi = NULL;
603132f69e4bSDaniel Jurgens 			} else {
603232f69e4bSDaniel Jurgens 				mlx5_ib_dbg(dev, "unbinding port_num: %d\n", i + 1);
603332f69e4bSDaniel Jurgens 				mlx5_ib_unbind_slave_port(dev, dev->port[i].mp.mpi);
603432f69e4bSDaniel Jurgens 			}
603532f69e4bSDaniel Jurgens 		}
603632f69e4bSDaniel Jurgens 	}
603732f69e4bSDaniel Jurgens 
603832f69e4bSDaniel Jurgens 	mlx5_ib_dbg(dev, "removing from devlist\n");
603932f69e4bSDaniel Jurgens 	list_del(&dev->ib_dev_list);
604032f69e4bSDaniel Jurgens 	mutex_unlock(&mlx5_ib_multiport_mutex);
604132f69e4bSDaniel Jurgens 
604232f69e4bSDaniel Jurgens 	mlx5_nic_vport_disable_roce(dev->mdev);
604332f69e4bSDaniel Jurgens }
604432f69e4bSDaniel Jurgens 
60459a119cd5SJason Gunthorpe ADD_UVERBS_ATTRIBUTES_SIMPLE(
60469a119cd5SJason Gunthorpe 	mlx5_ib_dm,
60479a119cd5SJason Gunthorpe 	UVERBS_OBJECT_DM,
604824da0016SAriel Levkovich 	UVERBS_METHOD_DM_ALLOC,
60499a119cd5SJason Gunthorpe 	UVERBS_ATTR_PTR_OUT(MLX5_IB_ATTR_ALLOC_DM_RESP_START_OFFSET,
605024da0016SAriel Levkovich 			    UVERBS_ATTR_TYPE(u64),
605183bb4442SJason Gunthorpe 			    UA_MANDATORY),
60529a119cd5SJason Gunthorpe 	UVERBS_ATTR_PTR_OUT(MLX5_IB_ATTR_ALLOC_DM_RESP_PAGE_INDEX,
605324da0016SAriel Levkovich 			    UVERBS_ATTR_TYPE(u16),
60543b113a1eSAriel Levkovich 			    UA_OPTIONAL),
60553b113a1eSAriel Levkovich 	UVERBS_ATTR_CONST_IN(MLX5_IB_ATTR_ALLOC_DM_REQ_TYPE,
60563b113a1eSAriel Levkovich 			     enum mlx5_ib_uapi_dm_type,
60573b113a1eSAriel Levkovich 			     UA_OPTIONAL));
605824da0016SAriel Levkovich 
60599a119cd5SJason Gunthorpe ADD_UVERBS_ATTRIBUTES_SIMPLE(
60609a119cd5SJason Gunthorpe 	mlx5_ib_flow_action,
60619a119cd5SJason Gunthorpe 	UVERBS_OBJECT_FLOW_ACTION,
6062c6475a0bSAviad Yehezkel 	UVERBS_METHOD_FLOW_ACTION_ESP_CREATE,
6063bccd0622SJason Gunthorpe 	UVERBS_ATTR_FLAGS_IN(MLX5_IB_ATTR_CREATE_FLOW_ACTION_FLAGS,
6064bccd0622SJason Gunthorpe 			     enum mlx5_ib_uapi_flow_action_flags));
6065c6475a0bSAviad Yehezkel 
60660cbf432dSJason Gunthorpe static const struct uapi_definition mlx5_ib_defs[] = {
60670cbf432dSJason Gunthorpe #if IS_ENABLED(CONFIG_INFINIBAND_USER_ACCESS)
606836e235c8SJason Gunthorpe 	UAPI_DEF_CHAIN(mlx5_ib_devx_defs),
60690cbf432dSJason Gunthorpe 	UAPI_DEF_CHAIN(mlx5_ib_flow_defs),
60700cbf432dSJason Gunthorpe #endif
60718c84660bSMatan Barak 
60720cbf432dSJason Gunthorpe 	UAPI_DEF_CHAIN_OBJ_TREE(UVERBS_OBJECT_FLOW_ACTION,
60730cbf432dSJason Gunthorpe 				&mlx5_ib_flow_action),
60740cbf432dSJason Gunthorpe 	UAPI_DEF_CHAIN_OBJ_TREE(UVERBS_OBJECT_DM, &mlx5_ib_dm),
60750cbf432dSJason Gunthorpe 	{}
60760cbf432dSJason Gunthorpe };
60778c84660bSMatan Barak 
60781a1e03dcSRaed Salem static int mlx5_ib_read_counters(struct ib_counters *counters,
60791a1e03dcSRaed Salem 				 struct ib_counters_read_attr *read_attr,
60801a1e03dcSRaed Salem 				 struct uverbs_attr_bundle *attrs)
60811a1e03dcSRaed Salem {
60821a1e03dcSRaed Salem 	struct mlx5_ib_mcounters *mcounters = to_mcounters(counters);
60831a1e03dcSRaed Salem 	struct mlx5_read_counters_attr mread_attr = {};
60841a1e03dcSRaed Salem 	struct mlx5_ib_flow_counters_desc *desc;
60851a1e03dcSRaed Salem 	int ret, i;
60861a1e03dcSRaed Salem 
60871a1e03dcSRaed Salem 	mutex_lock(&mcounters->mcntrs_mutex);
60881a1e03dcSRaed Salem 	if (mcounters->cntrs_max_index > read_attr->ncounters) {
60891a1e03dcSRaed Salem 		ret = -EINVAL;
60901a1e03dcSRaed Salem 		goto err_bound;
60911a1e03dcSRaed Salem 	}
60921a1e03dcSRaed Salem 
60931a1e03dcSRaed Salem 	mread_attr.out = kcalloc(mcounters->counters_num, sizeof(u64),
60941a1e03dcSRaed Salem 				 GFP_KERNEL);
60951a1e03dcSRaed Salem 	if (!mread_attr.out) {
60961a1e03dcSRaed Salem 		ret = -ENOMEM;
60971a1e03dcSRaed Salem 		goto err_bound;
60981a1e03dcSRaed Salem 	}
60991a1e03dcSRaed Salem 
61001a1e03dcSRaed Salem 	mread_attr.hw_cntrs_hndl = mcounters->hw_cntrs_hndl;
61011a1e03dcSRaed Salem 	mread_attr.flags = read_attr->flags;
61021a1e03dcSRaed Salem 	ret = mcounters->read_counters(counters->device, &mread_attr);
61031a1e03dcSRaed Salem 	if (ret)
61041a1e03dcSRaed Salem 		goto err_read;
61051a1e03dcSRaed Salem 
61061a1e03dcSRaed Salem 	/* do the pass over the counters data array to assign according to the
61071a1e03dcSRaed Salem 	 * descriptions and indexing pairs
61081a1e03dcSRaed Salem 	 */
61091a1e03dcSRaed Salem 	desc = mcounters->counters_data;
61101a1e03dcSRaed Salem 	for (i = 0; i < mcounters->ncounters; i++)
61111a1e03dcSRaed Salem 		read_attr->counters_buff[desc[i].index] += mread_attr.out[desc[i].description];
61121a1e03dcSRaed Salem 
61131a1e03dcSRaed Salem err_read:
61141a1e03dcSRaed Salem 	kfree(mread_attr.out);
61151a1e03dcSRaed Salem err_bound:
61161a1e03dcSRaed Salem 	mutex_unlock(&mcounters->mcntrs_mutex);
61171a1e03dcSRaed Salem 	return ret;
61181a1e03dcSRaed Salem }
61191a1e03dcSRaed Salem 
6120b29e2a13SRaed Salem static int mlx5_ib_destroy_counters(struct ib_counters *counters)
6121b29e2a13SRaed Salem {
6122b29e2a13SRaed Salem 	struct mlx5_ib_mcounters *mcounters = to_mcounters(counters);
6123b29e2a13SRaed Salem 
61243b3233fbSRaed Salem 	counters_clear_description(counters);
61253b3233fbSRaed Salem 	if (mcounters->hw_cntrs_hndl)
61263b3233fbSRaed Salem 		mlx5_fc_destroy(to_mdev(counters->device)->mdev,
61273b3233fbSRaed Salem 				mcounters->hw_cntrs_hndl);
61283b3233fbSRaed Salem 
6129b29e2a13SRaed Salem 	kfree(mcounters);
6130b29e2a13SRaed Salem 
6131b29e2a13SRaed Salem 	return 0;
6132b29e2a13SRaed Salem }
6133b29e2a13SRaed Salem 
6134b29e2a13SRaed Salem static struct ib_counters *mlx5_ib_create_counters(struct ib_device *device,
6135b29e2a13SRaed Salem 						   struct uverbs_attr_bundle *attrs)
6136b29e2a13SRaed Salem {
6137b29e2a13SRaed Salem 	struct mlx5_ib_mcounters *mcounters;
6138b29e2a13SRaed Salem 
6139b29e2a13SRaed Salem 	mcounters = kzalloc(sizeof(*mcounters), GFP_KERNEL);
6140b29e2a13SRaed Salem 	if (!mcounters)
6141b29e2a13SRaed Salem 		return ERR_PTR(-ENOMEM);
6142b29e2a13SRaed Salem 
61433b3233fbSRaed Salem 	mutex_init(&mcounters->mcntrs_mutex);
61443b3233fbSRaed Salem 
6145b29e2a13SRaed Salem 	return &mcounters->ibcntrs;
6146b29e2a13SRaed Salem }
6147b29e2a13SRaed Salem 
6148fb652d32SMark Bloch static void mlx5_ib_stage_init_cleanup(struct mlx5_ib_dev *dev)
6149e126ba97SEli Cohen {
615032f69e4bSDaniel Jurgens 	mlx5_ib_cleanup_multiport_master(dev);
615113859d5dSLeon Romanovsky 	if (IS_ENABLED(CONFIG_INFINIBAND_ON_DEMAND_PAGING)) {
6152534fd7aaSYishai Hadas 		srcu_barrier(&dev->mr_srcu);
61533cc297dbSMark Bloch 		cleanup_srcu_struct(&dev->mr_srcu);
615413859d5dSLeon Romanovsky 	}
61554056b12eSAriel Levkovich 
61564056b12eSAriel Levkovich 	WARN_ON(!bitmap_empty(dev->dm.memic_alloc_pages, MLX5_MAX_MEMIC_PAGES));
615716c1975fSMark Bloch }
615816c1975fSMark Bloch 
6159fb652d32SMark Bloch static int mlx5_ib_stage_init_init(struct mlx5_ib_dev *dev)
616016c1975fSMark Bloch {
616116c1975fSMark Bloch 	struct mlx5_core_dev *mdev = dev->mdev;
6162e126ba97SEli Cohen 	int err;
616332f69e4bSDaniel Jurgens 	int i;
6164e126ba97SEli Cohen 
616532f69e4bSDaniel Jurgens 	for (i = 0; i < dev->num_ports; i++) {
616632f69e4bSDaniel Jurgens 		spin_lock_init(&dev->port[i].mp.mpi_lock);
616795579e78SMark Bloch 		rwlock_init(&dev->port[i].roce.netdev_lock);
6168d3b5cc1cSMark Bloch 		dev->port[i].roce.dev = dev;
6169d3b5cc1cSMark Bloch 		dev->port[i].roce.native_port_num = i + 1;
6170d3b5cc1cSMark Bloch 		dev->port[i].roce.last_port_state = IB_PORT_DOWN;
617132f69e4bSDaniel Jurgens 	}
617232f69e4bSDaniel Jurgens 
617300815752SMoni Shoua 	mlx5_ib_internal_fill_odp_caps(dev);
617400815752SMoni Shoua 
617532f69e4bSDaniel Jurgens 	err = mlx5_ib_init_multiport_master(dev);
6176e126ba97SEli Cohen 	if (err)
6177da796ccbSMark Bloch 		return err;
6178e126ba97SEli Cohen 
6179a989ea01SMark Bloch 	err = set_has_smi_cap(dev);
6180a989ea01SMark Bloch 	if (err)
6181a989ea01SMark Bloch 		return err;
6182e126ba97SEli Cohen 
618332f69e4bSDaniel Jurgens 	if (!mlx5_core_mp_enabled(mdev)) {
618432f69e4bSDaniel Jurgens 		for (i = 1; i <= dev->num_ports; i++) {
618532f69e4bSDaniel Jurgens 			err = get_port_caps(dev, i);
618632f69e4bSDaniel Jurgens 			if (err)
618732f69e4bSDaniel Jurgens 				break;
618832f69e4bSDaniel Jurgens 		}
618932f69e4bSDaniel Jurgens 	} else {
619032f69e4bSDaniel Jurgens 		err = get_port_caps(dev, mlx5_core_native_port_num(mdev));
619132f69e4bSDaniel Jurgens 	}
619232f69e4bSDaniel Jurgens 	if (err)
619332f69e4bSDaniel Jurgens 		goto err_mp;
619432f69e4bSDaniel Jurgens 
61951b5daf11SMajd Dibbiny 	if (mlx5_use_mad_ifc(dev))
6196e126ba97SEli Cohen 		get_ext_port_caps(dev);
6197e126ba97SEli Cohen 
6198e126ba97SEli Cohen 	dev->ib_dev.node_type		= RDMA_NODE_IB_CA;
6199c6790aa9SSagi Grimberg 	dev->ib_dev.local_dma_lkey	= 0 /* not supported for now */;
6200e126ba97SEli Cohen 	dev->ib_dev.phys_port_cnt	= dev->num_ports;
6201f2f3df55SSaeed Mahameed 	dev->ib_dev.num_comp_vectors    = mlx5_comp_vectors_count(mdev);
6202c42260f1SVu Pham 	dev->ib_dev.dev.parent		= mdev->device;
6203e126ba97SEli Cohen 
62043cc297dbSMark Bloch 	mutex_init(&dev->cap_mask_mutex);
62053cc297dbSMark Bloch 	INIT_LIST_HEAD(&dev->qp_list);
62063cc297dbSMark Bloch 	spin_lock_init(&dev->reset_flow_resource_lock);
62073cc297dbSMark Bloch 
62083b113a1eSAriel Levkovich 	spin_lock_init(&dev->dm.lock);
62093b113a1eSAriel Levkovich 	dev->dm.dev = mdev;
621024da0016SAriel Levkovich 
621113859d5dSLeon Romanovsky 	if (IS_ENABLED(CONFIG_INFINIBAND_ON_DEMAND_PAGING)) {
62123cc297dbSMark Bloch 		err = init_srcu_struct(&dev->mr_srcu);
6213a6bc3875SMoni Shoua 		if (err)
6214c9b9dcb4SAriel Levkovich 			goto err_mp;
6215623d1543SJason Gunthorpe 	}
62163cc297dbSMark Bloch 
621716c1975fSMark Bloch 	return 0;
621825c13324SAriel Levkovich 
621932f69e4bSDaniel Jurgens err_mp:
622032f69e4bSDaniel Jurgens 	mlx5_ib_cleanup_multiport_master(dev);
622116c1975fSMark Bloch 
622216c1975fSMark Bloch 	return -ENOMEM;
622316c1975fSMark Bloch }
622416c1975fSMark Bloch 
62259a4ca38dSMark Bloch static int mlx5_ib_stage_flow_db_init(struct mlx5_ib_dev *dev)
62269a4ca38dSMark Bloch {
62279a4ca38dSMark Bloch 	dev->flow_db = kzalloc(sizeof(*dev->flow_db), GFP_KERNEL);
62289a4ca38dSMark Bloch 
62299a4ca38dSMark Bloch 	if (!dev->flow_db)
62309a4ca38dSMark Bloch 		return -ENOMEM;
62319a4ca38dSMark Bloch 
62329a4ca38dSMark Bloch 	mutex_init(&dev->flow_db->lock);
62339a4ca38dSMark Bloch 
62349a4ca38dSMark Bloch 	return 0;
62359a4ca38dSMark Bloch }
62369a4ca38dSMark Bloch 
62379a4ca38dSMark Bloch static void mlx5_ib_stage_flow_db_cleanup(struct mlx5_ib_dev *dev)
62389a4ca38dSMark Bloch {
62399a4ca38dSMark Bloch 	kfree(dev->flow_db);
62409a4ca38dSMark Bloch }
62419a4ca38dSMark Bloch 
624296458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_ops = {
62437a154142SJason Gunthorpe 	.owner = THIS_MODULE,
6244b9560a41SJason Gunthorpe 	.driver_id = RDMA_DRIVER_MLX5,
624572c6ec18SJason Gunthorpe 	.uverbs_abi_ver	= MLX5_IB_UVERBS_ABI_VERSION,
6246b9560a41SJason Gunthorpe 
624796458233SKamal Heib 	.add_gid = mlx5_ib_add_gid,
624896458233SKamal Heib 	.alloc_mr = mlx5_ib_alloc_mr,
62496c984472SMax Gurtovoy 	.alloc_mr_integrity = mlx5_ib_alloc_mr_integrity,
625096458233SKamal Heib 	.alloc_pd = mlx5_ib_alloc_pd,
625196458233SKamal Heib 	.alloc_ucontext = mlx5_ib_alloc_ucontext,
625296458233SKamal Heib 	.attach_mcast = mlx5_ib_mcg_attach,
625396458233SKamal Heib 	.check_mr_status = mlx5_ib_check_mr_status,
625496458233SKamal Heib 	.create_ah = mlx5_ib_create_ah,
625596458233SKamal Heib 	.create_counters = mlx5_ib_create_counters,
625696458233SKamal Heib 	.create_cq = mlx5_ib_create_cq,
625796458233SKamal Heib 	.create_flow = mlx5_ib_create_flow,
625896458233SKamal Heib 	.create_qp = mlx5_ib_create_qp,
625996458233SKamal Heib 	.create_srq = mlx5_ib_create_srq,
626096458233SKamal Heib 	.dealloc_pd = mlx5_ib_dealloc_pd,
626196458233SKamal Heib 	.dealloc_ucontext = mlx5_ib_dealloc_ucontext,
626296458233SKamal Heib 	.del_gid = mlx5_ib_del_gid,
626396458233SKamal Heib 	.dereg_mr = mlx5_ib_dereg_mr,
626496458233SKamal Heib 	.destroy_ah = mlx5_ib_destroy_ah,
626596458233SKamal Heib 	.destroy_counters = mlx5_ib_destroy_counters,
626696458233SKamal Heib 	.destroy_cq = mlx5_ib_destroy_cq,
626796458233SKamal Heib 	.destroy_flow = mlx5_ib_destroy_flow,
626896458233SKamal Heib 	.destroy_flow_action = mlx5_ib_destroy_flow_action,
626996458233SKamal Heib 	.destroy_qp = mlx5_ib_destroy_qp,
627096458233SKamal Heib 	.destroy_srq = mlx5_ib_destroy_srq,
627196458233SKamal Heib 	.detach_mcast = mlx5_ib_mcg_detach,
627296458233SKamal Heib 	.disassociate_ucontext = mlx5_ib_disassociate_ucontext,
627396458233SKamal Heib 	.drain_rq = mlx5_ib_drain_rq,
627496458233SKamal Heib 	.drain_sq = mlx5_ib_drain_sq,
6275e1b95ae0SErez Alfasi 	.fill_res_entry = mlx5_ib_fill_res_entry,
6276*4061ff7aSErez Alfasi 	.fill_stat_entry = mlx5_ib_fill_stat_entry,
627796458233SKamal Heib 	.get_dev_fw_str = get_dev_fw_str,
627896458233SKamal Heib 	.get_dma_mr = mlx5_ib_get_dma_mr,
627996458233SKamal Heib 	.get_link_layer = mlx5_ib_port_link_layer,
628096458233SKamal Heib 	.map_mr_sg = mlx5_ib_map_mr_sg,
62816c984472SMax Gurtovoy 	.map_mr_sg_pi = mlx5_ib_map_mr_sg_pi,
628296458233SKamal Heib 	.mmap = mlx5_ib_mmap,
628396458233SKamal Heib 	.modify_cq = mlx5_ib_modify_cq,
628496458233SKamal Heib 	.modify_device = mlx5_ib_modify_device,
628596458233SKamal Heib 	.modify_port = mlx5_ib_modify_port,
628696458233SKamal Heib 	.modify_qp = mlx5_ib_modify_qp,
628796458233SKamal Heib 	.modify_srq = mlx5_ib_modify_srq,
628896458233SKamal Heib 	.poll_cq = mlx5_ib_poll_cq,
628996458233SKamal Heib 	.post_recv = mlx5_ib_post_recv,
629096458233SKamal Heib 	.post_send = mlx5_ib_post_send,
629196458233SKamal Heib 	.post_srq_recv = mlx5_ib_post_srq_recv,
629296458233SKamal Heib 	.process_mad = mlx5_ib_process_mad,
629396458233SKamal Heib 	.query_ah = mlx5_ib_query_ah,
629496458233SKamal Heib 	.query_device = mlx5_ib_query_device,
629596458233SKamal Heib 	.query_gid = mlx5_ib_query_gid,
629696458233SKamal Heib 	.query_pkey = mlx5_ib_query_pkey,
629796458233SKamal Heib 	.query_qp = mlx5_ib_query_qp,
629896458233SKamal Heib 	.query_srq = mlx5_ib_query_srq,
629996458233SKamal Heib 	.read_counters = mlx5_ib_read_counters,
630096458233SKamal Heib 	.reg_user_mr = mlx5_ib_reg_user_mr,
630196458233SKamal Heib 	.req_notify_cq = mlx5_ib_arm_cq,
630296458233SKamal Heib 	.rereg_user_mr = mlx5_ib_rereg_user_mr,
630396458233SKamal Heib 	.resize_cq = mlx5_ib_resize_cq,
6304d3456914SLeon Romanovsky 
6305d3456914SLeon Romanovsky 	INIT_RDMA_OBJ_SIZE(ib_ah, mlx5_ib_ah, ibah),
6306e39afe3dSLeon Romanovsky 	INIT_RDMA_OBJ_SIZE(ib_cq, mlx5_ib_cq, ibcq),
630721a428a0SLeon Romanovsky 	INIT_RDMA_OBJ_SIZE(ib_pd, mlx5_ib_pd, ibpd),
630868e326deSLeon Romanovsky 	INIT_RDMA_OBJ_SIZE(ib_srq, mlx5_ib_srq, ibsrq),
6309a2a074efSLeon Romanovsky 	INIT_RDMA_OBJ_SIZE(ib_ucontext, mlx5_ib_ucontext, ibucontext),
631096458233SKamal Heib };
631196458233SKamal Heib 
631296458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_flow_ipsec_ops = {
631396458233SKamal Heib 	.create_flow_action_esp = mlx5_ib_create_flow_action_esp,
631496458233SKamal Heib 	.modify_flow_action_esp = mlx5_ib_modify_flow_action_esp,
631596458233SKamal Heib };
631696458233SKamal Heib 
631796458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_ipoib_enhanced_ops = {
631896458233SKamal Heib 	.rdma_netdev_get_params = mlx5_ib_rn_get_params,
631996458233SKamal Heib };
632096458233SKamal Heib 
632196458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_sriov_ops = {
632296458233SKamal Heib 	.get_vf_config = mlx5_ib_get_vf_config,
632396458233SKamal Heib 	.get_vf_stats = mlx5_ib_get_vf_stats,
632496458233SKamal Heib 	.set_vf_guid = mlx5_ib_set_vf_guid,
632596458233SKamal Heib 	.set_vf_link_state = mlx5_ib_set_vf_link_state,
632696458233SKamal Heib };
632796458233SKamal Heib 
632896458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_mw_ops = {
632996458233SKamal Heib 	.alloc_mw = mlx5_ib_alloc_mw,
633096458233SKamal Heib 	.dealloc_mw = mlx5_ib_dealloc_mw,
633196458233SKamal Heib };
633296458233SKamal Heib 
633396458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_xrc_ops = {
633496458233SKamal Heib 	.alloc_xrcd = mlx5_ib_alloc_xrcd,
633596458233SKamal Heib 	.dealloc_xrcd = mlx5_ib_dealloc_xrcd,
633696458233SKamal Heib };
633796458233SKamal Heib 
633896458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_dm_ops = {
633996458233SKamal Heib 	.alloc_dm = mlx5_ib_alloc_dm,
634096458233SKamal Heib 	.dealloc_dm = mlx5_ib_dealloc_dm,
634196458233SKamal Heib 	.reg_dm_mr = mlx5_ib_reg_dm_mr,
634296458233SKamal Heib };
634396458233SKamal Heib 
6344fb652d32SMark Bloch static int mlx5_ib_stage_caps_init(struct mlx5_ib_dev *dev)
634516c1975fSMark Bloch {
634616c1975fSMark Bloch 	struct mlx5_core_dev *mdev = dev->mdev;
634716c1975fSMark Bloch 	int err;
634816c1975fSMark Bloch 
6349e126ba97SEli Cohen 	dev->ib_dev.uverbs_cmd_mask	=
6350e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_GET_CONTEXT)		|
6351e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_QUERY_DEVICE)	|
6352e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_QUERY_PORT)		|
6353e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_ALLOC_PD)		|
6354e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_DEALLOC_PD)		|
635541c450fdSMoni Shoua 		(1ull << IB_USER_VERBS_CMD_CREATE_AH)		|
635641c450fdSMoni Shoua 		(1ull << IB_USER_VERBS_CMD_DESTROY_AH)		|
6357e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_REG_MR)		|
635856e11d62SNoa Osherovich 		(1ull << IB_USER_VERBS_CMD_REREG_MR)		|
6359e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_DEREG_MR)		|
6360e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL)	|
6361e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_CREATE_CQ)		|
6362e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_RESIZE_CQ)		|
6363e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_DESTROY_CQ)		|
6364e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_CREATE_QP)		|
6365e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_MODIFY_QP)		|
6366e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_QUERY_QP)		|
6367e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_DESTROY_QP)		|
6368e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_ATTACH_MCAST)	|
6369e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_DETACH_MCAST)	|
6370e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_CREATE_SRQ)		|
6371e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_MODIFY_SRQ)		|
6372e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_QUERY_SRQ)		|
6373e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_DESTROY_SRQ)		|
6374e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_CREATE_XSRQ)		|
6375e126ba97SEli Cohen 		(1ull << IB_USER_VERBS_CMD_OPEN_QP);
63761707cb4aSHaggai Eran 	dev->ib_dev.uverbs_ex_cmd_mask =
6377d4584ddfSMatan Barak 		(1ull << IB_USER_VERBS_EX_CMD_QUERY_DEVICE)	|
6378d4584ddfSMatan Barak 		(1ull << IB_USER_VERBS_EX_CMD_CREATE_CQ)	|
63797d29f349SBodong Wang 		(1ull << IB_USER_VERBS_EX_CMD_CREATE_QP)	|
6380b0e9df6dSYonatan Cohen 		(1ull << IB_USER_VERBS_EX_CMD_MODIFY_QP)	|
638196458233SKamal Heib 		(1ull << IB_USER_VERBS_EX_CMD_MODIFY_CQ)	|
638296458233SKamal Heib 		(1ull << IB_USER_VERBS_EX_CMD_CREATE_FLOW)	|
638396458233SKamal Heib 		(1ull << IB_USER_VERBS_EX_CMD_DESTROY_FLOW);
6384e126ba97SEli Cohen 
6385f6a8a19bSDenis Drozdov 	if (MLX5_CAP_GEN(mdev, ipoib_enhanced_offloads) &&
6386f6a8a19bSDenis Drozdov 	    IS_ENABLED(CONFIG_MLX5_CORE_IPOIB))
638796458233SKamal Heib 		ib_set_device_ops(&dev->ib_dev,
638896458233SKamal Heib 				  &mlx5_ib_dev_ipoib_enhanced_ops);
63898e959601SNiranjana Vishwanathapura 
639096458233SKamal Heib 	if (mlx5_core_is_pf(mdev))
639196458233SKamal Heib 		ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_sriov_ops);
63927c2344c3SMaor Gottlieb 
63936e8484c5SMax Gurtovoy 	dev->umr_fence = mlx5_get_umr_fence(MLX5_CAP_GEN(mdev, umr_fence));
63946e8484c5SMax Gurtovoy 
6395d2370e0aSMatan Barak 	if (MLX5_CAP_GEN(mdev, imaicl)) {
6396d2370e0aSMatan Barak 		dev->ib_dev.uverbs_cmd_mask |=
6397d2370e0aSMatan Barak 			(1ull << IB_USER_VERBS_CMD_ALLOC_MW)	|
6398d2370e0aSMatan Barak 			(1ull << IB_USER_VERBS_CMD_DEALLOC_MW);
639996458233SKamal Heib 		ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_mw_ops);
6400d2370e0aSMatan Barak 	}
6401d2370e0aSMatan Barak 
6402938fe83cSSaeed Mahameed 	if (MLX5_CAP_GEN(mdev, xrc)) {
6403e126ba97SEli Cohen 		dev->ib_dev.uverbs_cmd_mask |=
6404e126ba97SEli Cohen 			(1ull << IB_USER_VERBS_CMD_OPEN_XRCD) |
6405e126ba97SEli Cohen 			(1ull << IB_USER_VERBS_CMD_CLOSE_XRCD);
640696458233SKamal Heib 		ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_xrc_ops);
6407e126ba97SEli Cohen 	}
6408e126ba97SEli Cohen 
640925c13324SAriel Levkovich 	if (MLX5_CAP_DEV_MEM(mdev, memic) ||
641025c13324SAriel Levkovich 	    MLX5_CAP_GEN_64(dev->mdev, general_obj_types) &
641125c13324SAriel Levkovich 	    MLX5_GENERAL_OBJ_TYPES_CAP_SW_ICM)
641296458233SKamal Heib 		ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_dm_ops);
641324da0016SAriel Levkovich 
6414dfb631a1SJason Gunthorpe 	if (mlx5_accel_ipsec_device_caps(dev->mdev) &
641596458233SKamal Heib 	    MLX5_ACCEL_IPSEC_CAP_DEVICE)
641696458233SKamal Heib 		ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_flow_ipsec_ops);
641796458233SKamal Heib 	ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_ops);
641881e30880SYishai Hadas 
641936e235c8SJason Gunthorpe 	if (IS_ENABLED(CONFIG_INFINIBAND_USER_ACCESS))
642036e235c8SJason Gunthorpe 		dev->ib_dev.driver_def = mlx5_ib_defs;
642181e30880SYishai Hadas 
6422e126ba97SEli Cohen 	err = init_node_data(dev);
6423e126ba97SEli Cohen 	if (err)
642416c1975fSMark Bloch 		return err;
6425e126ba97SEli Cohen 
6426c8b89924SMark Bloch 	if ((MLX5_CAP_GEN(dev->mdev, port_type) == MLX5_CAP_PORT_TYPE_ETH) &&
6427e7996a9aSJason Gunthorpe 	    (MLX5_CAP_GEN(dev->mdev, disable_local_lb_uc) ||
6428e7996a9aSJason Gunthorpe 	     MLX5_CAP_GEN(dev->mdev, disable_local_lb_mc)))
6429a560f1d9SMark Bloch 		mutex_init(&dev->lb.mutex);
6430c8b89924SMark Bloch 
643196e2fd73SLeon Romanovsky 	dev->ib_dev.use_cq_dim = true;
643296e2fd73SLeon Romanovsky 
643316c1975fSMark Bloch 	return 0;
643416c1975fSMark Bloch }
643516c1975fSMark Bloch 
643696458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_port_ops = {
643796458233SKamal Heib 	.get_port_immutable = mlx5_port_immutable,
643896458233SKamal Heib 	.query_port = mlx5_ib_query_port,
643996458233SKamal Heib };
644096458233SKamal Heib 
64418e6efa3aSMark Bloch static int mlx5_ib_stage_non_default_cb(struct mlx5_ib_dev *dev)
644216c1975fSMark Bloch {
644396458233SKamal Heib 	ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_port_ops);
64448e6efa3aSMark Bloch 	return 0;
64458e6efa3aSMark Bloch }
64468e6efa3aSMark Bloch 
644796458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_port_rep_ops = {
644896458233SKamal Heib 	.get_port_immutable = mlx5_port_rep_immutable,
644996458233SKamal Heib 	.query_port = mlx5_ib_rep_query_port,
645096458233SKamal Heib };
645196458233SKamal Heib 
6452fb652d32SMark Bloch static int mlx5_ib_stage_rep_non_default_cb(struct mlx5_ib_dev *dev)
64538e6efa3aSMark Bloch {
645496458233SKamal Heib 	ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_port_rep_ops);
64558e6efa3aSMark Bloch 	return 0;
64568e6efa3aSMark Bloch }
64578e6efa3aSMark Bloch 
645896458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_common_roce_ops = {
645996458233SKamal Heib 	.create_rwq_ind_table = mlx5_ib_create_rwq_ind_table,
646096458233SKamal Heib 	.create_wq = mlx5_ib_create_wq,
646196458233SKamal Heib 	.destroy_rwq_ind_table = mlx5_ib_destroy_rwq_ind_table,
646296458233SKamal Heib 	.destroy_wq = mlx5_ib_destroy_wq,
646396458233SKamal Heib 	.get_netdev = mlx5_ib_get_netdev,
646496458233SKamal Heib 	.modify_wq = mlx5_ib_modify_wq,
646596458233SKamal Heib };
646696458233SKamal Heib 
6467e3f1ed1fSLeon Romanovsky static int mlx5_ib_stage_common_roce_init(struct mlx5_ib_dev *dev)
64688e6efa3aSMark Bloch {
6469e3f1ed1fSLeon Romanovsky 	u8 port_num;
64707fd8aefbSDaniel Jurgens 
6471c11a226aSMark Bloch 	dev->ib_dev.uverbs_ex_cmd_mask |=
6472c11a226aSMark Bloch 			(1ull << IB_USER_VERBS_EX_CMD_CREATE_WQ) |
6473c11a226aSMark Bloch 			(1ull << IB_USER_VERBS_EX_CMD_MODIFY_WQ) |
6474c11a226aSMark Bloch 			(1ull << IB_USER_VERBS_EX_CMD_DESTROY_WQ) |
6475c11a226aSMark Bloch 			(1ull << IB_USER_VERBS_EX_CMD_CREATE_RWQ_IND_TBL) |
6476c11a226aSMark Bloch 			(1ull << IB_USER_VERBS_EX_CMD_DESTROY_RWQ_IND_TBL);
647796458233SKamal Heib 	ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_common_roce_ops);
64788e6efa3aSMark Bloch 
6479e3f1ed1fSLeon Romanovsky 	port_num = mlx5_core_native_port_num(dev->mdev) - 1;
6480e3f1ed1fSLeon Romanovsky 
648126628e2dSMark Bloch 	/* Register only for native ports */
64828e6efa3aSMark Bloch 	return mlx5_add_netdev_notifier(dev, port_num);
64838e6efa3aSMark Bloch }
64848e6efa3aSMark Bloch 
64858e6efa3aSMark Bloch static void mlx5_ib_stage_common_roce_cleanup(struct mlx5_ib_dev *dev)
64868e6efa3aSMark Bloch {
64878e6efa3aSMark Bloch 	u8 port_num = mlx5_core_native_port_num(dev->mdev) - 1;
64888e6efa3aSMark Bloch 
64898e6efa3aSMark Bloch 	mlx5_remove_netdev_notifier(dev, port_num);
64908e6efa3aSMark Bloch }
64918e6efa3aSMark Bloch 
6492fb652d32SMark Bloch static int mlx5_ib_stage_rep_roce_init(struct mlx5_ib_dev *dev)
64938e6efa3aSMark Bloch {
64948e6efa3aSMark Bloch 	struct mlx5_core_dev *mdev = dev->mdev;
64958e6efa3aSMark Bloch 	enum rdma_link_layer ll;
64968e6efa3aSMark Bloch 	int port_type_cap;
64978e6efa3aSMark Bloch 	int err = 0;
64988e6efa3aSMark Bloch 
64998e6efa3aSMark Bloch 	port_type_cap = MLX5_CAP_GEN(mdev, port_type);
65008e6efa3aSMark Bloch 	ll = mlx5_port_type_cap_to_rdma_ll(port_type_cap);
65018e6efa3aSMark Bloch 
65028e6efa3aSMark Bloch 	if (ll == IB_LINK_LAYER_ETHERNET)
6503e3f1ed1fSLeon Romanovsky 		err = mlx5_ib_stage_common_roce_init(dev);
65048e6efa3aSMark Bloch 
650516c1975fSMark Bloch 	return err;
6506fc24fc5eSAchiad Shochat }
6507fc24fc5eSAchiad Shochat 
6508fb652d32SMark Bloch static void mlx5_ib_stage_rep_roce_cleanup(struct mlx5_ib_dev *dev)
65098e6efa3aSMark Bloch {
65108e6efa3aSMark Bloch 	mlx5_ib_stage_common_roce_cleanup(dev);
65118e6efa3aSMark Bloch }
65128e6efa3aSMark Bloch 
65138e6efa3aSMark Bloch static int mlx5_ib_stage_roce_init(struct mlx5_ib_dev *dev)
65148e6efa3aSMark Bloch {
65158e6efa3aSMark Bloch 	struct mlx5_core_dev *mdev = dev->mdev;
65168e6efa3aSMark Bloch 	enum rdma_link_layer ll;
65178e6efa3aSMark Bloch 	int port_type_cap;
65188e6efa3aSMark Bloch 	int err;
65198e6efa3aSMark Bloch 
65208e6efa3aSMark Bloch 	port_type_cap = MLX5_CAP_GEN(mdev, port_type);
65218e6efa3aSMark Bloch 	ll = mlx5_port_type_cap_to_rdma_ll(port_type_cap);
65228e6efa3aSMark Bloch 
65238e6efa3aSMark Bloch 	if (ll == IB_LINK_LAYER_ETHERNET) {
6524e3f1ed1fSLeon Romanovsky 		err = mlx5_ib_stage_common_roce_init(dev);
65258e6efa3aSMark Bloch 		if (err)
65268e6efa3aSMark Bloch 			return err;
65278e6efa3aSMark Bloch 
6528e3f1ed1fSLeon Romanovsky 		err = mlx5_enable_eth(dev);
65298e6efa3aSMark Bloch 		if (err)
65308e6efa3aSMark Bloch 			goto cleanup;
65318e6efa3aSMark Bloch 	}
65328e6efa3aSMark Bloch 
653316c1975fSMark Bloch 	return 0;
65348e6efa3aSMark Bloch cleanup:
65358e6efa3aSMark Bloch 	mlx5_ib_stage_common_roce_cleanup(dev);
65368e6efa3aSMark Bloch 
65378e6efa3aSMark Bloch 	return err;
653845bded2cSKamal Heib }
65396aec21f6SHaggai Eran 
654016c1975fSMark Bloch static void mlx5_ib_stage_roce_cleanup(struct mlx5_ib_dev *dev)
654116c1975fSMark Bloch {
654216c1975fSMark Bloch 	struct mlx5_core_dev *mdev = dev->mdev;
654316c1975fSMark Bloch 	enum rdma_link_layer ll;
654416c1975fSMark Bloch 	int port_type_cap;
65454a2da0b8SParav Pandit 
654616c1975fSMark Bloch 	port_type_cap = MLX5_CAP_GEN(mdev, port_type);
654716c1975fSMark Bloch 	ll = mlx5_port_type_cap_to_rdma_ll(port_type_cap);
654816c1975fSMark Bloch 
654916c1975fSMark Bloch 	if (ll == IB_LINK_LAYER_ETHERNET) {
655016c1975fSMark Bloch 		mlx5_disable_eth(dev);
65518e6efa3aSMark Bloch 		mlx5_ib_stage_common_roce_cleanup(dev);
655216c1975fSMark Bloch 	}
655316c1975fSMark Bloch }
655416c1975fSMark Bloch 
6555fb652d32SMark Bloch static int mlx5_ib_stage_dev_res_init(struct mlx5_ib_dev *dev)
655616c1975fSMark Bloch {
655716c1975fSMark Bloch 	return create_dev_resources(&dev->devr);
655816c1975fSMark Bloch }
655916c1975fSMark Bloch 
6560fb652d32SMark Bloch static void mlx5_ib_stage_dev_res_cleanup(struct mlx5_ib_dev *dev)
656116c1975fSMark Bloch {
656216c1975fSMark Bloch 	destroy_dev_resources(&dev->devr);
656316c1975fSMark Bloch }
656416c1975fSMark Bloch 
656516c1975fSMark Bloch static int mlx5_ib_stage_odp_init(struct mlx5_ib_dev *dev)
656616c1975fSMark Bloch {
656716c1975fSMark Bloch 	return mlx5_ib_odp_init_one(dev);
656816c1975fSMark Bloch }
656916c1975fSMark Bloch 
6570f3ffed0cSKamal Heib static void mlx5_ib_stage_odp_cleanup(struct mlx5_ib_dev *dev)
6571d5d284b8SSaeed Mahameed {
6572d5d284b8SSaeed Mahameed 	mlx5_ib_odp_cleanup_one(dev);
6573d5d284b8SSaeed Mahameed }
6574d5d284b8SSaeed Mahameed 
657596458233SKamal Heib static const struct ib_device_ops mlx5_ib_dev_hw_stats_ops = {
657696458233SKamal Heib 	.alloc_hw_stats = mlx5_ib_alloc_hw_stats,
657796458233SKamal Heib 	.get_hw_stats = mlx5_ib_get_hw_stats,
657845842fc6SMark Zhang 	.counter_bind_qp = mlx5_ib_counter_bind_qp,
657945842fc6SMark Zhang 	.counter_unbind_qp = mlx5_ib_counter_unbind_qp,
658045842fc6SMark Zhang 	.counter_dealloc = mlx5_ib_counter_dealloc,
658118d422ceSMark Zhang 	.counter_alloc_stats = mlx5_ib_counter_alloc_stats,
658218d422ceSMark Zhang 	.counter_update_stats = mlx5_ib_counter_update_stats,
658396458233SKamal Heib };
658496458233SKamal Heib 
6585fb652d32SMark Bloch static int mlx5_ib_stage_counters_init(struct mlx5_ib_dev *dev)
658616c1975fSMark Bloch {
65875e1e7612SMark Bloch 	if (MLX5_CAP_GEN(dev->mdev, max_qp_cnt)) {
658896458233SKamal Heib 		ib_set_device_ops(&dev->ib_dev, &mlx5_ib_dev_hw_stats_ops);
65895e1e7612SMark Bloch 
659016c1975fSMark Bloch 		return mlx5_ib_alloc_counters(dev);
65915e1e7612SMark Bloch 	}
659216c1975fSMark Bloch 
659316c1975fSMark Bloch 	return 0;
659416c1975fSMark Bloch }
659516c1975fSMark Bloch 
6596fb652d32SMark Bloch static void mlx5_ib_stage_counters_cleanup(struct mlx5_ib_dev *dev)
659716c1975fSMark Bloch {
659816c1975fSMark Bloch 	if (MLX5_CAP_GEN(dev->mdev, max_qp_cnt))
659916c1975fSMark Bloch 		mlx5_ib_dealloc_counters(dev);
660016c1975fSMark Bloch }
660116c1975fSMark Bloch 
660216c1975fSMark Bloch static int mlx5_ib_stage_cong_debugfs_init(struct mlx5_ib_dev *dev)
660316c1975fSMark Bloch {
660473eb8f03SGreg Kroah-Hartman 	mlx5_ib_init_cong_debugfs(dev,
6605a9e546e7SParav Pandit 				  mlx5_core_native_port_num(dev->mdev) - 1);
660673eb8f03SGreg Kroah-Hartman 	return 0;
660716c1975fSMark Bloch }
660816c1975fSMark Bloch 
660916c1975fSMark Bloch static void mlx5_ib_stage_cong_debugfs_cleanup(struct mlx5_ib_dev *dev)
661016c1975fSMark Bloch {
6611a9e546e7SParav Pandit 	mlx5_ib_cleanup_cong_debugfs(dev,
6612a9e546e7SParav Pandit 				     mlx5_core_native_port_num(dev->mdev) - 1);
661316c1975fSMark Bloch }
661416c1975fSMark Bloch 
661516c1975fSMark Bloch static int mlx5_ib_stage_uar_init(struct mlx5_ib_dev *dev)
661616c1975fSMark Bloch {
66175fe9dec0SEli Cohen 	dev->mdev->priv.uar = mlx5_get_uars_page(dev->mdev);
6618444261caSLeon Romanovsky 	return PTR_ERR_OR_ZERO(dev->mdev->priv.uar);
661916c1975fSMark Bloch }
662016c1975fSMark Bloch 
662116c1975fSMark Bloch static void mlx5_ib_stage_uar_cleanup(struct mlx5_ib_dev *dev)
662216c1975fSMark Bloch {
662316c1975fSMark Bloch 	mlx5_put_uars_page(dev->mdev, dev->mdev->priv.uar);
662416c1975fSMark Bloch }
662516c1975fSMark Bloch 
6626fb652d32SMark Bloch static int mlx5_ib_stage_bfrag_init(struct mlx5_ib_dev *dev)
662716c1975fSMark Bloch {
662816c1975fSMark Bloch 	int err;
66295fe9dec0SEli Cohen 
66305fe9dec0SEli Cohen 	err = mlx5_alloc_bfreg(dev->mdev, &dev->bfreg, false, false);
66315fe9dec0SEli Cohen 	if (err)
663216c1975fSMark Bloch 		return err;
66335fe9dec0SEli Cohen 
66345fe9dec0SEli Cohen 	err = mlx5_alloc_bfreg(dev->mdev, &dev->fp_bfreg, false, true);
66355fe9dec0SEli Cohen 	if (err)
663616c1975fSMark Bloch 		mlx5_free_bfreg(dev->mdev, &dev->fp_bfreg);
66375fe9dec0SEli Cohen 
663816c1975fSMark Bloch 	return err;
663916c1975fSMark Bloch }
66400837e86aSMark Bloch 
6641fb652d32SMark Bloch static void mlx5_ib_stage_bfrag_cleanup(struct mlx5_ib_dev *dev)
664216c1975fSMark Bloch {
664316c1975fSMark Bloch 	mlx5_free_bfreg(dev->mdev, &dev->fp_bfreg);
664416c1975fSMark Bloch 	mlx5_free_bfreg(dev->mdev, &dev->bfreg);
664516c1975fSMark Bloch }
6646e126ba97SEli Cohen 
6647fb652d32SMark Bloch static int mlx5_ib_stage_ib_reg_init(struct mlx5_ib_dev *dev)
664816c1975fSMark Bloch {
6649e349f858SJason Gunthorpe 	const char *name;
6650e349f858SJason Gunthorpe 
6651508a523fSParav Pandit 	rdma_set_device_sysfs_group(&dev->ib_dev, &mlx5_attr_group);
66527c34ec19SAviv Heller 	if (!mlx5_lag_is_roce(dev->mdev))
6653e349f858SJason Gunthorpe 		name = "mlx5_%d";
6654e349f858SJason Gunthorpe 	else
6655e349f858SJason Gunthorpe 		name = "mlx5_bond_%d";
6656ea4baf7fSParav Pandit 	return ib_register_device(&dev->ib_dev, name);
665716c1975fSMark Bloch }
665816c1975fSMark Bloch 
6659fb652d32SMark Bloch static void mlx5_ib_stage_pre_ib_reg_umr_cleanup(struct mlx5_ib_dev *dev)
666042cea83fSMark Bloch {
666142cea83fSMark Bloch 	destroy_umrc_res(dev);
666242cea83fSMark Bloch }
666342cea83fSMark Bloch 
6664fb652d32SMark Bloch static void mlx5_ib_stage_ib_reg_cleanup(struct mlx5_ib_dev *dev)
666516c1975fSMark Bloch {
666616c1975fSMark Bloch 	ib_unregister_device(&dev->ib_dev);
666716c1975fSMark Bloch }
666816c1975fSMark Bloch 
6669fb652d32SMark Bloch static int mlx5_ib_stage_post_ib_reg_umr_init(struct mlx5_ib_dev *dev)
667016c1975fSMark Bloch {
667116c1975fSMark Bloch 	return create_umr_res(dev);
667216c1975fSMark Bloch }
667316c1975fSMark Bloch 
667416c1975fSMark Bloch static int mlx5_ib_stage_delay_drop_init(struct mlx5_ib_dev *dev)
667516c1975fSMark Bloch {
667603404e8aSMaor Gottlieb 	init_delay_drop(dev);
667703404e8aSMaor Gottlieb 
667816c1975fSMark Bloch 	return 0;
667916c1975fSMark Bloch }
668016c1975fSMark Bloch 
668116c1975fSMark Bloch static void mlx5_ib_stage_delay_drop_cleanup(struct mlx5_ib_dev *dev)
668216c1975fSMark Bloch {
668316c1975fSMark Bloch 	cancel_delay_drop(dev);
668416c1975fSMark Bloch }
668516c1975fSMark Bloch 
6686df097a27SSaeed Mahameed static int mlx5_ib_stage_dev_notifier_init(struct mlx5_ib_dev *dev)
6687df097a27SSaeed Mahameed {
6688df097a27SSaeed Mahameed 	dev->mdev_events.notifier_call = mlx5_ib_event;
6689df097a27SSaeed Mahameed 	mlx5_notifier_register(dev->mdev, &dev->mdev_events);
6690df097a27SSaeed Mahameed 	return 0;
6691df097a27SSaeed Mahameed }
6692df097a27SSaeed Mahameed 
6693df097a27SSaeed Mahameed static void mlx5_ib_stage_dev_notifier_cleanup(struct mlx5_ib_dev *dev)
6694df097a27SSaeed Mahameed {
6695df097a27SSaeed Mahameed 	mlx5_notifier_unregister(dev->mdev, &dev->mdev_events);
6696df097a27SSaeed Mahameed }
6697df097a27SSaeed Mahameed 
669881773ce5SLeon Romanovsky static int mlx5_ib_stage_devx_init(struct mlx5_ib_dev *dev)
669981773ce5SLeon Romanovsky {
670081773ce5SLeon Romanovsky 	int uid;
670181773ce5SLeon Romanovsky 
6702fb98153bSYishai Hadas 	uid = mlx5_ib_devx_create(dev, false);
6703e337dd53SYishai Hadas 	if (uid > 0) {
670481773ce5SLeon Romanovsky 		dev->devx_whitelist_uid = uid;
6705e337dd53SYishai Hadas 		mlx5_ib_devx_init_event_table(dev);
6706e337dd53SYishai Hadas 	}
670781773ce5SLeon Romanovsky 
670881773ce5SLeon Romanovsky 	return 0;
670981773ce5SLeon Romanovsky }
671081773ce5SLeon Romanovsky static void mlx5_ib_stage_devx_cleanup(struct mlx5_ib_dev *dev)
671181773ce5SLeon Romanovsky {
6712e337dd53SYishai Hadas 	if (dev->devx_whitelist_uid) {
6713e337dd53SYishai Hadas 		mlx5_ib_devx_cleanup_event_table(dev);
671481773ce5SLeon Romanovsky 		mlx5_ib_devx_destroy(dev, dev->devx_whitelist_uid);
671581773ce5SLeon Romanovsky 	}
6716e337dd53SYishai Hadas }
671781773ce5SLeon Romanovsky 
6718b5ca15adSMark Bloch void __mlx5_ib_remove(struct mlx5_ib_dev *dev,
671916c1975fSMark Bloch 		      const struct mlx5_ib_profile *profile,
672016c1975fSMark Bloch 		      int stage)
672116c1975fSMark Bloch {
672216c1975fSMark Bloch 	/* Number of stages to cleanup */
672316c1975fSMark Bloch 	while (stage) {
672416c1975fSMark Bloch 		stage--;
672516c1975fSMark Bloch 		if (profile->stage[stage].cleanup)
672616c1975fSMark Bloch 			profile->stage[stage].cleanup(dev);
672716c1975fSMark Bloch 	}
67284a6dc855SMark Bloch 
6729da796ccbSMark Bloch 	kfree(dev->port);
67304a6dc855SMark Bloch 	ib_dealloc_device(&dev->ib_dev);
673116c1975fSMark Bloch }
673216c1975fSMark Bloch 
6733b5ca15adSMark Bloch void *__mlx5_ib_add(struct mlx5_ib_dev *dev,
673416c1975fSMark Bloch 		    const struct mlx5_ib_profile *profile)
673516c1975fSMark Bloch {
673616c1975fSMark Bloch 	int err;
673716c1975fSMark Bloch 	int i;
673816c1975fSMark Bloch 
673916c1975fSMark Bloch 	for (i = 0; i < MLX5_IB_STAGE_MAX; i++) {
674016c1975fSMark Bloch 		if (profile->stage[i].init) {
674116c1975fSMark Bloch 			err = profile->stage[i].init(dev);
674216c1975fSMark Bloch 			if (err)
674316c1975fSMark Bloch 				goto err_out;
674416c1975fSMark Bloch 		}
674516c1975fSMark Bloch 	}
674616c1975fSMark Bloch 
674716c1975fSMark Bloch 	dev->profile = profile;
6748e126ba97SEli Cohen 	dev->ib_active = true;
6749e126ba97SEli Cohen 
67509603b61dSJack Morgenstein 	return dev;
6751e126ba97SEli Cohen 
675216c1975fSMark Bloch err_out:
675316c1975fSMark Bloch 	__mlx5_ib_remove(dev, profile, i);
6754e126ba97SEli Cohen 
67559603b61dSJack Morgenstein 	return NULL;
6756e126ba97SEli Cohen }
6757e126ba97SEli Cohen 
675816c1975fSMark Bloch static const struct mlx5_ib_profile pf_profile = {
675916c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_INIT,
676016c1975fSMark Bloch 		     mlx5_ib_stage_init_init,
676116c1975fSMark Bloch 		     mlx5_ib_stage_init_cleanup),
67629a4ca38dSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_FLOW_DB,
67639a4ca38dSMark Bloch 		     mlx5_ib_stage_flow_db_init,
67649a4ca38dSMark Bloch 		     mlx5_ib_stage_flow_db_cleanup),
676516c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_CAPS,
676616c1975fSMark Bloch 		     mlx5_ib_stage_caps_init,
676716c1975fSMark Bloch 		     NULL),
67688e6efa3aSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_NON_DEFAULT_CB,
67698e6efa3aSMark Bloch 		     mlx5_ib_stage_non_default_cb,
67708e6efa3aSMark Bloch 		     NULL),
677116c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_ROCE,
677216c1975fSMark Bloch 		     mlx5_ib_stage_roce_init,
677316c1975fSMark Bloch 		     mlx5_ib_stage_roce_cleanup),
6774f3da6577SLeon Romanovsky 	STAGE_CREATE(MLX5_IB_STAGE_SRQ,
6775f3da6577SLeon Romanovsky 		     mlx5_init_srq_table,
6776f3da6577SLeon Romanovsky 		     mlx5_cleanup_srq_table),
677716c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_DEVICE_RESOURCES,
677816c1975fSMark Bloch 		     mlx5_ib_stage_dev_res_init,
677916c1975fSMark Bloch 		     mlx5_ib_stage_dev_res_cleanup),
6780df097a27SSaeed Mahameed 	STAGE_CREATE(MLX5_IB_STAGE_DEVICE_NOTIFIER,
6781df097a27SSaeed Mahameed 		     mlx5_ib_stage_dev_notifier_init,
6782df097a27SSaeed Mahameed 		     mlx5_ib_stage_dev_notifier_cleanup),
678316c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_ODP,
678416c1975fSMark Bloch 		     mlx5_ib_stage_odp_init,
6785d5d284b8SSaeed Mahameed 		     mlx5_ib_stage_odp_cleanup),
678616c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_COUNTERS,
678716c1975fSMark Bloch 		     mlx5_ib_stage_counters_init,
678816c1975fSMark Bloch 		     mlx5_ib_stage_counters_cleanup),
678916c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_CONG_DEBUGFS,
679016c1975fSMark Bloch 		     mlx5_ib_stage_cong_debugfs_init,
679116c1975fSMark Bloch 		     mlx5_ib_stage_cong_debugfs_cleanup),
679216c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_UAR,
679316c1975fSMark Bloch 		     mlx5_ib_stage_uar_init,
679416c1975fSMark Bloch 		     mlx5_ib_stage_uar_cleanup),
679516c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_BFREG,
679616c1975fSMark Bloch 		     mlx5_ib_stage_bfrag_init,
679716c1975fSMark Bloch 		     mlx5_ib_stage_bfrag_cleanup),
679842cea83fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_PRE_IB_REG_UMR,
679942cea83fSMark Bloch 		     NULL,
680042cea83fSMark Bloch 		     mlx5_ib_stage_pre_ib_reg_umr_cleanup),
680181773ce5SLeon Romanovsky 	STAGE_CREATE(MLX5_IB_STAGE_WHITELIST_UID,
680281773ce5SLeon Romanovsky 		     mlx5_ib_stage_devx_init,
680381773ce5SLeon Romanovsky 		     mlx5_ib_stage_devx_cleanup),
680416c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_IB_REG,
680516c1975fSMark Bloch 		     mlx5_ib_stage_ib_reg_init,
680616c1975fSMark Bloch 		     mlx5_ib_stage_ib_reg_cleanup),
680742cea83fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_POST_IB_REG_UMR,
680842cea83fSMark Bloch 		     mlx5_ib_stage_post_ib_reg_umr_init,
680942cea83fSMark Bloch 		     NULL),
681016c1975fSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_DELAY_DROP,
681116c1975fSMark Bloch 		     mlx5_ib_stage_delay_drop_init,
681216c1975fSMark Bloch 		     mlx5_ib_stage_delay_drop_cleanup),
681316c1975fSMark Bloch };
681416c1975fSMark Bloch 
6815f0666f1fSBodong Wang const struct mlx5_ib_profile uplink_rep_profile = {
6816b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_INIT,
6817b5ca15adSMark Bloch 		     mlx5_ib_stage_init_init,
6818b5ca15adSMark Bloch 		     mlx5_ib_stage_init_cleanup),
6819b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_FLOW_DB,
6820b5ca15adSMark Bloch 		     mlx5_ib_stage_flow_db_init,
6821b5ca15adSMark Bloch 		     mlx5_ib_stage_flow_db_cleanup),
6822b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_CAPS,
6823b5ca15adSMark Bloch 		     mlx5_ib_stage_caps_init,
6824b5ca15adSMark Bloch 		     NULL),
6825b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_NON_DEFAULT_CB,
6826b5ca15adSMark Bloch 		     mlx5_ib_stage_rep_non_default_cb,
6827b5ca15adSMark Bloch 		     NULL),
6828b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_ROCE,
6829b5ca15adSMark Bloch 		     mlx5_ib_stage_rep_roce_init,
6830b5ca15adSMark Bloch 		     mlx5_ib_stage_rep_roce_cleanup),
6831f3da6577SLeon Romanovsky 	STAGE_CREATE(MLX5_IB_STAGE_SRQ,
6832f3da6577SLeon Romanovsky 		     mlx5_init_srq_table,
6833f3da6577SLeon Romanovsky 		     mlx5_cleanup_srq_table),
6834b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_DEVICE_RESOURCES,
6835b5ca15adSMark Bloch 		     mlx5_ib_stage_dev_res_init,
6836b5ca15adSMark Bloch 		     mlx5_ib_stage_dev_res_cleanup),
6837df097a27SSaeed Mahameed 	STAGE_CREATE(MLX5_IB_STAGE_DEVICE_NOTIFIER,
6838df097a27SSaeed Mahameed 		     mlx5_ib_stage_dev_notifier_init,
6839df097a27SSaeed Mahameed 		     mlx5_ib_stage_dev_notifier_cleanup),
6840b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_COUNTERS,
6841b5ca15adSMark Bloch 		     mlx5_ib_stage_counters_init,
6842b5ca15adSMark Bloch 		     mlx5_ib_stage_counters_cleanup),
6843b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_UAR,
6844b5ca15adSMark Bloch 		     mlx5_ib_stage_uar_init,
6845b5ca15adSMark Bloch 		     mlx5_ib_stage_uar_cleanup),
6846b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_BFREG,
6847b5ca15adSMark Bloch 		     mlx5_ib_stage_bfrag_init,
6848b5ca15adSMark Bloch 		     mlx5_ib_stage_bfrag_cleanup),
684903fe2debSDavid S. Miller 	STAGE_CREATE(MLX5_IB_STAGE_PRE_IB_REG_UMR,
685003fe2debSDavid S. Miller 		     NULL,
685103fe2debSDavid S. Miller 		     mlx5_ib_stage_pre_ib_reg_umr_cleanup),
68527f575103SMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_WHITELIST_UID,
68537f575103SMark Bloch 		     mlx5_ib_stage_devx_init,
68547f575103SMark Bloch 		     mlx5_ib_stage_devx_cleanup),
6855b5ca15adSMark Bloch 	STAGE_CREATE(MLX5_IB_STAGE_IB_REG,
6856b5ca15adSMark Bloch 		     mlx5_ib_stage_ib_reg_init,
6857b5ca15adSMark Bloch 		     mlx5_ib_stage_ib_reg_cleanup),
685803fe2debSDavid S. Miller 	STAGE_CREATE(MLX5_IB_STAGE_POST_IB_REG_UMR,
685903fe2debSDavid S. Miller 		     mlx5_ib_stage_post_ib_reg_umr_init,
686003fe2debSDavid S. Miller 		     NULL),
6861b5ca15adSMark Bloch };
6862b5ca15adSMark Bloch 
6863e3f1ed1fSLeon Romanovsky static void *mlx5_ib_add_slave_port(struct mlx5_core_dev *mdev)
686432f69e4bSDaniel Jurgens {
686532f69e4bSDaniel Jurgens 	struct mlx5_ib_multiport_info *mpi;
686632f69e4bSDaniel Jurgens 	struct mlx5_ib_dev *dev;
686732f69e4bSDaniel Jurgens 	bool bound = false;
686832f69e4bSDaniel Jurgens 	int err;
686932f69e4bSDaniel Jurgens 
687032f69e4bSDaniel Jurgens 	mpi = kzalloc(sizeof(*mpi), GFP_KERNEL);
687132f69e4bSDaniel Jurgens 	if (!mpi)
687232f69e4bSDaniel Jurgens 		return NULL;
687332f69e4bSDaniel Jurgens 
687432f69e4bSDaniel Jurgens 	mpi->mdev = mdev;
687532f69e4bSDaniel Jurgens 
687632f69e4bSDaniel Jurgens 	err = mlx5_query_nic_vport_system_image_guid(mdev,
687732f69e4bSDaniel Jurgens 						     &mpi->sys_image_guid);
687832f69e4bSDaniel Jurgens 	if (err) {
687932f69e4bSDaniel Jurgens 		kfree(mpi);
688032f69e4bSDaniel Jurgens 		return NULL;
688132f69e4bSDaniel Jurgens 	}
688232f69e4bSDaniel Jurgens 
688332f69e4bSDaniel Jurgens 	mutex_lock(&mlx5_ib_multiport_mutex);
688432f69e4bSDaniel Jurgens 	list_for_each_entry(dev, &mlx5_ib_dev_list, ib_dev_list) {
688532f69e4bSDaniel Jurgens 		if (dev->sys_image_guid == mpi->sys_image_guid)
688632f69e4bSDaniel Jurgens 			bound = mlx5_ib_bind_slave_port(dev, mpi);
688732f69e4bSDaniel Jurgens 
688832f69e4bSDaniel Jurgens 		if (bound) {
688932f69e4bSDaniel Jurgens 			rdma_roce_rescan_device(&dev->ib_dev);
689032f69e4bSDaniel Jurgens 			break;
689132f69e4bSDaniel Jurgens 		}
689232f69e4bSDaniel Jurgens 	}
689332f69e4bSDaniel Jurgens 
689432f69e4bSDaniel Jurgens 	if (!bound) {
689532f69e4bSDaniel Jurgens 		list_add_tail(&mpi->list, &mlx5_ib_unaffiliated_port_list);
6896c42260f1SVu Pham 		dev_dbg(mdev->device,
6897c42260f1SVu Pham 			"no suitable IB device found to bind to, added to unaffiliated list.\n");
689832f69e4bSDaniel Jurgens 	}
689932f69e4bSDaniel Jurgens 	mutex_unlock(&mlx5_ib_multiport_mutex);
690032f69e4bSDaniel Jurgens 
690132f69e4bSDaniel Jurgens 	return mpi;
690232f69e4bSDaniel Jurgens }
690332f69e4bSDaniel Jurgens 
690416c1975fSMark Bloch static void *mlx5_ib_add(struct mlx5_core_dev *mdev)
690516c1975fSMark Bloch {
690632f69e4bSDaniel Jurgens 	enum rdma_link_layer ll;
6907b5ca15adSMark Bloch 	struct mlx5_ib_dev *dev;
690832f69e4bSDaniel Jurgens 	int port_type_cap;
6909da796ccbSMark Bloch 	int num_ports;
691032f69e4bSDaniel Jurgens 
6911b5ca15adSMark Bloch 	printk_once(KERN_INFO "%s", mlx5_version);
6912b5ca15adSMark Bloch 
6913f0666f1fSBodong Wang 	if (MLX5_ESWITCH_MANAGER(mdev) &&
6914f6455de0SBodong Wang 	    mlx5_ib_eswitch_mode(mdev->priv.eswitch) == MLX5_ESWITCH_OFFLOADS) {
69155fb58c9eSMark Bloch 		if (!mlx5_core_mp_enabled(mdev))
6916f0666f1fSBodong Wang 			mlx5_ib_register_vport_reps(mdev);
6917f0666f1fSBodong Wang 		return mdev;
6918f0666f1fSBodong Wang 	}
6919f0666f1fSBodong Wang 
692032f69e4bSDaniel Jurgens 	port_type_cap = MLX5_CAP_GEN(mdev, port_type);
692132f69e4bSDaniel Jurgens 	ll = mlx5_port_type_cap_to_rdma_ll(port_type_cap);
692232f69e4bSDaniel Jurgens 
6923e3f1ed1fSLeon Romanovsky 	if (mlx5_core_is_mp_slave(mdev) && ll == IB_LINK_LAYER_ETHERNET)
6924e3f1ed1fSLeon Romanovsky 		return mlx5_ib_add_slave_port(mdev);
692532f69e4bSDaniel Jurgens 
6926da796ccbSMark Bloch 	num_ports = max(MLX5_CAP_GEN(mdev, num_ports),
6927da796ccbSMark Bloch 			MLX5_CAP_GEN(mdev, num_vhca_ports));
6928459cc69fSLeon Romanovsky 	dev = ib_alloc_device(mlx5_ib_dev, ib_dev);
6929b5ca15adSMark Bloch 	if (!dev)
6930b5ca15adSMark Bloch 		return NULL;
6931da796ccbSMark Bloch 	dev->port = kcalloc(num_ports, sizeof(*dev->port),
6932da796ccbSMark Bloch 			     GFP_KERNEL);
6933da796ccbSMark Bloch 	if (!dev->port) {
6934a5c9c299SParav Pandit 		ib_dealloc_device(&dev->ib_dev);
6935da796ccbSMark Bloch 		return NULL;
6936da796ccbSMark Bloch 	}
6937b5ca15adSMark Bloch 
6938b5ca15adSMark Bloch 	dev->mdev = mdev;
6939da796ccbSMark Bloch 	dev->num_ports = num_ports;
6940b5ca15adSMark Bloch 
6941b5ca15adSMark Bloch 	return __mlx5_ib_add(dev, &pf_profile);
694216c1975fSMark Bloch }
694316c1975fSMark Bloch 
69449603b61dSJack Morgenstein static void mlx5_ib_remove(struct mlx5_core_dev *mdev, void *context)
6945e126ba97SEli Cohen {
694632f69e4bSDaniel Jurgens 	struct mlx5_ib_multiport_info *mpi;
694732f69e4bSDaniel Jurgens 	struct mlx5_ib_dev *dev;
69486aec21f6SHaggai Eran 
6949f0666f1fSBodong Wang 	if (MLX5_ESWITCH_MANAGER(mdev) && context == mdev) {
6950f0666f1fSBodong Wang 		mlx5_ib_unregister_vport_reps(mdev);
6951f0666f1fSBodong Wang 		return;
6952f0666f1fSBodong Wang 	}
6953f0666f1fSBodong Wang 
695432f69e4bSDaniel Jurgens 	if (mlx5_core_is_mp_slave(mdev)) {
695532f69e4bSDaniel Jurgens 		mpi = context;
695632f69e4bSDaniel Jurgens 		mutex_lock(&mlx5_ib_multiport_mutex);
695732f69e4bSDaniel Jurgens 		if (mpi->ibdev)
695832f69e4bSDaniel Jurgens 			mlx5_ib_unbind_slave_port(mpi->ibdev, mpi);
695932f69e4bSDaniel Jurgens 		list_del(&mpi->list);
696032f69e4bSDaniel Jurgens 		mutex_unlock(&mlx5_ib_multiport_mutex);
69615d44adebSDanit Goldberg 		kfree(mpi);
696232f69e4bSDaniel Jurgens 		return;
696332f69e4bSDaniel Jurgens 	}
696432f69e4bSDaniel Jurgens 
696532f69e4bSDaniel Jurgens 	dev = context;
696616c1975fSMark Bloch 	__mlx5_ib_remove(dev, dev->profile, MLX5_IB_STAGE_MAX);
6967e126ba97SEli Cohen }
6968e126ba97SEli Cohen 
69699603b61dSJack Morgenstein static struct mlx5_interface mlx5_ib_interface = {
69709603b61dSJack Morgenstein 	.add            = mlx5_ib_add,
69719603b61dSJack Morgenstein 	.remove         = mlx5_ib_remove,
697264613d94SSaeed Mahameed 	.protocol	= MLX5_INTERFACE_PROTOCOL_IB,
6973e126ba97SEli Cohen };
6974e126ba97SEli Cohen 
6975c44ef998SIlya Lesokhin unsigned long mlx5_ib_get_xlt_emergency_page(void)
6976c44ef998SIlya Lesokhin {
6977c44ef998SIlya Lesokhin 	mutex_lock(&xlt_emergency_page_mutex);
6978c44ef998SIlya Lesokhin 	return xlt_emergency_page;
6979c44ef998SIlya Lesokhin }
6980c44ef998SIlya Lesokhin 
6981c44ef998SIlya Lesokhin void mlx5_ib_put_xlt_emergency_page(void)
6982c44ef998SIlya Lesokhin {
6983c44ef998SIlya Lesokhin 	mutex_unlock(&xlt_emergency_page_mutex);
6984c44ef998SIlya Lesokhin }
6985c44ef998SIlya Lesokhin 
6986e126ba97SEli Cohen static int __init mlx5_ib_init(void)
6987e126ba97SEli Cohen {
69886aec21f6SHaggai Eran 	int err;
69896aec21f6SHaggai Eran 
6990c44ef998SIlya Lesokhin 	xlt_emergency_page = __get_free_page(GFP_KERNEL);
6991c44ef998SIlya Lesokhin 	if (!xlt_emergency_page)
6992d69a24e0SDaniel Jurgens 		return -ENOMEM;
6993d69a24e0SDaniel Jurgens 
6994c44ef998SIlya Lesokhin 	mutex_init(&xlt_emergency_page_mutex);
6995c44ef998SIlya Lesokhin 
6996c44ef998SIlya Lesokhin 	mlx5_ib_event_wq = alloc_ordered_workqueue("mlx5_ib_event_wq", 0);
6997c44ef998SIlya Lesokhin 	if (!mlx5_ib_event_wq) {
6998c44ef998SIlya Lesokhin 		free_page(xlt_emergency_page);
6999c44ef998SIlya Lesokhin 		return -ENOMEM;
7000c44ef998SIlya Lesokhin 	}
7001c44ef998SIlya Lesokhin 
700281713d37SArtemy Kovalyov 	mlx5_ib_odp_init();
70039603b61dSJack Morgenstein 
70046aec21f6SHaggai Eran 	err = mlx5_register_interface(&mlx5_ib_interface);
70056aec21f6SHaggai Eran 
70066aec21f6SHaggai Eran 	return err;
7007e126ba97SEli Cohen }
7008e126ba97SEli Cohen 
7009e126ba97SEli Cohen static void __exit mlx5_ib_cleanup(void)
7010e126ba97SEli Cohen {
70119603b61dSJack Morgenstein 	mlx5_unregister_interface(&mlx5_ib_interface);
7012d69a24e0SDaniel Jurgens 	destroy_workqueue(mlx5_ib_event_wq);
7013c44ef998SIlya Lesokhin 	mutex_destroy(&xlt_emergency_page_mutex);
7014c44ef998SIlya Lesokhin 	free_page(xlt_emergency_page);
7015e126ba97SEli Cohen }
7016e126ba97SEli Cohen 
7017e126ba97SEli Cohen module_init(mlx5_ib_init);
7018e126ba97SEli Cohen module_exit(mlx5_ib_cleanup);
7019