xref: /openbmc/linux/drivers/block/rnbd/rnbd-srv.c (revision 5b9ea86e)
12de6c8deSJack Wang // SPDX-License-Identifier: GPL-2.0-or-later
22de6c8deSJack Wang /*
32de6c8deSJack Wang  * RDMA Network Block Driver
42de6c8deSJack Wang  *
52de6c8deSJack Wang  * Copyright (c) 2014 - 2018 ProfitBricks GmbH. All rights reserved.
62de6c8deSJack Wang  * Copyright (c) 2018 - 2019 1&1 IONOS Cloud GmbH. All rights reserved.
72de6c8deSJack Wang  * Copyright (c) 2019 - 2020 1&1 IONOS SE. All rights reserved.
82de6c8deSJack Wang  */
92de6c8deSJack Wang #undef pr_fmt
102de6c8deSJack Wang #define pr_fmt(fmt) KBUILD_MODNAME " L" __stringify(__LINE__) ": " fmt
112de6c8deSJack Wang 
122de6c8deSJack Wang #include <linux/module.h>
132de6c8deSJack Wang #include <linux/blkdev.h>
142de6c8deSJack Wang 
152de6c8deSJack Wang #include "rnbd-srv.h"
1674e237b6SSantosh Pradhan #include "rnbd-srv-trace.h"
172de6c8deSJack Wang 
182de6c8deSJack Wang MODULE_DESCRIPTION("RDMA Network Block Device Server");
192de6c8deSJack Wang MODULE_LICENSE("GPL");
202de6c8deSJack Wang 
212de6c8deSJack Wang static u16 port_nr = RTRS_PORT;
222de6c8deSJack Wang 
232de6c8deSJack Wang module_param_named(port_nr, port_nr, ushort, 0444);
242de6c8deSJack Wang MODULE_PARM_DESC(port_nr,
252de6c8deSJack Wang 		 "The port number the server is listening on (default: "
262de6c8deSJack Wang 		 __stringify(RTRS_PORT)")");
272de6c8deSJack Wang 
282de6c8deSJack Wang #define DEFAULT_DEV_SEARCH_PATH "/"
292de6c8deSJack Wang 
302de6c8deSJack Wang static char dev_search_path[PATH_MAX] = DEFAULT_DEV_SEARCH_PATH;
312de6c8deSJack Wang 
dev_search_path_set(const char * val,const struct kernel_param * kp)322de6c8deSJack Wang static int dev_search_path_set(const char *val, const struct kernel_param *kp)
332de6c8deSJack Wang {
342de6c8deSJack Wang 	const char *p = strrchr(val, '\n') ? : val + strlen(val);
352de6c8deSJack Wang 
362de6c8deSJack Wang 	if (strlen(val) >= sizeof(dev_search_path))
372de6c8deSJack Wang 		return -EINVAL;
382de6c8deSJack Wang 
392de6c8deSJack Wang 	snprintf(dev_search_path, sizeof(dev_search_path), "%.*s",
402de6c8deSJack Wang 		 (int)(p - val), val);
412de6c8deSJack Wang 
422de6c8deSJack Wang 	pr_info("dev_search_path changed to '%s'\n", dev_search_path);
432de6c8deSJack Wang 
442de6c8deSJack Wang 	return 0;
452de6c8deSJack Wang }
462de6c8deSJack Wang 
472de6c8deSJack Wang static struct kparam_string dev_search_path_kparam_str = {
482de6c8deSJack Wang 	.maxlen	= sizeof(dev_search_path),
492de6c8deSJack Wang 	.string	= dev_search_path
502de6c8deSJack Wang };
512de6c8deSJack Wang 
522de6c8deSJack Wang static const struct kernel_param_ops dev_search_path_ops = {
532de6c8deSJack Wang 	.set	= dev_search_path_set,
542de6c8deSJack Wang 	.get	= param_get_string,
552de6c8deSJack Wang };
562de6c8deSJack Wang 
572de6c8deSJack Wang module_param_cb(dev_search_path, &dev_search_path_ops,
582de6c8deSJack Wang 		&dev_search_path_kparam_str, 0444);
592de6c8deSJack Wang MODULE_PARM_DESC(dev_search_path,
602de6c8deSJack Wang 		 "Sets the dev_search_path. When a device is mapped this path is prepended to the device path from the map device operation.  If %SESSNAME% is specified in a path, then device will be searched in a session namespace. (default: "
612de6c8deSJack Wang 		 DEFAULT_DEV_SEARCH_PATH ")");
622de6c8deSJack Wang 
632de6c8deSJack Wang static DEFINE_MUTEX(sess_lock);
642de6c8deSJack Wang static DEFINE_SPINLOCK(dev_lock);
652de6c8deSJack Wang 
662de6c8deSJack Wang static LIST_HEAD(sess_list);
672de6c8deSJack Wang static LIST_HEAD(dev_list);
682de6c8deSJack Wang 
692de6c8deSJack Wang struct rnbd_io_private {
702de6c8deSJack Wang 	struct rtrs_srv_op		*id;
712de6c8deSJack Wang 	struct rnbd_srv_sess_dev	*sess_dev;
722de6c8deSJack Wang };
732de6c8deSJack Wang 
rnbd_sess_dev_release(struct kref * kref)742de6c8deSJack Wang static void rnbd_sess_dev_release(struct kref *kref)
752de6c8deSJack Wang {
762de6c8deSJack Wang 	struct rnbd_srv_sess_dev *sess_dev;
772de6c8deSJack Wang 
782de6c8deSJack Wang 	sess_dev = container_of(kref, struct rnbd_srv_sess_dev, kref);
792de6c8deSJack Wang 	complete(sess_dev->destroy_comp);
802de6c8deSJack Wang }
812de6c8deSJack Wang 
rnbd_put_sess_dev(struct rnbd_srv_sess_dev * sess_dev)822de6c8deSJack Wang static inline void rnbd_put_sess_dev(struct rnbd_srv_sess_dev *sess_dev)
832de6c8deSJack Wang {
842de6c8deSJack Wang 	kref_put(&sess_dev->kref, rnbd_sess_dev_release);
852de6c8deSJack Wang }
862de6c8deSJack Wang 
872de6c8deSJack Wang static struct rnbd_srv_sess_dev *
rnbd_get_sess_dev(int dev_id,struct rnbd_srv_session * srv_sess)882de6c8deSJack Wang rnbd_get_sess_dev(int dev_id, struct rnbd_srv_session *srv_sess)
892de6c8deSJack Wang {
902de6c8deSJack Wang 	struct rnbd_srv_sess_dev *sess_dev;
912de6c8deSJack Wang 	int ret = 0;
922de6c8deSJack Wang 
932de6c8deSJack Wang 	rcu_read_lock();
942de6c8deSJack Wang 	sess_dev = xa_load(&srv_sess->index_idr, dev_id);
951e31016bSGioh Kim 	if (sess_dev)
962de6c8deSJack Wang 		ret = kref_get_unless_zero(&sess_dev->kref);
972de6c8deSJack Wang 	rcu_read_unlock();
982de6c8deSJack Wang 
99ba2eed1cSGuoqing Jiang 	if (!ret)
1002de6c8deSJack Wang 		return ERR_PTR(-ENXIO);
1012de6c8deSJack Wang 
1022de6c8deSJack Wang 	return sess_dev;
1032de6c8deSJack Wang }
1042de6c8deSJack Wang 
rnbd_dev_bi_end_io(struct bio * bio)1051fe0640fSChristoph Hellwig static void rnbd_dev_bi_end_io(struct bio *bio)
1061fe0640fSChristoph Hellwig {
1072ecaa581SChristoph Hellwig 	struct rnbd_io_private *rnbd_priv = bio->bi_private;
1082ecaa581SChristoph Hellwig 	struct rnbd_srv_sess_dev *sess_dev = rnbd_priv->sess_dev;
1092ecaa581SChristoph Hellwig 
1102ecaa581SChristoph Hellwig 	rnbd_put_sess_dev(sess_dev);
1112ecaa581SChristoph Hellwig 	rtrs_srv_resp_rdma(rnbd_priv->id, blk_status_to_errno(bio->bi_status));
1122ecaa581SChristoph Hellwig 
1132ecaa581SChristoph Hellwig 	kfree(rnbd_priv);
1141fe0640fSChristoph Hellwig 	bio_put(bio);
1151fe0640fSChristoph Hellwig }
1161fe0640fSChristoph Hellwig 
process_rdma(struct rnbd_srv_session * srv_sess,struct rtrs_srv_op * id,void * data,u32 datalen,const void * usr,size_t usrlen)117c81cba85SGioh Kim static int process_rdma(struct rnbd_srv_session *srv_sess,
1182de6c8deSJack Wang 			struct rtrs_srv_op *id, void *data, u32 datalen,
1192de6c8deSJack Wang 			const void *usr, size_t usrlen)
1202de6c8deSJack Wang {
1212de6c8deSJack Wang 	const struct rnbd_msg_io *msg = usr;
1222de6c8deSJack Wang 	struct rnbd_io_private *priv;
1232de6c8deSJack Wang 	struct rnbd_srv_sess_dev *sess_dev;
1242de6c8deSJack Wang 	u32 dev_id;
1252de6c8deSJack Wang 	int err;
126735d77d4SGuoqing Jiang 	struct bio *bio;
127735d77d4SGuoqing Jiang 	short prio;
1282de6c8deSJack Wang 
12974e237b6SSantosh Pradhan 	trace_process_rdma(srv_sess, msg, id, datalen, usrlen);
13074e237b6SSantosh Pradhan 
1312de6c8deSJack Wang 	priv = kmalloc(sizeof(*priv), GFP_KERNEL);
1322de6c8deSJack Wang 	if (!priv)
1332de6c8deSJack Wang 		return -ENOMEM;
1342de6c8deSJack Wang 
1352de6c8deSJack Wang 	dev_id = le32_to_cpu(msg->device_id);
1362de6c8deSJack Wang 
1372de6c8deSJack Wang 	sess_dev = rnbd_get_sess_dev(dev_id, srv_sess);
1382de6c8deSJack Wang 	if (IS_ERR(sess_dev)) {
1392de6c8deSJack Wang 		pr_err_ratelimited("Got I/O request on session %s for unknown device id %d\n",
1402de6c8deSJack Wang 				   srv_sess->sessname, dev_id);
1412de6c8deSJack Wang 		err = -ENOTCONN;
1422de6c8deSJack Wang 		goto err;
1432de6c8deSJack Wang 	}
1442de6c8deSJack Wang 
1452de6c8deSJack Wang 	priv->sess_dev = sess_dev;
1462de6c8deSJack Wang 	priv->id = id;
1472de6c8deSJack Wang 
148f7de4886SChristoph Hellwig 	bio = bio_alloc(sess_dev->bdev, 1,
14907888c66SChristoph Hellwig 			rnbd_to_bio_flags(le32_to_cpu(msg->rw)), GFP_KERNEL);
1501fe0640fSChristoph Hellwig 	if (bio_add_page(bio, virt_to_page(data), datalen,
1511fe0640fSChristoph Hellwig 			offset_in_page(data)) != datalen) {
1521fe0640fSChristoph Hellwig 		rnbd_srv_err(sess_dev, "Failed to map data to bio\n");
1531fe0640fSChristoph Hellwig 		err = -EINVAL;
1541fe0640fSChristoph Hellwig 		goto bio_put;
1552de6c8deSJack Wang 	}
1562de6c8deSJack Wang 
157735d77d4SGuoqing Jiang 	bio->bi_end_io = rnbd_dev_bi_end_io;
158d7b78de2SChristoph Hellwig 	bio->bi_private = priv;
159735d77d4SGuoqing Jiang 	bio->bi_iter.bi_sector = le64_to_cpu(msg->sector);
160735d77d4SGuoqing Jiang 	bio->bi_iter.bi_size = le32_to_cpu(msg->bi_size);
161735d77d4SGuoqing Jiang 	prio = srv_sess->ver < RNBD_PROTO_VER_MAJOR ||
162735d77d4SGuoqing Jiang 	       usrlen < sizeof(*msg) ? 0 : le16_to_cpu(msg->prio);
163735d77d4SGuoqing Jiang 	bio_set_prio(bio, prio);
164735d77d4SGuoqing Jiang 
165735d77d4SGuoqing Jiang 	submit_bio(bio);
166735d77d4SGuoqing Jiang 
1672de6c8deSJack Wang 	return 0;
1682de6c8deSJack Wang 
1691fe0640fSChristoph Hellwig bio_put:
1701fe0640fSChristoph Hellwig 	bio_put(bio);
1712de6c8deSJack Wang 	rnbd_put_sess_dev(sess_dev);
1722de6c8deSJack Wang err:
1732de6c8deSJack Wang 	kfree(priv);
1742de6c8deSJack Wang 	return err;
1752de6c8deSJack Wang }
1762de6c8deSJack Wang 
destroy_device(struct kref * kref)177d16b5ac8SGuoqing Jiang static void destroy_device(struct kref *kref)
1782de6c8deSJack Wang {
179d16b5ac8SGuoqing Jiang 	struct rnbd_srv_dev *dev = container_of(kref, struct rnbd_srv_dev, kref);
180d16b5ac8SGuoqing Jiang 
1812de6c8deSJack Wang 	WARN_ONCE(!list_empty(&dev->sess_dev_list),
1822de6c8deSJack Wang 		  "Device %s is being destroyed but still in use!\n",
1833ecdbf91SGuoqing Jiang 		  dev->name);
1842de6c8deSJack Wang 
1852de6c8deSJack Wang 	spin_lock(&dev_lock);
1862de6c8deSJack Wang 	list_del(&dev->list);
1872de6c8deSJack Wang 	spin_unlock(&dev_lock);
1882de6c8deSJack Wang 
1892de6c8deSJack Wang 	mutex_destroy(&dev->lock);
1902de6c8deSJack Wang 	if (dev->dev_kobj.state_in_sysfs)
1912de6c8deSJack Wang 		/*
1922de6c8deSJack Wang 		 * Destroy kobj only if it was really created.
1932de6c8deSJack Wang 		 */
1942de6c8deSJack Wang 		rnbd_srv_destroy_dev_sysfs(dev);
1952de6c8deSJack Wang 	else
1962de6c8deSJack Wang 		kfree(dev);
1972de6c8deSJack Wang }
1982de6c8deSJack Wang 
rnbd_put_srv_dev(struct rnbd_srv_dev * dev)1992de6c8deSJack Wang static void rnbd_put_srv_dev(struct rnbd_srv_dev *dev)
2002de6c8deSJack Wang {
201d16b5ac8SGuoqing Jiang 	kref_put(&dev->kref, destroy_device);
2022de6c8deSJack Wang }
2032de6c8deSJack Wang 
rnbd_destroy_sess_dev(struct rnbd_srv_sess_dev * sess_dev,bool keep_id)20478699805SLutz Pogrell void rnbd_destroy_sess_dev(struct rnbd_srv_sess_dev *sess_dev, bool keep_id)
2052de6c8deSJack Wang {
2062de6c8deSJack Wang 	DECLARE_COMPLETION_ONSTACK(dc);
2072de6c8deSJack Wang 
20878699805SLutz Pogrell 	if (keep_id)
20978699805SLutz Pogrell 		/* free the resources for the id but don't  */
21078699805SLutz Pogrell 		/* allow to re-use the id itself because it */
21178699805SLutz Pogrell 		/* is still used by the client              */
21278699805SLutz Pogrell 		xa_cmpxchg(&sess_dev->sess->index_idr, sess_dev->device_id,
21378699805SLutz Pogrell 			   sess_dev, NULL, 0);
21478699805SLutz Pogrell 	else
2152de6c8deSJack Wang 		xa_erase(&sess_dev->sess->index_idr, sess_dev->device_id);
2162de6c8deSJack Wang 	synchronize_rcu();
21778699805SLutz Pogrell 
2182de6c8deSJack Wang 	sess_dev->destroy_comp = &dc;
2192de6c8deSJack Wang 	rnbd_put_sess_dev(sess_dev);
2202de6c8deSJack Wang 	wait_for_completion(&dc); /* wait for inflights to drop to zero */
2212de6c8deSJack Wang 
2222736e8eeSChristoph Hellwig 	blkdev_put(sess_dev->bdev, NULL);
2232de6c8deSJack Wang 	mutex_lock(&sess_dev->dev->lock);
2242de6c8deSJack Wang 	list_del(&sess_dev->dev_list);
22599b07780SChristoph Hellwig 	if (!sess_dev->readonly)
2262de6c8deSJack Wang 		sess_dev->dev->open_write_cnt--;
2272de6c8deSJack Wang 	mutex_unlock(&sess_dev->dev->lock);
2282de6c8deSJack Wang 
2292de6c8deSJack Wang 	rnbd_put_srv_dev(sess_dev->dev);
2302de6c8deSJack Wang 
2312de6c8deSJack Wang 	rnbd_srv_info(sess_dev, "Device closed\n");
2322de6c8deSJack Wang 	kfree(sess_dev);
2332de6c8deSJack Wang }
2342de6c8deSJack Wang 
destroy_sess(struct rnbd_srv_session * srv_sess)2352de6c8deSJack Wang static void destroy_sess(struct rnbd_srv_session *srv_sess)
2362de6c8deSJack Wang {
237ce11bdf9SMd Haris Iqbal 	struct rnbd_srv_sess_dev *sess_dev;
238ce11bdf9SMd Haris Iqbal 	unsigned long index;
2392de6c8deSJack Wang 
240ce11bdf9SMd Haris Iqbal 	if (xa_empty(&srv_sess->index_idr))
2412de6c8deSJack Wang 		goto out;
2422de6c8deSJack Wang 
24374e237b6SSantosh Pradhan 	trace_destroy_sess(srv_sess);
24474e237b6SSantosh Pradhan 
2452de6c8deSJack Wang 	mutex_lock(&srv_sess->lock);
246ce11bdf9SMd Haris Iqbal 	xa_for_each(&srv_sess->index_idr, index, sess_dev)
2472de6c8deSJack Wang 		rnbd_srv_destroy_dev_session_sysfs(sess_dev);
2482de6c8deSJack Wang 	mutex_unlock(&srv_sess->lock);
2492de6c8deSJack Wang 
2502de6c8deSJack Wang out:
2512de6c8deSJack Wang 	xa_destroy(&srv_sess->index_idr);
2522de6c8deSJack Wang 
2532de6c8deSJack Wang 	pr_info("RTRS Session %s disconnected\n", srv_sess->sessname);
2542de6c8deSJack Wang 
2552de6c8deSJack Wang 	mutex_lock(&sess_lock);
2562de6c8deSJack Wang 	list_del(&srv_sess->list);
2572de6c8deSJack Wang 	mutex_unlock(&sess_lock);
2582de6c8deSJack Wang 
2592de6c8deSJack Wang 	mutex_destroy(&srv_sess->lock);
2602de6c8deSJack Wang 	kfree(srv_sess);
2612de6c8deSJack Wang }
2622de6c8deSJack Wang 
create_sess(struct rtrs_srv_sess * rtrs)263f7ecac6aSVaishali Thakkar static int create_sess(struct rtrs_srv_sess *rtrs)
2642de6c8deSJack Wang {
2652de6c8deSJack Wang 	struct rnbd_srv_session *srv_sess;
266ae4c8164SVaishali Thakkar 	char pathname[NAME_MAX];
2672de6c8deSJack Wang 	int err;
2682de6c8deSJack Wang 
269ae4c8164SVaishali Thakkar 	err = rtrs_srv_get_path_name(rtrs, pathname, sizeof(pathname));
2702de6c8deSJack Wang 	if (err) {
271ae4c8164SVaishali Thakkar 		pr_err("rtrs_srv_get_path_name(%s): %d\n", pathname, err);
2722de6c8deSJack Wang 
2732de6c8deSJack Wang 		return err;
2742de6c8deSJack Wang 	}
2752de6c8deSJack Wang 	srv_sess = kzalloc(sizeof(*srv_sess), GFP_KERNEL);
2762de6c8deSJack Wang 	if (!srv_sess)
2772de6c8deSJack Wang 		return -ENOMEM;
2782de6c8deSJack Wang 
2792de6c8deSJack Wang 	srv_sess->queue_depth = rtrs_srv_get_queue_depth(rtrs);
2802de6c8deSJack Wang 	xa_init_flags(&srv_sess->index_idr, XA_FLAGS_ALLOC);
2812de6c8deSJack Wang 	mutex_init(&srv_sess->lock);
2822de6c8deSJack Wang 	mutex_lock(&sess_lock);
2832de6c8deSJack Wang 	list_add(&srv_sess->list, &sess_list);
2842de6c8deSJack Wang 	mutex_unlock(&sess_lock);
2852de6c8deSJack Wang 
2862de6c8deSJack Wang 	srv_sess->rtrs = rtrs;
287ae4c8164SVaishali Thakkar 	strscpy(srv_sess->sessname, pathname, sizeof(srv_sess->sessname));
2882de6c8deSJack Wang 
2892de6c8deSJack Wang 	rtrs_srv_set_sess_priv(rtrs, srv_sess);
2902de6c8deSJack Wang 
29174e237b6SSantosh Pradhan 	trace_create_sess(srv_sess);
29274e237b6SSantosh Pradhan 
2932de6c8deSJack Wang 	return 0;
2942de6c8deSJack Wang }
2952de6c8deSJack Wang 
rnbd_srv_link_ev(struct rtrs_srv_sess * rtrs,enum rtrs_srv_link_ev ev,void * priv)296f7ecac6aSVaishali Thakkar static int rnbd_srv_link_ev(struct rtrs_srv_sess *rtrs,
2972de6c8deSJack Wang 			     enum rtrs_srv_link_ev ev, void *priv)
2982de6c8deSJack Wang {
2992de6c8deSJack Wang 	struct rnbd_srv_session *srv_sess = priv;
3002de6c8deSJack Wang 
3012de6c8deSJack Wang 	switch (ev) {
3022de6c8deSJack Wang 	case RTRS_SRV_LINK_EV_CONNECTED:
3032de6c8deSJack Wang 		return create_sess(rtrs);
3042de6c8deSJack Wang 
3052de6c8deSJack Wang 	case RTRS_SRV_LINK_EV_DISCONNECTED:
3062de6c8deSJack Wang 		if (WARN_ON_ONCE(!srv_sess))
3072de6c8deSJack Wang 			return -EINVAL;
3082de6c8deSJack Wang 
3092de6c8deSJack Wang 		destroy_sess(srv_sess);
3102de6c8deSJack Wang 		return 0;
3112de6c8deSJack Wang 
3122de6c8deSJack Wang 	default:
3132de6c8deSJack Wang 		pr_warn("Received unknown RTRS session event %d from session %s\n",
3142de6c8deSJack Wang 			ev, srv_sess->sessname);
3152de6c8deSJack Wang 		return -EINVAL;
3162de6c8deSJack Wang 	}
3172de6c8deSJack Wang }
3182de6c8deSJack Wang 
rnbd_srv_sess_dev_force_close(struct rnbd_srv_sess_dev * sess_dev,struct kobj_attribute * attr)319c77bfa8fSGioh Kim void rnbd_srv_sess_dev_force_close(struct rnbd_srv_sess_dev *sess_dev,
320c77bfa8fSGioh Kim 				   struct kobj_attribute *attr)
32178699805SLutz Pogrell {
3221a84e7c6SJack Wang 	struct rnbd_srv_session	*sess = sess_dev->sess;
3231a84e7c6SJack Wang 
324b168e1d8SGioh Kim 	/* It is already started to close by client's close message. */
325b168e1d8SGioh Kim 	if (!mutex_trylock(&sess->lock))
326b168e1d8SGioh Kim 		return;
3274bc14f31SMd Haris Iqbal 
3284bc14f31SMd Haris Iqbal 	sess_dev->keep_id = true;
329c77bfa8fSGioh Kim 	/* first remove sysfs itself to avoid deadlock */
330c77bfa8fSGioh Kim 	sysfs_remove_file_self(&sess_dev->kobj, &attr->attr);
3311a84e7c6SJack Wang 	rnbd_srv_destroy_dev_session_sysfs(sess_dev);
3321a84e7c6SJack Wang 	mutex_unlock(&sess->lock);
33378699805SLutz Pogrell }
33478699805SLutz Pogrell 
process_msg_close(struct rnbd_srv_session * srv_sess,void * data,size_t datalen,const void * usr,size_t usrlen)335be2b2f6bSGuoqing Jiang static void process_msg_close(struct rnbd_srv_session *srv_sess,
3362de6c8deSJack Wang 			     void *data, size_t datalen, const void *usr,
3372de6c8deSJack Wang 			     size_t usrlen)
3382de6c8deSJack Wang {
3392de6c8deSJack Wang 	const struct rnbd_msg_close *close_msg = usr;
3402de6c8deSJack Wang 	struct rnbd_srv_sess_dev *sess_dev;
3412de6c8deSJack Wang 
34274e237b6SSantosh Pradhan 	trace_process_msg_close(srv_sess, close_msg);
34374e237b6SSantosh Pradhan 
3442de6c8deSJack Wang 	sess_dev = rnbd_get_sess_dev(le32_to_cpu(close_msg->device_id),
3452de6c8deSJack Wang 				      srv_sess);
3462de6c8deSJack Wang 	if (IS_ERR(sess_dev))
347be2b2f6bSGuoqing Jiang 		return;
3482de6c8deSJack Wang 
3492de6c8deSJack Wang 	rnbd_put_sess_dev(sess_dev);
3502de6c8deSJack Wang 	mutex_lock(&srv_sess->lock);
3512de6c8deSJack Wang 	rnbd_srv_destroy_dev_session_sysfs(sess_dev);
3522de6c8deSJack Wang 	mutex_unlock(&srv_sess->lock);
3532de6c8deSJack Wang }
3542de6c8deSJack Wang 
355c81cba85SGioh Kim static int process_msg_open(struct rnbd_srv_session *srv_sess,
3562de6c8deSJack Wang 			    const void *msg, size_t len,
3572de6c8deSJack Wang 			    void *data, size_t datalen);
3582de6c8deSJack Wang 
359fece685cSGuoqing Jiang static void process_msg_sess_info(struct rnbd_srv_session *srv_sess,
3602de6c8deSJack Wang 				 const void *msg, size_t len,
3612de6c8deSJack Wang 				 void *data, size_t datalen);
3622de6c8deSJack Wang 
rnbd_srv_rdma_ev(void * priv,struct rtrs_srv_op * id,void * data,size_t datalen,const void * usr,size_t usrlen)3636edd86a2SGuoqing Jiang static int rnbd_srv_rdma_ev(void *priv, struct rtrs_srv_op *id,
3646edd86a2SGuoqing Jiang 			    void *data, size_t datalen,
3656edd86a2SGuoqing Jiang 			    const void *usr, size_t usrlen)
3662de6c8deSJack Wang {
3672de6c8deSJack Wang 	struct rnbd_srv_session *srv_sess = priv;
3682de6c8deSJack Wang 	const struct rnbd_msg_hdr *hdr = usr;
3692de6c8deSJack Wang 	int ret = 0;
3702de6c8deSJack Wang 	u16 type;
3712de6c8deSJack Wang 
3722de6c8deSJack Wang 	if (WARN_ON_ONCE(!srv_sess))
3732de6c8deSJack Wang 		return -ENODEV;
3742de6c8deSJack Wang 
3752de6c8deSJack Wang 	type = le16_to_cpu(hdr->type);
3762de6c8deSJack Wang 
3772de6c8deSJack Wang 	switch (type) {
3782de6c8deSJack Wang 	case RNBD_MSG_IO:
379c81cba85SGioh Kim 		return process_rdma(srv_sess, id, data, datalen, usr, usrlen);
3802de6c8deSJack Wang 	case RNBD_MSG_CLOSE:
381be2b2f6bSGuoqing Jiang 		process_msg_close(srv_sess, data, datalen, usr, usrlen);
3822de6c8deSJack Wang 		break;
3832de6c8deSJack Wang 	case RNBD_MSG_OPEN:
384c81cba85SGioh Kim 		ret = process_msg_open(srv_sess, usr, usrlen, data, datalen);
3852de6c8deSJack Wang 		break;
3862de6c8deSJack Wang 	case RNBD_MSG_SESS_INFO:
387fece685cSGuoqing Jiang 		process_msg_sess_info(srv_sess, usr, usrlen, data, datalen);
3882de6c8deSJack Wang 		break;
3892de6c8deSJack Wang 	default:
3906edd86a2SGuoqing Jiang 		pr_warn("Received unexpected message type %d from session %s\n",
3916edd86a2SGuoqing Jiang 			type, srv_sess->sessname);
3922de6c8deSJack Wang 		return -EINVAL;
3932de6c8deSJack Wang 	}
3942de6c8deSJack Wang 
395095134fbSGuoqing Jiang 	/*
396095134fbSGuoqing Jiang 	 * Since ret is passed to rtrs to handle the failure case, we
397095134fbSGuoqing Jiang 	 * just return 0 at the end otherwise callers in rtrs would call
398095134fbSGuoqing Jiang 	 * send_io_resp_imm again to print redundant err message.
399095134fbSGuoqing Jiang 	 */
4002de6c8deSJack Wang 	rtrs_srv_resp_rdma(id, ret);
4012de6c8deSJack Wang 	return 0;
4022de6c8deSJack Wang }
4032de6c8deSJack Wang 
4042de6c8deSJack Wang static struct rnbd_srv_sess_dev
rnbd_sess_dev_alloc(struct rnbd_srv_session * srv_sess)4052de6c8deSJack Wang *rnbd_sess_dev_alloc(struct rnbd_srv_session *srv_sess)
4062de6c8deSJack Wang {
4072de6c8deSJack Wang 	struct rnbd_srv_sess_dev *sess_dev;
4082de6c8deSJack Wang 	int error;
4092de6c8deSJack Wang 
4102de6c8deSJack Wang 	sess_dev = kzalloc(sizeof(*sess_dev), GFP_KERNEL);
4112de6c8deSJack Wang 	if (!sess_dev)
4122de6c8deSJack Wang 		return ERR_PTR(-ENOMEM);
4132de6c8deSJack Wang 
4142de6c8deSJack Wang 	error = xa_alloc(&srv_sess->index_idr, &sess_dev->device_id, sess_dev,
4152de6c8deSJack Wang 			 xa_limit_32b, GFP_NOWAIT);
4162de6c8deSJack Wang 	if (error < 0) {
4172de6c8deSJack Wang 		pr_warn("Allocating idr failed, err: %d\n", error);
4182de6c8deSJack Wang 		kfree(sess_dev);
4192de6c8deSJack Wang 		return ERR_PTR(error);
4202de6c8deSJack Wang 	}
4212de6c8deSJack Wang 
4222de6c8deSJack Wang 	return sess_dev;
4232de6c8deSJack Wang }
4242de6c8deSJack Wang 
rnbd_srv_init_srv_dev(struct block_device * bdev)4256e880cf5SChristoph Hellwig static struct rnbd_srv_dev *rnbd_srv_init_srv_dev(struct block_device *bdev)
4262de6c8deSJack Wang {
4272de6c8deSJack Wang 	struct rnbd_srv_dev *dev;
4282de6c8deSJack Wang 
4292de6c8deSJack Wang 	dev = kzalloc(sizeof(*dev), GFP_KERNEL);
4302de6c8deSJack Wang 	if (!dev)
4312de6c8deSJack Wang 		return ERR_PTR(-ENOMEM);
4322de6c8deSJack Wang 
4333ecdbf91SGuoqing Jiang 	snprintf(dev->name, sizeof(dev->name), "%pg", bdev);
4342de6c8deSJack Wang 	kref_init(&dev->kref);
4352de6c8deSJack Wang 	INIT_LIST_HEAD(&dev->sess_dev_list);
4362de6c8deSJack Wang 	mutex_init(&dev->lock);
4372de6c8deSJack Wang 
4382de6c8deSJack Wang 	return dev;
4392de6c8deSJack Wang }
4402de6c8deSJack Wang 
4412de6c8deSJack Wang static struct rnbd_srv_dev *
rnbd_srv_find_or_add_srv_dev(struct rnbd_srv_dev * new_dev)4422de6c8deSJack Wang rnbd_srv_find_or_add_srv_dev(struct rnbd_srv_dev *new_dev)
4432de6c8deSJack Wang {
4442de6c8deSJack Wang 	struct rnbd_srv_dev *dev;
4452de6c8deSJack Wang 
4462de6c8deSJack Wang 	spin_lock(&dev_lock);
4472de6c8deSJack Wang 	list_for_each_entry(dev, &dev_list, list) {
4483ecdbf91SGuoqing Jiang 		if (!strncmp(dev->name, new_dev->name, sizeof(dev->name))) {
4492de6c8deSJack Wang 			if (!kref_get_unless_zero(&dev->kref))
4502de6c8deSJack Wang 				/*
4512de6c8deSJack Wang 				 * We lost the race, device is almost dead.
4522de6c8deSJack Wang 				 *  Continue traversing to find a valid one.
4532de6c8deSJack Wang 				 */
4542de6c8deSJack Wang 				continue;
4552de6c8deSJack Wang 			spin_unlock(&dev_lock);
4562de6c8deSJack Wang 			return dev;
4572de6c8deSJack Wang 		}
4582de6c8deSJack Wang 	}
4592de6c8deSJack Wang 	list_add(&new_dev->list, &dev_list);
4602de6c8deSJack Wang 	spin_unlock(&dev_lock);
4612de6c8deSJack Wang 
4622de6c8deSJack Wang 	return new_dev;
4632de6c8deSJack Wang }
4642de6c8deSJack Wang 
rnbd_srv_check_update_open_perm(struct rnbd_srv_dev * srv_dev,struct rnbd_srv_session * srv_sess,enum rnbd_access_mode access_mode)4652de6c8deSJack Wang static int rnbd_srv_check_update_open_perm(struct rnbd_srv_dev *srv_dev,
4662de6c8deSJack Wang 					    struct rnbd_srv_session *srv_sess,
4672de6c8deSJack Wang 					    enum rnbd_access_mode access_mode)
4682de6c8deSJack Wang {
4696a12d537SGuoqing Jiang 	int ret = 0;
4702de6c8deSJack Wang 
4712de6c8deSJack Wang 	mutex_lock(&srv_dev->lock);
4722de6c8deSJack Wang 
4732de6c8deSJack Wang 	switch (access_mode) {
4742de6c8deSJack Wang 	case RNBD_ACCESS_RO:
4752de6c8deSJack Wang 		break;
4762de6c8deSJack Wang 	case RNBD_ACCESS_RW:
4772de6c8deSJack Wang 		if (srv_dev->open_write_cnt == 0)  {
4782de6c8deSJack Wang 			srv_dev->open_write_cnt++;
4792de6c8deSJack Wang 		} else {
4802de6c8deSJack Wang 			pr_err("Mapping device '%s' for session %s with RW permissions failed. Device already opened as 'RW' by %d client(s), access mode %s.\n",
4813ecdbf91SGuoqing Jiang 			       srv_dev->name, srv_sess->sessname,
4822de6c8deSJack Wang 			       srv_dev->open_write_cnt,
483d6e94913SGuoqing Jiang 			       rnbd_access_modes[access_mode].str);
4846a12d537SGuoqing Jiang 			ret = -EPERM;
4852de6c8deSJack Wang 		}
4862de6c8deSJack Wang 		break;
4872de6c8deSJack Wang 	case RNBD_ACCESS_MIGRATION:
4882de6c8deSJack Wang 		if (srv_dev->open_write_cnt < 2) {
4892de6c8deSJack Wang 			srv_dev->open_write_cnt++;
4902de6c8deSJack Wang 		} else {
4912de6c8deSJack Wang 			pr_err("Mapping device '%s' for session %s with migration permissions failed. Device already opened as 'RW' by %d client(s), access mode %s.\n",
4923ecdbf91SGuoqing Jiang 			       srv_dev->name, srv_sess->sessname,
4932de6c8deSJack Wang 			       srv_dev->open_write_cnt,
494d6e94913SGuoqing Jiang 			       rnbd_access_modes[access_mode].str);
4956a12d537SGuoqing Jiang 			ret = -EPERM;
4962de6c8deSJack Wang 		}
4972de6c8deSJack Wang 		break;
4982de6c8deSJack Wang 	default:
4992de6c8deSJack Wang 		pr_err("Received mapping request for device '%s' on session %s with invalid access mode: %d\n",
5003ecdbf91SGuoqing Jiang 		       srv_dev->name, srv_sess->sessname, access_mode);
5012de6c8deSJack Wang 		ret = -EINVAL;
5022de6c8deSJack Wang 	}
5032de6c8deSJack Wang 
5042de6c8deSJack Wang 	mutex_unlock(&srv_dev->lock);
5052de6c8deSJack Wang 
5062de6c8deSJack Wang 	return ret;
5072de6c8deSJack Wang }
5082de6c8deSJack Wang 
5092de6c8deSJack Wang static struct rnbd_srv_dev *
rnbd_srv_get_or_create_srv_dev(struct block_device * bdev,struct rnbd_srv_session * srv_sess,enum rnbd_access_mode access_mode)510f7de4886SChristoph Hellwig rnbd_srv_get_or_create_srv_dev(struct block_device *bdev,
5112de6c8deSJack Wang 				struct rnbd_srv_session *srv_sess,
5122de6c8deSJack Wang 				enum rnbd_access_mode access_mode)
5132de6c8deSJack Wang {
5142de6c8deSJack Wang 	int ret;
5152de6c8deSJack Wang 	struct rnbd_srv_dev *new_dev, *dev;
5162de6c8deSJack Wang 
517f7de4886SChristoph Hellwig 	new_dev = rnbd_srv_init_srv_dev(bdev);
5182de6c8deSJack Wang 	if (IS_ERR(new_dev))
5192de6c8deSJack Wang 		return new_dev;
5202de6c8deSJack Wang 
5212de6c8deSJack Wang 	dev = rnbd_srv_find_or_add_srv_dev(new_dev);
5222de6c8deSJack Wang 	if (dev != new_dev)
5232de6c8deSJack Wang 		kfree(new_dev);
5242de6c8deSJack Wang 
5252de6c8deSJack Wang 	ret = rnbd_srv_check_update_open_perm(dev, srv_sess, access_mode);
5262de6c8deSJack Wang 	if (ret) {
5272de6c8deSJack Wang 		rnbd_put_srv_dev(dev);
5282de6c8deSJack Wang 		return ERR_PTR(ret);
5292de6c8deSJack Wang 	}
5302de6c8deSJack Wang 
5312de6c8deSJack Wang 	return dev;
5322de6c8deSJack Wang }
5332de6c8deSJack Wang 
rnbd_srv_fill_msg_open_rsp(struct rnbd_msg_open_rsp * rsp,struct rnbd_srv_sess_dev * sess_dev)5342de6c8deSJack Wang static void rnbd_srv_fill_msg_open_rsp(struct rnbd_msg_open_rsp *rsp,
5352de6c8deSJack Wang 					struct rnbd_srv_sess_dev *sess_dev)
5362de6c8deSJack Wang {
537f7de4886SChristoph Hellwig 	struct block_device *bdev = sess_dev->bdev;
5382de6c8deSJack Wang 
5392de6c8deSJack Wang 	rsp->hdr.type = cpu_to_le16(RNBD_MSG_OPEN_RSP);
5409ad15320SChristoph Hellwig 	rsp->device_id = cpu_to_le32(sess_dev->device_id);
5419ad15320SChristoph Hellwig 	rsp->nsectors = cpu_to_le64(bdev_nr_sectors(bdev));
5429ad15320SChristoph Hellwig 	rsp->logical_block_size	= cpu_to_le16(bdev_logical_block_size(bdev));
5439ad15320SChristoph Hellwig 	rsp->physical_block_size = cpu_to_le16(bdev_physical_block_size(bdev));
5449ad15320SChristoph Hellwig 	rsp->max_segments = cpu_to_le16(bdev_max_segments(bdev));
5452de6c8deSJack Wang 	rsp->max_hw_sectors =
5469ad15320SChristoph Hellwig 		cpu_to_le32(queue_max_hw_sectors(bdev_get_queue(bdev)));
547ebd04737SChristoph Hellwig 	rsp->max_write_same_sectors = 0;
5489ad15320SChristoph Hellwig 	rsp->max_discard_sectors = cpu_to_le32(bdev_max_discard_sectors(bdev));
5499ad15320SChristoph Hellwig 	rsp->discard_granularity = cpu_to_le32(bdev_discard_granularity(bdev));
5509ad15320SChristoph Hellwig 	rsp->discard_alignment = cpu_to_le32(bdev_discard_alignment(bdev));
5519ad15320SChristoph Hellwig 	rsp->secure_discard = cpu_to_le16(bdev_max_secure_erase_sectors(bdev));
552512c781fSGioh Kim 	rsp->cache_policy = 0;
5539ad15320SChristoph Hellwig 	if (bdev_write_cache(bdev))
554512c781fSGioh Kim 		rsp->cache_policy |= RNBD_WRITEBACK;
5559ad15320SChristoph Hellwig 	if (bdev_fua(bdev))
556512c781fSGioh Kim 		rsp->cache_policy |= RNBD_FUA;
5572de6c8deSJack Wang }
5582de6c8deSJack Wang 
5592de6c8deSJack Wang static struct rnbd_srv_sess_dev *
rnbd_srv_create_set_sess_dev(struct rnbd_srv_session * srv_sess,const struct rnbd_msg_open * open_msg,struct block_device * bdev,bool readonly,struct rnbd_srv_dev * srv_dev)5602de6c8deSJack Wang rnbd_srv_create_set_sess_dev(struct rnbd_srv_session *srv_sess,
5612de6c8deSJack Wang 			      const struct rnbd_msg_open *open_msg,
56299b07780SChristoph Hellwig 			      struct block_device *bdev, bool readonly,
5632de6c8deSJack Wang 			      struct rnbd_srv_dev *srv_dev)
5642de6c8deSJack Wang {
5652de6c8deSJack Wang 	struct rnbd_srv_sess_dev *sdev = rnbd_sess_dev_alloc(srv_sess);
5662de6c8deSJack Wang 
5672de6c8deSJack Wang 	if (IS_ERR(sdev))
5682de6c8deSJack Wang 		return sdev;
5692de6c8deSJack Wang 
5702de6c8deSJack Wang 	kref_init(&sdev->kref);
5712de6c8deSJack Wang 
57257b93ed4SDima Stepanov 	strscpy(sdev->pathname, open_msg->dev_name, sizeof(sdev->pathname));
5732de6c8deSJack Wang 
574f7de4886SChristoph Hellwig 	sdev->bdev		= bdev;
5752de6c8deSJack Wang 	sdev->sess		= srv_sess;
5762de6c8deSJack Wang 	sdev->dev		= srv_dev;
57799b07780SChristoph Hellwig 	sdev->readonly		= readonly;
5782de6c8deSJack Wang 	sdev->access_mode	= open_msg->access_mode;
5792de6c8deSJack Wang 
5802de6c8deSJack Wang 	return sdev;
5812de6c8deSJack Wang }
5822de6c8deSJack Wang 
rnbd_srv_get_full_path(struct rnbd_srv_session * srv_sess,const char * dev_name)5832de6c8deSJack Wang static char *rnbd_srv_get_full_path(struct rnbd_srv_session *srv_sess,
5842de6c8deSJack Wang 				     const char *dev_name)
5852de6c8deSJack Wang {
5862de6c8deSJack Wang 	char *full_path;
5872de6c8deSJack Wang 	char *a, *b;
588*5b9ea86eSKees Cook 	int len;
5892de6c8deSJack Wang 
5902de6c8deSJack Wang 	full_path = kmalloc(PATH_MAX, GFP_KERNEL);
5912de6c8deSJack Wang 	if (!full_path)
5922de6c8deSJack Wang 		return ERR_PTR(-ENOMEM);
5932de6c8deSJack Wang 
5942de6c8deSJack Wang 	/*
5952de6c8deSJack Wang 	 * Replace %SESSNAME% with a real session name in order to
5962de6c8deSJack Wang 	 * create device namespace.
5972de6c8deSJack Wang 	 */
5982de6c8deSJack Wang 	a = strnstr(dev_search_path, "%SESSNAME%", sizeof(dev_search_path));
5992de6c8deSJack Wang 	if (a) {
600*5b9ea86eSKees Cook 		len = a - dev_search_path;
6012de6c8deSJack Wang 
6022de6c8deSJack Wang 		len = snprintf(full_path, PATH_MAX, "%.*s/%s/%s", len,
6032de6c8deSJack Wang 			       dev_search_path, srv_sess->sessname, dev_name);
604*5b9ea86eSKees Cook 	} else {
605*5b9ea86eSKees Cook 		len = snprintf(full_path, PATH_MAX, "%s/%s",
606*5b9ea86eSKees Cook 			       dev_search_path, dev_name);
607*5b9ea86eSKees Cook 	}
6082de6c8deSJack Wang 	if (len >= PATH_MAX) {
6092de6c8deSJack Wang 		pr_err("Too long path: %s, %s, %s\n",
6102de6c8deSJack Wang 		       dev_search_path, srv_sess->sessname, dev_name);
6112de6c8deSJack Wang 		kfree(full_path);
6122de6c8deSJack Wang 		return ERR_PTR(-EINVAL);
6132de6c8deSJack Wang 	}
6142de6c8deSJack Wang 
6152de6c8deSJack Wang 	/* eliminitate duplicated slashes */
6162de6c8deSJack Wang 	a = strchr(full_path, '/');
6172de6c8deSJack Wang 	b = a;
6182de6c8deSJack Wang 	while (*b != '\0') {
6192de6c8deSJack Wang 		if (*b == '/' && *a == '/') {
6202de6c8deSJack Wang 			b++;
6212de6c8deSJack Wang 		} else {
6222de6c8deSJack Wang 			a++;
6232de6c8deSJack Wang 			*a = *b;
6242de6c8deSJack Wang 			b++;
6252de6c8deSJack Wang 		}
6262de6c8deSJack Wang 	}
6272de6c8deSJack Wang 	a++;
6282de6c8deSJack Wang 	*a = '\0';
6292de6c8deSJack Wang 
6302de6c8deSJack Wang 	return full_path;
6312de6c8deSJack Wang }
6322de6c8deSJack Wang 
process_msg_sess_info(struct rnbd_srv_session * srv_sess,const void * msg,size_t len,void * data,size_t datalen)633fece685cSGuoqing Jiang static void process_msg_sess_info(struct rnbd_srv_session *srv_sess,
6342de6c8deSJack Wang 				 const void *msg, size_t len,
6352de6c8deSJack Wang 				 void *data, size_t datalen)
6362de6c8deSJack Wang {
6372de6c8deSJack Wang 	const struct rnbd_msg_sess_info *sess_info_msg = msg;
6382de6c8deSJack Wang 	struct rnbd_msg_sess_info_rsp *rsp = data;
6392de6c8deSJack Wang 
6402de6c8deSJack Wang 	srv_sess->ver = min_t(u8, sess_info_msg->ver, RNBD_PROTO_VER_MAJOR);
64174e237b6SSantosh Pradhan 
64274e237b6SSantosh Pradhan 	trace_process_msg_sess_info(srv_sess, sess_info_msg);
6432de6c8deSJack Wang 
6442de6c8deSJack Wang 	rsp->hdr.type = cpu_to_le16(RNBD_MSG_SESS_INFO_RSP);
6452de6c8deSJack Wang 	rsp->ver = srv_sess->ver;
6462de6c8deSJack Wang }
6472de6c8deSJack Wang 
6482de6c8deSJack Wang /**
6492de6c8deSJack Wang  * find_srv_sess_dev() - a dev is already opened by this name
6502de6c8deSJack Wang  * @srv_sess:	the session to search.
6512de6c8deSJack Wang  * @dev_name:	string containing the name of the device.
6522de6c8deSJack Wang  *
6532de6c8deSJack Wang  * Return struct rnbd_srv_sess_dev if srv_sess already opened the dev_name
6542de6c8deSJack Wang  * NULL if the session didn't open the device yet.
6552de6c8deSJack Wang  */
6562de6c8deSJack Wang static struct rnbd_srv_sess_dev *
find_srv_sess_dev(struct rnbd_srv_session * srv_sess,const char * dev_name)6572de6c8deSJack Wang find_srv_sess_dev(struct rnbd_srv_session *srv_sess, const char *dev_name)
6582de6c8deSJack Wang {
6592de6c8deSJack Wang 	struct rnbd_srv_sess_dev *sess_dev;
660ce11bdf9SMd Haris Iqbal 	unsigned long index;
6612de6c8deSJack Wang 
662ce11bdf9SMd Haris Iqbal 	if (xa_empty(&srv_sess->index_idr))
6632de6c8deSJack Wang 		return NULL;
6642de6c8deSJack Wang 
665ce11bdf9SMd Haris Iqbal 	xa_for_each(&srv_sess->index_idr, index, sess_dev)
6662de6c8deSJack Wang 		if (!strcmp(sess_dev->pathname, dev_name))
6672de6c8deSJack Wang 			return sess_dev;
6682de6c8deSJack Wang 
6692de6c8deSJack Wang 	return NULL;
6702de6c8deSJack Wang }
6712de6c8deSJack Wang 
process_msg_open(struct rnbd_srv_session * srv_sess,const void * msg,size_t len,void * data,size_t datalen)672c81cba85SGioh Kim static int process_msg_open(struct rnbd_srv_session *srv_sess,
6732de6c8deSJack Wang 			    const void *msg, size_t len,
6742de6c8deSJack Wang 			    void *data, size_t datalen)
6752de6c8deSJack Wang {
6762de6c8deSJack Wang 	int ret;
6772de6c8deSJack Wang 	struct rnbd_srv_dev *srv_dev;
6782de6c8deSJack Wang 	struct rnbd_srv_sess_dev *srv_sess_dev;
6792de6c8deSJack Wang 	const struct rnbd_msg_open *open_msg = msg;
680f7de4886SChristoph Hellwig 	struct block_device *bdev;
68105bdb996SChristoph Hellwig 	blk_mode_t open_flags = BLK_OPEN_READ;
6822de6c8deSJack Wang 	char *full_path;
6832de6c8deSJack Wang 	struct rnbd_msg_open_rsp *rsp = data;
6842de6c8deSJack Wang 
68574e237b6SSantosh Pradhan 	trace_process_msg_open(srv_sess, open_msg);
68674e237b6SSantosh Pradhan 
6872de6c8deSJack Wang 	if (open_msg->access_mode != RNBD_ACCESS_RO)
68805bdb996SChristoph Hellwig 		open_flags |= BLK_OPEN_WRITE;
6892de6c8deSJack Wang 
6902de6c8deSJack Wang 	mutex_lock(&srv_sess->lock);
6912de6c8deSJack Wang 
6922de6c8deSJack Wang 	srv_sess_dev = find_srv_sess_dev(srv_sess, open_msg->dev_name);
6932de6c8deSJack Wang 	if (srv_sess_dev)
6942de6c8deSJack Wang 		goto fill_response;
6952de6c8deSJack Wang 
6962de6c8deSJack Wang 	if ((strlen(dev_search_path) + strlen(open_msg->dev_name))
6972de6c8deSJack Wang 	    >= PATH_MAX) {
6982de6c8deSJack Wang 		pr_err("Opening device for session %s failed, device path too long. '%s/%s' is longer than PATH_MAX (%d)\n",
6992de6c8deSJack Wang 		       srv_sess->sessname, dev_search_path, open_msg->dev_name,
7002de6c8deSJack Wang 		       PATH_MAX);
7012de6c8deSJack Wang 		ret = -EINVAL;
7022de6c8deSJack Wang 		goto reject;
7032de6c8deSJack Wang 	}
7042de6c8deSJack Wang 	if (strstr(open_msg->dev_name, "..")) {
7052de6c8deSJack Wang 		pr_err("Opening device for session %s failed, device path %s contains relative path ..\n",
7062de6c8deSJack Wang 		       srv_sess->sessname, open_msg->dev_name);
7072de6c8deSJack Wang 		ret = -EINVAL;
7082de6c8deSJack Wang 		goto reject;
7092de6c8deSJack Wang 	}
7102de6c8deSJack Wang 	full_path = rnbd_srv_get_full_path(srv_sess, open_msg->dev_name);
7112de6c8deSJack Wang 	if (IS_ERR(full_path)) {
7122de6c8deSJack Wang 		ret = PTR_ERR(full_path);
7132de6c8deSJack Wang 		pr_err("Opening device '%s' for client %s failed, failed to get device full path, err: %d\n",
7142de6c8deSJack Wang 		       open_msg->dev_name, srv_sess->sessname, ret);
7152de6c8deSJack Wang 		goto reject;
7162de6c8deSJack Wang 	}
7172de6c8deSJack Wang 
7185ee60767SChristoph Hellwig 	bdev = blkdev_get_by_path(full_path, open_flags, NULL, NULL);
719f7de4886SChristoph Hellwig 	if (IS_ERR(bdev)) {
720f7de4886SChristoph Hellwig 		ret = PTR_ERR(bdev);
7216856b194SChristoph Hellwig 		pr_err("Opening device '%s' on session %s failed, failed to open the block device, err: %d\n",
7226856b194SChristoph Hellwig 		       full_path, srv_sess->sessname, ret);
7232de6c8deSJack Wang 		goto free_path;
7242de6c8deSJack Wang 	}
7252de6c8deSJack Wang 
726f7de4886SChristoph Hellwig 	srv_dev = rnbd_srv_get_or_create_srv_dev(bdev, srv_sess,
7272de6c8deSJack Wang 						  open_msg->access_mode);
7282de6c8deSJack Wang 	if (IS_ERR(srv_dev)) {
7292de6c8deSJack Wang 		pr_err("Opening device '%s' on session %s failed, creating srv_dev failed, err: %ld\n",
7302de6c8deSJack Wang 		       full_path, srv_sess->sessname, PTR_ERR(srv_dev));
7312de6c8deSJack Wang 		ret = PTR_ERR(srv_dev);
732f7de4886SChristoph Hellwig 		goto blkdev_put;
7332de6c8deSJack Wang 	}
7342de6c8deSJack Wang 
73599b07780SChristoph Hellwig 	srv_sess_dev = rnbd_srv_create_set_sess_dev(srv_sess, open_msg, bdev,
73699b07780SChristoph Hellwig 				open_msg->access_mode == RNBD_ACCESS_RO,
7372de6c8deSJack Wang 				srv_dev);
7382de6c8deSJack Wang 	if (IS_ERR(srv_sess_dev)) {
7392de6c8deSJack Wang 		pr_err("Opening device '%s' on session %s failed, creating sess_dev failed, err: %ld\n",
7402de6c8deSJack Wang 		       full_path, srv_sess->sessname, PTR_ERR(srv_sess_dev));
7412de6c8deSJack Wang 		ret = PTR_ERR(srv_sess_dev);
7422de6c8deSJack Wang 		goto srv_dev_put;
7432de6c8deSJack Wang 	}
7442de6c8deSJack Wang 
7452de6c8deSJack Wang 	/* Create the srv_dev sysfs files if they haven't been created yet. The
7462de6c8deSJack Wang 	 * reason to delay the creation is not to create the sysfs files before
7472de6c8deSJack Wang 	 * we are sure the device can be opened.
7482de6c8deSJack Wang 	 */
7492de6c8deSJack Wang 	mutex_lock(&srv_dev->lock);
7502de6c8deSJack Wang 	if (!srv_dev->dev_kobj.state_in_sysfs) {
751f7de4886SChristoph Hellwig 		ret = rnbd_srv_create_dev_sysfs(srv_dev, bdev);
7522de6c8deSJack Wang 		if (ret) {
7532de6c8deSJack Wang 			mutex_unlock(&srv_dev->lock);
7542de6c8deSJack Wang 			rnbd_srv_err(srv_sess_dev,
7552de6c8deSJack Wang 				      "Opening device failed, failed to create device sysfs files, err: %d\n",
7562de6c8deSJack Wang 				      ret);
7572de6c8deSJack Wang 			goto free_srv_sess_dev;
7582de6c8deSJack Wang 		}
7592de6c8deSJack Wang 	}
7602de6c8deSJack Wang 
7612de6c8deSJack Wang 	ret = rnbd_srv_create_dev_session_sysfs(srv_sess_dev);
7622de6c8deSJack Wang 	if (ret) {
7632de6c8deSJack Wang 		mutex_unlock(&srv_dev->lock);
7642de6c8deSJack Wang 		rnbd_srv_err(srv_sess_dev,
7652de6c8deSJack Wang 			      "Opening device failed, failed to create dev client sysfs files, err: %d\n",
7662de6c8deSJack Wang 			      ret);
7672de6c8deSJack Wang 		goto free_srv_sess_dev;
7682de6c8deSJack Wang 	}
7692de6c8deSJack Wang 
7702de6c8deSJack Wang 	list_add(&srv_sess_dev->dev_list, &srv_dev->sess_dev_list);
7712de6c8deSJack Wang 	mutex_unlock(&srv_dev->lock);
7722de6c8deSJack Wang 
7733ecdbf91SGuoqing Jiang 	rnbd_srv_info(srv_sess_dev, "Opened device '%s'\n", srv_dev->name);
7742de6c8deSJack Wang 
7752de6c8deSJack Wang 	kfree(full_path);
7762de6c8deSJack Wang 
7772de6c8deSJack Wang fill_response:
7782de6c8deSJack Wang 	rnbd_srv_fill_msg_open_rsp(rsp, srv_sess_dev);
7792de6c8deSJack Wang 	mutex_unlock(&srv_sess->lock);
7802de6c8deSJack Wang 	return 0;
7812de6c8deSJack Wang 
7822de6c8deSJack Wang free_srv_sess_dev:
7832de6c8deSJack Wang 	xa_erase(&srv_sess->index_idr, srv_sess_dev->device_id);
7842de6c8deSJack Wang 	synchronize_rcu();
7852de6c8deSJack Wang 	kfree(srv_sess_dev);
7862de6c8deSJack Wang srv_dev_put:
7872de6c8deSJack Wang 	if (open_msg->access_mode != RNBD_ACCESS_RO) {
7882de6c8deSJack Wang 		mutex_lock(&srv_dev->lock);
7892de6c8deSJack Wang 		srv_dev->open_write_cnt--;
7902de6c8deSJack Wang 		mutex_unlock(&srv_dev->lock);
7912de6c8deSJack Wang 	}
7922de6c8deSJack Wang 	rnbd_put_srv_dev(srv_dev);
793f7de4886SChristoph Hellwig blkdev_put:
7942736e8eeSChristoph Hellwig 	blkdev_put(bdev, NULL);
7952de6c8deSJack Wang free_path:
7962de6c8deSJack Wang 	kfree(full_path);
7972de6c8deSJack Wang reject:
7982de6c8deSJack Wang 	mutex_unlock(&srv_sess->lock);
7992de6c8deSJack Wang 	return ret;
8002de6c8deSJack Wang }
8012de6c8deSJack Wang 
8022de6c8deSJack Wang static struct rtrs_srv_ctx *rtrs_ctx;
8032de6c8deSJack Wang 
8042de6c8deSJack Wang static struct rtrs_srv_ops rtrs_ops;
rnbd_srv_init_module(void)8052de6c8deSJack Wang static int __init rnbd_srv_init_module(void)
8062de6c8deSJack Wang {
807d3fc0b46SGuoqing Jiang 	int err = 0;
8082de6c8deSJack Wang 
8092de6c8deSJack Wang 	BUILD_BUG_ON(sizeof(struct rnbd_msg_hdr) != 4);
8102de6c8deSJack Wang 	BUILD_BUG_ON(sizeof(struct rnbd_msg_sess_info) != 36);
8112de6c8deSJack Wang 	BUILD_BUG_ON(sizeof(struct rnbd_msg_sess_info_rsp) != 36);
8122de6c8deSJack Wang 	BUILD_BUG_ON(sizeof(struct rnbd_msg_open) != 264);
8132de6c8deSJack Wang 	BUILD_BUG_ON(sizeof(struct rnbd_msg_close) != 8);
8142de6c8deSJack Wang 	BUILD_BUG_ON(sizeof(struct rnbd_msg_open_rsp) != 56);
8152de6c8deSJack Wang 	rtrs_ops = (struct rtrs_srv_ops) {
8162de6c8deSJack Wang 		.rdma_ev = rnbd_srv_rdma_ev,
8172de6c8deSJack Wang 		.link_ev = rnbd_srv_link_ev,
8182de6c8deSJack Wang 	};
8192de6c8deSJack Wang 	rtrs_ctx = rtrs_srv_open(&rtrs_ops, port_nr);
8202de6c8deSJack Wang 	if (IS_ERR(rtrs_ctx)) {
8212de6c8deSJack Wang 		pr_err("rtrs_srv_open(), err: %d\n", err);
822d3fc0b46SGuoqing Jiang 		return PTR_ERR(rtrs_ctx);
8232de6c8deSJack Wang 	}
8242de6c8deSJack Wang 
8252de6c8deSJack Wang 	err = rnbd_srv_create_sysfs_files();
8262de6c8deSJack Wang 	if (err) {
8272de6c8deSJack Wang 		pr_err("rnbd_srv_create_sysfs_files(), err: %d\n", err);
8282de6c8deSJack Wang 		rtrs_srv_close(rtrs_ctx);
8292de6c8deSJack Wang 	}
8302de6c8deSJack Wang 
831d3fc0b46SGuoqing Jiang 	return err;
8322de6c8deSJack Wang }
8332de6c8deSJack Wang 
rnbd_srv_cleanup_module(void)8342de6c8deSJack Wang static void __exit rnbd_srv_cleanup_module(void)
8352de6c8deSJack Wang {
8362de6c8deSJack Wang 	rtrs_srv_close(rtrs_ctx);
8372de6c8deSJack Wang 	WARN_ON(!list_empty(&sess_list));
8382de6c8deSJack Wang 	rnbd_srv_destroy_sysfs_files();
8392de6c8deSJack Wang }
8402de6c8deSJack Wang 
8412de6c8deSJack Wang module_init(rnbd_srv_init_module);
8422de6c8deSJack Wang module_exit(rnbd_srv_cleanup_module);
843