xref: /openbmc/linux/drivers/block/rnbd/rnbd-proto.h (revision 1ac731c529cd4d6adbce134754b51ff7d822b145)
1219ace60SJack Wang /* SPDX-License-Identifier: GPL-2.0-or-later */
2219ace60SJack Wang /*
3219ace60SJack Wang  * RDMA Network Block Driver
4219ace60SJack Wang  *
5219ace60SJack Wang  * Copyright (c) 2014 - 2018 ProfitBricks GmbH. All rights reserved.
6219ace60SJack Wang  * Copyright (c) 2018 - 2019 1&1 IONOS Cloud GmbH. All rights reserved.
7219ace60SJack Wang  * Copyright (c) 2019 - 2020 1&1 IONOS SE. All rights reserved.
8219ace60SJack Wang  */
9219ace60SJack Wang #ifndef RNBD_PROTO_H
10219ace60SJack Wang #define RNBD_PROTO_H
11219ace60SJack Wang 
12219ace60SJack Wang #include <linux/types.h>
1324b83debSChristoph Hellwig #include <linux/blk-mq.h>
14219ace60SJack Wang #include <linux/limits.h>
15219ace60SJack Wang #include <linux/inet.h>
16219ace60SJack Wang #include <linux/in.h>
17219ace60SJack Wang #include <linux/in6.h>
18219ace60SJack Wang #include <rdma/ib.h>
19219ace60SJack Wang 
20219ace60SJack Wang #define RNBD_PROTO_VER_MAJOR 2
21219ace60SJack Wang #define RNBD_PROTO_VER_MINOR 0
22219ace60SJack Wang 
23219ace60SJack Wang /* The default port number the RTRS server is listening on. */
24219ace60SJack Wang #define RTRS_PORT 1234
25219ace60SJack Wang 
26219ace60SJack Wang /**
27219ace60SJack Wang  * enum rnbd_msg_types - RNBD message types
28219ace60SJack Wang  * @RNBD_MSG_SESS_INFO:	initial session info from client to server
29219ace60SJack Wang  * @RNBD_MSG_SESS_INFO_RSP:	initial session info from server to client
30219ace60SJack Wang  * @RNBD_MSG_OPEN:		open (map) device request
31219ace60SJack Wang  * @RNBD_MSG_OPEN_RSP:		response to an @RNBD_MSG_OPEN
32219ace60SJack Wang  * @RNBD_MSG_IO:		block IO request operation
33219ace60SJack Wang  * @RNBD_MSG_CLOSE:		close (unmap) device request
34219ace60SJack Wang  */
35219ace60SJack Wang enum rnbd_msg_type {
36219ace60SJack Wang 	RNBD_MSG_SESS_INFO,
37219ace60SJack Wang 	RNBD_MSG_SESS_INFO_RSP,
38219ace60SJack Wang 	RNBD_MSG_OPEN,
39219ace60SJack Wang 	RNBD_MSG_OPEN_RSP,
40219ace60SJack Wang 	RNBD_MSG_IO,
41219ace60SJack Wang 	RNBD_MSG_CLOSE,
42219ace60SJack Wang };
43219ace60SJack Wang 
44219ace60SJack Wang /**
45219ace60SJack Wang  * struct rnbd_msg_hdr - header of RNBD messages
46219ace60SJack Wang  * @type:	Message type, valid values see: enum rnbd_msg_types
47219ace60SJack Wang  */
48219ace60SJack Wang struct rnbd_msg_hdr {
49219ace60SJack Wang 	__le16		type;
50219ace60SJack Wang 	__le16		__padding;
51219ace60SJack Wang };
52219ace60SJack Wang 
53219ace60SJack Wang /**
54219ace60SJack Wang  * We allow to map RO many times and RW only once. We allow to map yet another
55219ace60SJack Wang  * time RW, if MIGRATION is provided (second RW export can be required for
56219ace60SJack Wang  * example for VM migration)
57219ace60SJack Wang  */
58219ace60SJack Wang enum rnbd_access_mode {
59219ace60SJack Wang 	RNBD_ACCESS_RO,
60219ace60SJack Wang 	RNBD_ACCESS_RW,
61219ace60SJack Wang 	RNBD_ACCESS_MIGRATION,
62219ace60SJack Wang };
63219ace60SJack Wang 
64219ace60SJack Wang static const __maybe_unused struct {
65219ace60SJack Wang 	enum rnbd_access_mode mode;
66219ace60SJack Wang 	const char *str;
67219ace60SJack Wang } rnbd_access_modes[] = {
68219ace60SJack Wang 	[RNBD_ACCESS_RO] = {RNBD_ACCESS_RO, "ro"},
69219ace60SJack Wang 	[RNBD_ACCESS_RW] = {RNBD_ACCESS_RW, "rw"},
70219ace60SJack Wang 	[RNBD_ACCESS_MIGRATION] = {RNBD_ACCESS_MIGRATION, "migration"},
71219ace60SJack Wang };
72219ace60SJack Wang 
73219ace60SJack Wang /**
74219ace60SJack Wang  * struct rnbd_msg_sess_info - initial session info from client to server
75219ace60SJack Wang  * @hdr:		message header
76219ace60SJack Wang  * @ver:		RNBD protocol version
77219ace60SJack Wang  */
78219ace60SJack Wang struct rnbd_msg_sess_info {
79219ace60SJack Wang 	struct rnbd_msg_hdr hdr;
80219ace60SJack Wang 	u8		ver;
81219ace60SJack Wang 	u8		reserved[31];
82219ace60SJack Wang };
83219ace60SJack Wang 
84219ace60SJack Wang /**
85219ace60SJack Wang  * struct rnbd_msg_sess_info_rsp - initial session info from server to client
86219ace60SJack Wang  * @hdr:		message header
87219ace60SJack Wang  * @ver:		RNBD protocol version
88219ace60SJack Wang  */
89219ace60SJack Wang struct rnbd_msg_sess_info_rsp {
90219ace60SJack Wang 	struct rnbd_msg_hdr hdr;
91219ace60SJack Wang 	u8		ver;
92219ace60SJack Wang 	u8		reserved[31];
93219ace60SJack Wang };
94219ace60SJack Wang 
95219ace60SJack Wang /**
96219ace60SJack Wang  * struct rnbd_msg_open - request to open a remote device.
97219ace60SJack Wang  * @hdr:		message header
98219ace60SJack Wang  * @access_mode:	the mode to open remote device, valid values see:
99219ace60SJack Wang  *			enum rnbd_access_mode
100219ace60SJack Wang  * @device_name:	device path on remote side
101219ace60SJack Wang  */
102219ace60SJack Wang struct rnbd_msg_open {
103219ace60SJack Wang 	struct rnbd_msg_hdr hdr;
104219ace60SJack Wang 	u8		access_mode;
105219ace60SJack Wang 	u8		resv1;
106219ace60SJack Wang 	s8		dev_name[NAME_MAX];
107219ace60SJack Wang 	u8		reserved[3];
108219ace60SJack Wang };
109219ace60SJack Wang 
110219ace60SJack Wang /**
111512c781fSGioh Kim  * struct rnbd_msg_close - request to close a remote device.
112512c781fSGioh Kim  * @hdr:	message header
113512c781fSGioh Kim  * @device_id:	device_id on server side to identify the device
114512c781fSGioh Kim  */
115512c781fSGioh Kim struct rnbd_msg_close {
116219ace60SJack Wang 	struct rnbd_msg_hdr hdr;
117219ace60SJack Wang 	__le32		device_id;
118219ace60SJack Wang };
119219ace60SJack Wang 
120219ace60SJack Wang enum rnbd_cache_policy {
121219ace60SJack Wang 	RNBD_FUA = 1 << 0,
122219ace60SJack Wang 	RNBD_WRITEBACK = 1 << 1,
123219ace60SJack Wang };
124219ace60SJack Wang 
125219ace60SJack Wang /**
126219ace60SJack Wang  * struct rnbd_msg_open_rsp - response message to RNBD_MSG_OPEN
127219ace60SJack Wang  * @hdr:		message header
128219ace60SJack Wang  * @device_id:		device_id on server side to identify the device
129219ace60SJack Wang  * @nsectors:		number of sectors in the usual 512b unit
130219ace60SJack Wang  * @max_hw_sectors:	max hardware sectors in the usual 512b unit
131030ce8baSGioh Kim  * @max_write_same_sectors: max sectors for WRITE SAME in the 512b unit
132512c781fSGioh Kim  * @max_discard_sectors: max. sectors that can be discarded at once in 512b
133219ace60SJack Wang  * unit.
134219ace60SJack Wang  * @discard_granularity: size of the internal discard allocation unit in bytes
135219ace60SJack Wang  * @discard_alignment: offset from internal allocation assignment in bytes
136219ace60SJack Wang  * @physical_block_size: physical block size device supports in bytes
137219ace60SJack Wang  * @logical_block_size: logical block size device supports in bytes
138219ace60SJack Wang  * @max_segments:	max segments hardware support in one transfer
139219ace60SJack Wang  * @secure_discard:	supports secure discard
140219ace60SJack Wang  * @obsolete_rotational: obsolete, not in used.
141219ace60SJack Wang  * @cache_policy: 	support write-back caching or FUA?
142219ace60SJack Wang  */
143219ace60SJack Wang struct rnbd_msg_open_rsp {
144219ace60SJack Wang 	struct rnbd_msg_hdr	hdr;
145219ace60SJack Wang 	__le32			device_id;
146219ace60SJack Wang 	__le64			nsectors;
147030ce8baSGioh Kim 	__le32			max_hw_sectors;
148512c781fSGioh Kim 	__le32			max_write_same_sectors;
149512c781fSGioh Kim 	__le32			max_discard_sectors;
150219ace60SJack Wang 	__le32			discard_granularity;
151219ace60SJack Wang 	__le32			discard_alignment;
152219ace60SJack Wang 	__le16			physical_block_size;
153219ace60SJack Wang 	__le16			logical_block_size;
154219ace60SJack Wang 	__le16			max_segments;
155219ace60SJack Wang 	__le16			secure_discard;
156219ace60SJack Wang 	u8			obsolete_rotational;
157219ace60SJack Wang 	u8			cache_policy;
158219ace60SJack Wang 	u8			reserved[10];
159219ace60SJack Wang };
160219ace60SJack Wang 
161219ace60SJack Wang /**
162219ace60SJack Wang  * struct rnbd_msg_io - message for I/O read/write
163219ace60SJack Wang  * @hdr:	message header
164219ace60SJack Wang  * @device_id:	device_id on server side to find the right device
165219ace60SJack Wang  * @sector:	bi_sector attribute from struct bio
166219ace60SJack Wang  * @rw:		valid values are defined in enum rnbd_io_flags
167219ace60SJack Wang  * @bi_size:    number of bytes for I/O read/write
168219ace60SJack Wang  * @prio:       priority
169219ace60SJack Wang  */
170219ace60SJack Wang struct rnbd_msg_io {
171219ace60SJack Wang 	struct rnbd_msg_hdr hdr;
172219ace60SJack Wang 	__le32		device_id;
173219ace60SJack Wang 	__le64		sector;
174219ace60SJack Wang 	__le32		rw;
175219ace60SJack Wang 	__le32		bi_size;
176219ace60SJack Wang 	__le16		prio;
177219ace60SJack Wang };
178219ace60SJack Wang 
179219ace60SJack Wang #define RNBD_OP_BITS  8
180219ace60SJack Wang #define RNBD_OP_MASK  ((1 << RNBD_OP_BITS) - 1)
181219ace60SJack Wang 
182219ace60SJack Wang /**
183219ace60SJack Wang  * enum rnbd_io_flags - RNBD request types from rq_flag_bits
184219ace60SJack Wang  * @RNBD_OP_READ:	     read sectors from the device
185219ace60SJack Wang  * @RNBD_OP_WRITE:	     write sectors to the device
186219ace60SJack Wang  * @RNBD_OP_FLUSH:	     flush the volatile write cache
187219ace60SJack Wang  * @RNBD_OP_DISCARD:        discard sectors
188219ace60SJack Wang  * @RNBD_OP_SECURE_ERASE:   securely erase sectors
189219ace60SJack Wang  * @RNBD_OP_WRITE_SAME:     write the same sectors many times
190219ace60SJack Wang 
191219ace60SJack Wang  * @RNBD_F_SYNC:	     request is sync (sync write or read)
192219ace60SJack Wang  * @RNBD_F_FUA:             forced unit access
193219ace60SJack Wang  */
194219ace60SJack Wang enum rnbd_io_flags {
195219ace60SJack Wang 
196219ace60SJack Wang 	/* Operations */
197219ace60SJack Wang 	RNBD_OP_READ		= 0,
198219ace60SJack Wang 	RNBD_OP_WRITE		= 1,
199219ace60SJack Wang 	RNBD_OP_FLUSH		= 2,
200219ace60SJack Wang 	RNBD_OP_DISCARD	= 3,
201219ace60SJack Wang 	RNBD_OP_SECURE_ERASE	= 4,
202219ace60SJack Wang 	RNBD_OP_WRITE_SAME	= 5,
203219ace60SJack Wang 
204219ace60SJack Wang 	/* Flags */
205219ace60SJack Wang 	RNBD_F_SYNC  = 1<<(RNBD_OP_BITS + 0),
206219ace60SJack Wang 	RNBD_F_FUA   = 1<<(RNBD_OP_BITS + 1),
207219ace60SJack Wang };
208219ace60SJack Wang 
rnbd_op(u32 flags)209219ace60SJack Wang static inline u32 rnbd_op(u32 flags)
210219ace60SJack Wang {
211219ace60SJack Wang 	return flags & RNBD_OP_MASK;
212219ace60SJack Wang }
213219ace60SJack Wang 
rnbd_flags(u32 flags)214219ace60SJack Wang static inline u32 rnbd_flags(u32 flags)
215219ace60SJack Wang {
216219ace60SJack Wang 	return flags & ~RNBD_OP_MASK;
217219ace60SJack Wang }
218219ace60SJack Wang 
rnbd_to_bio_flags(u32 rnbd_opf)219219ace60SJack Wang static inline blk_opf_t rnbd_to_bio_flags(u32 rnbd_opf)
220219ace60SJack Wang {
221219ace60SJack Wang 	blk_opf_t bio_opf;
222219ace60SJack Wang 
223219ace60SJack Wang 	switch (rnbd_op(rnbd_opf)) {
224219ace60SJack Wang 	case RNBD_OP_READ:
225219ace60SJack Wang 		bio_opf = REQ_OP_READ;
226219ace60SJack Wang 		break;
227219ace60SJack Wang 	case RNBD_OP_WRITE:
228219ace60SJack Wang 		bio_opf = REQ_OP_WRITE;
229219ace60SJack Wang 		break;
230219ace60SJack Wang 	case RNBD_OP_FLUSH:
231219ace60SJack Wang 		bio_opf = REQ_OP_WRITE | REQ_PREFLUSH;
23203df83acSBart Van Assche 		break;
233219ace60SJack Wang 	case RNBD_OP_DISCARD:
23403df83acSBart Van Assche 		bio_opf = REQ_OP_DISCARD;
235219ace60SJack Wang 		break;
236219ace60SJack Wang 	case RNBD_OP_SECURE_ERASE:
237219ace60SJack Wang 		bio_opf = REQ_OP_SECURE_ERASE;
238219ace60SJack Wang 		break;
239219ace60SJack Wang 	default:
240219ace60SJack Wang 		WARN(1, "Unknown RNBD type: %d (flags %d)\n",
241219ace60SJack Wang 		     rnbd_op(rnbd_opf), rnbd_opf);
242219ace60SJack Wang 		bio_opf = 0;
243219ace60SJack Wang 	}
244*5e6e0808SGuoqing Jiang 
245219ace60SJack Wang 	if (rnbd_opf & RNBD_F_SYNC)
246219ace60SJack Wang 		bio_opf |= REQ_SYNC;
247219ace60SJack Wang 
248219ace60SJack Wang 	if (rnbd_opf & RNBD_F_FUA)
249219ace60SJack Wang 		bio_opf |= REQ_FUA;
250219ace60SJack Wang 
251219ace60SJack Wang 	return bio_opf;
252219ace60SJack Wang }
253219ace60SJack Wang 
rq_to_rnbd_flags(struct request * rq)254219ace60SJack Wang static inline u32 rq_to_rnbd_flags(struct request *rq)
255219ace60SJack Wang {
256219ace60SJack Wang 	u32 rnbd_opf;
257219ace60SJack Wang 
258219ace60SJack Wang 	switch (req_op(rq)) {
259219ace60SJack Wang 	case REQ_OP_READ:
260219ace60SJack Wang 		rnbd_opf = RNBD_OP_READ;
261219ace60SJack Wang 		break;
262219ace60SJack Wang 	case REQ_OP_WRITE:
263219ace60SJack Wang 		rnbd_opf = RNBD_OP_WRITE;
264219ace60SJack Wang 		break;
265219ace60SJack Wang 	case REQ_OP_DISCARD:
266219ace60SJack Wang 		rnbd_opf = RNBD_OP_DISCARD;
267219ace60SJack Wang 		break;
268219ace60SJack Wang 	case REQ_OP_SECURE_ERASE:
269219ace60SJack Wang 		rnbd_opf = RNBD_OP_SECURE_ERASE;
270219ace60SJack Wang 		break;
271219ace60SJack Wang 	case REQ_OP_FLUSH:
272219ace60SJack Wang 		rnbd_opf = RNBD_OP_FLUSH;
273219ace60SJack Wang 		break;
274219ace60SJack Wang 	default:
275219ace60SJack Wang 		WARN(1, "Unknown request type %d (flags %llu)\n",
276219ace60SJack Wang 		     (__force u32)req_op(rq),
277219ace60SJack Wang 		     (__force unsigned long long)rq->cmd_flags);
278219ace60SJack Wang 		rnbd_opf = 0;
279219ace60SJack Wang 	}
280219ace60SJack Wang 
281219ace60SJack Wang 	if (op_is_sync(rq->cmd_flags))
282219ace60SJack Wang 		rnbd_opf |= RNBD_F_SYNC;
283219ace60SJack Wang 
284219ace60SJack Wang 	if (op_is_flush(rq->cmd_flags))
285219ace60SJack Wang 		rnbd_opf |= RNBD_F_FUA;
286219ace60SJack Wang 
287219ace60SJack Wang 	return rnbd_opf;
288219ace60SJack Wang }
28903df83acSBart Van Assche 
29003df83acSBart Van Assche const char *rnbd_access_mode_str(enum rnbd_access_mode mode);
291219ace60SJack Wang 
292219ace60SJack Wang #endif /* RNBD_PROTO_H */
293219ace60SJack Wang