1219ace60SJack Wang /* SPDX-License-Identifier: GPL-2.0-or-later */
2219ace60SJack Wang /*
3219ace60SJack Wang * RDMA Network Block Driver
4219ace60SJack Wang *
5219ace60SJack Wang * Copyright (c) 2014 - 2018 ProfitBricks GmbH. All rights reserved.
6219ace60SJack Wang * Copyright (c) 2018 - 2019 1&1 IONOS Cloud GmbH. All rights reserved.
7219ace60SJack Wang * Copyright (c) 2019 - 2020 1&1 IONOS SE. All rights reserved.
8219ace60SJack Wang */
9219ace60SJack Wang #ifndef RNBD_PROTO_H
10219ace60SJack Wang #define RNBD_PROTO_H
11219ace60SJack Wang
12219ace60SJack Wang #include <linux/types.h>
1324b83debSChristoph Hellwig #include <linux/blk-mq.h>
14219ace60SJack Wang #include <linux/limits.h>
15219ace60SJack Wang #include <linux/inet.h>
16219ace60SJack Wang #include <linux/in.h>
17219ace60SJack Wang #include <linux/in6.h>
18219ace60SJack Wang #include <rdma/ib.h>
19219ace60SJack Wang
20219ace60SJack Wang #define RNBD_PROTO_VER_MAJOR 2
21219ace60SJack Wang #define RNBD_PROTO_VER_MINOR 0
22219ace60SJack Wang
23219ace60SJack Wang /* The default port number the RTRS server is listening on. */
24219ace60SJack Wang #define RTRS_PORT 1234
25219ace60SJack Wang
26219ace60SJack Wang /**
27219ace60SJack Wang * enum rnbd_msg_types - RNBD message types
28219ace60SJack Wang * @RNBD_MSG_SESS_INFO: initial session info from client to server
29219ace60SJack Wang * @RNBD_MSG_SESS_INFO_RSP: initial session info from server to client
30219ace60SJack Wang * @RNBD_MSG_OPEN: open (map) device request
31219ace60SJack Wang * @RNBD_MSG_OPEN_RSP: response to an @RNBD_MSG_OPEN
32219ace60SJack Wang * @RNBD_MSG_IO: block IO request operation
33219ace60SJack Wang * @RNBD_MSG_CLOSE: close (unmap) device request
34219ace60SJack Wang */
35219ace60SJack Wang enum rnbd_msg_type {
36219ace60SJack Wang RNBD_MSG_SESS_INFO,
37219ace60SJack Wang RNBD_MSG_SESS_INFO_RSP,
38219ace60SJack Wang RNBD_MSG_OPEN,
39219ace60SJack Wang RNBD_MSG_OPEN_RSP,
40219ace60SJack Wang RNBD_MSG_IO,
41219ace60SJack Wang RNBD_MSG_CLOSE,
42219ace60SJack Wang };
43219ace60SJack Wang
44219ace60SJack Wang /**
45219ace60SJack Wang * struct rnbd_msg_hdr - header of RNBD messages
46219ace60SJack Wang * @type: Message type, valid values see: enum rnbd_msg_types
47219ace60SJack Wang */
48219ace60SJack Wang struct rnbd_msg_hdr {
49219ace60SJack Wang __le16 type;
50219ace60SJack Wang __le16 __padding;
51219ace60SJack Wang };
52219ace60SJack Wang
53219ace60SJack Wang /**
54219ace60SJack Wang * We allow to map RO many times and RW only once. We allow to map yet another
55219ace60SJack Wang * time RW, if MIGRATION is provided (second RW export can be required for
56219ace60SJack Wang * example for VM migration)
57219ace60SJack Wang */
58219ace60SJack Wang enum rnbd_access_mode {
59219ace60SJack Wang RNBD_ACCESS_RO,
60219ace60SJack Wang RNBD_ACCESS_RW,
61219ace60SJack Wang RNBD_ACCESS_MIGRATION,
62219ace60SJack Wang };
63219ace60SJack Wang
64219ace60SJack Wang static const __maybe_unused struct {
65219ace60SJack Wang enum rnbd_access_mode mode;
66219ace60SJack Wang const char *str;
67219ace60SJack Wang } rnbd_access_modes[] = {
68219ace60SJack Wang [RNBD_ACCESS_RO] = {RNBD_ACCESS_RO, "ro"},
69219ace60SJack Wang [RNBD_ACCESS_RW] = {RNBD_ACCESS_RW, "rw"},
70219ace60SJack Wang [RNBD_ACCESS_MIGRATION] = {RNBD_ACCESS_MIGRATION, "migration"},
71219ace60SJack Wang };
72219ace60SJack Wang
73219ace60SJack Wang /**
74219ace60SJack Wang * struct rnbd_msg_sess_info - initial session info from client to server
75219ace60SJack Wang * @hdr: message header
76219ace60SJack Wang * @ver: RNBD protocol version
77219ace60SJack Wang */
78219ace60SJack Wang struct rnbd_msg_sess_info {
79219ace60SJack Wang struct rnbd_msg_hdr hdr;
80219ace60SJack Wang u8 ver;
81219ace60SJack Wang u8 reserved[31];
82219ace60SJack Wang };
83219ace60SJack Wang
84219ace60SJack Wang /**
85219ace60SJack Wang * struct rnbd_msg_sess_info_rsp - initial session info from server to client
86219ace60SJack Wang * @hdr: message header
87219ace60SJack Wang * @ver: RNBD protocol version
88219ace60SJack Wang */
89219ace60SJack Wang struct rnbd_msg_sess_info_rsp {
90219ace60SJack Wang struct rnbd_msg_hdr hdr;
91219ace60SJack Wang u8 ver;
92219ace60SJack Wang u8 reserved[31];
93219ace60SJack Wang };
94219ace60SJack Wang
95219ace60SJack Wang /**
96219ace60SJack Wang * struct rnbd_msg_open - request to open a remote device.
97219ace60SJack Wang * @hdr: message header
98219ace60SJack Wang * @access_mode: the mode to open remote device, valid values see:
99219ace60SJack Wang * enum rnbd_access_mode
100219ace60SJack Wang * @device_name: device path on remote side
101219ace60SJack Wang */
102219ace60SJack Wang struct rnbd_msg_open {
103219ace60SJack Wang struct rnbd_msg_hdr hdr;
104219ace60SJack Wang u8 access_mode;
105219ace60SJack Wang u8 resv1;
106219ace60SJack Wang s8 dev_name[NAME_MAX];
107219ace60SJack Wang u8 reserved[3];
108219ace60SJack Wang };
109219ace60SJack Wang
110219ace60SJack Wang /**
111512c781fSGioh Kim * struct rnbd_msg_close - request to close a remote device.
112512c781fSGioh Kim * @hdr: message header
113512c781fSGioh Kim * @device_id: device_id on server side to identify the device
114512c781fSGioh Kim */
115512c781fSGioh Kim struct rnbd_msg_close {
116219ace60SJack Wang struct rnbd_msg_hdr hdr;
117219ace60SJack Wang __le32 device_id;
118219ace60SJack Wang };
119219ace60SJack Wang
120219ace60SJack Wang enum rnbd_cache_policy {
121219ace60SJack Wang RNBD_FUA = 1 << 0,
122219ace60SJack Wang RNBD_WRITEBACK = 1 << 1,
123219ace60SJack Wang };
124219ace60SJack Wang
125219ace60SJack Wang /**
126219ace60SJack Wang * struct rnbd_msg_open_rsp - response message to RNBD_MSG_OPEN
127219ace60SJack Wang * @hdr: message header
128219ace60SJack Wang * @device_id: device_id on server side to identify the device
129219ace60SJack Wang * @nsectors: number of sectors in the usual 512b unit
130219ace60SJack Wang * @max_hw_sectors: max hardware sectors in the usual 512b unit
131030ce8baSGioh Kim * @max_write_same_sectors: max sectors for WRITE SAME in the 512b unit
132512c781fSGioh Kim * @max_discard_sectors: max. sectors that can be discarded at once in 512b
133219ace60SJack Wang * unit.
134219ace60SJack Wang * @discard_granularity: size of the internal discard allocation unit in bytes
135219ace60SJack Wang * @discard_alignment: offset from internal allocation assignment in bytes
136219ace60SJack Wang * @physical_block_size: physical block size device supports in bytes
137219ace60SJack Wang * @logical_block_size: logical block size device supports in bytes
138219ace60SJack Wang * @max_segments: max segments hardware support in one transfer
139219ace60SJack Wang * @secure_discard: supports secure discard
140219ace60SJack Wang * @obsolete_rotational: obsolete, not in used.
141219ace60SJack Wang * @cache_policy: support write-back caching or FUA?
142219ace60SJack Wang */
143219ace60SJack Wang struct rnbd_msg_open_rsp {
144219ace60SJack Wang struct rnbd_msg_hdr hdr;
145219ace60SJack Wang __le32 device_id;
146219ace60SJack Wang __le64 nsectors;
147030ce8baSGioh Kim __le32 max_hw_sectors;
148512c781fSGioh Kim __le32 max_write_same_sectors;
149512c781fSGioh Kim __le32 max_discard_sectors;
150219ace60SJack Wang __le32 discard_granularity;
151219ace60SJack Wang __le32 discard_alignment;
152219ace60SJack Wang __le16 physical_block_size;
153219ace60SJack Wang __le16 logical_block_size;
154219ace60SJack Wang __le16 max_segments;
155219ace60SJack Wang __le16 secure_discard;
156219ace60SJack Wang u8 obsolete_rotational;
157219ace60SJack Wang u8 cache_policy;
158219ace60SJack Wang u8 reserved[10];
159219ace60SJack Wang };
160219ace60SJack Wang
161219ace60SJack Wang /**
162219ace60SJack Wang * struct rnbd_msg_io - message for I/O read/write
163219ace60SJack Wang * @hdr: message header
164219ace60SJack Wang * @device_id: device_id on server side to find the right device
165219ace60SJack Wang * @sector: bi_sector attribute from struct bio
166219ace60SJack Wang * @rw: valid values are defined in enum rnbd_io_flags
167219ace60SJack Wang * @bi_size: number of bytes for I/O read/write
168219ace60SJack Wang * @prio: priority
169219ace60SJack Wang */
170219ace60SJack Wang struct rnbd_msg_io {
171219ace60SJack Wang struct rnbd_msg_hdr hdr;
172219ace60SJack Wang __le32 device_id;
173219ace60SJack Wang __le64 sector;
174219ace60SJack Wang __le32 rw;
175219ace60SJack Wang __le32 bi_size;
176219ace60SJack Wang __le16 prio;
177219ace60SJack Wang };
178219ace60SJack Wang
179219ace60SJack Wang #define RNBD_OP_BITS 8
180219ace60SJack Wang #define RNBD_OP_MASK ((1 << RNBD_OP_BITS) - 1)
181219ace60SJack Wang
182219ace60SJack Wang /**
183219ace60SJack Wang * enum rnbd_io_flags - RNBD request types from rq_flag_bits
184219ace60SJack Wang * @RNBD_OP_READ: read sectors from the device
185219ace60SJack Wang * @RNBD_OP_WRITE: write sectors to the device
186219ace60SJack Wang * @RNBD_OP_FLUSH: flush the volatile write cache
187219ace60SJack Wang * @RNBD_OP_DISCARD: discard sectors
188219ace60SJack Wang * @RNBD_OP_SECURE_ERASE: securely erase sectors
189219ace60SJack Wang * @RNBD_OP_WRITE_SAME: write the same sectors many times
190219ace60SJack Wang
191219ace60SJack Wang * @RNBD_F_SYNC: request is sync (sync write or read)
192219ace60SJack Wang * @RNBD_F_FUA: forced unit access
193219ace60SJack Wang */
194219ace60SJack Wang enum rnbd_io_flags {
195219ace60SJack Wang
196219ace60SJack Wang /* Operations */
197219ace60SJack Wang RNBD_OP_READ = 0,
198219ace60SJack Wang RNBD_OP_WRITE = 1,
199219ace60SJack Wang RNBD_OP_FLUSH = 2,
200219ace60SJack Wang RNBD_OP_DISCARD = 3,
201219ace60SJack Wang RNBD_OP_SECURE_ERASE = 4,
202219ace60SJack Wang RNBD_OP_WRITE_SAME = 5,
203219ace60SJack Wang
204219ace60SJack Wang /* Flags */
205219ace60SJack Wang RNBD_F_SYNC = 1<<(RNBD_OP_BITS + 0),
206219ace60SJack Wang RNBD_F_FUA = 1<<(RNBD_OP_BITS + 1),
207219ace60SJack Wang };
208219ace60SJack Wang
rnbd_op(u32 flags)209219ace60SJack Wang static inline u32 rnbd_op(u32 flags)
210219ace60SJack Wang {
211219ace60SJack Wang return flags & RNBD_OP_MASK;
212219ace60SJack Wang }
213219ace60SJack Wang
rnbd_flags(u32 flags)214219ace60SJack Wang static inline u32 rnbd_flags(u32 flags)
215219ace60SJack Wang {
216219ace60SJack Wang return flags & ~RNBD_OP_MASK;
217219ace60SJack Wang }
218219ace60SJack Wang
rnbd_to_bio_flags(u32 rnbd_opf)219219ace60SJack Wang static inline blk_opf_t rnbd_to_bio_flags(u32 rnbd_opf)
220219ace60SJack Wang {
221219ace60SJack Wang blk_opf_t bio_opf;
222219ace60SJack Wang
223219ace60SJack Wang switch (rnbd_op(rnbd_opf)) {
224219ace60SJack Wang case RNBD_OP_READ:
225219ace60SJack Wang bio_opf = REQ_OP_READ;
226219ace60SJack Wang break;
227219ace60SJack Wang case RNBD_OP_WRITE:
228219ace60SJack Wang bio_opf = REQ_OP_WRITE;
229219ace60SJack Wang break;
230219ace60SJack Wang case RNBD_OP_FLUSH:
231219ace60SJack Wang bio_opf = REQ_OP_WRITE | REQ_PREFLUSH;
23203df83acSBart Van Assche break;
233219ace60SJack Wang case RNBD_OP_DISCARD:
23403df83acSBart Van Assche bio_opf = REQ_OP_DISCARD;
235219ace60SJack Wang break;
236219ace60SJack Wang case RNBD_OP_SECURE_ERASE:
237219ace60SJack Wang bio_opf = REQ_OP_SECURE_ERASE;
238219ace60SJack Wang break;
239219ace60SJack Wang default:
240219ace60SJack Wang WARN(1, "Unknown RNBD type: %d (flags %d)\n",
241219ace60SJack Wang rnbd_op(rnbd_opf), rnbd_opf);
242219ace60SJack Wang bio_opf = 0;
243219ace60SJack Wang }
244*5e6e0808SGuoqing Jiang
245219ace60SJack Wang if (rnbd_opf & RNBD_F_SYNC)
246219ace60SJack Wang bio_opf |= REQ_SYNC;
247219ace60SJack Wang
248219ace60SJack Wang if (rnbd_opf & RNBD_F_FUA)
249219ace60SJack Wang bio_opf |= REQ_FUA;
250219ace60SJack Wang
251219ace60SJack Wang return bio_opf;
252219ace60SJack Wang }
253219ace60SJack Wang
rq_to_rnbd_flags(struct request * rq)254219ace60SJack Wang static inline u32 rq_to_rnbd_flags(struct request *rq)
255219ace60SJack Wang {
256219ace60SJack Wang u32 rnbd_opf;
257219ace60SJack Wang
258219ace60SJack Wang switch (req_op(rq)) {
259219ace60SJack Wang case REQ_OP_READ:
260219ace60SJack Wang rnbd_opf = RNBD_OP_READ;
261219ace60SJack Wang break;
262219ace60SJack Wang case REQ_OP_WRITE:
263219ace60SJack Wang rnbd_opf = RNBD_OP_WRITE;
264219ace60SJack Wang break;
265219ace60SJack Wang case REQ_OP_DISCARD:
266219ace60SJack Wang rnbd_opf = RNBD_OP_DISCARD;
267219ace60SJack Wang break;
268219ace60SJack Wang case REQ_OP_SECURE_ERASE:
269219ace60SJack Wang rnbd_opf = RNBD_OP_SECURE_ERASE;
270219ace60SJack Wang break;
271219ace60SJack Wang case REQ_OP_FLUSH:
272219ace60SJack Wang rnbd_opf = RNBD_OP_FLUSH;
273219ace60SJack Wang break;
274219ace60SJack Wang default:
275219ace60SJack Wang WARN(1, "Unknown request type %d (flags %llu)\n",
276219ace60SJack Wang (__force u32)req_op(rq),
277219ace60SJack Wang (__force unsigned long long)rq->cmd_flags);
278219ace60SJack Wang rnbd_opf = 0;
279219ace60SJack Wang }
280219ace60SJack Wang
281219ace60SJack Wang if (op_is_sync(rq->cmd_flags))
282219ace60SJack Wang rnbd_opf |= RNBD_F_SYNC;
283219ace60SJack Wang
284219ace60SJack Wang if (op_is_flush(rq->cmd_flags))
285219ace60SJack Wang rnbd_opf |= RNBD_F_FUA;
286219ace60SJack Wang
287219ace60SJack Wang return rnbd_opf;
288219ace60SJack Wang }
28903df83acSBart Van Assche
29003df83acSBart Van Assche const char *rnbd_access_mode_str(enum rnbd_access_mode mode);
291219ace60SJack Wang
292219ace60SJack Wang #endif /* RNBD_PROTO_H */
293219ace60SJack Wang