xref: /openbmc/linux/fs/smb/client/smbdirect.h (revision 1ac731c529cd4d6adbce134754b51ff7d822b145)
1*38c8a9a5SSteve French /* SPDX-License-Identifier: GPL-2.0-or-later */
2*38c8a9a5SSteve French /*
3*38c8a9a5SSteve French  *   Copyright (C) 2017, Microsoft Corporation.
4*38c8a9a5SSteve French  *
5*38c8a9a5SSteve French  *   Author(s): Long Li <longli@microsoft.com>
6*38c8a9a5SSteve French  */
7*38c8a9a5SSteve French #ifndef _SMBDIRECT_H
8*38c8a9a5SSteve French #define _SMBDIRECT_H
9*38c8a9a5SSteve French 
10*38c8a9a5SSteve French #ifdef CONFIG_CIFS_SMB_DIRECT
11*38c8a9a5SSteve French #define cifs_rdma_enabled(server)	((server)->rdma)
12*38c8a9a5SSteve French 
13*38c8a9a5SSteve French #include "cifsglob.h"
14*38c8a9a5SSteve French #include <rdma/ib_verbs.h>
15*38c8a9a5SSteve French #include <rdma/rdma_cm.h>
16*38c8a9a5SSteve French #include <linux/mempool.h>
17*38c8a9a5SSteve French 
18*38c8a9a5SSteve French extern int rdma_readwrite_threshold;
19*38c8a9a5SSteve French extern int smbd_max_frmr_depth;
20*38c8a9a5SSteve French extern int smbd_keep_alive_interval;
21*38c8a9a5SSteve French extern int smbd_max_receive_size;
22*38c8a9a5SSteve French extern int smbd_max_fragmented_recv_size;
23*38c8a9a5SSteve French extern int smbd_max_send_size;
24*38c8a9a5SSteve French extern int smbd_send_credit_target;
25*38c8a9a5SSteve French extern int smbd_receive_credit_max;
26*38c8a9a5SSteve French 
27*38c8a9a5SSteve French enum keep_alive_status {
28*38c8a9a5SSteve French 	KEEP_ALIVE_NONE,
29*38c8a9a5SSteve French 	KEEP_ALIVE_PENDING,
30*38c8a9a5SSteve French 	KEEP_ALIVE_SENT,
31*38c8a9a5SSteve French };
32*38c8a9a5SSteve French 
33*38c8a9a5SSteve French enum smbd_connection_status {
34*38c8a9a5SSteve French 	SMBD_CREATED,
35*38c8a9a5SSteve French 	SMBD_CONNECTING,
36*38c8a9a5SSteve French 	SMBD_CONNECTED,
37*38c8a9a5SSteve French 	SMBD_NEGOTIATE_FAILED,
38*38c8a9a5SSteve French 	SMBD_DISCONNECTING,
39*38c8a9a5SSteve French 	SMBD_DISCONNECTED,
40*38c8a9a5SSteve French 	SMBD_DESTROYED
41*38c8a9a5SSteve French };
42*38c8a9a5SSteve French 
43*38c8a9a5SSteve French /*
44*38c8a9a5SSteve French  * The context for the SMBDirect transport
45*38c8a9a5SSteve French  * Everything related to the transport is here. It has several logical parts
46*38c8a9a5SSteve French  * 1. RDMA related structures
47*38c8a9a5SSteve French  * 2. SMBDirect connection parameters
48*38c8a9a5SSteve French  * 3. Memory registrations
49*38c8a9a5SSteve French  * 4. Receive and reassembly queues for data receive path
50*38c8a9a5SSteve French  * 5. mempools for allocating packets
51*38c8a9a5SSteve French  */
52*38c8a9a5SSteve French struct smbd_connection {
53*38c8a9a5SSteve French 	enum smbd_connection_status transport_status;
54*38c8a9a5SSteve French 
55*38c8a9a5SSteve French 	/* RDMA related */
56*38c8a9a5SSteve French 	struct rdma_cm_id *id;
57*38c8a9a5SSteve French 	struct ib_qp_init_attr qp_attr;
58*38c8a9a5SSteve French 	struct ib_pd *pd;
59*38c8a9a5SSteve French 	struct ib_cq *send_cq, *recv_cq;
60*38c8a9a5SSteve French 	struct ib_device_attr dev_attr;
61*38c8a9a5SSteve French 	int ri_rc;
62*38c8a9a5SSteve French 	struct completion ri_done;
63*38c8a9a5SSteve French 	wait_queue_head_t conn_wait;
64*38c8a9a5SSteve French 	wait_queue_head_t disconn_wait;
65*38c8a9a5SSteve French 
66*38c8a9a5SSteve French 	struct completion negotiate_completion;
67*38c8a9a5SSteve French 	bool negotiate_done;
68*38c8a9a5SSteve French 
69*38c8a9a5SSteve French 	struct work_struct disconnect_work;
70*38c8a9a5SSteve French 	struct work_struct post_send_credits_work;
71*38c8a9a5SSteve French 
72*38c8a9a5SSteve French 	spinlock_t lock_new_credits_offered;
73*38c8a9a5SSteve French 	int new_credits_offered;
74*38c8a9a5SSteve French 
75*38c8a9a5SSteve French 	/* Connection parameters defined in [MS-SMBD] 3.1.1.1 */
76*38c8a9a5SSteve French 	int receive_credit_max;
77*38c8a9a5SSteve French 	int send_credit_target;
78*38c8a9a5SSteve French 	int max_send_size;
79*38c8a9a5SSteve French 	int max_fragmented_recv_size;
80*38c8a9a5SSteve French 	int max_fragmented_send_size;
81*38c8a9a5SSteve French 	int max_receive_size;
82*38c8a9a5SSteve French 	int keep_alive_interval;
83*38c8a9a5SSteve French 	int max_readwrite_size;
84*38c8a9a5SSteve French 	enum keep_alive_status keep_alive_requested;
85*38c8a9a5SSteve French 	int protocol;
86*38c8a9a5SSteve French 	atomic_t send_credits;
87*38c8a9a5SSteve French 	atomic_t receive_credits;
88*38c8a9a5SSteve French 	int receive_credit_target;
89*38c8a9a5SSteve French 	int fragment_reassembly_remaining;
90*38c8a9a5SSteve French 
91*38c8a9a5SSteve French 	/* Memory registrations */
92*38c8a9a5SSteve French 	/* Maximum number of RDMA read/write outstanding on this connection */
93*38c8a9a5SSteve French 	int responder_resources;
94*38c8a9a5SSteve French 	/* Maximum number of pages in a single RDMA write/read on this connection */
95*38c8a9a5SSteve French 	int max_frmr_depth;
96*38c8a9a5SSteve French 	/*
97*38c8a9a5SSteve French 	 * If payload is less than or equal to the threshold,
98*38c8a9a5SSteve French 	 * use RDMA send/recv to send upper layer I/O.
99*38c8a9a5SSteve French 	 * If payload is more than the threshold,
100*38c8a9a5SSteve French 	 * use RDMA read/write through memory registration for I/O.
101*38c8a9a5SSteve French 	 */
102*38c8a9a5SSteve French 	int rdma_readwrite_threshold;
103*38c8a9a5SSteve French 	enum ib_mr_type mr_type;
104*38c8a9a5SSteve French 	struct list_head mr_list;
105*38c8a9a5SSteve French 	spinlock_t mr_list_lock;
106*38c8a9a5SSteve French 	/* The number of available MRs ready for memory registration */
107*38c8a9a5SSteve French 	atomic_t mr_ready_count;
108*38c8a9a5SSteve French 	atomic_t mr_used_count;
109*38c8a9a5SSteve French 	wait_queue_head_t wait_mr;
110*38c8a9a5SSteve French 	struct work_struct mr_recovery_work;
111*38c8a9a5SSteve French 	/* Used by transport to wait until all MRs are returned */
112*38c8a9a5SSteve French 	wait_queue_head_t wait_for_mr_cleanup;
113*38c8a9a5SSteve French 
114*38c8a9a5SSteve French 	/* Activity accoutning */
115*38c8a9a5SSteve French 	atomic_t send_pending;
116*38c8a9a5SSteve French 	wait_queue_head_t wait_send_pending;
117*38c8a9a5SSteve French 	wait_queue_head_t wait_post_send;
118*38c8a9a5SSteve French 
119*38c8a9a5SSteve French 	/* Receive queue */
120*38c8a9a5SSteve French 	struct list_head receive_queue;
121*38c8a9a5SSteve French 	int count_receive_queue;
122*38c8a9a5SSteve French 	spinlock_t receive_queue_lock;
123*38c8a9a5SSteve French 
124*38c8a9a5SSteve French 	struct list_head empty_packet_queue;
125*38c8a9a5SSteve French 	int count_empty_packet_queue;
126*38c8a9a5SSteve French 	spinlock_t empty_packet_queue_lock;
127*38c8a9a5SSteve French 
128*38c8a9a5SSteve French 	wait_queue_head_t wait_receive_queues;
129*38c8a9a5SSteve French 
130*38c8a9a5SSteve French 	/* Reassembly queue */
131*38c8a9a5SSteve French 	struct list_head reassembly_queue;
132*38c8a9a5SSteve French 	spinlock_t reassembly_queue_lock;
133*38c8a9a5SSteve French 	wait_queue_head_t wait_reassembly_queue;
134*38c8a9a5SSteve French 
135*38c8a9a5SSteve French 	/* total data length of reassembly queue */
136*38c8a9a5SSteve French 	int reassembly_data_length;
137*38c8a9a5SSteve French 	int reassembly_queue_length;
138*38c8a9a5SSteve French 	/* the offset to first buffer in reassembly queue */
139*38c8a9a5SSteve French 	int first_entry_offset;
140*38c8a9a5SSteve French 
141*38c8a9a5SSteve French 	bool send_immediate;
142*38c8a9a5SSteve French 
143*38c8a9a5SSteve French 	wait_queue_head_t wait_send_queue;
144*38c8a9a5SSteve French 
145*38c8a9a5SSteve French 	/*
146*38c8a9a5SSteve French 	 * Indicate if we have received a full packet on the connection
147*38c8a9a5SSteve French 	 * This is used to identify the first SMBD packet of a assembled
148*38c8a9a5SSteve French 	 * payload (SMB packet) in reassembly queue so we can return a
149*38c8a9a5SSteve French 	 * RFC1002 length to upper layer to indicate the length of the SMB
150*38c8a9a5SSteve French 	 * packet received
151*38c8a9a5SSteve French 	 */
152*38c8a9a5SSteve French 	bool full_packet_received;
153*38c8a9a5SSteve French 
154*38c8a9a5SSteve French 	struct workqueue_struct *workqueue;
155*38c8a9a5SSteve French 	struct delayed_work idle_timer_work;
156*38c8a9a5SSteve French 
157*38c8a9a5SSteve French 	/* Memory pool for preallocating buffers */
158*38c8a9a5SSteve French 	/* request pool for RDMA send */
159*38c8a9a5SSteve French 	struct kmem_cache *request_cache;
160*38c8a9a5SSteve French 	mempool_t *request_mempool;
161*38c8a9a5SSteve French 
162*38c8a9a5SSteve French 	/* response pool for RDMA receive */
163*38c8a9a5SSteve French 	struct kmem_cache *response_cache;
164*38c8a9a5SSteve French 	mempool_t *response_mempool;
165*38c8a9a5SSteve French 
166*38c8a9a5SSteve French 	/* for debug purposes */
167*38c8a9a5SSteve French 	unsigned int count_get_receive_buffer;
168*38c8a9a5SSteve French 	unsigned int count_put_receive_buffer;
169*38c8a9a5SSteve French 	unsigned int count_reassembly_queue;
170*38c8a9a5SSteve French 	unsigned int count_enqueue_reassembly_queue;
171*38c8a9a5SSteve French 	unsigned int count_dequeue_reassembly_queue;
172*38c8a9a5SSteve French 	unsigned int count_send_empty;
173*38c8a9a5SSteve French };
174*38c8a9a5SSteve French 
175*38c8a9a5SSteve French enum smbd_message_type {
176*38c8a9a5SSteve French 	SMBD_NEGOTIATE_RESP,
177*38c8a9a5SSteve French 	SMBD_TRANSFER_DATA,
178*38c8a9a5SSteve French };
179*38c8a9a5SSteve French 
180*38c8a9a5SSteve French #define SMB_DIRECT_RESPONSE_REQUESTED 0x0001
181*38c8a9a5SSteve French 
182*38c8a9a5SSteve French /* SMBD negotiation request packet [MS-SMBD] 2.2.1 */
183*38c8a9a5SSteve French struct smbd_negotiate_req {
184*38c8a9a5SSteve French 	__le16 min_version;
185*38c8a9a5SSteve French 	__le16 max_version;
186*38c8a9a5SSteve French 	__le16 reserved;
187*38c8a9a5SSteve French 	__le16 credits_requested;
188*38c8a9a5SSteve French 	__le32 preferred_send_size;
189*38c8a9a5SSteve French 	__le32 max_receive_size;
190*38c8a9a5SSteve French 	__le32 max_fragmented_size;
191*38c8a9a5SSteve French } __packed;
192*38c8a9a5SSteve French 
193*38c8a9a5SSteve French /* SMBD negotiation response packet [MS-SMBD] 2.2.2 */
194*38c8a9a5SSteve French struct smbd_negotiate_resp {
195*38c8a9a5SSteve French 	__le16 min_version;
196*38c8a9a5SSteve French 	__le16 max_version;
197*38c8a9a5SSteve French 	__le16 negotiated_version;
198*38c8a9a5SSteve French 	__le16 reserved;
199*38c8a9a5SSteve French 	__le16 credits_requested;
200*38c8a9a5SSteve French 	__le16 credits_granted;
201*38c8a9a5SSteve French 	__le32 status;
202*38c8a9a5SSteve French 	__le32 max_readwrite_size;
203*38c8a9a5SSteve French 	__le32 preferred_send_size;
204*38c8a9a5SSteve French 	__le32 max_receive_size;
205*38c8a9a5SSteve French 	__le32 max_fragmented_size;
206*38c8a9a5SSteve French } __packed;
207*38c8a9a5SSteve French 
208*38c8a9a5SSteve French /* SMBD data transfer packet with payload [MS-SMBD] 2.2.3 */
209*38c8a9a5SSteve French struct smbd_data_transfer {
210*38c8a9a5SSteve French 	__le16 credits_requested;
211*38c8a9a5SSteve French 	__le16 credits_granted;
212*38c8a9a5SSteve French 	__le16 flags;
213*38c8a9a5SSteve French 	__le16 reserved;
214*38c8a9a5SSteve French 	__le32 remaining_data_length;
215*38c8a9a5SSteve French 	__le32 data_offset;
216*38c8a9a5SSteve French 	__le32 data_length;
217*38c8a9a5SSteve French 	__le32 padding;
218*38c8a9a5SSteve French 	__u8 buffer[];
219*38c8a9a5SSteve French } __packed;
220*38c8a9a5SSteve French 
221*38c8a9a5SSteve French /* The packet fields for a registered RDMA buffer */
222*38c8a9a5SSteve French struct smbd_buffer_descriptor_v1 {
223*38c8a9a5SSteve French 	__le64 offset;
224*38c8a9a5SSteve French 	__le32 token;
225*38c8a9a5SSteve French 	__le32 length;
226*38c8a9a5SSteve French } __packed;
227*38c8a9a5SSteve French 
228*38c8a9a5SSteve French /* Maximum number of SGEs used by smbdirect.c in any send work request */
229*38c8a9a5SSteve French #define SMBDIRECT_MAX_SEND_SGE	6
230*38c8a9a5SSteve French 
231*38c8a9a5SSteve French /* The context for a SMBD request */
232*38c8a9a5SSteve French struct smbd_request {
233*38c8a9a5SSteve French 	struct smbd_connection *info;
234*38c8a9a5SSteve French 	struct ib_cqe cqe;
235*38c8a9a5SSteve French 
236*38c8a9a5SSteve French 	/* the SGE entries for this work request */
237*38c8a9a5SSteve French 	struct ib_sge sge[SMBDIRECT_MAX_SEND_SGE];
238*38c8a9a5SSteve French 	int num_sge;
239*38c8a9a5SSteve French 
240*38c8a9a5SSteve French 	/* SMBD packet header follows this structure */
241*38c8a9a5SSteve French 	u8 packet[];
242*38c8a9a5SSteve French };
243*38c8a9a5SSteve French 
244*38c8a9a5SSteve French /* Maximum number of SGEs used by smbdirect.c in any receive work request */
245*38c8a9a5SSteve French #define SMBDIRECT_MAX_RECV_SGE	1
246*38c8a9a5SSteve French 
247*38c8a9a5SSteve French /* The context for a SMBD response */
248*38c8a9a5SSteve French struct smbd_response {
249*38c8a9a5SSteve French 	struct smbd_connection *info;
250*38c8a9a5SSteve French 	struct ib_cqe cqe;
251*38c8a9a5SSteve French 	struct ib_sge sge;
252*38c8a9a5SSteve French 
253*38c8a9a5SSteve French 	enum smbd_message_type type;
254*38c8a9a5SSteve French 
255*38c8a9a5SSteve French 	/* Link to receive queue or reassembly queue */
256*38c8a9a5SSteve French 	struct list_head list;
257*38c8a9a5SSteve French 
258*38c8a9a5SSteve French 	/* Indicate if this is the 1st packet of a payload */
259*38c8a9a5SSteve French 	bool first_segment;
260*38c8a9a5SSteve French 
261*38c8a9a5SSteve French 	/* SMBD packet header and payload follows this structure */
262*38c8a9a5SSteve French 	u8 packet[];
263*38c8a9a5SSteve French };
264*38c8a9a5SSteve French 
265*38c8a9a5SSteve French /* Create a SMBDirect session */
266*38c8a9a5SSteve French struct smbd_connection *smbd_get_connection(
267*38c8a9a5SSteve French 	struct TCP_Server_Info *server, struct sockaddr *dstaddr);
268*38c8a9a5SSteve French 
269*38c8a9a5SSteve French /* Reconnect SMBDirect session */
270*38c8a9a5SSteve French int smbd_reconnect(struct TCP_Server_Info *server);
271*38c8a9a5SSteve French /* Destroy SMBDirect session */
272*38c8a9a5SSteve French void smbd_destroy(struct TCP_Server_Info *server);
273*38c8a9a5SSteve French 
274*38c8a9a5SSteve French /* Interface for carrying upper layer I/O through send/recv */
275*38c8a9a5SSteve French int smbd_recv(struct smbd_connection *info, struct msghdr *msg);
276*38c8a9a5SSteve French int smbd_send(struct TCP_Server_Info *server,
277*38c8a9a5SSteve French 	int num_rqst, struct smb_rqst *rqst);
278*38c8a9a5SSteve French 
279*38c8a9a5SSteve French enum mr_state {
280*38c8a9a5SSteve French 	MR_READY,
281*38c8a9a5SSteve French 	MR_REGISTERED,
282*38c8a9a5SSteve French 	MR_INVALIDATED,
283*38c8a9a5SSteve French 	MR_ERROR
284*38c8a9a5SSteve French };
285*38c8a9a5SSteve French 
286*38c8a9a5SSteve French struct smbd_mr {
287*38c8a9a5SSteve French 	struct smbd_connection	*conn;
288*38c8a9a5SSteve French 	struct list_head	list;
289*38c8a9a5SSteve French 	enum mr_state		state;
290*38c8a9a5SSteve French 	struct ib_mr		*mr;
291*38c8a9a5SSteve French 	struct sg_table		sgt;
292*38c8a9a5SSteve French 	enum dma_data_direction	dir;
293*38c8a9a5SSteve French 	union {
294*38c8a9a5SSteve French 		struct ib_reg_wr	wr;
295*38c8a9a5SSteve French 		struct ib_send_wr	inv_wr;
296*38c8a9a5SSteve French 	};
297*38c8a9a5SSteve French 	struct ib_cqe		cqe;
298*38c8a9a5SSteve French 	bool			need_invalidate;
299*38c8a9a5SSteve French 	struct completion	invalidate_done;
300*38c8a9a5SSteve French };
301*38c8a9a5SSteve French 
302*38c8a9a5SSteve French /* Interfaces to register and deregister MR for RDMA read/write */
303*38c8a9a5SSteve French struct smbd_mr *smbd_register_mr(
304*38c8a9a5SSteve French 	struct smbd_connection *info, struct iov_iter *iter,
305*38c8a9a5SSteve French 	bool writing, bool need_invalidate);
306*38c8a9a5SSteve French int smbd_deregister_mr(struct smbd_mr *mr);
307*38c8a9a5SSteve French 
308*38c8a9a5SSteve French #else
309*38c8a9a5SSteve French #define cifs_rdma_enabled(server)	0
310*38c8a9a5SSteve French struct smbd_connection {};
smbd_get_connection(struct TCP_Server_Info * server,struct sockaddr * dstaddr)311*38c8a9a5SSteve French static inline void *smbd_get_connection(
312*38c8a9a5SSteve French 	struct TCP_Server_Info *server, struct sockaddr *dstaddr) {return NULL;}
smbd_reconnect(struct TCP_Server_Info * server)313*38c8a9a5SSteve French static inline int smbd_reconnect(struct TCP_Server_Info *server) {return -1; }
smbd_destroy(struct TCP_Server_Info * server)314*38c8a9a5SSteve French static inline void smbd_destroy(struct TCP_Server_Info *server) {}
smbd_recv(struct smbd_connection * info,struct msghdr * msg)315*38c8a9a5SSteve French static inline int smbd_recv(struct smbd_connection *info, struct msghdr *msg) {return -1; }
smbd_send(struct TCP_Server_Info * server,int num_rqst,struct smb_rqst * rqst)316*38c8a9a5SSteve French static inline int smbd_send(struct TCP_Server_Info *server, int num_rqst, struct smb_rqst *rqst) {return -1; }
317*38c8a9a5SSteve French #endif
318*38c8a9a5SSteve French 
319*38c8a9a5SSteve French #endif
320