xref: /openbmc/linux/net/mptcp/protocol.h (revision 36db6e8484ed455bbb320d89a119378897ae991c)
1f870fa0bSMat Martineau /* SPDX-License-Identifier: GPL-2.0 */
2f870fa0bSMat Martineau /* Multipath TCP
3f870fa0bSMat Martineau  *
4f870fa0bSMat Martineau  * Copyright (c) 2017 - 2019, Intel Corporation.
5f870fa0bSMat Martineau  */
6f870fa0bSMat Martineau 
7f870fa0bSMat Martineau #ifndef __MPTCP_PROTOCOL_H
8f870fa0bSMat Martineau #define __MPTCP_PROTOCOL_H
9f870fa0bSMat Martineau 
1079c0949eSPeter Krystad #include <linux/random.h>
1179c0949eSPeter Krystad #include <net/tcp.h>
1279c0949eSPeter Krystad #include <net/inet_connection_sock.h>
13b911c97cSFlorian Westphal #include <uapi/linux/mptcp.h>
149ab4807cSKishen Maloor #include <net/genetlink.h>
1579c0949eSPeter Krystad 
16cc7972eaSChristoph Paasch #define MPTCP_SUPPORTED_VERSION	1
17eda7acddSPeter Krystad 
18eda7acddSPeter Krystad /* MPTCP option bits */
19eda7acddSPeter Krystad #define OPTION_MPTCP_MPC_SYN	BIT(0)
20eda7acddSPeter Krystad #define OPTION_MPTCP_MPC_SYNACK	BIT(1)
21eda7acddSPeter Krystad #define OPTION_MPTCP_MPC_ACK	BIT(2)
22f296234cSPeter Krystad #define OPTION_MPTCP_MPJ_SYN	BIT(3)
23f296234cSPeter Krystad #define OPTION_MPTCP_MPJ_SYNACK	BIT(4)
24f296234cSPeter Krystad #define OPTION_MPTCP_MPJ_ACK	BIT(5)
253df523abSPeter Krystad #define OPTION_MPTCP_ADD_ADDR	BIT(6)
26fef6b7ecSGeliang Tang #define OPTION_MPTCP_RM_ADDR	BIT(7)
27fef6b7ecSGeliang Tang #define OPTION_MPTCP_FASTCLOSE	BIT(8)
28fef6b7ecSGeliang Tang #define OPTION_MPTCP_PRIO	BIT(9)
29fef6b7ecSGeliang Tang #define OPTION_MPTCP_RST	BIT(10)
301bff1e43SPaolo Abeni #define OPTION_MPTCP_DSS	BIT(11)
31c25aeb4eSGeliang Tang #define OPTION_MPTCP_FAIL	BIT(12)
32eda7acddSPeter Krystad 
3374c7dfbeSPaolo Abeni #define OPTION_MPTCP_CSUMREQD	BIT(13)
3474c7dfbeSPaolo Abeni 
3574c7dfbeSPaolo Abeni #define OPTIONS_MPTCP_MPC	(OPTION_MPTCP_MPC_SYN | OPTION_MPTCP_MPC_SYNACK | \
3674c7dfbeSPaolo Abeni 				 OPTION_MPTCP_MPC_ACK)
3774c7dfbeSPaolo Abeni #define OPTIONS_MPTCP_MPJ	(OPTION_MPTCP_MPJ_SYN | OPTION_MPTCP_MPJ_SYNACK | \
38780aa120SWan Jiabing 				 OPTION_MPTCP_MPJ_ACK)
3974c7dfbeSPaolo Abeni 
40eda7acddSPeter Krystad /* MPTCP option subtypes */
41eda7acddSPeter Krystad #define MPTCPOPT_MP_CAPABLE	0
42eda7acddSPeter Krystad #define MPTCPOPT_MP_JOIN	1
43eda7acddSPeter Krystad #define MPTCPOPT_DSS		2
44eda7acddSPeter Krystad #define MPTCPOPT_ADD_ADDR	3
45eda7acddSPeter Krystad #define MPTCPOPT_RM_ADDR	4
46eda7acddSPeter Krystad #define MPTCPOPT_MP_PRIO	5
47eda7acddSPeter Krystad #define MPTCPOPT_MP_FAIL	6
48eda7acddSPeter Krystad #define MPTCPOPT_MP_FASTCLOSE	7
49dc87efdbSFlorian Westphal #define MPTCPOPT_RST		8
50eda7acddSPeter Krystad 
51eda7acddSPeter Krystad /* MPTCP suboption lengths */
52cc7972eaSChristoph Paasch #define TCPOLEN_MPTCP_MPC_SYN		4
53eda7acddSPeter Krystad #define TCPOLEN_MPTCP_MPC_SYNACK	12
54eda7acddSPeter Krystad #define TCPOLEN_MPTCP_MPC_ACK		20
55cc7972eaSChristoph Paasch #define TCPOLEN_MPTCP_MPC_ACK_DATA	22
56f296234cSPeter Krystad #define TCPOLEN_MPTCP_MPJ_SYN		12
57f296234cSPeter Krystad #define TCPOLEN_MPTCP_MPJ_SYNACK	16
58f296234cSPeter Krystad #define TCPOLEN_MPTCP_MPJ_ACK		24
596d0060f6SMat Martineau #define TCPOLEN_MPTCP_DSS_BASE		4
60648ef4b8SMat Martineau #define TCPOLEN_MPTCP_DSS_ACK32		4
616d0060f6SMat Martineau #define TCPOLEN_MPTCP_DSS_ACK64		8
62648ef4b8SMat Martineau #define TCPOLEN_MPTCP_DSS_MAP32		10
636d0060f6SMat Martineau #define TCPOLEN_MPTCP_DSS_MAP64		14
646d0060f6SMat Martineau #define TCPOLEN_MPTCP_DSS_CHECKSUM	2
653df523abSPeter Krystad #define TCPOLEN_MPTCP_ADD_ADDR		16
6627ab92d9SDavide Caratti #define TCPOLEN_MPTCP_ADD_ADDR_PORT	18
673df523abSPeter Krystad #define TCPOLEN_MPTCP_ADD_ADDR_BASE	8
6827ab92d9SDavide Caratti #define TCPOLEN_MPTCP_ADD_ADDR_BASE_PORT	10
693df523abSPeter Krystad #define TCPOLEN_MPTCP_ADD_ADDR6		28
7027ab92d9SDavide Caratti #define TCPOLEN_MPTCP_ADD_ADDR6_PORT	30
713df523abSPeter Krystad #define TCPOLEN_MPTCP_ADD_ADDR6_BASE	20
7227ab92d9SDavide Caratti #define TCPOLEN_MPTCP_ADD_ADDR6_BASE_PORT	22
7327ab92d9SDavide Caratti #define TCPOLEN_MPTCP_PORT_LEN		2
7427ab92d9SDavide Caratti #define TCPOLEN_MPTCP_PORT_ALIGN	2
756445e17aSGeliang Tang #define TCPOLEN_MPTCP_RM_ADDR_BASE	3
76ec99a470SDavide Caratti #define TCPOLEN_MPTCP_PRIO		3
77ec99a470SDavide Caratti #define TCPOLEN_MPTCP_PRIO_ALIGN	4
7850c504a2SFlorian Westphal #define TCPOLEN_MPTCP_FASTCLOSE		12
79dc87efdbSFlorian Westphal #define TCPOLEN_MPTCP_RST		4
80c25aeb4eSGeliang Tang #define TCPOLEN_MPTCP_FAIL		12
81eda7acddSPeter Krystad 
82208e8f66SGeliang Tang #define TCPOLEN_MPTCP_MPC_ACK_DATA_CSUM	(TCPOLEN_MPTCP_DSS_CHECKSUM + TCPOLEN_MPTCP_MPC_ACK_DATA)
83208e8f66SGeliang Tang 
84ec3edaa7SPeter Krystad /* MPTCP MP_JOIN flags */
85f296234cSPeter Krystad #define MPTCPOPT_BACKUP		BIT(0)
86ec3edaa7SPeter Krystad #define MPTCPOPT_THMAC_LEN	8
87f296234cSPeter Krystad 
88eda7acddSPeter Krystad /* MPTCP MP_CAPABLE flags */
89eda7acddSPeter Krystad #define MPTCP_VERSION_MASK	(0x0F)
90eda7acddSPeter Krystad #define MPTCP_CAP_CHECKSUM_REQD	BIT(7)
91eda7acddSPeter Krystad #define MPTCP_CAP_EXTENSIBILITY	BIT(6)
92bab6b88eSGeliang Tang #define MPTCP_CAP_DENY_JOIN_ID0	BIT(5)
9365492c5aSPaolo Abeni #define MPTCP_CAP_HMAC_SHA256	BIT(0)
94bab6b88eSGeliang Tang #define MPTCP_CAP_FLAG_MASK	(0x1F)
95eda7acddSPeter Krystad 
966d0060f6SMat Martineau /* MPTCP DSS flags */
976d0060f6SMat Martineau #define MPTCP_DSS_DATA_FIN	BIT(4)
986d0060f6SMat Martineau #define MPTCP_DSS_DSN64		BIT(3)
996d0060f6SMat Martineau #define MPTCP_DSS_HAS_MAP	BIT(2)
1006d0060f6SMat Martineau #define MPTCP_DSS_ACK64		BIT(1)
1016d0060f6SMat Martineau #define MPTCP_DSS_HAS_ACK	BIT(0)
102648ef4b8SMat Martineau #define MPTCP_DSS_FLAG_MASK	(0x1F)
103648ef4b8SMat Martineau 
1043df523abSPeter Krystad /* MPTCP ADD_ADDR flags */
1053df523abSPeter Krystad #define MPTCP_ADDR_ECHO		BIT(0)
1063df523abSPeter Krystad 
10740453a5cSGeliang Tang /* MPTCP MP_PRIO flags */
10840453a5cSGeliang Tang #define MPTCP_PRIO_BKUP		BIT(0)
10940453a5cSGeliang Tang 
110dc87efdbSFlorian Westphal /* MPTCP TCPRST flags */
111dc87efdbSFlorian Westphal #define MPTCP_RST_TRANSIENT	BIT(0)
112dc87efdbSFlorian Westphal 
113e9d09bacSPaolo Abeni /* MPTCP socket atomic flags */
1148edf0864SFlorian Westphal #define MPTCP_NOSPACE		1
1153b1d6210SPaolo Abeni #define MPTCP_WORK_RTX		2
116e1ff9e82SDavide Caratti #define MPTCP_FALLBACK_DONE	4
1170e4f35d7SPaolo Abeni #define MPTCP_WORK_CLOSE_SUBFLOW 5
118e9d09bacSPaolo Abeni 
119e9d09bacSPaolo Abeni /* MPTCP socket release cb flags */
120e9d09bacSPaolo Abeni #define MPTCP_PUSH_PENDING	1
121e9d09bacSPaolo Abeni #define MPTCP_CLEAN_UNA		2
122e9d09bacSPaolo Abeni #define MPTCP_ERROR_REPORT	3
123e9d09bacSPaolo Abeni #define MPTCP_RETRANSMIT	4
124e9d09bacSPaolo Abeni #define MPTCP_FLUSH_JOIN_LIST	5
125cf742d09SPaolo Abeni #define MPTCP_SYNC_STATE	6
12634c7757aSPaolo Abeni #define MPTCP_SYNC_SNDBUF	7
1276d0060f6SMat Martineau 
128dfc8d060SDmytro Shytyi struct mptcp_skb_cb {
129dfc8d060SDmytro Shytyi 	u64 map_seq;
130dfc8d060SDmytro Shytyi 	u64 end_seq;
131dfc8d060SDmytro Shytyi 	u32 offset;
132dfc8d060SDmytro Shytyi 	u8  has_rxtstamp:1;
133dfc8d060SDmytro Shytyi };
134dfc8d060SDmytro Shytyi 
135dfc8d060SDmytro Shytyi #define MPTCP_SKB_CB(__skb)	((struct mptcp_skb_cb *)&((__skb)->cb[0]))
136dfc8d060SDmytro Shytyi 
before64(__u64 seq1,__u64 seq2)137eaa2ffabSPaolo Abeni static inline bool before64(__u64 seq1, __u64 seq2)
138eaa2ffabSPaolo Abeni {
139eaa2ffabSPaolo Abeni 	return (__s64)(seq1 - seq2) < 0;
140eaa2ffabSPaolo Abeni }
141eaa2ffabSPaolo Abeni 
142eaa2ffabSPaolo Abeni #define after64(seq2, seq1)	before64(seq1, seq2)
143eaa2ffabSPaolo Abeni 
144cfde141eSPaolo Abeni struct mptcp_options_received {
145cfde141eSPaolo Abeni 	u64	sndr_key;
146cfde141eSPaolo Abeni 	u64	rcvr_key;
147cfde141eSPaolo Abeni 	u64	data_ack;
148cfde141eSPaolo Abeni 	u64	data_seq;
149cfde141eSPaolo Abeni 	u32	subflow_seq;
150cfde141eSPaolo Abeni 	u16	data_len;
151208e8f66SGeliang Tang 	__sum16	csum;
1527f6c72b8SPaolo Abeni 	struct_group(status,
15374c7dfbeSPaolo Abeni 		u16 suboptions;
154a086aebaSPaolo Abeni 		u16 use_map:1,
155cfde141eSPaolo Abeni 		    dsn64:1,
156cfde141eSPaolo Abeni 		    data_fin:1,
157cfde141eSPaolo Abeni 		    use_ack:1,
158cfde141eSPaolo Abeni 		    ack64:1,
159cfde141eSPaolo Abeni 		    mpc_map:1,
160a086aebaSPaolo Abeni 		    reset_reason:4,
161a086aebaSPaolo Abeni 		    reset_transient:1,
162a086aebaSPaolo Abeni 		    echo:1,
163a086aebaSPaolo Abeni 		    backup:1,
164a086aebaSPaolo Abeni 		    deny_join_id0:1,
165cfde141eSPaolo Abeni 		    __unused:2;
1667f6c72b8SPaolo Abeni 	);
167a086aebaSPaolo Abeni 	u8	join_id;
1687f6c72b8SPaolo Abeni 	u32	token;
1697f6c72b8SPaolo Abeni 	u32	nonce;
170a086aebaSPaolo Abeni 	u64	thmac;
171a086aebaSPaolo Abeni 	u8	hmac[MPTCPOPT_HMAC_LEN];
172f7dafee1SGeliang Tang 	struct mptcp_addr_info addr;
1735c4a824dSGeliang Tang 	struct mptcp_rm_list rm_list;
174cfde141eSPaolo Abeni 	u64	ahmac;
1755580d41bSGeliang Tang 	u64	fail_seq;
176cfde141eSPaolo Abeni };
177cfde141eSPaolo Abeni 
mptcp_option(u8 subopt,u8 len,u8 nib,u8 field)1783df523abSPeter Krystad static inline __be32 mptcp_option(u8 subopt, u8 len, u8 nib, u8 field)
1793df523abSPeter Krystad {
1803df523abSPeter Krystad 	return htonl((TCPOPT_MPTCP << 24) | (len << 16) | (subopt << 12) |
1813df523abSPeter Krystad 		     ((nib & 0xF) << 8) | field);
1823df523abSPeter Krystad }
1833df523abSPeter Krystad 
1841b1c7a0eSPeter Krystad enum mptcp_pm_status {
1851b1c7a0eSPeter Krystad 	MPTCP_PM_ADD_ADDR_RECEIVED,
18684dfe367SGeliang Tang 	MPTCP_PM_ADD_ADDR_SEND_ACK,
187d0876b22SGeliang Tang 	MPTCP_PM_RM_ADDR_RECEIVED,
1881b1c7a0eSPeter Krystad 	MPTCP_PM_ESTABLISHED,
1891b1c7a0eSPeter Krystad 	MPTCP_PM_SUBFLOW_ESTABLISHED,
19086e39e04SPaolo Abeni 	MPTCP_PM_ALREADY_ESTABLISHED,	/* persistent status, set after ESTABLISHED event */
19186e39e04SPaolo Abeni 	MPTCP_PM_MPC_ENDPOINT_ACCOUNTED /* persistent status, set after MPC local address is
19286e39e04SPaolo Abeni 					 * accounted int id_avail_bitmap
19386e39e04SPaolo Abeni 					 */
1941b1c7a0eSPeter Krystad };
1951b1c7a0eSPeter Krystad 
196d85a8fdeSMat Martineau enum mptcp_pm_type {
197d85a8fdeSMat Martineau 	MPTCP_PM_TYPE_KERNEL = 0,
198d85a8fdeSMat Martineau 	MPTCP_PM_TYPE_USERSPACE,
199d85a8fdeSMat Martineau 
200d85a8fdeSMat Martineau 	__MPTCP_PM_TYPE_NR,
201d85a8fdeSMat Martineau 	__MPTCP_PM_TYPE_MAX = __MPTCP_PM_TYPE_NR - 1,
202d85a8fdeSMat Martineau };
203d85a8fdeSMat Martineau 
20486e39e04SPaolo Abeni /* Status bits below MPTCP_PM_ALREADY_ESTABLISHED need pm worker actions */
20586e39e04SPaolo Abeni #define MPTCP_PM_WORK_MASK ((1 << MPTCP_PM_ALREADY_ESTABLISHED) - 1)
20686e39e04SPaolo Abeni 
20713ad9f01SGeliang Tang enum mptcp_addr_signal_status {
208d91d322aSGeliang Tang 	MPTCP_ADD_ADDR_SIGNAL,
209d91d322aSGeliang Tang 	MPTCP_ADD_ADDR_ECHO,
21042842a42SGeliang Tang 	MPTCP_RM_ADDR_SIGNAL,
211d91d322aSGeliang Tang };
212d91d322aSGeliang Tang 
21386e39e04SPaolo Abeni /* max value of mptcp_addr_info.id */
21486e39e04SPaolo Abeni #define MPTCP_PM_MAX_ADDR_ID		U8_MAX
21586e39e04SPaolo Abeni 
2161b1c7a0eSPeter Krystad struct mptcp_pm_data {
2171b1c7a0eSPeter Krystad 	struct mptcp_addr_info local;
2181b1c7a0eSPeter Krystad 	struct mptcp_addr_info remote;
219b6c08380SGeliang Tang 	struct list_head anno_list;
2204638de5aSKishen Maloor 	struct list_head userspace_pm_local_addr_list;
2211b1c7a0eSPeter Krystad 
2221b1c7a0eSPeter Krystad 	spinlock_t	lock;		/*protects the whole PM data */
2231b1c7a0eSPeter Krystad 
22413ad9f01SGeliang Tang 	u8		addr_signal;
2251b1c7a0eSPeter Krystad 	bool		server_side;
2261b1c7a0eSPeter Krystad 	bool		work_pending;
2271b1c7a0eSPeter Krystad 	bool		accept_addr;
2281b1c7a0eSPeter Krystad 	bool		accept_subflow;
229df377be3SGeliang Tang 	bool		remote_deny_join_id0;
2301b1c7a0eSPeter Krystad 	u8		add_addr_signaled;
2311b1c7a0eSPeter Krystad 	u8		add_addr_accepted;
2321b1c7a0eSPeter Krystad 	u8		local_addr_used;
233d85a8fdeSMat Martineau 	u8		pm_type;
2341b1c7a0eSPeter Krystad 	u8		subflows;
2351b1c7a0eSPeter Krystad 	u8		status;
23686e39e04SPaolo Abeni 	DECLARE_BITMAP(id_avail_bitmap, MPTCP_PM_MAX_ADDR_ID + 1);
237cbde2787SGeliang Tang 	struct mptcp_rm_list rm_list_tx;
238b5c55f33SGeliang Tang 	struct mptcp_rm_list rm_list_rx;
2391b1c7a0eSPeter Krystad };
2401b1c7a0eSPeter Krystad 
2414638de5aSKishen Maloor struct mptcp_pm_addr_entry {
2424638de5aSKishen Maloor 	struct list_head	list;
2434638de5aSKishen Maloor 	struct mptcp_addr_info	addr;
2444638de5aSKishen Maloor 	u8			flags;
2454638de5aSKishen Maloor 	int			ifindex;
2464638de5aSKishen Maloor 	struct socket		*lsk;
2474638de5aSKishen Maloor };
2484638de5aSKishen Maloor 
24918b683bfSPaolo Abeni struct mptcp_data_frag {
25018b683bfSPaolo Abeni 	struct list_head list;
25118b683bfSPaolo Abeni 	u64 data_seq;
252f0e6a4cfSPaolo Abeni 	u16 data_len;
253f0e6a4cfSPaolo Abeni 	u16 offset;
254f0e6a4cfSPaolo Abeni 	u16 overhead;
255f0e6a4cfSPaolo Abeni 	u16 already_sent;
25618b683bfSPaolo Abeni 	struct page *page;
25718b683bfSPaolo Abeni };
25818b683bfSPaolo Abeni 
259f870fa0bSMat Martineau /* MPTCP connection sock */
260f870fa0bSMat Martineau struct mptcp_sock {
261f870fa0bSMat Martineau 	/* inet_connection_sock must be the first member */
262f870fa0bSMat Martineau 	struct inet_connection_sock sk;
263cec37a6eSPeter Krystad 	u64		local_key;
264cec37a6eSPeter Krystad 	u64		remote_key;
2656d0060f6SMat Martineau 	u64		write_seq;
26638967f42SPaolo Abeni 	u64		bytes_sent;
267eaa2ffabSPaolo Abeni 	u64		snd_nxt;
26838967f42SPaolo Abeni 	u64		bytes_received;
2696d0060f6SMat Martineau 	u64		ack_seq;
270f3589be0SPaolo Abeni 	atomic64_t	rcv_wnd_sent;
2713721b9b6SMat Martineau 	u64		rcv_data_fin_seq;
27238967f42SPaolo Abeni 	u64		bytes_retrans;
273124a4885SPaolo Abeni 	u64		bytes_consumed;
2746511882cSPaolo Abeni 	int		rmem_fwd_alloc;
275d5f49190SPaolo Abeni 	int		snd_burst;
276ea4ca586SPaolo Abeni 	int		old_wspace;
2771e1d9d6fSPaolo Abeni 	u64		recovery_snd_nxt;	/* in recovery mode accept up to this seq;
2781e1d9d6fSPaolo Abeni 						 * recovery related fields are under data_lock
2791e1d9d6fSPaolo Abeni 						 * protection
2801e1d9d6fSPaolo Abeni 						 */
28138967f42SPaolo Abeni 	u64		bytes_acked;
2827439d687SPaolo Abeni 	u64		snd_una;
2837439d687SPaolo Abeni 	u64		wnd_end;
284b51f9b80SPaolo Abeni 	unsigned long	timer_ival;
28579c0949eSPeter Krystad 	u32		token;
28687952603SPaolo Abeni 	int		rmem_released;
287648ef4b8SMat Martineau 	unsigned long	flags;
288e9d09bacSPaolo Abeni 	unsigned long	cb_flags;
2891e1d9d6fSPaolo Abeni 	bool		recovery;		/* closing subflow write queue reinjected */
290d22f4988SChristoph Paasch 	bool		can_ack;
291b93df08cSPaolo Abeni 	bool		fully_established;
2923721b9b6SMat Martineau 	bool		rcv_data_fin;
2937279da61SMat Martineau 	bool		snd_data_fin_enable;
29450c504a2SFlorian Westphal 	bool		rcv_fastclose;
29537198e93SDavide Caratti 	bool		use_64bit_ack; /* Set when we received a 64-bit DSN */
296752e9067SGeliang Tang 	bool		csum_enabled;
2970530020aSGeliang Tang 	bool		allow_infinite_fallback;
298cf742d09SPaolo Abeni 	u8		pending_state; /* A subflow asked to set this sk_state,
299cf742d09SPaolo Abeni 					* protected by the msk data lock
300cf742d09SPaolo Abeni 					*/
3013ad14f54SPaolo Abeni 	u8		mpc_endpoint_id;
3024f6e14bdSMaxim Galaganov 	u8		recvmsg_inq:1,
3034f6e14bdSMaxim Galaganov 			cork:1,
30454f1944eSPaolo Abeni 			nodelay:1,
305b6985b9bSPaolo Abeni 			fastopening:1,
30639880bd8SPaolo Abeni 			in_accept_queue:1,
307a2d74374SPaolo Abeni 			free_first:1,
308a2d74374SPaolo Abeni 			rcvspace_init:1;
309184873afSMatthieu Baerts (NGI0) 	int		keepalive_cnt;
310184873afSMatthieu Baerts (NGI0) 	int		keepalive_idle;
311184873afSMatthieu Baerts (NGI0) 	int		keepalive_intvl;
31280992017SPaolo Abeni 	struct work_struct work;
313ab174ad8SPaolo Abeni 	struct sk_buff  *ooo_last_skb;
314ab174ad8SPaolo Abeni 	struct rb_root  out_of_order_queue;
31587952603SPaolo Abeni 	struct sk_buff_head receive_queue;
316cec37a6eSPeter Krystad 	struct list_head conn_list;
31718b683bfSPaolo Abeni 	struct list_head rtx_queue;
318f0e6a4cfSPaolo Abeni 	struct mptcp_data_frag *first_pending;
319ec3edaa7SPeter Krystad 	struct list_head join_list;
32039880bd8SPaolo Abeni 	struct sock	*first; /* The mptcp ops can safely dereference, using suitable
3215b825727SPaolo Abeni 				 * ONCE annotation, the subflow outside the socket
3225b825727SPaolo Abeni 				 * lock as such sock is freed after close().
3235b825727SPaolo Abeni 				 */
3241b1c7a0eSPeter Krystad 	struct mptcp_pm_data	pm;
3251730b2b2SGeliang Tang 	struct mptcp_sched_ops	*sched;
326a6b118feSFlorian Westphal 	struct {
327a6b118feSFlorian Westphal 		u32	space;	/* bytes copied in last measurement window */
328a6b118feSFlorian Westphal 		u32	copied; /* bytes copied in this measurement window */
329a6b118feSFlorian Westphal 		u64	time;	/* start time of measurement window */
330a6b118feSFlorian Westphal 		u64	rtt_us; /* last maximum rtt of subflows */
331a6b118feSFlorian Westphal 	} rcvq_space;
332b8dc6d6cSPaolo Abeni 	u8		scaling_ratio;
333df00b087SFlorian Westphal 
3346f06b4d4SPaolo Abeni 	u32		subflow_id;
335df00b087SFlorian Westphal 	u32		setsockopt_seq;
33620b5759fSPaolo Abeni 	char		ca_name[TCP_CA_NAME_MAX];
337f870fa0bSMat Martineau };
338f870fa0bSMat Martineau 
33987952603SPaolo Abeni #define mptcp_data_lock(sk) spin_lock_bh(&(sk)->sk_lock.slock)
34087952603SPaolo Abeni #define mptcp_data_unlock(sk) spin_unlock_bh(&(sk)->sk_lock.slock)
34187952603SPaolo Abeni 
342cec37a6eSPeter Krystad #define mptcp_for_each_subflow(__msk, __subflow)			\
343cec37a6eSPeter Krystad 	list_for_each_entry(__subflow, &((__msk)->conn_list), node)
3445efbf6f7SMatthieu Baerts #define mptcp_for_each_subflow_safe(__msk, __subflow, __tmp)			\
3455efbf6f7SMatthieu Baerts 	list_for_each_entry_safe(__subflow, __tmp, &((__msk)->conn_list), node)
346cec37a6eSPeter Krystad 
msk_owned_by_me(const struct mptcp_sock * msk)3473abc05d9SFlorian Westphal static inline void msk_owned_by_me(const struct mptcp_sock *msk)
3483abc05d9SFlorian Westphal {
3493abc05d9SFlorian Westphal 	sock_owned_by_me((const struct sock *)msk);
3503abc05d9SFlorian Westphal }
3513abc05d9SFlorian Westphal 
352403a40f2SEric Dumazet #define mptcp_sk(ptr) container_of_const(ptr, struct mptcp_sock, sk.icsk_inet.sk)
353f870fa0bSMat Martineau 
354ce599c51SPaolo Abeni /* the msk socket don't use the backlog, also account for the bulk
355ce599c51SPaolo Abeni  * free memory
356ce599c51SPaolo Abeni  */
__mptcp_rmem(const struct sock * sk)357ce599c51SPaolo Abeni static inline int __mptcp_rmem(const struct sock *sk)
358ce599c51SPaolo Abeni {
359ce599c51SPaolo Abeni 	return atomic_read(&sk->sk_rmem_alloc) - READ_ONCE(mptcp_sk(sk)->rmem_released);
360ce599c51SPaolo Abeni }
361ce599c51SPaolo Abeni 
mptcp_win_from_space(const struct sock * sk,int space)362b8dc6d6cSPaolo Abeni static inline int mptcp_win_from_space(const struct sock *sk, int space)
363b8dc6d6cSPaolo Abeni {
364b8dc6d6cSPaolo Abeni 	return __tcp_win_from_space(mptcp_sk(sk)->scaling_ratio, space);
365b8dc6d6cSPaolo Abeni }
366b8dc6d6cSPaolo Abeni 
__mptcp_space(const struct sock * sk)367ea4ca586SPaolo Abeni static inline int __mptcp_space(const struct sock *sk)
368ea4ca586SPaolo Abeni {
369b8dc6d6cSPaolo Abeni 	return mptcp_win_from_space(sk, READ_ONCE(sk->sk_rcvbuf) - __mptcp_rmem(sk));
370ea4ca586SPaolo Abeni }
371ea4ca586SPaolo Abeni 
mptcp_send_head(const struct sock * sk)372f0e6a4cfSPaolo Abeni static inline struct mptcp_data_frag *mptcp_send_head(const struct sock *sk)
373f0e6a4cfSPaolo Abeni {
374f0e6a4cfSPaolo Abeni 	const struct mptcp_sock *msk = mptcp_sk(sk);
375f0e6a4cfSPaolo Abeni 
376f0e6a4cfSPaolo Abeni 	return READ_ONCE(msk->first_pending);
377f0e6a4cfSPaolo Abeni }
378f0e6a4cfSPaolo Abeni 
mptcp_send_next(struct sock * sk)379f0e6a4cfSPaolo Abeni static inline struct mptcp_data_frag *mptcp_send_next(struct sock *sk)
380f0e6a4cfSPaolo Abeni {
381f0e6a4cfSPaolo Abeni 	struct mptcp_sock *msk = mptcp_sk(sk);
382f0e6a4cfSPaolo Abeni 	struct mptcp_data_frag *cur;
383f0e6a4cfSPaolo Abeni 
384f0e6a4cfSPaolo Abeni 	cur = msk->first_pending;
385f0e6a4cfSPaolo Abeni 	return list_is_last(&cur->list, &msk->rtx_queue) ? NULL :
386f0e6a4cfSPaolo Abeni 						     list_next_entry(cur, list);
387f0e6a4cfSPaolo Abeni }
388f0e6a4cfSPaolo Abeni 
mptcp_pending_tail(const struct sock * sk)389f0e6a4cfSPaolo Abeni static inline struct mptcp_data_frag *mptcp_pending_tail(const struct sock *sk)
390f0e6a4cfSPaolo Abeni {
391403a40f2SEric Dumazet 	const struct mptcp_sock *msk = mptcp_sk(sk);
392f0e6a4cfSPaolo Abeni 
393f0e6a4cfSPaolo Abeni 	if (!msk->first_pending)
394f0e6a4cfSPaolo Abeni 		return NULL;
395f0e6a4cfSPaolo Abeni 
396f0e6a4cfSPaolo Abeni 	if (WARN_ON_ONCE(list_empty(&msk->rtx_queue)))
397f0e6a4cfSPaolo Abeni 		return NULL;
398f0e6a4cfSPaolo Abeni 
399f0e6a4cfSPaolo Abeni 	return list_last_entry(&msk->rtx_queue, struct mptcp_data_frag, list);
400f0e6a4cfSPaolo Abeni }
401f0e6a4cfSPaolo Abeni 
mptcp_rtx_head(struct sock * sk)402403a40f2SEric Dumazet static inline struct mptcp_data_frag *mptcp_rtx_head(struct sock *sk)
4037948f6ccSFlorian Westphal {
4047948f6ccSFlorian Westphal 	struct mptcp_sock *msk = mptcp_sk(sk);
4057948f6ccSFlorian Westphal 
40664b9cea7SPaolo Abeni 	if (msk->snd_una == READ_ONCE(msk->snd_nxt))
40764b9cea7SPaolo Abeni 		return NULL;
40864b9cea7SPaolo Abeni 
409a386bc5bSGeliang Tang 	return list_first_entry_or_null(&msk->rtx_queue, struct mptcp_data_frag, list);
4107948f6ccSFlorian Westphal }
4117948f6ccSFlorian Westphal 
412d0cc2987SGeliang Tang struct csum_pseudo_header {
413d0cc2987SGeliang Tang 	__be64 data_seq;
414d0cc2987SGeliang Tang 	__be32 subflow_seq;
415d0cc2987SGeliang Tang 	__be16 data_len;
416d0cc2987SGeliang Tang 	__sum16 csum;
417d0cc2987SGeliang Tang };
418d0cc2987SGeliang Tang 
419cec37a6eSPeter Krystad struct mptcp_subflow_request_sock {
420cec37a6eSPeter Krystad 	struct	tcp_request_sock sk;
421d22f4988SChristoph Paasch 	u16	mp_capable : 1,
422cec37a6eSPeter Krystad 		mp_join : 1,
42306fe1719SGeliang Tang 		backup : 1,
4248ed3e34cSMatthieu Baerts (NGI0) 		request_bkup : 1,
425bab6b88eSGeliang Tang 		csum_reqd : 1,
426bab6b88eSGeliang Tang 		allow_join_id0 : 1;
4271b1c7a0eSPeter Krystad 	u8	local_id;
428f296234cSPeter Krystad 	u8	remote_id;
429cec37a6eSPeter Krystad 	u64	local_key;
43079c0949eSPeter Krystad 	u64	idsn;
43179c0949eSPeter Krystad 	u32	token;
432648ef4b8SMat Martineau 	u32	ssn_offset;
433f296234cSPeter Krystad 	u64	thmac;
434f296234cSPeter Krystad 	u32	local_nonce;
435f296234cSPeter Krystad 	u32	remote_nonce;
4368fd4de12SPaolo Abeni 	struct mptcp_sock	*msk;
4372c5ebd00SPaolo Abeni 	struct hlist_nulls_node token_node;
438cec37a6eSPeter Krystad };
439cec37a6eSPeter Krystad 
440cec37a6eSPeter Krystad static inline struct mptcp_subflow_request_sock *
mptcp_subflow_rsk(const struct request_sock * rsk)441cec37a6eSPeter Krystad mptcp_subflow_rsk(const struct request_sock *rsk)
442cec37a6eSPeter Krystad {
443cec37a6eSPeter Krystad 	return (struct mptcp_subflow_request_sock *)rsk;
444cec37a6eSPeter Krystad }
445cec37a6eSPeter Krystad 
4466719331cSPaolo Abeni enum mptcp_data_avail {
4476719331cSPaolo Abeni 	MPTCP_SUBFLOW_NODATA,
4486719331cSPaolo Abeni 	MPTCP_SUBFLOW_DATA_AVAIL,
4496719331cSPaolo Abeni };
4506719331cSPaolo Abeni 
451b19bc294SPaolo Abeni struct mptcp_delegated_action {
452b19bc294SPaolo Abeni 	struct napi_struct napi;
453b19bc294SPaolo Abeni 	struct list_head head;
454b19bc294SPaolo Abeni };
455b19bc294SPaolo Abeni 
456b19bc294SPaolo Abeni DECLARE_PER_CPU(struct mptcp_delegated_action, mptcp_delegated_actions);
457b19bc294SPaolo Abeni 
458a5efdbceSPaolo Abeni #define MPTCP_DELEGATE_SCHEDULED	0
459a5efdbceSPaolo Abeni #define MPTCP_DELEGATE_SEND		1
460a5efdbceSPaolo Abeni #define MPTCP_DELEGATE_ACK		2
46134c7757aSPaolo Abeni #define MPTCP_DELEGATE_SNDBUF		3
462b19bc294SPaolo Abeni 
463a5efdbceSPaolo Abeni #define MPTCP_DELEGATE_ACTIONS_MASK	(~BIT(MPTCP_DELEGATE_SCHEDULED))
4642303f994SPeter Krystad /* MPTCP subflow context */
4652303f994SPeter Krystad struct mptcp_subflow_context {
466cec37a6eSPeter Krystad 	struct	list_head node;/* conn_list of subflows */
467b29fcfb5SPaolo Abeni 
46863ec72bdSKees Cook 	struct_group(reset,
469b29fcfb5SPaolo Abeni 
4703ce0852cSPaolo Abeni 	unsigned long avg_pacing_rate; /* protected by msk socket lock */
471cec37a6eSPeter Krystad 	u64	local_key;
472cec37a6eSPeter Krystad 	u64	remote_key;
47379c0949eSPeter Krystad 	u64	idsn;
474648ef4b8SMat Martineau 	u64	map_seq;
475cc7972eaSChristoph Paasch 	u32	snd_isn;
47679c0949eSPeter Krystad 	u32	token;
4776d0060f6SMat Martineau 	u32	rel_write_seq;
478648ef4b8SMat Martineau 	u32	map_subflow_seq;
479648ef4b8SMat Martineau 	u32	ssn_offset;
480648ef4b8SMat Martineau 	u32	map_data_len;
481dd8bcd17SPaolo Abeni 	__wsum	map_data_csum;
482dd8bcd17SPaolo Abeni 	u32	map_csum_len;
483cec37a6eSPeter Krystad 	u32	request_mptcp : 1,  /* send MP_CAPABLE */
484ec3edaa7SPeter Krystad 		request_join : 1,   /* send MP_JOIN */
485ec3edaa7SPeter Krystad 		request_bkup : 1,
486cec37a6eSPeter Krystad 		mp_capable : 1,	    /* remote is MPTCP capable */
487f296234cSPeter Krystad 		mp_join : 1,	    /* remote is JOINing */
4880be534f5SPaolo Abeni 		fully_established : 1,	    /* path validated */
489f296234cSPeter Krystad 		pm_notified : 1,    /* PM hook called for established status */
490648ef4b8SMat Martineau 		conn_finished : 1,
491648ef4b8SMat Martineau 		map_valid : 1,
492dd8bcd17SPaolo Abeni 		map_csum_reqd : 1,
493dd8bcd17SPaolo Abeni 		map_data_fin : 1,
494d22f4988SChristoph Paasch 		mpc_map : 1,
495f296234cSPeter Krystad 		backup : 1,
49606706542SGeliang Tang 		send_mp_prio : 1,
497c25aeb4eSGeliang Tang 		send_mp_fail : 1,
498f284c0c7SPaolo Abeni 		send_fastclose : 1,
4991e39e5a3SGeliang Tang 		send_infinite_map : 1,
500b3ea6b27SPaolo Abeni 		remote_key_valid : 1,        /* received the peer key from */
501ff5a0b42SPaolo Abeni 		disposable : 1,	    /* ctx can be free at ulp release time */
5024cf86ae8SPaolo Abeni 		stale : 1,	    /* unable to snd/rcv data, do not use for xmit */
503dfc8d060SDmytro Shytyi 		valid_csum_seen : 1,        /* at least one csum validated */
504dfc8d060SDmytro Shytyi 		is_mptfo : 1,	    /* subflow is doing TFO */
505a088190fSMatthieu Baerts (NGI0) 		close_event_done : 1,       /* has done the post-closed part */
506a088190fSMatthieu Baerts (NGI0) 		__unused : 9;
5076719331cSPaolo Abeni 	enum mptcp_data_avail data_avail;
508fce68b03SGeliang Tang 	bool	scheduled;
50937d9305cSPaolo Abeni 	bool	pm_listener;	    /* a listener managed by the kernel PM? */
510f296234cSPeter Krystad 	u32	remote_nonce;
511f296234cSPeter Krystad 	u64	thmac;
512f296234cSPeter Krystad 	u32	local_nonce;
513ec3edaa7SPeter Krystad 	u32	remote_token;
514b3ea6b27SPaolo Abeni 	union {
515b3ea6b27SPaolo Abeni 		u8	hmac[MPTCPOPT_HMAC_LEN]; /* MPJ subflow only */
516b3ea6b27SPaolo Abeni 		u64	iasn;	    /* initial ack sequence number, MPC subflows only */
517b3ea6b27SPaolo Abeni 	};
518ba2cf922SPaolo Abeni 	s16	local_id;	    /* if negative not initialized yet */
519f296234cSPeter Krystad 	u8	remote_id;
520dc87efdbSFlorian Westphal 	u8	reset_seen:1;
521dc87efdbSFlorian Westphal 	u8	reset_transient:1;
522dc87efdbSFlorian Westphal 	u8	reset_reason:4;
52371b7dec2SPaolo Abeni 	u8	stale_count;
524648ef4b8SMat Martineau 
5256f06b4d4SPaolo Abeni 	u32	subflow_id;
5266f06b4d4SPaolo Abeni 
527b19bc294SPaolo Abeni 	long	delegated_status;
52876a13b31SGeliang Tang 	unsigned long	fail_tout;
529b29fcfb5SPaolo Abeni 
53063ec72bdSKees Cook 	);
531b29fcfb5SPaolo Abeni 
532b19bc294SPaolo Abeni 	struct	list_head delegated_node;   /* link into delegated_action, protected by local BH */
533b19bc294SPaolo Abeni 
534df00b087SFlorian Westphal 	u32	setsockopt_seq;
53571b7dec2SPaolo Abeni 	u32	stale_rcv_tstamp;
53634c7757aSPaolo Abeni 	int     cached_sndbuf;	    /* sndbuf size when last synced with the msk sndbuf,
53734c7757aSPaolo Abeni 				     * protected by the msk socket lock
53834c7757aSPaolo Abeni 				     */
539df00b087SFlorian Westphal 
5402303f994SPeter Krystad 	struct	sock *tcp_sock;	    /* tcp sk backpointer */
5412303f994SPeter Krystad 	struct	sock *conn;	    /* parent mptcp_sock */
542cec37a6eSPeter Krystad 	const	struct inet_connection_sock_af_ops *icsk_af_ops;
543648ef4b8SMat Martineau 	void	(*tcp_state_change)(struct sock *sk);
54415cc1045SPaolo Abeni 	void	(*tcp_error_report)(struct sock *sk);
545648ef4b8SMat Martineau 
5462303f994SPeter Krystad 	struct	rcu_head rcu;
5472303f994SPeter Krystad };
5482303f994SPeter Krystad 
5492303f994SPeter Krystad static inline struct mptcp_subflow_context *
mptcp_subflow_ctx(const struct sock * sk)5502303f994SPeter Krystad mptcp_subflow_ctx(const struct sock *sk)
5512303f994SPeter Krystad {
5522303f994SPeter Krystad 	struct inet_connection_sock *icsk = inet_csk(sk);
5532303f994SPeter Krystad 
5542303f994SPeter Krystad 	/* Use RCU on icsk_ulp_data only for sock diag code */
5552303f994SPeter Krystad 	return (__force struct mptcp_subflow_context *)icsk->icsk_ulp_data;
5562303f994SPeter Krystad }
5572303f994SPeter Krystad 
5582303f994SPeter Krystad static inline struct sock *
mptcp_subflow_tcp_sock(const struct mptcp_subflow_context * subflow)5592303f994SPeter Krystad mptcp_subflow_tcp_sock(const struct mptcp_subflow_context *subflow)
5602303f994SPeter Krystad {
5612303f994SPeter Krystad 	return subflow->tcp_sock;
5622303f994SPeter Krystad }
5632303f994SPeter Krystad 
564b29fcfb5SPaolo Abeni static inline void
mptcp_subflow_ctx_reset(struct mptcp_subflow_context * subflow)565b29fcfb5SPaolo Abeni mptcp_subflow_ctx_reset(struct mptcp_subflow_context *subflow)
566b29fcfb5SPaolo Abeni {
56763ec72bdSKees Cook 	memset(&subflow->reset, 0, sizeof(subflow->reset));
568b29fcfb5SPaolo Abeni 	subflow->request_mptcp = 1;
569ba2cf922SPaolo Abeni 	WRITE_ONCE(subflow->local_id, -1);
570b29fcfb5SPaolo Abeni }
571b29fcfb5SPaolo Abeni 
572648ef4b8SMat Martineau static inline u64
mptcp_subflow_get_map_offset(const struct mptcp_subflow_context * subflow)573648ef4b8SMat Martineau mptcp_subflow_get_map_offset(const struct mptcp_subflow_context *subflow)
574648ef4b8SMat Martineau {
575648ef4b8SMat Martineau 	return tcp_sk(mptcp_subflow_tcp_sock(subflow))->copied_seq -
576648ef4b8SMat Martineau 		      subflow->ssn_offset -
577648ef4b8SMat Martineau 		      subflow->map_subflow_seq;
578648ef4b8SMat Martineau }
579648ef4b8SMat Martineau 
580648ef4b8SMat Martineau static inline u64
mptcp_subflow_get_mapped_dsn(const struct mptcp_subflow_context * subflow)581648ef4b8SMat Martineau mptcp_subflow_get_mapped_dsn(const struct mptcp_subflow_context *subflow)
582648ef4b8SMat Martineau {
583648ef4b8SMat Martineau 	return subflow->map_seq + mptcp_subflow_get_map_offset(subflow);
584648ef4b8SMat Martineau }
585648ef4b8SMat Martineau 
586a5efdbceSPaolo Abeni void mptcp_subflow_process_delegated(struct sock *ssk, long actions);
587b19bc294SPaolo Abeni 
mptcp_subflow_delegate(struct mptcp_subflow_context * subflow,int action)588bcd97734SPaolo Abeni static inline void mptcp_subflow_delegate(struct mptcp_subflow_context *subflow, int action)
589b19bc294SPaolo Abeni {
590a5efdbceSPaolo Abeni 	long old, set_bits = BIT(MPTCP_DELEGATE_SCHEDULED) | BIT(action);
591b19bc294SPaolo Abeni 	struct mptcp_delegated_action *delegated;
592b19bc294SPaolo Abeni 	bool schedule;
593b19bc294SPaolo Abeni 
594bcd97734SPaolo Abeni 	/* the caller held the subflow bh socket lock */
595bcd97734SPaolo Abeni 	lockdep_assert_in_softirq();
596bcd97734SPaolo Abeni 
597a5efdbceSPaolo Abeni 	/* The implied barrier pairs with tcp_release_cb_override()
598a5efdbceSPaolo Abeni 	 * mptcp_napi_poll(), and ensures the below list check sees list
599a5efdbceSPaolo Abeni 	 * updates done prior to delegated status bits changes
600b19bc294SPaolo Abeni 	 */
601a5efdbceSPaolo Abeni 	old = set_mask_bits(&subflow->delegated_status, 0, set_bits);
602a5efdbceSPaolo Abeni 	if (!(old & BIT(MPTCP_DELEGATE_SCHEDULED))) {
603a5efdbceSPaolo Abeni 		if (WARN_ON_ONCE(!list_empty(&subflow->delegated_node)))
604b19bc294SPaolo Abeni 			return;
605b19bc294SPaolo Abeni 
606b19bc294SPaolo Abeni 		delegated = this_cpu_ptr(&mptcp_delegated_actions);
607b19bc294SPaolo Abeni 		schedule = list_empty(&delegated->head);
608b19bc294SPaolo Abeni 		list_add_tail(&subflow->delegated_node, &delegated->head);
609b19bc294SPaolo Abeni 		sock_hold(mptcp_subflow_tcp_sock(subflow));
610b19bc294SPaolo Abeni 		if (schedule)
611b19bc294SPaolo Abeni 			napi_schedule(&delegated->napi);
612b19bc294SPaolo Abeni 	}
613b19bc294SPaolo Abeni }
614b19bc294SPaolo Abeni 
615b19bc294SPaolo Abeni static inline struct mptcp_subflow_context *
mptcp_subflow_delegated_next(struct mptcp_delegated_action * delegated)616b19bc294SPaolo Abeni mptcp_subflow_delegated_next(struct mptcp_delegated_action *delegated)
617b19bc294SPaolo Abeni {
618b19bc294SPaolo Abeni 	struct mptcp_subflow_context *ret;
619b19bc294SPaolo Abeni 
620b19bc294SPaolo Abeni 	if (list_empty(&delegated->head))
621b19bc294SPaolo Abeni 		return NULL;
622b19bc294SPaolo Abeni 
623b19bc294SPaolo Abeni 	ret = list_first_entry(&delegated->head, struct mptcp_subflow_context, delegated_node);
624b19bc294SPaolo Abeni 	list_del_init(&ret->delegated_node);
625b19bc294SPaolo Abeni 	return ret;
626b19bc294SPaolo Abeni }
627b19bc294SPaolo Abeni 
6286da14d74SPaolo Abeni int mptcp_is_enabled(const struct net *net);
6296da14d74SPaolo Abeni unsigned int mptcp_get_add_addr_timeout(const struct net *net);
6306da14d74SPaolo Abeni int mptcp_is_checksum_enabled(const struct net *net);
6316da14d74SPaolo Abeni int mptcp_allow_join_id0(const struct net *net);
632ff5a0b42SPaolo Abeni unsigned int mptcp_stale_loss_cnt(const struct net *net);
6336bb63cccSMat Martineau int mptcp_get_pm_type(const struct net *net);
634e3b2870bSGeliang Tang const char *mptcp_get_scheduler(const struct net *net);
635b45df837SPaolo Abeni void __mptcp_subflow_fully_established(struct mptcp_sock *msk,
636b45df837SPaolo Abeni 				       struct mptcp_subflow_context *subflow,
637b3ea6b27SPaolo Abeni 				       const struct mptcp_options_received *mp_opt);
6381e1d9d6fSPaolo Abeni bool __mptcp_retransmit_pending_data(struct sock *sk);
6398b38217aSMaxim Galaganov void mptcp_check_and_set_pending(struct sock *sk);
640ff5a0b42SPaolo Abeni void __mptcp_push_pending(struct sock *sk, unsigned int flags);
641648ef4b8SMat Martineau bool mptcp_subflow_data_available(struct sock *sk);
642d39dcecaSPaolo Abeni void __init mptcp_subflow_init(void);
643d0876b22SGeliang Tang void mptcp_subflow_shutdown(struct sock *sk, struct sock *ssk, int how);
644a141e02eSFlorian Westphal void mptcp_close_ssk(struct sock *sk, struct sock *ssk,
645e16163b6SPaolo Abeni 		     struct mptcp_subflow_context *subflow);
646a6574302SMat Martineau void __mptcp_subflow_send_ack(struct sock *ssk);
647d5824847SPaolo Abeni void mptcp_subflow_reset(struct sock *ssk);
6482a6a870eSPaolo Abeni void mptcp_subflow_queue_clean(struct sock *sk, struct sock *ssk);
649866f26f2SPaolo Abeni void mptcp_sock_graft(struct sock *sk, struct socket *parent);
6503f326a82SPaolo Abeni struct sock *__mptcp_nmpc_sk(struct mptcp_sock *msk);
65126d3e21cSMenglong Dong bool __mptcp_close(struct sock *sk, long timeout);
65230e51b92SMenglong Dong void mptcp_cancel_work(struct sock *sk);
65363740448SPaolo Abeni void __mptcp_unaccepted_force_close(struct sock *sk);
65436b122baSDmytro Shytyi void mptcp_set_owner_r(struct sk_buff *skb, struct sock *sk);
65556557547SGeliang Tang void mptcp_set_state(struct sock *sk, int state);
656ec3edaa7SPeter Krystad 
6574638de5aSKishen Maloor bool mptcp_addresses_equal(const struct mptcp_addr_info *a,
6584638de5aSKishen Maloor 			   const struct mptcp_addr_info *b, bool use_port);
659dc886bceSGeliang Tang void mptcp_local_address(const struct sock_common *skc, struct mptcp_addr_info *addr);
6604638de5aSKishen Maloor 
661ec3edaa7SPeter Krystad /* called with sk socket lock held */
662ef0da3b8SPaolo Abeni int __mptcp_subflow_connect(struct sock *sk, const struct mptcp_addr_info *loc,
663ee285257SGeliang Tang 			    const struct mptcp_addr_info *remote);
6646bc1fe7dSPaolo Abeni int mptcp_subflow_create_socket(struct sock *sk, unsigned short family,
6656bc1fe7dSPaolo Abeni 				struct socket **new_sock);
6661729cf18SGeliang Tang void mptcp_info2sockaddr(const struct mptcp_addr_info *info,
6671729cf18SGeliang Tang 			 struct sockaddr_storage *addr,
6681729cf18SGeliang Tang 			 unsigned short family);
669740ebe35SGeliang Tang struct mptcp_sched_ops *mptcp_sched_find(const char *name);
670740ebe35SGeliang Tang int mptcp_register_scheduler(struct mptcp_sched_ops *sched);
671740ebe35SGeliang Tang void mptcp_unregister_scheduler(struct mptcp_sched_ops *sched);
672ed1ad86bSGeliang Tang void mptcp_sched_init(void);
6731730b2b2SGeliang Tang int mptcp_init_sched(struct mptcp_sock *msk,
6741730b2b2SGeliang Tang 		     struct mptcp_sched_ops *sched);
6751730b2b2SGeliang Tang void mptcp_release_sched(struct mptcp_sock *msk);
676fce68b03SGeliang Tang void mptcp_subflow_set_scheduled(struct mptcp_subflow_context *subflow,
677fce68b03SGeliang Tang 				 bool scheduled);
67807336a87SGeliang Tang struct sock *mptcp_subflow_get_send(struct mptcp_sock *msk);
67907336a87SGeliang Tang struct sock *mptcp_subflow_get_retrans(struct mptcp_sock *msk);
68007336a87SGeliang Tang int mptcp_sched_get_send(struct mptcp_sock *msk);
68107336a87SGeliang Tang int mptcp_sched_get_retrans(struct mptcp_sock *msk);
6822303f994SPeter Krystad 
mptcp_data_avail(const struct mptcp_sock * msk)683124a4885SPaolo Abeni static inline u64 mptcp_data_avail(const struct mptcp_sock *msk)
684124a4885SPaolo Abeni {
685124a4885SPaolo Abeni 	return READ_ONCE(msk->bytes_received) - READ_ONCE(msk->bytes_consumed);
686124a4885SPaolo Abeni }
687124a4885SPaolo Abeni 
mptcp_epollin_ready(const struct sock * sk)688124a4885SPaolo Abeni static inline bool mptcp_epollin_ready(const struct sock *sk)
689124a4885SPaolo Abeni {
690d09d17c1SPaolo Abeni 	u64 data_avail = mptcp_data_avail(mptcp_sk(sk));
691d09d17c1SPaolo Abeni 
692d09d17c1SPaolo Abeni 	if (!data_avail)
693d09d17c1SPaolo Abeni 		return false;
694d09d17c1SPaolo Abeni 
695124a4885SPaolo Abeni 	/* mptcp doesn't have to deal with small skbs in the receive queue,
696d09d17c1SPaolo Abeni 	 * as it can always coalesce them
697124a4885SPaolo Abeni 	 */
698d09d17c1SPaolo Abeni 	return (data_avail >= sk->sk_rcvlowat) ||
699124a4885SPaolo Abeni 	       (mem_cgroup_sockets_enabled && sk->sk_memcg &&
700124a4885SPaolo Abeni 		mem_cgroup_under_socket_pressure(sk->sk_memcg)) ||
701124a4885SPaolo Abeni 	       READ_ONCE(tcp_memory_pressure);
702124a4885SPaolo Abeni }
703124a4885SPaolo Abeni 
704124a4885SPaolo Abeni int mptcp_set_rcvlowat(struct sock *sk, int val);
705124a4885SPaolo Abeni 
__tcp_can_send(const struct sock * ssk)706c886d702SPaolo Abeni static inline bool __tcp_can_send(const struct sock *ssk)
707c886d702SPaolo Abeni {
708c886d702SPaolo Abeni 	/* only send if our side has not closed yet */
709c886d702SPaolo Abeni 	return ((1 << inet_sk_state_load(ssk)) & (TCPF_ESTABLISHED | TCPF_CLOSE_WAIT));
710c886d702SPaolo Abeni }
711c886d702SPaolo Abeni 
__mptcp_subflow_active(struct mptcp_subflow_context * subflow)712ff5a0b42SPaolo Abeni static inline bool __mptcp_subflow_active(struct mptcp_subflow_context *subflow)
71343f1140bSGeliang Tang {
71443f1140bSGeliang Tang 	/* can't send if JOIN hasn't completed yet (i.e. is usable for mptcp) */
71543f1140bSGeliang Tang 	if (subflow->request_join && !subflow->fully_established)
71643f1140bSGeliang Tang 		return false;
71743f1140bSGeliang Tang 
718c886d702SPaolo Abeni 	return __tcp_can_send(mptcp_subflow_tcp_sock(subflow));
71943f1140bSGeliang Tang }
72043f1140bSGeliang Tang 
721ff5a0b42SPaolo Abeni void mptcp_subflow_set_active(struct mptcp_subflow_context *subflow);
722ff5a0b42SPaolo Abeni 
723ff5a0b42SPaolo Abeni bool mptcp_subflow_active(struct mptcp_subflow_context *subflow);
724ff5a0b42SPaolo Abeni 
725b6985b9bSPaolo Abeni void mptcp_subflow_drop_ctx(struct sock *ssk);
726b6985b9bSPaolo Abeni 
mptcp_subflow_tcp_fallback(struct sock * sk,struct mptcp_subflow_context * ctx)727648ef4b8SMat Martineau static inline void mptcp_subflow_tcp_fallback(struct sock *sk,
728648ef4b8SMat Martineau 					      struct mptcp_subflow_context *ctx)
729648ef4b8SMat Martineau {
730952382c6SFlorian Westphal 	sk->sk_data_ready = sock_def_readable;
731648ef4b8SMat Martineau 	sk->sk_state_change = ctx->tcp_state_change;
732952382c6SFlorian Westphal 	sk->sk_write_space = sk_stream_write_space;
73315cc1045SPaolo Abeni 	sk->sk_error_report = ctx->tcp_error_report;
734648ef4b8SMat Martineau 
735648ef4b8SMat Martineau 	inet_csk(sk)->icsk_af_ops = ctx->icsk_af_ops;
736648ef4b8SMat Martineau }
737648ef4b8SMat Martineau 
738d39dcecaSPaolo Abeni void __init mptcp_proto_init(void);
739784325e9SMatthieu Baerts #if IS_ENABLED(CONFIG_MPTCP_IPV6)
740d39dcecaSPaolo Abeni int __init mptcp_proto_v6_init(void);
741784325e9SMatthieu Baerts #endif
742648ef4b8SMat Martineau 
7437e8b88ecSPaolo Abeni struct sock *mptcp_sk_clone_init(const struct sock *sk,
744cfde141eSPaolo Abeni 				 const struct mptcp_options_received *mp_opt,
7457e8b88ecSPaolo Abeni 				 struct sock *ssk,
746fca5c82cSPaolo Abeni 				 struct request_sock *req);
7470799e21bSGeliang Tang void mptcp_get_options(const struct sk_buff *skb,
748cfde141eSPaolo Abeni 		       struct mptcp_options_received *mp_opt);
749cec37a6eSPeter Krystad 
750cec37a6eSPeter Krystad void mptcp_finish_connect(struct sock *sk);
751cf742d09SPaolo Abeni void __mptcp_sync_state(struct sock *sk, int state);
752f6909dc1SPaolo Abeni void mptcp_reset_tout_timer(struct mptcp_sock *msk, unsigned long fail_tout);
75327e5ccc2SPaolo Abeni 
mptcp_stop_tout_timer(struct sock * sk)75427e5ccc2SPaolo Abeni static inline void mptcp_stop_tout_timer(struct sock *sk)
75527e5ccc2SPaolo Abeni {
75627e5ccc2SPaolo Abeni 	if (!inet_csk(sk)->icsk_mtup.probe_timestamp)
75727e5ccc2SPaolo Abeni 		return;
75827e5ccc2SPaolo Abeni 
75927e5ccc2SPaolo Abeni 	sk_stop_timer(sk, &sk->sk_timer);
76027e5ccc2SPaolo Abeni 	inet_csk(sk)->icsk_mtup.probe_timestamp = 0;
76127e5ccc2SPaolo Abeni }
76227e5ccc2SPaolo Abeni 
mptcp_set_close_tout(struct sock * sk,unsigned long tout)76327e5ccc2SPaolo Abeni static inline void mptcp_set_close_tout(struct sock *sk, unsigned long tout)
76427e5ccc2SPaolo Abeni {
76527e5ccc2SPaolo Abeni 	/* avoid 0 timestamp, as that means no close timeout */
76627e5ccc2SPaolo Abeni 	inet_csk(sk)->icsk_mtup.probe_timestamp = tout ? : 1;
76727e5ccc2SPaolo Abeni }
76827e5ccc2SPaolo Abeni 
mptcp_start_tout_timer(struct sock * sk)76927e5ccc2SPaolo Abeni static inline void mptcp_start_tout_timer(struct sock *sk)
77027e5ccc2SPaolo Abeni {
77127e5ccc2SPaolo Abeni 	mptcp_set_close_tout(sk, tcp_jiffies32);
77227e5ccc2SPaolo Abeni 	mptcp_reset_tout_timer(mptcp_sk(sk), 0);
77327e5ccc2SPaolo Abeni }
77427e5ccc2SPaolo Abeni 
mptcp_is_fully_established(struct sock * sk)775b93df08cSPaolo Abeni static inline bool mptcp_is_fully_established(struct sock *sk)
776b93df08cSPaolo Abeni {
777b93df08cSPaolo Abeni 	return inet_sk_state_load(sk) == TCP_ESTABLISHED &&
778b93df08cSPaolo Abeni 	       READ_ONCE(mptcp_sk(sk)->fully_established);
779b93df08cSPaolo Abeni }
780124a4885SPaolo Abeni 
781a6b118feSFlorian Westphal void mptcp_rcv_space_init(struct mptcp_sock *msk, const struct sock *ssk);
7822e52213cSFlorian Westphal void mptcp_data_ready(struct sock *sk, struct sock *ssk);
783f296234cSPeter Krystad bool mptcp_finish_join(struct sock *sk);
784ba8f48f7SPaolo Abeni bool mptcp_schedule_work(struct sock *sk);
7850abdde82SPaolo Abeni int mptcp_setsockopt(struct sock *sk, int level, int optname,
7860abdde82SPaolo Abeni 		     sockptr_t optval, unsigned int optlen);
7870abdde82SPaolo Abeni int mptcp_getsockopt(struct sock *sk, int level, int optname,
7880abdde82SPaolo Abeni 		     char __user *optval, int __user *option);
7890abdde82SPaolo Abeni 
7901502328fSPaolo Abeni u64 __mptcp_expand_seq(u64 old_seq, u64 cur_seq);
mptcp_expand_seq(u64 old_seq,u64 cur_seq,bool use_64bit)7911502328fSPaolo Abeni static inline u64 mptcp_expand_seq(u64 old_seq, u64 cur_seq, bool use_64bit)
7921502328fSPaolo Abeni {
7931502328fSPaolo Abeni 	if (use_64bit)
7941502328fSPaolo Abeni 		return cur_seq;
7951502328fSPaolo Abeni 
7961502328fSPaolo Abeni 	return __mptcp_expand_seq(old_seq, cur_seq);
7971502328fSPaolo Abeni }
798219d0499SPaolo Abeni void __mptcp_check_push(struct sock *sk, struct sock *ssk);
7997439d687SPaolo Abeni void __mptcp_data_acked(struct sock *sk);
80015cc1045SPaolo Abeni void __mptcp_error_report(struct sock *sk);
8011a49b2c2SMat Martineau bool mptcp_update_rcv_data_fin(struct mptcp_sock *msk, u64 data_fin_seq, bool use_64bit);
mptcp_data_fin_enabled(const struct mptcp_sock * msk)802e16163b6SPaolo Abeni static inline bool mptcp_data_fin_enabled(const struct mptcp_sock *msk)
803e16163b6SPaolo Abeni {
804e16163b6SPaolo Abeni 	return READ_ONCE(msk->snd_data_fin_enable) &&
805e16163b6SPaolo Abeni 	       READ_ONCE(msk->write_seq) == READ_ONCE(msk->snd_nxt);
806e16163b6SPaolo Abeni }
807e16163b6SPaolo Abeni 
mptcp_write_space(struct sock * sk)808b609ecdaSPaolo Abeni static inline void mptcp_write_space(struct sock *sk)
809b609ecdaSPaolo Abeni {
810b609ecdaSPaolo Abeni 	if (sk_stream_is_writeable(sk)) {
811b609ecdaSPaolo Abeni 		/* pairs with memory barrier in mptcp_poll */
812b609ecdaSPaolo Abeni 		smp_mb();
813b609ecdaSPaolo Abeni 		if (test_and_clear_bit(MPTCP_NOSPACE, &mptcp_sk(sk)->flags))
814b609ecdaSPaolo Abeni 			sk_stream_write_space(sk);
815b609ecdaSPaolo Abeni 	}
816b609ecdaSPaolo Abeni }
817b609ecdaSPaolo Abeni 
__mptcp_sync_sndbuf(struct sock * sk)81834c7757aSPaolo Abeni static inline void __mptcp_sync_sndbuf(struct sock *sk)
8195cf92bbaSPaolo Abeni {
82034c7757aSPaolo Abeni 	struct mptcp_subflow_context *subflow;
82134c7757aSPaolo Abeni 	int ssk_sndbuf, new_sndbuf;
8225cf92bbaSPaolo Abeni 
82334c7757aSPaolo Abeni 	if (sk->sk_userlocks & SOCK_SNDBUF_LOCK)
82434c7757aSPaolo Abeni 		return;
82534c7757aSPaolo Abeni 
82634c7757aSPaolo Abeni 	new_sndbuf = sock_net(sk)->ipv4.sysctl_tcp_wmem[0];
82734c7757aSPaolo Abeni 	mptcp_for_each_subflow(mptcp_sk(sk), subflow) {
82834c7757aSPaolo Abeni 		ssk_sndbuf =  READ_ONCE(mptcp_subflow_tcp_sock(subflow)->sk_sndbuf);
82934c7757aSPaolo Abeni 
83034c7757aSPaolo Abeni 		subflow->cached_sndbuf = ssk_sndbuf;
83134c7757aSPaolo Abeni 		new_sndbuf += ssk_sndbuf;
83234c7757aSPaolo Abeni 	}
83334c7757aSPaolo Abeni 
83434c7757aSPaolo Abeni 	/* the msk max wmem limit is <nr_subflows> * tcp wmem[2] */
83534c7757aSPaolo Abeni 	WRITE_ONCE(sk->sk_sndbuf, new_sndbuf);
836b609ecdaSPaolo Abeni 	mptcp_write_space(sk);
83734c7757aSPaolo Abeni }
83834c7757aSPaolo Abeni 
83934c7757aSPaolo Abeni /* The called held both the msk socket and the subflow socket locks,
84034c7757aSPaolo Abeni  * possibly under BH
84134c7757aSPaolo Abeni  */
__mptcp_propagate_sndbuf(struct sock * sk,struct sock * ssk)84234c7757aSPaolo Abeni static inline void __mptcp_propagate_sndbuf(struct sock *sk, struct sock *ssk)
84334c7757aSPaolo Abeni {
84434c7757aSPaolo Abeni 	struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(ssk);
84534c7757aSPaolo Abeni 
84634c7757aSPaolo Abeni 	if (READ_ONCE(ssk->sk_sndbuf) != subflow->cached_sndbuf)
84734c7757aSPaolo Abeni 		__mptcp_sync_sndbuf(sk);
84834c7757aSPaolo Abeni }
84934c7757aSPaolo Abeni 
85034c7757aSPaolo Abeni /* the caller held only the subflow socket lock, either in process or
85134c7757aSPaolo Abeni  * BH context. Additionally this can be called under the msk data lock,
85234c7757aSPaolo Abeni  * so we can't acquire such lock here: let the delegate action acquires
85334c7757aSPaolo Abeni  * the needed locks in suitable order.
85434c7757aSPaolo Abeni  */
mptcp_propagate_sndbuf(struct sock * sk,struct sock * ssk)85534c7757aSPaolo Abeni static inline void mptcp_propagate_sndbuf(struct sock *sk, struct sock *ssk)
85634c7757aSPaolo Abeni {
85734c7757aSPaolo Abeni 	struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(ssk);
85834c7757aSPaolo Abeni 
85934c7757aSPaolo Abeni 	if (likely(READ_ONCE(ssk->sk_sndbuf) == subflow->cached_sndbuf))
86034c7757aSPaolo Abeni 		return;
86134c7757aSPaolo Abeni 
86234c7757aSPaolo Abeni 	local_bh_disable();
86334c7757aSPaolo Abeni 	mptcp_subflow_delegate(subflow, MPTCP_DELEGATE_SNDBUF);
86434c7757aSPaolo Abeni 	local_bh_enable();
8655cf92bbaSPaolo Abeni }
8665cf92bbaSPaolo Abeni 
867c0bf3c6aSPaolo Abeni void mptcp_destroy_common(struct mptcp_sock *msk, unsigned int flags);
868cec37a6eSPeter Krystad 
869c68a0cd1SJianguo Wu #define MPTCP_TOKEN_MAX_RETRIES	4
870c68a0cd1SJianguo Wu 
8712c5ebd00SPaolo Abeni void __init mptcp_token_init(void);
mptcp_token_init_request(struct request_sock * req)8722c5ebd00SPaolo Abeni static inline void mptcp_token_init_request(struct request_sock *req)
8732c5ebd00SPaolo Abeni {
8742c5ebd00SPaolo Abeni 	mptcp_subflow_rsk(req)->token_node.pprev = NULL;
8752c5ebd00SPaolo Abeni }
8762c5ebd00SPaolo Abeni 
87779c0949eSPeter Krystad int mptcp_token_new_request(struct request_sock *req);
8782c5ebd00SPaolo Abeni void mptcp_token_destroy_request(struct request_sock *req);
879294de909SMenglong Dong int mptcp_token_new_connect(struct sock *ssk);
8802c5ebd00SPaolo Abeni void mptcp_token_accept(struct mptcp_subflow_request_sock *r,
8812c5ebd00SPaolo Abeni 			struct mptcp_sock *msk);
882c83a47e5SFlorian Westphal bool mptcp_token_exists(u32 token);
883ea1300b9SFlorian Westphal struct mptcp_sock *mptcp_token_get_sock(struct net *net, u32 token);
88496d890daSPaolo Abeni struct mptcp_sock *mptcp_token_iter_next(const struct net *net, long *s_slot,
88596d890daSPaolo Abeni 					 long *s_num);
8862c5ebd00SPaolo Abeni void mptcp_token_destroy(struct mptcp_sock *msk);
88779c0949eSPeter Krystad 
88879c0949eSPeter Krystad void mptcp_crypto_key_sha(u64 key, u32 *token, u64 *idsn);
88979c0949eSPeter Krystad 
8903df523abSPeter Krystad void mptcp_crypto_hmac_sha(u64 key1, u64 key2, u8 *msg, int len, void *hmac);
891ba2c89e0SPaolo Abeni __sum16 __mptcp_make_csum(u64 data_seq, u32 subflow_seq, u16 data_len, __wsum sum);
89279c0949eSPeter Krystad 
893d39dcecaSPaolo Abeni void __init mptcp_pm_init(void);
8941b1c7a0eSPeter Krystad void mptcp_pm_data_init(struct mptcp_sock *msk);
895b29fcfb5SPaolo Abeni void mptcp_pm_data_reset(struct mptcp_sock *msk);
896702c2f64SFlorian Westphal int mptcp_pm_parse_addr(struct nlattr *attr, struct genl_info *info,
897702c2f64SFlorian Westphal 			struct mptcp_addr_info *addr);
8989ab4807cSKishen Maloor int mptcp_pm_parse_entry(struct nlattr *attr, struct genl_info *info,
8999ab4807cSKishen Maloor 			 bool require_family,
9009ab4807cSKishen Maloor 			 struct mptcp_pm_addr_entry *entry);
901fb00ee4fSMatthieu Baerts bool mptcp_pm_addr_families_match(const struct sock *sk,
902fb00ee4fSMatthieu Baerts 				  const struct mptcp_addr_info *loc,
903fb00ee4fSMatthieu Baerts 				  const struct mptcp_addr_info *rem);
90471b7dec2SPaolo Abeni void mptcp_pm_subflow_chk_stale(const struct mptcp_sock *msk, struct sock *ssk);
905ff5a0b42SPaolo Abeni void mptcp_pm_nl_subflow_chk_stale(const struct mptcp_sock *msk, struct sock *ssk);
9066c714f1bSFlorian Westphal void mptcp_pm_new_connection(struct mptcp_sock *msk, const struct sock *ssk, int server_side);
9077a486c44SPaolo Abeni void mptcp_pm_fully_established(struct mptcp_sock *msk, const struct sock *ssk);
9081b1c7a0eSPeter Krystad bool mptcp_pm_allow_new_subflow(struct mptcp_sock *msk);
9091b1c7a0eSPeter Krystad void mptcp_pm_connection_closed(struct mptcp_sock *msk);
91062535200SGeliang Tang void mptcp_pm_subflow_established(struct mptcp_sock *msk);
911a88c9e49SPaolo Abeni bool mptcp_pm_nl_check_work_pending(struct mptcp_sock *msk);
912a88c9e49SPaolo Abeni void mptcp_pm_subflow_check_next(struct mptcp_sock *msk, const struct sock *ssk,
913a88c9e49SPaolo Abeni 				 const struct mptcp_subflow_context *subflow);
914d1ace2d9SKishen Maloor void mptcp_pm_add_addr_received(const struct sock *ssk,
9151b1c7a0eSPeter Krystad 				const struct mptcp_addr_info *addr);
916557963c3SGeliang Tang void mptcp_pm_add_addr_echoed(struct mptcp_sock *msk,
91790d93088SPaolo Abeni 			      const struct mptcp_addr_info *addr);
91884dfe367SGeliang Tang void mptcp_pm_add_addr_send_ack(struct mptcp_sock *msk);
919dc14d542SMatthieu Baerts (NGI0) bool mptcp_pm_nl_is_init_remote_addr(struct mptcp_sock *msk,
920dc14d542SMatthieu Baerts (NGI0) 				     const struct mptcp_addr_info *remote);
921b46a0238SGeliang Tang void mptcp_pm_nl_addr_send_ack(struct mptcp_sock *msk);
9225c4a824dSGeliang Tang void mptcp_pm_rm_addr_received(struct mptcp_sock *msk,
9235c4a824dSGeliang Tang 			       const struct mptcp_rm_list *rm_list);
92440453a5cSGeliang Tang void mptcp_pm_mp_prio_received(struct sock *sk, u8 bkup);
9255580d41bSGeliang Tang void mptcp_pm_mp_fail_received(struct sock *sk, u64 fail_seq);
926892f396cSKishen Maloor int mptcp_pm_nl_mp_prio_send_ack(struct mptcp_sock *msk,
927892f396cSKishen Maloor 				 struct mptcp_addr_info *addr,
928892f396cSKishen Maloor 				 struct mptcp_addr_info *rem,
929892f396cSKishen Maloor 				 u8 bkup);
9309ab4807cSKishen Maloor bool mptcp_pm_alloc_anno_list(struct mptcp_sock *msk,
931528cb5f2SGeliang Tang 			      const struct mptcp_addr_info *addr);
932b6c08380SGeliang Tang void mptcp_pm_free_anno_list(struct mptcp_sock *msk);
9335bc56388SGeliang Tang bool mptcp_pm_sport_in_anno_list(struct mptcp_sock *msk, const struct sock *sk);
93400cfd77bSGeliang Tang struct mptcp_pm_add_entry *
93500cfd77bSGeliang Tang mptcp_pm_del_add_timer(struct mptcp_sock *msk,
93690d93088SPaolo Abeni 		       const struct mptcp_addr_info *addr, bool check_id);
937d88c476fSGeliang Tang struct mptcp_pm_add_entry *
93890d93088SPaolo Abeni mptcp_lookup_anno_list_by_saddr(const struct mptcp_sock *msk,
93990d93088SPaolo Abeni 				const struct mptcp_addr_info *addr);
9408b201370SKishen Maloor int mptcp_pm_get_flags_and_ifindex_by_id(struct mptcp_sock *msk,
9418b201370SKishen Maloor 					 unsigned int id,
9428b201370SKishen Maloor 					 u8 *flags, int *ifindex);
943f40be0dbSGeliang Tang int mptcp_pm_nl_get_flags_and_ifindex_by_id(struct mptcp_sock *msk, unsigned int id,
944f40be0dbSGeliang Tang 					    u8 *flags, int *ifindex);
9458b201370SKishen Maloor int mptcp_userspace_pm_get_flags_and_ifindex_by_id(struct mptcp_sock *msk,
9468b201370SKishen Maloor 						   unsigned int id,
947ee285257SGeliang Tang 						   u8 *flags, int *ifindex);
9486ba7ce89SGeliang Tang int mptcp_pm_set_flags(struct net *net, struct nlattr *token,
9496ba7ce89SGeliang Tang 		       struct mptcp_pm_addr_entry *loc,
9506ba7ce89SGeliang Tang 		       struct mptcp_pm_addr_entry *rem, u8 bkup);
9516ba7ce89SGeliang Tang int mptcp_pm_nl_set_flags(struct net *net, struct mptcp_pm_addr_entry *addr, u8 bkup);
952892f396cSKishen Maloor int mptcp_userspace_pm_set_flags(struct net *net, struct nlattr *token,
953892f396cSKishen Maloor 				 struct mptcp_pm_addr_entry *loc,
954892f396cSKishen Maloor 				 struct mptcp_pm_addr_entry *rem, u8 bkup);
9551b1c7a0eSPeter Krystad int mptcp_pm_announce_addr(struct mptcp_sock *msk,
9566a6c05a8SGeliang Tang 			   const struct mptcp_addr_info *addr,
957f7efc777SGeliang Tang 			   bool echo);
958cbde2787SGeliang Tang int mptcp_pm_remove_addr(struct mptcp_sock *msk, const struct mptcp_rm_list *rm_list);
9598b1c94daSGeliang Tang void mptcp_pm_remove_addrs(struct mptcp_sock *msk, struct list_head *rm_list);
960d9a4594eSKishen Maloor 
9614638de5aSKishen Maloor void mptcp_free_local_addr_list(struct mptcp_sock *msk);
9629ab4807cSKishen Maloor int mptcp_nl_cmd_announce(struct sk_buff *skb, struct genl_info *info);
963d9a4594eSKishen Maloor int mptcp_nl_cmd_remove(struct sk_buff *skb, struct genl_info *info);
964702c2f64SFlorian Westphal int mptcp_nl_cmd_sf_create(struct sk_buff *skb, struct genl_info *info);
965702c2f64SFlorian Westphal int mptcp_nl_cmd_sf_destroy(struct sk_buff *skb, struct genl_info *info);
9661b1c7a0eSPeter Krystad 
967b911c97cSFlorian Westphal void mptcp_event(enum mptcp_event_type type, const struct mptcp_sock *msk,
968b911c97cSFlorian Westphal 		 const struct sock *ssk, gfp_t gfp);
969d1ace2d9SKishen Maloor void mptcp_event_addr_announced(const struct sock *ssk, const struct mptcp_addr_info *info);
970b911c97cSFlorian Westphal void mptcp_event_addr_removed(const struct mptcp_sock *msk, u8 id);
971f8c9dfbdSGeliang Tang void mptcp_event_pm_listener(const struct sock *ssk,
972f8c9dfbdSGeliang Tang 			     enum mptcp_event_type event);
9734d25247dSKishen Maloor bool mptcp_userspace_pm_active(const struct mptcp_sock *msk);
974b911c97cSFlorian Westphal 
975b45df837SPaolo Abeni void __mptcp_fastopen_gen_msk_ackseq(struct mptcp_sock *msk, struct mptcp_subflow_context *subflow,
976dfc8d060SDmytro Shytyi 				     const struct mptcp_options_received *mp_opt);
97736b122baSDmytro Shytyi void mptcp_fastopen_subflow_synack_set_params(struct mptcp_subflow_context *subflow,
97836b122baSDmytro Shytyi 					      struct request_sock *req);
979dfc8d060SDmytro Shytyi 
mptcp_pm_should_add_signal(struct mptcp_sock * msk)980f643b803SGeliang Tang static inline bool mptcp_pm_should_add_signal(struct mptcp_sock *msk)
9811b1c7a0eSPeter Krystad {
98218fc1a92SYonglong Li 	return READ_ONCE(msk->pm.addr_signal) &
98318fc1a92SYonglong Li 		(BIT(MPTCP_ADD_ADDR_SIGNAL) | BIT(MPTCP_ADD_ADDR_ECHO));
98418fc1a92SYonglong Li }
98518fc1a92SYonglong Li 
mptcp_pm_should_add_signal_addr(struct mptcp_sock * msk)98618fc1a92SYonglong Li static inline bool mptcp_pm_should_add_signal_addr(struct mptcp_sock *msk)
98718fc1a92SYonglong Li {
98813ad9f01SGeliang Tang 	return READ_ONCE(msk->pm.addr_signal) & BIT(MPTCP_ADD_ADDR_SIGNAL);
989d91d322aSGeliang Tang }
990d91d322aSGeliang Tang 
mptcp_pm_should_add_signal_echo(struct mptcp_sock * msk)991d91d322aSGeliang Tang static inline bool mptcp_pm_should_add_signal_echo(struct mptcp_sock *msk)
992d91d322aSGeliang Tang {
99313ad9f01SGeliang Tang 	return READ_ONCE(msk->pm.addr_signal) & BIT(MPTCP_ADD_ADDR_ECHO);
9941b1c7a0eSPeter Krystad }
9951b1c7a0eSPeter Krystad 
mptcp_pm_should_rm_signal(struct mptcp_sock * msk)9965cb104aeSGeliang Tang static inline bool mptcp_pm_should_rm_signal(struct mptcp_sock *msk)
9975cb104aeSGeliang Tang {
99813ad9f01SGeliang Tang 	return READ_ONCE(msk->pm.addr_signal) & BIT(MPTCP_RM_ADDR_SIGNAL);
9995cb104aeSGeliang Tang }
10005cb104aeSGeliang Tang 
mptcp_pm_is_userspace(const struct mptcp_sock * msk)100114b06811SMat Martineau static inline bool mptcp_pm_is_userspace(const struct mptcp_sock *msk)
100214b06811SMat Martineau {
100314b06811SMat Martineau 	return READ_ONCE(msk->pm.pm_type) == MPTCP_PM_TYPE_USERSPACE;
100414b06811SMat Martineau }
100514b06811SMat Martineau 
mptcp_pm_is_kernel(const struct mptcp_sock * msk)10064d25247dSKishen Maloor static inline bool mptcp_pm_is_kernel(const struct mptcp_sock *msk)
10074d25247dSKishen Maloor {
10084d25247dSKishen Maloor 	return READ_ONCE(msk->pm.pm_type) == MPTCP_PM_TYPE_KERNEL;
10094d25247dSKishen Maloor }
10104d25247dSKishen Maloor 
mptcp_add_addr_len(int family,bool echo,bool port)10114a2777a8SGeliang Tang static inline unsigned int mptcp_add_addr_len(int family, bool echo, bool port)
10121b1c7a0eSPeter Krystad {
10132ec72faeSGeliang Tang 	u8 len = TCPOLEN_MPTCP_ADD_ADDR_BASE;
10142ec72faeSGeliang Tang 
10152ec72faeSGeliang Tang 	if (family == AF_INET6)
10162ec72faeSGeliang Tang 		len = TCPOLEN_MPTCP_ADD_ADDR6_BASE;
10172ec72faeSGeliang Tang 	if (!echo)
10182ec72faeSGeliang Tang 		len += MPTCPOPT_THMAC_LEN;
101927ab92d9SDavide Caratti 	/* account for 2 trailing 'nop' options */
10204a2777a8SGeliang Tang 	if (port)
102127ab92d9SDavide Caratti 		len += TCPOLEN_MPTCP_PORT_LEN + TCPOLEN_MPTCP_PORT_ALIGN;
10222ec72faeSGeliang Tang 
10232ec72faeSGeliang Tang 	return len;
10241b1c7a0eSPeter Krystad }
10251b1c7a0eSPeter Krystad 
mptcp_rm_addr_len(const struct mptcp_rm_list * rm_list)10266445e17aSGeliang Tang static inline int mptcp_rm_addr_len(const struct mptcp_rm_list *rm_list)
10276445e17aSGeliang Tang {
10286445e17aSGeliang Tang 	if (rm_list->nr == 0 || rm_list->nr > MPTCP_RM_IDS_MAX)
10296445e17aSGeliang Tang 		return -EINVAL;
10306445e17aSGeliang Tang 
10316445e17aSGeliang Tang 	return TCPOLEN_MPTCP_RM_ADDR_BASE + roundup(rm_list->nr - 1, 4) + 1;
10326445e17aSGeliang Tang }
10336445e17aSGeliang Tang 
103490d93088SPaolo Abeni bool mptcp_pm_add_addr_signal(struct mptcp_sock *msk, const struct sk_buff *skb,
10351f5e9e2fSYonglong Li 			      unsigned int opt_size, unsigned int remaining,
1036f462a446SYonglong Li 			      struct mptcp_addr_info *addr, bool *echo,
1037af7939f3SGeliang Tang 			      bool *drop_other_suboptions);
10385cb104aeSGeliang Tang bool mptcp_pm_rm_addr_signal(struct mptcp_sock *msk, unsigned int remaining,
10396445e17aSGeliang Tang 			     struct mptcp_rm_list *rm_list);
10401b1c7a0eSPeter Krystad int mptcp_pm_get_local_id(struct mptcp_sock *msk, struct sock_common *skc);
10419bbec87eSGeliang Tang int mptcp_pm_nl_get_local_id(struct mptcp_sock *msk, struct mptcp_addr_info *skc);
10428b201370SKishen Maloor int mptcp_userspace_pm_get_local_id(struct mptcp_sock *msk, struct mptcp_addr_info *skc);
1043fff9b920SMatthieu Baerts (NGI0) bool mptcp_pm_is_backup(struct mptcp_sock *msk, struct sock_common *skc);
1044fff9b920SMatthieu Baerts (NGI0) bool mptcp_pm_nl_is_backup(struct mptcp_sock *msk, struct mptcp_addr_info *skc);
1045fff9b920SMatthieu Baerts (NGI0) bool mptcp_userspace_pm_is_backup(struct mptcp_sock *msk, struct mptcp_addr_info *skc);
10461b1c7a0eSPeter Krystad 
subflow_get_local_id(const struct mptcp_subflow_context * subflow)1047ba2cf922SPaolo Abeni static inline u8 subflow_get_local_id(const struct mptcp_subflow_context *subflow)
1048ba2cf922SPaolo Abeni {
1049ba2cf922SPaolo Abeni 	int local_id = READ_ONCE(subflow->local_id);
1050ba2cf922SPaolo Abeni 
1051ba2cf922SPaolo Abeni 	if (local_id < 0)
1052ba2cf922SPaolo Abeni 		return 0;
1053ba2cf922SPaolo Abeni 	return local_id;
1054ba2cf922SPaolo Abeni }
1055ba2cf922SPaolo Abeni 
1056d39dcecaSPaolo Abeni void __init mptcp_pm_nl_init(void);
1057e9801430SFlorian Westphal void mptcp_pm_nl_work(struct mptcp_sock *msk);
105890d93088SPaolo Abeni unsigned int mptcp_pm_get_add_addr_signal_max(const struct mptcp_sock *msk);
105990d93088SPaolo Abeni unsigned int mptcp_pm_get_add_addr_accept_max(const struct mptcp_sock *msk);
106090d93088SPaolo Abeni unsigned int mptcp_pm_get_subflows_max(const struct mptcp_sock *msk);
106190d93088SPaolo Abeni unsigned int mptcp_pm_get_local_addr_max(const struct mptcp_sock *msk);
106201cacb00SPaolo Abeni 
106395d68651SPaolo Abeni /* called under PM lock */
__mptcp_pm_close_subflow(struct mptcp_sock * msk)106495d68651SPaolo Abeni static inline void __mptcp_pm_close_subflow(struct mptcp_sock *msk)
106595d68651SPaolo Abeni {
106695d68651SPaolo Abeni 	if (--msk->pm.subflows < mptcp_pm_get_subflows_max(msk))
106795d68651SPaolo Abeni 		WRITE_ONCE(msk->pm.accept_subflow, true);
106895d68651SPaolo Abeni }
106995d68651SPaolo Abeni 
mptcp_pm_close_subflow(struct mptcp_sock * msk)107095d68651SPaolo Abeni static inline void mptcp_pm_close_subflow(struct mptcp_sock *msk)
107195d68651SPaolo Abeni {
107295d68651SPaolo Abeni 	spin_lock_bh(&msk->pm.lock);
107395d68651SPaolo Abeni 	__mptcp_pm_close_subflow(msk);
107495d68651SPaolo Abeni 	spin_unlock_bh(&msk->pm.lock);
107595d68651SPaolo Abeni }
107695d68651SPaolo Abeni 
107778962489SFlorian Westphal void mptcp_sockopt_sync(struct mptcp_sock *msk, struct sock *ssk);
10783e501490SPaolo Abeni void mptcp_sockopt_sync_locked(struct mptcp_sock *msk, struct sock *ssk);
107978962489SFlorian Westphal 
mptcp_get_ext(const struct sk_buff * skb)1080dc87efdbSFlorian Westphal static inline struct mptcp_ext *mptcp_get_ext(const struct sk_buff *skb)
10816d0060f6SMat Martineau {
10826d0060f6SMat Martineau 	return (struct mptcp_ext *)skb_ext_find(skb, SKB_EXT_MPTCP);
10836d0060f6SMat Martineau }
10846d0060f6SMat Martineau 
10855147dfb5SDavide Caratti void mptcp_diag_subflow_init(struct tcp_ulp_ops *ops);
10865147dfb5SDavide Caratti 
__mptcp_check_fallback(const struct mptcp_sock * msk)1087d5f49190SPaolo Abeni static inline bool __mptcp_check_fallback(const struct mptcp_sock *msk)
1088e1ff9e82SDavide Caratti {
1089e1ff9e82SDavide Caratti 	return test_bit(MPTCP_FALLBACK_DONE, &msk->flags);
1090e1ff9e82SDavide Caratti }
1091e1ff9e82SDavide Caratti 
mptcp_check_fallback(const struct sock * sk)1092d5f49190SPaolo Abeni static inline bool mptcp_check_fallback(const struct sock *sk)
1093e1ff9e82SDavide Caratti {
1094e1ff9e82SDavide Caratti 	struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(sk);
1095e1ff9e82SDavide Caratti 	struct mptcp_sock *msk = mptcp_sk(subflow->conn);
1096e1ff9e82SDavide Caratti 
1097e1ff9e82SDavide Caratti 	return __mptcp_check_fallback(msk);
1098e1ff9e82SDavide Caratti }
1099e1ff9e82SDavide Caratti 
__mptcp_do_fallback(struct mptcp_sock * msk)1100e1ff9e82SDavide Caratti static inline void __mptcp_do_fallback(struct mptcp_sock *msk)
1101e1ff9e82SDavide Caratti {
1102e1ff9e82SDavide Caratti 	if (test_bit(MPTCP_FALLBACK_DONE, &msk->flags)) {
11033d2e1b82SMatthieu Baerts (NGI0) 		pr_debug("TCP fallback already done (msk=%p)\n", msk);
1104e1ff9e82SDavide Caratti 		return;
1105e1ff9e82SDavide Caratti 	}
1106*47f42722SMatthieu Baerts (NGI0) 	if (WARN_ON_ONCE(!READ_ONCE(msk->allow_infinite_fallback)))
1107*47f42722SMatthieu Baerts (NGI0) 		return;
1108e1ff9e82SDavide Caratti 	set_bit(MPTCP_FALLBACK_DONE, &msk->flags);
1109e1ff9e82SDavide Caratti }
1110e1ff9e82SDavide Caratti 
1111d51991e2SPaolo Abeni static inline void mptcp_do_fallback(struct sock *ssk)
1112e1ff9e82SDavide Caratti {
1113d51991e2SPaolo Abeni 	struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(ssk);
1114d51991e2SPaolo Abeni 	struct sock *sk = subflow->conn;
1115d51991e2SPaolo Abeni 	struct mptcp_sock *msk;
1116e1ff9e82SDavide Caratti 
1117d51991e2SPaolo Abeni 	msk = mptcp_sk(sk);
1118e1ff9e82SDavide Caratti 	__mptcp_do_fallback(msk);
1119d51991e2SPaolo Abeni 	if (READ_ONCE(msk->snd_data_fin_enable) && !(ssk->sk_shutdown & SEND_SHUTDOWN)) {
1120d51991e2SPaolo Abeni 		gfp_t saved_allocation = ssk->sk_allocation;
1121d51991e2SPaolo Abeni 
1122d51991e2SPaolo Abeni 		/* we are in a atomic (BH) scope, override ssk default for data
1123d51991e2SPaolo Abeni 		 * fin allocation
1124d51991e2SPaolo Abeni 		 */
1125d51991e2SPaolo Abeni 		ssk->sk_allocation = GFP_ATOMIC;
1126d51991e2SPaolo Abeni 		ssk->sk_shutdown |= SEND_SHUTDOWN;
1127d51991e2SPaolo Abeni 		tcp_shutdown(ssk, SEND_SHUTDOWN);
1128d51991e2SPaolo Abeni 		ssk->sk_allocation = saved_allocation;
1129d51991e2SPaolo Abeni 	}
1130e1ff9e82SDavide Caratti }
1131e1ff9e82SDavide Caratti 
mptcp_check_infinite_map(struct sk_buff * skb)11323d2e1b82SMatthieu Baerts (NGI0) #define pr_fallback(a) pr_debug("%s:fallback to TCP (msk=%p)\n", __func__, a)
1133e1ff9e82SDavide Caratti 
11341e39e5a3SGeliang Tang static inline bool mptcp_check_infinite_map(struct sk_buff *skb)
11351e39e5a3SGeliang Tang {
11361e39e5a3SGeliang Tang 	struct mptcp_ext *mpext;
11371e39e5a3SGeliang Tang 
11381e39e5a3SGeliang Tang 	mpext = skb ? mptcp_get_ext(skb) : NULL;
11391e39e5a3SGeliang Tang 	if (mpext && mpext->infinite_map)
11401e39e5a3SGeliang Tang 		return true;
11411e39e5a3SGeliang Tang 
11421e39e5a3SGeliang Tang 	return false;
11431e39e5a3SGeliang Tang }
11441e39e5a3SGeliang Tang 
114570c708e8SKishen Maloor static inline bool is_active_ssk(struct mptcp_subflow_context *subflow)
114670c708e8SKishen Maloor {
114770c708e8SKishen Maloor 	return (subflow->request_mptcp || subflow->request_join);
subflow_simultaneous_connect(struct sock * sk)114870c708e8SKishen Maloor }
114970c708e8SKishen Maloor 
11508fd73804SDavide Caratti static inline bool subflow_simultaneous_connect(struct sock *sk)
11518fd73804SDavide Caratti {
11528fd73804SDavide Caratti 	struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(sk);
11538fd73804SDavide Caratti 
11544bfe217eSPaolo Abeni 	return (1 << sk->sk_state) &
11554bfe217eSPaolo Abeni 	       (TCPF_ESTABLISHED | TCPF_FIN_WAIT1 | TCPF_FIN_WAIT2 | TCPF_CLOSING) &&
115670c708e8SKishen Maloor 	       is_active_ssk(subflow) &&
11578fd73804SDavide Caratti 	       !subflow->conn_finished;
11588fd73804SDavide Caratti }
11598fd73804SDavide Caratti 
11609466a1ccSFlorian Westphal #ifdef CONFIG_SYN_COOKIES
11619466a1ccSFlorian Westphal void subflow_init_req_cookie_join_save(const struct mptcp_subflow_request_sock *subflow_req,
11629466a1ccSFlorian Westphal 				       struct sk_buff *skb);
11639466a1ccSFlorian Westphal bool mptcp_token_join_cookie_init_state(struct mptcp_subflow_request_sock *subflow_req,
11649466a1ccSFlorian Westphal 					struct sk_buff *skb);
11659466a1ccSFlorian Westphal void __init mptcp_join_cookie_init(void);
subflow_init_req_cookie_join_save(const struct mptcp_subflow_request_sock * subflow_req,struct sk_buff * skb)11669466a1ccSFlorian Westphal #else
11679466a1ccSFlorian Westphal static inline void
11689466a1ccSFlorian Westphal subflow_init_req_cookie_join_save(const struct mptcp_subflow_request_sock *subflow_req,
11699466a1ccSFlorian Westphal 				  struct sk_buff *skb) {}
11709466a1ccSFlorian Westphal static inline bool
11719466a1ccSFlorian Westphal mptcp_token_join_cookie_init_state(struct mptcp_subflow_request_sock *subflow_req,
11729466a1ccSFlorian Westphal 				   struct sk_buff *skb)
11739466a1ccSFlorian Westphal {
11749466a1ccSFlorian Westphal 	return false;
mptcp_join_cookie_init(void)11759466a1ccSFlorian Westphal }
11769466a1ccSFlorian Westphal 
11779466a1ccSFlorian Westphal static inline void mptcp_join_cookie_init(void) {}
11789466a1ccSFlorian Westphal #endif
11799466a1ccSFlorian Westphal 
1180f870fa0bSMat Martineau #endif /* __MPTCP_PROTOCOL_H */
1181