1f870fa0bSMat Martineau /* SPDX-License-Identifier: GPL-2.0 */
2f870fa0bSMat Martineau /* Multipath TCP
3f870fa0bSMat Martineau *
4f870fa0bSMat Martineau * Copyright (c) 2017 - 2019, Intel Corporation.
5f870fa0bSMat Martineau */
6f870fa0bSMat Martineau
7f870fa0bSMat Martineau #ifndef __MPTCP_PROTOCOL_H
8f870fa0bSMat Martineau #define __MPTCP_PROTOCOL_H
9f870fa0bSMat Martineau
1079c0949eSPeter Krystad #include <linux/random.h>
1179c0949eSPeter Krystad #include <net/tcp.h>
1279c0949eSPeter Krystad #include <net/inet_connection_sock.h>
13b911c97cSFlorian Westphal #include <uapi/linux/mptcp.h>
149ab4807cSKishen Maloor #include <net/genetlink.h>
1579c0949eSPeter Krystad
16cc7972eaSChristoph Paasch #define MPTCP_SUPPORTED_VERSION 1
17eda7acddSPeter Krystad
18eda7acddSPeter Krystad /* MPTCP option bits */
19eda7acddSPeter Krystad #define OPTION_MPTCP_MPC_SYN BIT(0)
20eda7acddSPeter Krystad #define OPTION_MPTCP_MPC_SYNACK BIT(1)
21eda7acddSPeter Krystad #define OPTION_MPTCP_MPC_ACK BIT(2)
22f296234cSPeter Krystad #define OPTION_MPTCP_MPJ_SYN BIT(3)
23f296234cSPeter Krystad #define OPTION_MPTCP_MPJ_SYNACK BIT(4)
24f296234cSPeter Krystad #define OPTION_MPTCP_MPJ_ACK BIT(5)
253df523abSPeter Krystad #define OPTION_MPTCP_ADD_ADDR BIT(6)
26fef6b7ecSGeliang Tang #define OPTION_MPTCP_RM_ADDR BIT(7)
27fef6b7ecSGeliang Tang #define OPTION_MPTCP_FASTCLOSE BIT(8)
28fef6b7ecSGeliang Tang #define OPTION_MPTCP_PRIO BIT(9)
29fef6b7ecSGeliang Tang #define OPTION_MPTCP_RST BIT(10)
301bff1e43SPaolo Abeni #define OPTION_MPTCP_DSS BIT(11)
31c25aeb4eSGeliang Tang #define OPTION_MPTCP_FAIL BIT(12)
32eda7acddSPeter Krystad
3374c7dfbeSPaolo Abeni #define OPTION_MPTCP_CSUMREQD BIT(13)
3474c7dfbeSPaolo Abeni
3574c7dfbeSPaolo Abeni #define OPTIONS_MPTCP_MPC (OPTION_MPTCP_MPC_SYN | OPTION_MPTCP_MPC_SYNACK | \
3674c7dfbeSPaolo Abeni OPTION_MPTCP_MPC_ACK)
3774c7dfbeSPaolo Abeni #define OPTIONS_MPTCP_MPJ (OPTION_MPTCP_MPJ_SYN | OPTION_MPTCP_MPJ_SYNACK | \
38780aa120SWan Jiabing OPTION_MPTCP_MPJ_ACK)
3974c7dfbeSPaolo Abeni
40eda7acddSPeter Krystad /* MPTCP option subtypes */
41eda7acddSPeter Krystad #define MPTCPOPT_MP_CAPABLE 0
42eda7acddSPeter Krystad #define MPTCPOPT_MP_JOIN 1
43eda7acddSPeter Krystad #define MPTCPOPT_DSS 2
44eda7acddSPeter Krystad #define MPTCPOPT_ADD_ADDR 3
45eda7acddSPeter Krystad #define MPTCPOPT_RM_ADDR 4
46eda7acddSPeter Krystad #define MPTCPOPT_MP_PRIO 5
47eda7acddSPeter Krystad #define MPTCPOPT_MP_FAIL 6
48eda7acddSPeter Krystad #define MPTCPOPT_MP_FASTCLOSE 7
49dc87efdbSFlorian Westphal #define MPTCPOPT_RST 8
50eda7acddSPeter Krystad
51eda7acddSPeter Krystad /* MPTCP suboption lengths */
52cc7972eaSChristoph Paasch #define TCPOLEN_MPTCP_MPC_SYN 4
53eda7acddSPeter Krystad #define TCPOLEN_MPTCP_MPC_SYNACK 12
54eda7acddSPeter Krystad #define TCPOLEN_MPTCP_MPC_ACK 20
55cc7972eaSChristoph Paasch #define TCPOLEN_MPTCP_MPC_ACK_DATA 22
56f296234cSPeter Krystad #define TCPOLEN_MPTCP_MPJ_SYN 12
57f296234cSPeter Krystad #define TCPOLEN_MPTCP_MPJ_SYNACK 16
58f296234cSPeter Krystad #define TCPOLEN_MPTCP_MPJ_ACK 24
596d0060f6SMat Martineau #define TCPOLEN_MPTCP_DSS_BASE 4
60648ef4b8SMat Martineau #define TCPOLEN_MPTCP_DSS_ACK32 4
616d0060f6SMat Martineau #define TCPOLEN_MPTCP_DSS_ACK64 8
62648ef4b8SMat Martineau #define TCPOLEN_MPTCP_DSS_MAP32 10
636d0060f6SMat Martineau #define TCPOLEN_MPTCP_DSS_MAP64 14
646d0060f6SMat Martineau #define TCPOLEN_MPTCP_DSS_CHECKSUM 2
653df523abSPeter Krystad #define TCPOLEN_MPTCP_ADD_ADDR 16
6627ab92d9SDavide Caratti #define TCPOLEN_MPTCP_ADD_ADDR_PORT 18
673df523abSPeter Krystad #define TCPOLEN_MPTCP_ADD_ADDR_BASE 8
6827ab92d9SDavide Caratti #define TCPOLEN_MPTCP_ADD_ADDR_BASE_PORT 10
693df523abSPeter Krystad #define TCPOLEN_MPTCP_ADD_ADDR6 28
7027ab92d9SDavide Caratti #define TCPOLEN_MPTCP_ADD_ADDR6_PORT 30
713df523abSPeter Krystad #define TCPOLEN_MPTCP_ADD_ADDR6_BASE 20
7227ab92d9SDavide Caratti #define TCPOLEN_MPTCP_ADD_ADDR6_BASE_PORT 22
7327ab92d9SDavide Caratti #define TCPOLEN_MPTCP_PORT_LEN 2
7427ab92d9SDavide Caratti #define TCPOLEN_MPTCP_PORT_ALIGN 2
756445e17aSGeliang Tang #define TCPOLEN_MPTCP_RM_ADDR_BASE 3
76ec99a470SDavide Caratti #define TCPOLEN_MPTCP_PRIO 3
77ec99a470SDavide Caratti #define TCPOLEN_MPTCP_PRIO_ALIGN 4
7850c504a2SFlorian Westphal #define TCPOLEN_MPTCP_FASTCLOSE 12
79dc87efdbSFlorian Westphal #define TCPOLEN_MPTCP_RST 4
80c25aeb4eSGeliang Tang #define TCPOLEN_MPTCP_FAIL 12
81eda7acddSPeter Krystad
82208e8f66SGeliang Tang #define TCPOLEN_MPTCP_MPC_ACK_DATA_CSUM (TCPOLEN_MPTCP_DSS_CHECKSUM + TCPOLEN_MPTCP_MPC_ACK_DATA)
83208e8f66SGeliang Tang
84ec3edaa7SPeter Krystad /* MPTCP MP_JOIN flags */
85f296234cSPeter Krystad #define MPTCPOPT_BACKUP BIT(0)
86ec3edaa7SPeter Krystad #define MPTCPOPT_THMAC_LEN 8
87f296234cSPeter Krystad
88eda7acddSPeter Krystad /* MPTCP MP_CAPABLE flags */
89eda7acddSPeter Krystad #define MPTCP_VERSION_MASK (0x0F)
90eda7acddSPeter Krystad #define MPTCP_CAP_CHECKSUM_REQD BIT(7)
91eda7acddSPeter Krystad #define MPTCP_CAP_EXTENSIBILITY BIT(6)
92bab6b88eSGeliang Tang #define MPTCP_CAP_DENY_JOIN_ID0 BIT(5)
9365492c5aSPaolo Abeni #define MPTCP_CAP_HMAC_SHA256 BIT(0)
94bab6b88eSGeliang Tang #define MPTCP_CAP_FLAG_MASK (0x1F)
95eda7acddSPeter Krystad
966d0060f6SMat Martineau /* MPTCP DSS flags */
976d0060f6SMat Martineau #define MPTCP_DSS_DATA_FIN BIT(4)
986d0060f6SMat Martineau #define MPTCP_DSS_DSN64 BIT(3)
996d0060f6SMat Martineau #define MPTCP_DSS_HAS_MAP BIT(2)
1006d0060f6SMat Martineau #define MPTCP_DSS_ACK64 BIT(1)
1016d0060f6SMat Martineau #define MPTCP_DSS_HAS_ACK BIT(0)
102648ef4b8SMat Martineau #define MPTCP_DSS_FLAG_MASK (0x1F)
103648ef4b8SMat Martineau
1043df523abSPeter Krystad /* MPTCP ADD_ADDR flags */
1053df523abSPeter Krystad #define MPTCP_ADDR_ECHO BIT(0)
1063df523abSPeter Krystad
10740453a5cSGeliang Tang /* MPTCP MP_PRIO flags */
10840453a5cSGeliang Tang #define MPTCP_PRIO_BKUP BIT(0)
10940453a5cSGeliang Tang
110dc87efdbSFlorian Westphal /* MPTCP TCPRST flags */
111dc87efdbSFlorian Westphal #define MPTCP_RST_TRANSIENT BIT(0)
112dc87efdbSFlorian Westphal
113e9d09bacSPaolo Abeni /* MPTCP socket atomic flags */
1148edf0864SFlorian Westphal #define MPTCP_NOSPACE 1
1153b1d6210SPaolo Abeni #define MPTCP_WORK_RTX 2
116e1ff9e82SDavide Caratti #define MPTCP_FALLBACK_DONE 4
1170e4f35d7SPaolo Abeni #define MPTCP_WORK_CLOSE_SUBFLOW 5
118e9d09bacSPaolo Abeni
119e9d09bacSPaolo Abeni /* MPTCP socket release cb flags */
120e9d09bacSPaolo Abeni #define MPTCP_PUSH_PENDING 1
121e9d09bacSPaolo Abeni #define MPTCP_CLEAN_UNA 2
122e9d09bacSPaolo Abeni #define MPTCP_ERROR_REPORT 3
123e9d09bacSPaolo Abeni #define MPTCP_RETRANSMIT 4
124e9d09bacSPaolo Abeni #define MPTCP_FLUSH_JOIN_LIST 5
125cf742d09SPaolo Abeni #define MPTCP_SYNC_STATE 6
12634c7757aSPaolo Abeni #define MPTCP_SYNC_SNDBUF 7
1276d0060f6SMat Martineau
128dfc8d060SDmytro Shytyi struct mptcp_skb_cb {
129dfc8d060SDmytro Shytyi u64 map_seq;
130dfc8d060SDmytro Shytyi u64 end_seq;
131dfc8d060SDmytro Shytyi u32 offset;
132dfc8d060SDmytro Shytyi u8 has_rxtstamp:1;
133dfc8d060SDmytro Shytyi };
134dfc8d060SDmytro Shytyi
135dfc8d060SDmytro Shytyi #define MPTCP_SKB_CB(__skb) ((struct mptcp_skb_cb *)&((__skb)->cb[0]))
136dfc8d060SDmytro Shytyi
before64(__u64 seq1,__u64 seq2)137eaa2ffabSPaolo Abeni static inline bool before64(__u64 seq1, __u64 seq2)
138eaa2ffabSPaolo Abeni {
139eaa2ffabSPaolo Abeni return (__s64)(seq1 - seq2) < 0;
140eaa2ffabSPaolo Abeni }
141eaa2ffabSPaolo Abeni
142eaa2ffabSPaolo Abeni #define after64(seq2, seq1) before64(seq1, seq2)
143eaa2ffabSPaolo Abeni
144cfde141eSPaolo Abeni struct mptcp_options_received {
145cfde141eSPaolo Abeni u64 sndr_key;
146cfde141eSPaolo Abeni u64 rcvr_key;
147cfde141eSPaolo Abeni u64 data_ack;
148cfde141eSPaolo Abeni u64 data_seq;
149cfde141eSPaolo Abeni u32 subflow_seq;
150cfde141eSPaolo Abeni u16 data_len;
151208e8f66SGeliang Tang __sum16 csum;
1527f6c72b8SPaolo Abeni struct_group(status,
15374c7dfbeSPaolo Abeni u16 suboptions;
154a086aebaSPaolo Abeni u16 use_map:1,
155cfde141eSPaolo Abeni dsn64:1,
156cfde141eSPaolo Abeni data_fin:1,
157cfde141eSPaolo Abeni use_ack:1,
158cfde141eSPaolo Abeni ack64:1,
159cfde141eSPaolo Abeni mpc_map:1,
160a086aebaSPaolo Abeni reset_reason:4,
161a086aebaSPaolo Abeni reset_transient:1,
162a086aebaSPaolo Abeni echo:1,
163a086aebaSPaolo Abeni backup:1,
164a086aebaSPaolo Abeni deny_join_id0:1,
165cfde141eSPaolo Abeni __unused:2;
1667f6c72b8SPaolo Abeni );
167a086aebaSPaolo Abeni u8 join_id;
1687f6c72b8SPaolo Abeni u32 token;
1697f6c72b8SPaolo Abeni u32 nonce;
170a086aebaSPaolo Abeni u64 thmac;
171a086aebaSPaolo Abeni u8 hmac[MPTCPOPT_HMAC_LEN];
172f7dafee1SGeliang Tang struct mptcp_addr_info addr;
1735c4a824dSGeliang Tang struct mptcp_rm_list rm_list;
174cfde141eSPaolo Abeni u64 ahmac;
1755580d41bSGeliang Tang u64 fail_seq;
176cfde141eSPaolo Abeni };
177cfde141eSPaolo Abeni
mptcp_option(u8 subopt,u8 len,u8 nib,u8 field)1783df523abSPeter Krystad static inline __be32 mptcp_option(u8 subopt, u8 len, u8 nib, u8 field)
1793df523abSPeter Krystad {
1803df523abSPeter Krystad return htonl((TCPOPT_MPTCP << 24) | (len << 16) | (subopt << 12) |
1813df523abSPeter Krystad ((nib & 0xF) << 8) | field);
1823df523abSPeter Krystad }
1833df523abSPeter Krystad
1841b1c7a0eSPeter Krystad enum mptcp_pm_status {
1851b1c7a0eSPeter Krystad MPTCP_PM_ADD_ADDR_RECEIVED,
18684dfe367SGeliang Tang MPTCP_PM_ADD_ADDR_SEND_ACK,
187d0876b22SGeliang Tang MPTCP_PM_RM_ADDR_RECEIVED,
1881b1c7a0eSPeter Krystad MPTCP_PM_ESTABLISHED,
1891b1c7a0eSPeter Krystad MPTCP_PM_SUBFLOW_ESTABLISHED,
19086e39e04SPaolo Abeni MPTCP_PM_ALREADY_ESTABLISHED, /* persistent status, set after ESTABLISHED event */
19186e39e04SPaolo Abeni MPTCP_PM_MPC_ENDPOINT_ACCOUNTED /* persistent status, set after MPC local address is
19286e39e04SPaolo Abeni * accounted int id_avail_bitmap
19386e39e04SPaolo Abeni */
1941b1c7a0eSPeter Krystad };
1951b1c7a0eSPeter Krystad
196d85a8fdeSMat Martineau enum mptcp_pm_type {
197d85a8fdeSMat Martineau MPTCP_PM_TYPE_KERNEL = 0,
198d85a8fdeSMat Martineau MPTCP_PM_TYPE_USERSPACE,
199d85a8fdeSMat Martineau
200d85a8fdeSMat Martineau __MPTCP_PM_TYPE_NR,
201d85a8fdeSMat Martineau __MPTCP_PM_TYPE_MAX = __MPTCP_PM_TYPE_NR - 1,
202d85a8fdeSMat Martineau };
203d85a8fdeSMat Martineau
20486e39e04SPaolo Abeni /* Status bits below MPTCP_PM_ALREADY_ESTABLISHED need pm worker actions */
20586e39e04SPaolo Abeni #define MPTCP_PM_WORK_MASK ((1 << MPTCP_PM_ALREADY_ESTABLISHED) - 1)
20686e39e04SPaolo Abeni
20713ad9f01SGeliang Tang enum mptcp_addr_signal_status {
208d91d322aSGeliang Tang MPTCP_ADD_ADDR_SIGNAL,
209d91d322aSGeliang Tang MPTCP_ADD_ADDR_ECHO,
21042842a42SGeliang Tang MPTCP_RM_ADDR_SIGNAL,
211d91d322aSGeliang Tang };
212d91d322aSGeliang Tang
21386e39e04SPaolo Abeni /* max value of mptcp_addr_info.id */
21486e39e04SPaolo Abeni #define MPTCP_PM_MAX_ADDR_ID U8_MAX
21586e39e04SPaolo Abeni
2161b1c7a0eSPeter Krystad struct mptcp_pm_data {
2171b1c7a0eSPeter Krystad struct mptcp_addr_info local;
2181b1c7a0eSPeter Krystad struct mptcp_addr_info remote;
219b6c08380SGeliang Tang struct list_head anno_list;
2204638de5aSKishen Maloor struct list_head userspace_pm_local_addr_list;
2211b1c7a0eSPeter Krystad
2221b1c7a0eSPeter Krystad spinlock_t lock; /*protects the whole PM data */
2231b1c7a0eSPeter Krystad
22413ad9f01SGeliang Tang u8 addr_signal;
2251b1c7a0eSPeter Krystad bool server_side;
2261b1c7a0eSPeter Krystad bool work_pending;
2271b1c7a0eSPeter Krystad bool accept_addr;
2281b1c7a0eSPeter Krystad bool accept_subflow;
229df377be3SGeliang Tang bool remote_deny_join_id0;
2301b1c7a0eSPeter Krystad u8 add_addr_signaled;
2311b1c7a0eSPeter Krystad u8 add_addr_accepted;
2321b1c7a0eSPeter Krystad u8 local_addr_used;
233d85a8fdeSMat Martineau u8 pm_type;
2341b1c7a0eSPeter Krystad u8 subflows;
2351b1c7a0eSPeter Krystad u8 status;
23686e39e04SPaolo Abeni DECLARE_BITMAP(id_avail_bitmap, MPTCP_PM_MAX_ADDR_ID + 1);
237cbde2787SGeliang Tang struct mptcp_rm_list rm_list_tx;
238b5c55f33SGeliang Tang struct mptcp_rm_list rm_list_rx;
2391b1c7a0eSPeter Krystad };
2401b1c7a0eSPeter Krystad
2414638de5aSKishen Maloor struct mptcp_pm_addr_entry {
2424638de5aSKishen Maloor struct list_head list;
2434638de5aSKishen Maloor struct mptcp_addr_info addr;
2444638de5aSKishen Maloor u8 flags;
2454638de5aSKishen Maloor int ifindex;
2464638de5aSKishen Maloor struct socket *lsk;
2474638de5aSKishen Maloor };
2484638de5aSKishen Maloor
24918b683bfSPaolo Abeni struct mptcp_data_frag {
25018b683bfSPaolo Abeni struct list_head list;
25118b683bfSPaolo Abeni u64 data_seq;
252f0e6a4cfSPaolo Abeni u16 data_len;
253f0e6a4cfSPaolo Abeni u16 offset;
254f0e6a4cfSPaolo Abeni u16 overhead;
255f0e6a4cfSPaolo Abeni u16 already_sent;
25618b683bfSPaolo Abeni struct page *page;
25718b683bfSPaolo Abeni };
25818b683bfSPaolo Abeni
259f870fa0bSMat Martineau /* MPTCP connection sock */
260f870fa0bSMat Martineau struct mptcp_sock {
261f870fa0bSMat Martineau /* inet_connection_sock must be the first member */
262f870fa0bSMat Martineau struct inet_connection_sock sk;
263cec37a6eSPeter Krystad u64 local_key;
264cec37a6eSPeter Krystad u64 remote_key;
2656d0060f6SMat Martineau u64 write_seq;
26638967f42SPaolo Abeni u64 bytes_sent;
267eaa2ffabSPaolo Abeni u64 snd_nxt;
26838967f42SPaolo Abeni u64 bytes_received;
2696d0060f6SMat Martineau u64 ack_seq;
270f3589be0SPaolo Abeni atomic64_t rcv_wnd_sent;
2713721b9b6SMat Martineau u64 rcv_data_fin_seq;
27238967f42SPaolo Abeni u64 bytes_retrans;
273124a4885SPaolo Abeni u64 bytes_consumed;
2746511882cSPaolo Abeni int rmem_fwd_alloc;
275d5f49190SPaolo Abeni int snd_burst;
276ea4ca586SPaolo Abeni int old_wspace;
2771e1d9d6fSPaolo Abeni u64 recovery_snd_nxt; /* in recovery mode accept up to this seq;
2781e1d9d6fSPaolo Abeni * recovery related fields are under data_lock
2791e1d9d6fSPaolo Abeni * protection
2801e1d9d6fSPaolo Abeni */
28138967f42SPaolo Abeni u64 bytes_acked;
2827439d687SPaolo Abeni u64 snd_una;
2837439d687SPaolo Abeni u64 wnd_end;
284b51f9b80SPaolo Abeni unsigned long timer_ival;
28579c0949eSPeter Krystad u32 token;
28687952603SPaolo Abeni int rmem_released;
287648ef4b8SMat Martineau unsigned long flags;
288e9d09bacSPaolo Abeni unsigned long cb_flags;
2891e1d9d6fSPaolo Abeni bool recovery; /* closing subflow write queue reinjected */
290d22f4988SChristoph Paasch bool can_ack;
291b93df08cSPaolo Abeni bool fully_established;
2923721b9b6SMat Martineau bool rcv_data_fin;
2937279da61SMat Martineau bool snd_data_fin_enable;
29450c504a2SFlorian Westphal bool rcv_fastclose;
29537198e93SDavide Caratti bool use_64bit_ack; /* Set when we received a 64-bit DSN */
296752e9067SGeliang Tang bool csum_enabled;
2970530020aSGeliang Tang bool allow_infinite_fallback;
298cf742d09SPaolo Abeni u8 pending_state; /* A subflow asked to set this sk_state,
299cf742d09SPaolo Abeni * protected by the msk data lock
300cf742d09SPaolo Abeni */
3013ad14f54SPaolo Abeni u8 mpc_endpoint_id;
3024f6e14bdSMaxim Galaganov u8 recvmsg_inq:1,
3034f6e14bdSMaxim Galaganov cork:1,
30454f1944eSPaolo Abeni nodelay:1,
305b6985b9bSPaolo Abeni fastopening:1,
30639880bd8SPaolo Abeni in_accept_queue:1,
307a2d74374SPaolo Abeni free_first:1,
308a2d74374SPaolo Abeni rcvspace_init:1;
309184873afSMatthieu Baerts (NGI0) int keepalive_cnt;
310184873afSMatthieu Baerts (NGI0) int keepalive_idle;
311184873afSMatthieu Baerts (NGI0) int keepalive_intvl;
31280992017SPaolo Abeni struct work_struct work;
313ab174ad8SPaolo Abeni struct sk_buff *ooo_last_skb;
314ab174ad8SPaolo Abeni struct rb_root out_of_order_queue;
31587952603SPaolo Abeni struct sk_buff_head receive_queue;
316cec37a6eSPeter Krystad struct list_head conn_list;
31718b683bfSPaolo Abeni struct list_head rtx_queue;
318f0e6a4cfSPaolo Abeni struct mptcp_data_frag *first_pending;
319ec3edaa7SPeter Krystad struct list_head join_list;
32039880bd8SPaolo Abeni struct sock *first; /* The mptcp ops can safely dereference, using suitable
3215b825727SPaolo Abeni * ONCE annotation, the subflow outside the socket
3225b825727SPaolo Abeni * lock as such sock is freed after close().
3235b825727SPaolo Abeni */
3241b1c7a0eSPeter Krystad struct mptcp_pm_data pm;
3251730b2b2SGeliang Tang struct mptcp_sched_ops *sched;
326a6b118feSFlorian Westphal struct {
327a6b118feSFlorian Westphal u32 space; /* bytes copied in last measurement window */
328a6b118feSFlorian Westphal u32 copied; /* bytes copied in this measurement window */
329a6b118feSFlorian Westphal u64 time; /* start time of measurement window */
330a6b118feSFlorian Westphal u64 rtt_us; /* last maximum rtt of subflows */
331a6b118feSFlorian Westphal } rcvq_space;
332b8dc6d6cSPaolo Abeni u8 scaling_ratio;
333df00b087SFlorian Westphal
3346f06b4d4SPaolo Abeni u32 subflow_id;
335df00b087SFlorian Westphal u32 setsockopt_seq;
33620b5759fSPaolo Abeni char ca_name[TCP_CA_NAME_MAX];
337f870fa0bSMat Martineau };
338f870fa0bSMat Martineau
33987952603SPaolo Abeni #define mptcp_data_lock(sk) spin_lock_bh(&(sk)->sk_lock.slock)
34087952603SPaolo Abeni #define mptcp_data_unlock(sk) spin_unlock_bh(&(sk)->sk_lock.slock)
34187952603SPaolo Abeni
342cec37a6eSPeter Krystad #define mptcp_for_each_subflow(__msk, __subflow) \
343cec37a6eSPeter Krystad list_for_each_entry(__subflow, &((__msk)->conn_list), node)
3445efbf6f7SMatthieu Baerts #define mptcp_for_each_subflow_safe(__msk, __subflow, __tmp) \
3455efbf6f7SMatthieu Baerts list_for_each_entry_safe(__subflow, __tmp, &((__msk)->conn_list), node)
346cec37a6eSPeter Krystad
msk_owned_by_me(const struct mptcp_sock * msk)3473abc05d9SFlorian Westphal static inline void msk_owned_by_me(const struct mptcp_sock *msk)
3483abc05d9SFlorian Westphal {
3493abc05d9SFlorian Westphal sock_owned_by_me((const struct sock *)msk);
3503abc05d9SFlorian Westphal }
3513abc05d9SFlorian Westphal
352403a40f2SEric Dumazet #define mptcp_sk(ptr) container_of_const(ptr, struct mptcp_sock, sk.icsk_inet.sk)
353f870fa0bSMat Martineau
354ce599c51SPaolo Abeni /* the msk socket don't use the backlog, also account for the bulk
355ce599c51SPaolo Abeni * free memory
356ce599c51SPaolo Abeni */
__mptcp_rmem(const struct sock * sk)357ce599c51SPaolo Abeni static inline int __mptcp_rmem(const struct sock *sk)
358ce599c51SPaolo Abeni {
359ce599c51SPaolo Abeni return atomic_read(&sk->sk_rmem_alloc) - READ_ONCE(mptcp_sk(sk)->rmem_released);
360ce599c51SPaolo Abeni }
361ce599c51SPaolo Abeni
mptcp_win_from_space(const struct sock * sk,int space)362b8dc6d6cSPaolo Abeni static inline int mptcp_win_from_space(const struct sock *sk, int space)
363b8dc6d6cSPaolo Abeni {
364b8dc6d6cSPaolo Abeni return __tcp_win_from_space(mptcp_sk(sk)->scaling_ratio, space);
365b8dc6d6cSPaolo Abeni }
366b8dc6d6cSPaolo Abeni
__mptcp_space(const struct sock * sk)367ea4ca586SPaolo Abeni static inline int __mptcp_space(const struct sock *sk)
368ea4ca586SPaolo Abeni {
369b8dc6d6cSPaolo Abeni return mptcp_win_from_space(sk, READ_ONCE(sk->sk_rcvbuf) - __mptcp_rmem(sk));
370ea4ca586SPaolo Abeni }
371ea4ca586SPaolo Abeni
mptcp_send_head(const struct sock * sk)372f0e6a4cfSPaolo Abeni static inline struct mptcp_data_frag *mptcp_send_head(const struct sock *sk)
373f0e6a4cfSPaolo Abeni {
374f0e6a4cfSPaolo Abeni const struct mptcp_sock *msk = mptcp_sk(sk);
375f0e6a4cfSPaolo Abeni
376f0e6a4cfSPaolo Abeni return READ_ONCE(msk->first_pending);
377f0e6a4cfSPaolo Abeni }
378f0e6a4cfSPaolo Abeni
mptcp_send_next(struct sock * sk)379f0e6a4cfSPaolo Abeni static inline struct mptcp_data_frag *mptcp_send_next(struct sock *sk)
380f0e6a4cfSPaolo Abeni {
381f0e6a4cfSPaolo Abeni struct mptcp_sock *msk = mptcp_sk(sk);
382f0e6a4cfSPaolo Abeni struct mptcp_data_frag *cur;
383f0e6a4cfSPaolo Abeni
384f0e6a4cfSPaolo Abeni cur = msk->first_pending;
385f0e6a4cfSPaolo Abeni return list_is_last(&cur->list, &msk->rtx_queue) ? NULL :
386f0e6a4cfSPaolo Abeni list_next_entry(cur, list);
387f0e6a4cfSPaolo Abeni }
388f0e6a4cfSPaolo Abeni
mptcp_pending_tail(const struct sock * sk)389f0e6a4cfSPaolo Abeni static inline struct mptcp_data_frag *mptcp_pending_tail(const struct sock *sk)
390f0e6a4cfSPaolo Abeni {
391403a40f2SEric Dumazet const struct mptcp_sock *msk = mptcp_sk(sk);
392f0e6a4cfSPaolo Abeni
393f0e6a4cfSPaolo Abeni if (!msk->first_pending)
394f0e6a4cfSPaolo Abeni return NULL;
395f0e6a4cfSPaolo Abeni
396f0e6a4cfSPaolo Abeni if (WARN_ON_ONCE(list_empty(&msk->rtx_queue)))
397f0e6a4cfSPaolo Abeni return NULL;
398f0e6a4cfSPaolo Abeni
399f0e6a4cfSPaolo Abeni return list_last_entry(&msk->rtx_queue, struct mptcp_data_frag, list);
400f0e6a4cfSPaolo Abeni }
401f0e6a4cfSPaolo Abeni
mptcp_rtx_head(struct sock * sk)402403a40f2SEric Dumazet static inline struct mptcp_data_frag *mptcp_rtx_head(struct sock *sk)
4037948f6ccSFlorian Westphal {
4047948f6ccSFlorian Westphal struct mptcp_sock *msk = mptcp_sk(sk);
4057948f6ccSFlorian Westphal
40664b9cea7SPaolo Abeni if (msk->snd_una == READ_ONCE(msk->snd_nxt))
40764b9cea7SPaolo Abeni return NULL;
40864b9cea7SPaolo Abeni
409a386bc5bSGeliang Tang return list_first_entry_or_null(&msk->rtx_queue, struct mptcp_data_frag, list);
4107948f6ccSFlorian Westphal }
4117948f6ccSFlorian Westphal
412d0cc2987SGeliang Tang struct csum_pseudo_header {
413d0cc2987SGeliang Tang __be64 data_seq;
414d0cc2987SGeliang Tang __be32 subflow_seq;
415d0cc2987SGeliang Tang __be16 data_len;
416d0cc2987SGeliang Tang __sum16 csum;
417d0cc2987SGeliang Tang };
418d0cc2987SGeliang Tang
419cec37a6eSPeter Krystad struct mptcp_subflow_request_sock {
420cec37a6eSPeter Krystad struct tcp_request_sock sk;
421d22f4988SChristoph Paasch u16 mp_capable : 1,
422cec37a6eSPeter Krystad mp_join : 1,
42306fe1719SGeliang Tang backup : 1,
4248ed3e34cSMatthieu Baerts (NGI0) request_bkup : 1,
425bab6b88eSGeliang Tang csum_reqd : 1,
426bab6b88eSGeliang Tang allow_join_id0 : 1;
4271b1c7a0eSPeter Krystad u8 local_id;
428f296234cSPeter Krystad u8 remote_id;
429cec37a6eSPeter Krystad u64 local_key;
43079c0949eSPeter Krystad u64 idsn;
43179c0949eSPeter Krystad u32 token;
432648ef4b8SMat Martineau u32 ssn_offset;
433f296234cSPeter Krystad u64 thmac;
434f296234cSPeter Krystad u32 local_nonce;
435f296234cSPeter Krystad u32 remote_nonce;
4368fd4de12SPaolo Abeni struct mptcp_sock *msk;
4372c5ebd00SPaolo Abeni struct hlist_nulls_node token_node;
438cec37a6eSPeter Krystad };
439cec37a6eSPeter Krystad
440cec37a6eSPeter Krystad static inline struct mptcp_subflow_request_sock *
mptcp_subflow_rsk(const struct request_sock * rsk)441cec37a6eSPeter Krystad mptcp_subflow_rsk(const struct request_sock *rsk)
442cec37a6eSPeter Krystad {
443cec37a6eSPeter Krystad return (struct mptcp_subflow_request_sock *)rsk;
444cec37a6eSPeter Krystad }
445cec37a6eSPeter Krystad
4466719331cSPaolo Abeni enum mptcp_data_avail {
4476719331cSPaolo Abeni MPTCP_SUBFLOW_NODATA,
4486719331cSPaolo Abeni MPTCP_SUBFLOW_DATA_AVAIL,
4496719331cSPaolo Abeni };
4506719331cSPaolo Abeni
451b19bc294SPaolo Abeni struct mptcp_delegated_action {
452b19bc294SPaolo Abeni struct napi_struct napi;
453b19bc294SPaolo Abeni struct list_head head;
454b19bc294SPaolo Abeni };
455b19bc294SPaolo Abeni
456b19bc294SPaolo Abeni DECLARE_PER_CPU(struct mptcp_delegated_action, mptcp_delegated_actions);
457b19bc294SPaolo Abeni
458a5efdbceSPaolo Abeni #define MPTCP_DELEGATE_SCHEDULED 0
459a5efdbceSPaolo Abeni #define MPTCP_DELEGATE_SEND 1
460a5efdbceSPaolo Abeni #define MPTCP_DELEGATE_ACK 2
46134c7757aSPaolo Abeni #define MPTCP_DELEGATE_SNDBUF 3
462b19bc294SPaolo Abeni
463a5efdbceSPaolo Abeni #define MPTCP_DELEGATE_ACTIONS_MASK (~BIT(MPTCP_DELEGATE_SCHEDULED))
4642303f994SPeter Krystad /* MPTCP subflow context */
4652303f994SPeter Krystad struct mptcp_subflow_context {
466cec37a6eSPeter Krystad struct list_head node;/* conn_list of subflows */
467b29fcfb5SPaolo Abeni
46863ec72bdSKees Cook struct_group(reset,
469b29fcfb5SPaolo Abeni
4703ce0852cSPaolo Abeni unsigned long avg_pacing_rate; /* protected by msk socket lock */
471cec37a6eSPeter Krystad u64 local_key;
472cec37a6eSPeter Krystad u64 remote_key;
47379c0949eSPeter Krystad u64 idsn;
474648ef4b8SMat Martineau u64 map_seq;
475cc7972eaSChristoph Paasch u32 snd_isn;
47679c0949eSPeter Krystad u32 token;
4776d0060f6SMat Martineau u32 rel_write_seq;
478648ef4b8SMat Martineau u32 map_subflow_seq;
479648ef4b8SMat Martineau u32 ssn_offset;
480648ef4b8SMat Martineau u32 map_data_len;
481dd8bcd17SPaolo Abeni __wsum map_data_csum;
482dd8bcd17SPaolo Abeni u32 map_csum_len;
483cec37a6eSPeter Krystad u32 request_mptcp : 1, /* send MP_CAPABLE */
484ec3edaa7SPeter Krystad request_join : 1, /* send MP_JOIN */
485ec3edaa7SPeter Krystad request_bkup : 1,
486cec37a6eSPeter Krystad mp_capable : 1, /* remote is MPTCP capable */
487f296234cSPeter Krystad mp_join : 1, /* remote is JOINing */
4880be534f5SPaolo Abeni fully_established : 1, /* path validated */
489f296234cSPeter Krystad pm_notified : 1, /* PM hook called for established status */
490648ef4b8SMat Martineau conn_finished : 1,
491648ef4b8SMat Martineau map_valid : 1,
492dd8bcd17SPaolo Abeni map_csum_reqd : 1,
493dd8bcd17SPaolo Abeni map_data_fin : 1,
494d22f4988SChristoph Paasch mpc_map : 1,
495f296234cSPeter Krystad backup : 1,
49606706542SGeliang Tang send_mp_prio : 1,
497c25aeb4eSGeliang Tang send_mp_fail : 1,
498f284c0c7SPaolo Abeni send_fastclose : 1,
4991e39e5a3SGeliang Tang send_infinite_map : 1,
500b3ea6b27SPaolo Abeni remote_key_valid : 1, /* received the peer key from */
501ff5a0b42SPaolo Abeni disposable : 1, /* ctx can be free at ulp release time */
5024cf86ae8SPaolo Abeni stale : 1, /* unable to snd/rcv data, do not use for xmit */
503dfc8d060SDmytro Shytyi valid_csum_seen : 1, /* at least one csum validated */
504dfc8d060SDmytro Shytyi is_mptfo : 1, /* subflow is doing TFO */
505a088190fSMatthieu Baerts (NGI0) close_event_done : 1, /* has done the post-closed part */
506a088190fSMatthieu Baerts (NGI0) __unused : 9;
5076719331cSPaolo Abeni enum mptcp_data_avail data_avail;
508fce68b03SGeliang Tang bool scheduled;
50937d9305cSPaolo Abeni bool pm_listener; /* a listener managed by the kernel PM? */
510f296234cSPeter Krystad u32 remote_nonce;
511f296234cSPeter Krystad u64 thmac;
512f296234cSPeter Krystad u32 local_nonce;
513ec3edaa7SPeter Krystad u32 remote_token;
514b3ea6b27SPaolo Abeni union {
515b3ea6b27SPaolo Abeni u8 hmac[MPTCPOPT_HMAC_LEN]; /* MPJ subflow only */
516b3ea6b27SPaolo Abeni u64 iasn; /* initial ack sequence number, MPC subflows only */
517b3ea6b27SPaolo Abeni };
518ba2cf922SPaolo Abeni s16 local_id; /* if negative not initialized yet */
519f296234cSPeter Krystad u8 remote_id;
520dc87efdbSFlorian Westphal u8 reset_seen:1;
521dc87efdbSFlorian Westphal u8 reset_transient:1;
522dc87efdbSFlorian Westphal u8 reset_reason:4;
52371b7dec2SPaolo Abeni u8 stale_count;
524648ef4b8SMat Martineau
5256f06b4d4SPaolo Abeni u32 subflow_id;
5266f06b4d4SPaolo Abeni
527b19bc294SPaolo Abeni long delegated_status;
52876a13b31SGeliang Tang unsigned long fail_tout;
529b29fcfb5SPaolo Abeni
53063ec72bdSKees Cook );
531b29fcfb5SPaolo Abeni
532b19bc294SPaolo Abeni struct list_head delegated_node; /* link into delegated_action, protected by local BH */
533b19bc294SPaolo Abeni
534df00b087SFlorian Westphal u32 setsockopt_seq;
53571b7dec2SPaolo Abeni u32 stale_rcv_tstamp;
53634c7757aSPaolo Abeni int cached_sndbuf; /* sndbuf size when last synced with the msk sndbuf,
53734c7757aSPaolo Abeni * protected by the msk socket lock
53834c7757aSPaolo Abeni */
539df00b087SFlorian Westphal
5402303f994SPeter Krystad struct sock *tcp_sock; /* tcp sk backpointer */
5412303f994SPeter Krystad struct sock *conn; /* parent mptcp_sock */
542cec37a6eSPeter Krystad const struct inet_connection_sock_af_ops *icsk_af_ops;
543648ef4b8SMat Martineau void (*tcp_state_change)(struct sock *sk);
54415cc1045SPaolo Abeni void (*tcp_error_report)(struct sock *sk);
545648ef4b8SMat Martineau
5462303f994SPeter Krystad struct rcu_head rcu;
5472303f994SPeter Krystad };
5482303f994SPeter Krystad
5492303f994SPeter Krystad static inline struct mptcp_subflow_context *
mptcp_subflow_ctx(const struct sock * sk)5502303f994SPeter Krystad mptcp_subflow_ctx(const struct sock *sk)
5512303f994SPeter Krystad {
5522303f994SPeter Krystad struct inet_connection_sock *icsk = inet_csk(sk);
5532303f994SPeter Krystad
5542303f994SPeter Krystad /* Use RCU on icsk_ulp_data only for sock diag code */
5552303f994SPeter Krystad return (__force struct mptcp_subflow_context *)icsk->icsk_ulp_data;
5562303f994SPeter Krystad }
5572303f994SPeter Krystad
5582303f994SPeter Krystad static inline struct sock *
mptcp_subflow_tcp_sock(const struct mptcp_subflow_context * subflow)5592303f994SPeter Krystad mptcp_subflow_tcp_sock(const struct mptcp_subflow_context *subflow)
5602303f994SPeter Krystad {
5612303f994SPeter Krystad return subflow->tcp_sock;
5622303f994SPeter Krystad }
5632303f994SPeter Krystad
564b29fcfb5SPaolo Abeni static inline void
mptcp_subflow_ctx_reset(struct mptcp_subflow_context * subflow)565b29fcfb5SPaolo Abeni mptcp_subflow_ctx_reset(struct mptcp_subflow_context *subflow)
566b29fcfb5SPaolo Abeni {
56763ec72bdSKees Cook memset(&subflow->reset, 0, sizeof(subflow->reset));
568b29fcfb5SPaolo Abeni subflow->request_mptcp = 1;
569ba2cf922SPaolo Abeni WRITE_ONCE(subflow->local_id, -1);
570b29fcfb5SPaolo Abeni }
571b29fcfb5SPaolo Abeni
572648ef4b8SMat Martineau static inline u64
mptcp_subflow_get_map_offset(const struct mptcp_subflow_context * subflow)573648ef4b8SMat Martineau mptcp_subflow_get_map_offset(const struct mptcp_subflow_context *subflow)
574648ef4b8SMat Martineau {
575648ef4b8SMat Martineau return tcp_sk(mptcp_subflow_tcp_sock(subflow))->copied_seq -
576648ef4b8SMat Martineau subflow->ssn_offset -
577648ef4b8SMat Martineau subflow->map_subflow_seq;
578648ef4b8SMat Martineau }
579648ef4b8SMat Martineau
580648ef4b8SMat Martineau static inline u64
mptcp_subflow_get_mapped_dsn(const struct mptcp_subflow_context * subflow)581648ef4b8SMat Martineau mptcp_subflow_get_mapped_dsn(const struct mptcp_subflow_context *subflow)
582648ef4b8SMat Martineau {
583648ef4b8SMat Martineau return subflow->map_seq + mptcp_subflow_get_map_offset(subflow);
584648ef4b8SMat Martineau }
585648ef4b8SMat Martineau
586a5efdbceSPaolo Abeni void mptcp_subflow_process_delegated(struct sock *ssk, long actions);
587b19bc294SPaolo Abeni
mptcp_subflow_delegate(struct mptcp_subflow_context * subflow,int action)588bcd97734SPaolo Abeni static inline void mptcp_subflow_delegate(struct mptcp_subflow_context *subflow, int action)
589b19bc294SPaolo Abeni {
590a5efdbceSPaolo Abeni long old, set_bits = BIT(MPTCP_DELEGATE_SCHEDULED) | BIT(action);
591b19bc294SPaolo Abeni struct mptcp_delegated_action *delegated;
592b19bc294SPaolo Abeni bool schedule;
593b19bc294SPaolo Abeni
594bcd97734SPaolo Abeni /* the caller held the subflow bh socket lock */
595bcd97734SPaolo Abeni lockdep_assert_in_softirq();
596bcd97734SPaolo Abeni
597a5efdbceSPaolo Abeni /* The implied barrier pairs with tcp_release_cb_override()
598a5efdbceSPaolo Abeni * mptcp_napi_poll(), and ensures the below list check sees list
599a5efdbceSPaolo Abeni * updates done prior to delegated status bits changes
600b19bc294SPaolo Abeni */
601a5efdbceSPaolo Abeni old = set_mask_bits(&subflow->delegated_status, 0, set_bits);
602a5efdbceSPaolo Abeni if (!(old & BIT(MPTCP_DELEGATE_SCHEDULED))) {
603a5efdbceSPaolo Abeni if (WARN_ON_ONCE(!list_empty(&subflow->delegated_node)))
604b19bc294SPaolo Abeni return;
605b19bc294SPaolo Abeni
606b19bc294SPaolo Abeni delegated = this_cpu_ptr(&mptcp_delegated_actions);
607b19bc294SPaolo Abeni schedule = list_empty(&delegated->head);
608b19bc294SPaolo Abeni list_add_tail(&subflow->delegated_node, &delegated->head);
609b19bc294SPaolo Abeni sock_hold(mptcp_subflow_tcp_sock(subflow));
610b19bc294SPaolo Abeni if (schedule)
611b19bc294SPaolo Abeni napi_schedule(&delegated->napi);
612b19bc294SPaolo Abeni }
613b19bc294SPaolo Abeni }
614b19bc294SPaolo Abeni
615b19bc294SPaolo Abeni static inline struct mptcp_subflow_context *
mptcp_subflow_delegated_next(struct mptcp_delegated_action * delegated)616b19bc294SPaolo Abeni mptcp_subflow_delegated_next(struct mptcp_delegated_action *delegated)
617b19bc294SPaolo Abeni {
618b19bc294SPaolo Abeni struct mptcp_subflow_context *ret;
619b19bc294SPaolo Abeni
620b19bc294SPaolo Abeni if (list_empty(&delegated->head))
621b19bc294SPaolo Abeni return NULL;
622b19bc294SPaolo Abeni
623b19bc294SPaolo Abeni ret = list_first_entry(&delegated->head, struct mptcp_subflow_context, delegated_node);
624b19bc294SPaolo Abeni list_del_init(&ret->delegated_node);
625b19bc294SPaolo Abeni return ret;
626b19bc294SPaolo Abeni }
627b19bc294SPaolo Abeni
6286da14d74SPaolo Abeni int mptcp_is_enabled(const struct net *net);
6296da14d74SPaolo Abeni unsigned int mptcp_get_add_addr_timeout(const struct net *net);
6306da14d74SPaolo Abeni int mptcp_is_checksum_enabled(const struct net *net);
6316da14d74SPaolo Abeni int mptcp_allow_join_id0(const struct net *net);
632ff5a0b42SPaolo Abeni unsigned int mptcp_stale_loss_cnt(const struct net *net);
6336bb63cccSMat Martineau int mptcp_get_pm_type(const struct net *net);
634e3b2870bSGeliang Tang const char *mptcp_get_scheduler(const struct net *net);
635b45df837SPaolo Abeni void __mptcp_subflow_fully_established(struct mptcp_sock *msk,
636b45df837SPaolo Abeni struct mptcp_subflow_context *subflow,
637b3ea6b27SPaolo Abeni const struct mptcp_options_received *mp_opt);
6381e1d9d6fSPaolo Abeni bool __mptcp_retransmit_pending_data(struct sock *sk);
6398b38217aSMaxim Galaganov void mptcp_check_and_set_pending(struct sock *sk);
640ff5a0b42SPaolo Abeni void __mptcp_push_pending(struct sock *sk, unsigned int flags);
641648ef4b8SMat Martineau bool mptcp_subflow_data_available(struct sock *sk);
642d39dcecaSPaolo Abeni void __init mptcp_subflow_init(void);
643d0876b22SGeliang Tang void mptcp_subflow_shutdown(struct sock *sk, struct sock *ssk, int how);
644a141e02eSFlorian Westphal void mptcp_close_ssk(struct sock *sk, struct sock *ssk,
645e16163b6SPaolo Abeni struct mptcp_subflow_context *subflow);
646a6574302SMat Martineau void __mptcp_subflow_send_ack(struct sock *ssk);
647d5824847SPaolo Abeni void mptcp_subflow_reset(struct sock *ssk);
6482a6a870eSPaolo Abeni void mptcp_subflow_queue_clean(struct sock *sk, struct sock *ssk);
649866f26f2SPaolo Abeni void mptcp_sock_graft(struct sock *sk, struct socket *parent);
6503f326a82SPaolo Abeni struct sock *__mptcp_nmpc_sk(struct mptcp_sock *msk);
65126d3e21cSMenglong Dong bool __mptcp_close(struct sock *sk, long timeout);
65230e51b92SMenglong Dong void mptcp_cancel_work(struct sock *sk);
65363740448SPaolo Abeni void __mptcp_unaccepted_force_close(struct sock *sk);
65436b122baSDmytro Shytyi void mptcp_set_owner_r(struct sk_buff *skb, struct sock *sk);
65556557547SGeliang Tang void mptcp_set_state(struct sock *sk, int state);
656ec3edaa7SPeter Krystad
6574638de5aSKishen Maloor bool mptcp_addresses_equal(const struct mptcp_addr_info *a,
6584638de5aSKishen Maloor const struct mptcp_addr_info *b, bool use_port);
659dc886bceSGeliang Tang void mptcp_local_address(const struct sock_common *skc, struct mptcp_addr_info *addr);
6604638de5aSKishen Maloor
661ec3edaa7SPeter Krystad /* called with sk socket lock held */
662ef0da3b8SPaolo Abeni int __mptcp_subflow_connect(struct sock *sk, const struct mptcp_addr_info *loc,
663ee285257SGeliang Tang const struct mptcp_addr_info *remote);
6646bc1fe7dSPaolo Abeni int mptcp_subflow_create_socket(struct sock *sk, unsigned short family,
6656bc1fe7dSPaolo Abeni struct socket **new_sock);
6661729cf18SGeliang Tang void mptcp_info2sockaddr(const struct mptcp_addr_info *info,
6671729cf18SGeliang Tang struct sockaddr_storage *addr,
6681729cf18SGeliang Tang unsigned short family);
669740ebe35SGeliang Tang struct mptcp_sched_ops *mptcp_sched_find(const char *name);
670740ebe35SGeliang Tang int mptcp_register_scheduler(struct mptcp_sched_ops *sched);
671740ebe35SGeliang Tang void mptcp_unregister_scheduler(struct mptcp_sched_ops *sched);
672ed1ad86bSGeliang Tang void mptcp_sched_init(void);
6731730b2b2SGeliang Tang int mptcp_init_sched(struct mptcp_sock *msk,
6741730b2b2SGeliang Tang struct mptcp_sched_ops *sched);
6751730b2b2SGeliang Tang void mptcp_release_sched(struct mptcp_sock *msk);
676fce68b03SGeliang Tang void mptcp_subflow_set_scheduled(struct mptcp_subflow_context *subflow,
677fce68b03SGeliang Tang bool scheduled);
67807336a87SGeliang Tang struct sock *mptcp_subflow_get_send(struct mptcp_sock *msk);
67907336a87SGeliang Tang struct sock *mptcp_subflow_get_retrans(struct mptcp_sock *msk);
68007336a87SGeliang Tang int mptcp_sched_get_send(struct mptcp_sock *msk);
68107336a87SGeliang Tang int mptcp_sched_get_retrans(struct mptcp_sock *msk);
6822303f994SPeter Krystad
mptcp_data_avail(const struct mptcp_sock * msk)683124a4885SPaolo Abeni static inline u64 mptcp_data_avail(const struct mptcp_sock *msk)
684124a4885SPaolo Abeni {
685124a4885SPaolo Abeni return READ_ONCE(msk->bytes_received) - READ_ONCE(msk->bytes_consumed);
686124a4885SPaolo Abeni }
687124a4885SPaolo Abeni
mptcp_epollin_ready(const struct sock * sk)688124a4885SPaolo Abeni static inline bool mptcp_epollin_ready(const struct sock *sk)
689124a4885SPaolo Abeni {
690d09d17c1SPaolo Abeni u64 data_avail = mptcp_data_avail(mptcp_sk(sk));
691d09d17c1SPaolo Abeni
692d09d17c1SPaolo Abeni if (!data_avail)
693d09d17c1SPaolo Abeni return false;
694d09d17c1SPaolo Abeni
695124a4885SPaolo Abeni /* mptcp doesn't have to deal with small skbs in the receive queue,
696d09d17c1SPaolo Abeni * as it can always coalesce them
697124a4885SPaolo Abeni */
698d09d17c1SPaolo Abeni return (data_avail >= sk->sk_rcvlowat) ||
699124a4885SPaolo Abeni (mem_cgroup_sockets_enabled && sk->sk_memcg &&
700124a4885SPaolo Abeni mem_cgroup_under_socket_pressure(sk->sk_memcg)) ||
701124a4885SPaolo Abeni READ_ONCE(tcp_memory_pressure);
702124a4885SPaolo Abeni }
703124a4885SPaolo Abeni
704124a4885SPaolo Abeni int mptcp_set_rcvlowat(struct sock *sk, int val);
705124a4885SPaolo Abeni
__tcp_can_send(const struct sock * ssk)706c886d702SPaolo Abeni static inline bool __tcp_can_send(const struct sock *ssk)
707c886d702SPaolo Abeni {
708c886d702SPaolo Abeni /* only send if our side has not closed yet */
709c886d702SPaolo Abeni return ((1 << inet_sk_state_load(ssk)) & (TCPF_ESTABLISHED | TCPF_CLOSE_WAIT));
710c886d702SPaolo Abeni }
711c886d702SPaolo Abeni
__mptcp_subflow_active(struct mptcp_subflow_context * subflow)712ff5a0b42SPaolo Abeni static inline bool __mptcp_subflow_active(struct mptcp_subflow_context *subflow)
71343f1140bSGeliang Tang {
71443f1140bSGeliang Tang /* can't send if JOIN hasn't completed yet (i.e. is usable for mptcp) */
71543f1140bSGeliang Tang if (subflow->request_join && !subflow->fully_established)
71643f1140bSGeliang Tang return false;
71743f1140bSGeliang Tang
718c886d702SPaolo Abeni return __tcp_can_send(mptcp_subflow_tcp_sock(subflow));
71943f1140bSGeliang Tang }
72043f1140bSGeliang Tang
721ff5a0b42SPaolo Abeni void mptcp_subflow_set_active(struct mptcp_subflow_context *subflow);
722ff5a0b42SPaolo Abeni
723ff5a0b42SPaolo Abeni bool mptcp_subflow_active(struct mptcp_subflow_context *subflow);
724ff5a0b42SPaolo Abeni
725b6985b9bSPaolo Abeni void mptcp_subflow_drop_ctx(struct sock *ssk);
726b6985b9bSPaolo Abeni
mptcp_subflow_tcp_fallback(struct sock * sk,struct mptcp_subflow_context * ctx)727648ef4b8SMat Martineau static inline void mptcp_subflow_tcp_fallback(struct sock *sk,
728648ef4b8SMat Martineau struct mptcp_subflow_context *ctx)
729648ef4b8SMat Martineau {
730952382c6SFlorian Westphal sk->sk_data_ready = sock_def_readable;
731648ef4b8SMat Martineau sk->sk_state_change = ctx->tcp_state_change;
732952382c6SFlorian Westphal sk->sk_write_space = sk_stream_write_space;
73315cc1045SPaolo Abeni sk->sk_error_report = ctx->tcp_error_report;
734648ef4b8SMat Martineau
735648ef4b8SMat Martineau inet_csk(sk)->icsk_af_ops = ctx->icsk_af_ops;
736648ef4b8SMat Martineau }
737648ef4b8SMat Martineau
738d39dcecaSPaolo Abeni void __init mptcp_proto_init(void);
739784325e9SMatthieu Baerts #if IS_ENABLED(CONFIG_MPTCP_IPV6)
740d39dcecaSPaolo Abeni int __init mptcp_proto_v6_init(void);
741784325e9SMatthieu Baerts #endif
742648ef4b8SMat Martineau
7437e8b88ecSPaolo Abeni struct sock *mptcp_sk_clone_init(const struct sock *sk,
744cfde141eSPaolo Abeni const struct mptcp_options_received *mp_opt,
7457e8b88ecSPaolo Abeni struct sock *ssk,
746fca5c82cSPaolo Abeni struct request_sock *req);
7470799e21bSGeliang Tang void mptcp_get_options(const struct sk_buff *skb,
748cfde141eSPaolo Abeni struct mptcp_options_received *mp_opt);
749cec37a6eSPeter Krystad
750cec37a6eSPeter Krystad void mptcp_finish_connect(struct sock *sk);
751cf742d09SPaolo Abeni void __mptcp_sync_state(struct sock *sk, int state);
752f6909dc1SPaolo Abeni void mptcp_reset_tout_timer(struct mptcp_sock *msk, unsigned long fail_tout);
75327e5ccc2SPaolo Abeni
mptcp_stop_tout_timer(struct sock * sk)75427e5ccc2SPaolo Abeni static inline void mptcp_stop_tout_timer(struct sock *sk)
75527e5ccc2SPaolo Abeni {
75627e5ccc2SPaolo Abeni if (!inet_csk(sk)->icsk_mtup.probe_timestamp)
75727e5ccc2SPaolo Abeni return;
75827e5ccc2SPaolo Abeni
75927e5ccc2SPaolo Abeni sk_stop_timer(sk, &sk->sk_timer);
76027e5ccc2SPaolo Abeni inet_csk(sk)->icsk_mtup.probe_timestamp = 0;
76127e5ccc2SPaolo Abeni }
76227e5ccc2SPaolo Abeni
mptcp_set_close_tout(struct sock * sk,unsigned long tout)76327e5ccc2SPaolo Abeni static inline void mptcp_set_close_tout(struct sock *sk, unsigned long tout)
76427e5ccc2SPaolo Abeni {
76527e5ccc2SPaolo Abeni /* avoid 0 timestamp, as that means no close timeout */
76627e5ccc2SPaolo Abeni inet_csk(sk)->icsk_mtup.probe_timestamp = tout ? : 1;
76727e5ccc2SPaolo Abeni }
76827e5ccc2SPaolo Abeni
mptcp_start_tout_timer(struct sock * sk)76927e5ccc2SPaolo Abeni static inline void mptcp_start_tout_timer(struct sock *sk)
77027e5ccc2SPaolo Abeni {
77127e5ccc2SPaolo Abeni mptcp_set_close_tout(sk, tcp_jiffies32);
77227e5ccc2SPaolo Abeni mptcp_reset_tout_timer(mptcp_sk(sk), 0);
77327e5ccc2SPaolo Abeni }
77427e5ccc2SPaolo Abeni
mptcp_is_fully_established(struct sock * sk)775b93df08cSPaolo Abeni static inline bool mptcp_is_fully_established(struct sock *sk)
776b93df08cSPaolo Abeni {
777b93df08cSPaolo Abeni return inet_sk_state_load(sk) == TCP_ESTABLISHED &&
778b93df08cSPaolo Abeni READ_ONCE(mptcp_sk(sk)->fully_established);
779b93df08cSPaolo Abeni }
780124a4885SPaolo Abeni
781a6b118feSFlorian Westphal void mptcp_rcv_space_init(struct mptcp_sock *msk, const struct sock *ssk);
7822e52213cSFlorian Westphal void mptcp_data_ready(struct sock *sk, struct sock *ssk);
783f296234cSPeter Krystad bool mptcp_finish_join(struct sock *sk);
784ba8f48f7SPaolo Abeni bool mptcp_schedule_work(struct sock *sk);
7850abdde82SPaolo Abeni int mptcp_setsockopt(struct sock *sk, int level, int optname,
7860abdde82SPaolo Abeni sockptr_t optval, unsigned int optlen);
7870abdde82SPaolo Abeni int mptcp_getsockopt(struct sock *sk, int level, int optname,
7880abdde82SPaolo Abeni char __user *optval, int __user *option);
7890abdde82SPaolo Abeni
7901502328fSPaolo Abeni u64 __mptcp_expand_seq(u64 old_seq, u64 cur_seq);
mptcp_expand_seq(u64 old_seq,u64 cur_seq,bool use_64bit)7911502328fSPaolo Abeni static inline u64 mptcp_expand_seq(u64 old_seq, u64 cur_seq, bool use_64bit)
7921502328fSPaolo Abeni {
7931502328fSPaolo Abeni if (use_64bit)
7941502328fSPaolo Abeni return cur_seq;
7951502328fSPaolo Abeni
7961502328fSPaolo Abeni return __mptcp_expand_seq(old_seq, cur_seq);
7971502328fSPaolo Abeni }
798219d0499SPaolo Abeni void __mptcp_check_push(struct sock *sk, struct sock *ssk);
7997439d687SPaolo Abeni void __mptcp_data_acked(struct sock *sk);
80015cc1045SPaolo Abeni void __mptcp_error_report(struct sock *sk);
8011a49b2c2SMat Martineau bool mptcp_update_rcv_data_fin(struct mptcp_sock *msk, u64 data_fin_seq, bool use_64bit);
mptcp_data_fin_enabled(const struct mptcp_sock * msk)802e16163b6SPaolo Abeni static inline bool mptcp_data_fin_enabled(const struct mptcp_sock *msk)
803e16163b6SPaolo Abeni {
804e16163b6SPaolo Abeni return READ_ONCE(msk->snd_data_fin_enable) &&
805e16163b6SPaolo Abeni READ_ONCE(msk->write_seq) == READ_ONCE(msk->snd_nxt);
806e16163b6SPaolo Abeni }
807e16163b6SPaolo Abeni
mptcp_write_space(struct sock * sk)808b609ecdaSPaolo Abeni static inline void mptcp_write_space(struct sock *sk)
809b609ecdaSPaolo Abeni {
810b609ecdaSPaolo Abeni if (sk_stream_is_writeable(sk)) {
811b609ecdaSPaolo Abeni /* pairs with memory barrier in mptcp_poll */
812b609ecdaSPaolo Abeni smp_mb();
813b609ecdaSPaolo Abeni if (test_and_clear_bit(MPTCP_NOSPACE, &mptcp_sk(sk)->flags))
814b609ecdaSPaolo Abeni sk_stream_write_space(sk);
815b609ecdaSPaolo Abeni }
816b609ecdaSPaolo Abeni }
817b609ecdaSPaolo Abeni
__mptcp_sync_sndbuf(struct sock * sk)81834c7757aSPaolo Abeni static inline void __mptcp_sync_sndbuf(struct sock *sk)
8195cf92bbaSPaolo Abeni {
82034c7757aSPaolo Abeni struct mptcp_subflow_context *subflow;
82134c7757aSPaolo Abeni int ssk_sndbuf, new_sndbuf;
8225cf92bbaSPaolo Abeni
82334c7757aSPaolo Abeni if (sk->sk_userlocks & SOCK_SNDBUF_LOCK)
82434c7757aSPaolo Abeni return;
82534c7757aSPaolo Abeni
82634c7757aSPaolo Abeni new_sndbuf = sock_net(sk)->ipv4.sysctl_tcp_wmem[0];
82734c7757aSPaolo Abeni mptcp_for_each_subflow(mptcp_sk(sk), subflow) {
82834c7757aSPaolo Abeni ssk_sndbuf = READ_ONCE(mptcp_subflow_tcp_sock(subflow)->sk_sndbuf);
82934c7757aSPaolo Abeni
83034c7757aSPaolo Abeni subflow->cached_sndbuf = ssk_sndbuf;
83134c7757aSPaolo Abeni new_sndbuf += ssk_sndbuf;
83234c7757aSPaolo Abeni }
83334c7757aSPaolo Abeni
83434c7757aSPaolo Abeni /* the msk max wmem limit is <nr_subflows> * tcp wmem[2] */
83534c7757aSPaolo Abeni WRITE_ONCE(sk->sk_sndbuf, new_sndbuf);
836b609ecdaSPaolo Abeni mptcp_write_space(sk);
83734c7757aSPaolo Abeni }
83834c7757aSPaolo Abeni
83934c7757aSPaolo Abeni /* The called held both the msk socket and the subflow socket locks,
84034c7757aSPaolo Abeni * possibly under BH
84134c7757aSPaolo Abeni */
__mptcp_propagate_sndbuf(struct sock * sk,struct sock * ssk)84234c7757aSPaolo Abeni static inline void __mptcp_propagate_sndbuf(struct sock *sk, struct sock *ssk)
84334c7757aSPaolo Abeni {
84434c7757aSPaolo Abeni struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(ssk);
84534c7757aSPaolo Abeni
84634c7757aSPaolo Abeni if (READ_ONCE(ssk->sk_sndbuf) != subflow->cached_sndbuf)
84734c7757aSPaolo Abeni __mptcp_sync_sndbuf(sk);
84834c7757aSPaolo Abeni }
84934c7757aSPaolo Abeni
85034c7757aSPaolo Abeni /* the caller held only the subflow socket lock, either in process or
85134c7757aSPaolo Abeni * BH context. Additionally this can be called under the msk data lock,
85234c7757aSPaolo Abeni * so we can't acquire such lock here: let the delegate action acquires
85334c7757aSPaolo Abeni * the needed locks in suitable order.
85434c7757aSPaolo Abeni */
mptcp_propagate_sndbuf(struct sock * sk,struct sock * ssk)85534c7757aSPaolo Abeni static inline void mptcp_propagate_sndbuf(struct sock *sk, struct sock *ssk)
85634c7757aSPaolo Abeni {
85734c7757aSPaolo Abeni struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(ssk);
85834c7757aSPaolo Abeni
85934c7757aSPaolo Abeni if (likely(READ_ONCE(ssk->sk_sndbuf) == subflow->cached_sndbuf))
86034c7757aSPaolo Abeni return;
86134c7757aSPaolo Abeni
86234c7757aSPaolo Abeni local_bh_disable();
86334c7757aSPaolo Abeni mptcp_subflow_delegate(subflow, MPTCP_DELEGATE_SNDBUF);
86434c7757aSPaolo Abeni local_bh_enable();
8655cf92bbaSPaolo Abeni }
8665cf92bbaSPaolo Abeni
867c0bf3c6aSPaolo Abeni void mptcp_destroy_common(struct mptcp_sock *msk, unsigned int flags);
868cec37a6eSPeter Krystad
869c68a0cd1SJianguo Wu #define MPTCP_TOKEN_MAX_RETRIES 4
870c68a0cd1SJianguo Wu
8712c5ebd00SPaolo Abeni void __init mptcp_token_init(void);
mptcp_token_init_request(struct request_sock * req)8722c5ebd00SPaolo Abeni static inline void mptcp_token_init_request(struct request_sock *req)
8732c5ebd00SPaolo Abeni {
8742c5ebd00SPaolo Abeni mptcp_subflow_rsk(req)->token_node.pprev = NULL;
8752c5ebd00SPaolo Abeni }
8762c5ebd00SPaolo Abeni
87779c0949eSPeter Krystad int mptcp_token_new_request(struct request_sock *req);
8782c5ebd00SPaolo Abeni void mptcp_token_destroy_request(struct request_sock *req);
879294de909SMenglong Dong int mptcp_token_new_connect(struct sock *ssk);
8802c5ebd00SPaolo Abeni void mptcp_token_accept(struct mptcp_subflow_request_sock *r,
8812c5ebd00SPaolo Abeni struct mptcp_sock *msk);
882c83a47e5SFlorian Westphal bool mptcp_token_exists(u32 token);
883ea1300b9SFlorian Westphal struct mptcp_sock *mptcp_token_get_sock(struct net *net, u32 token);
88496d890daSPaolo Abeni struct mptcp_sock *mptcp_token_iter_next(const struct net *net, long *s_slot,
88596d890daSPaolo Abeni long *s_num);
8862c5ebd00SPaolo Abeni void mptcp_token_destroy(struct mptcp_sock *msk);
88779c0949eSPeter Krystad
88879c0949eSPeter Krystad void mptcp_crypto_key_sha(u64 key, u32 *token, u64 *idsn);
88979c0949eSPeter Krystad
8903df523abSPeter Krystad void mptcp_crypto_hmac_sha(u64 key1, u64 key2, u8 *msg, int len, void *hmac);
891ba2c89e0SPaolo Abeni __sum16 __mptcp_make_csum(u64 data_seq, u32 subflow_seq, u16 data_len, __wsum sum);
89279c0949eSPeter Krystad
893d39dcecaSPaolo Abeni void __init mptcp_pm_init(void);
8941b1c7a0eSPeter Krystad void mptcp_pm_data_init(struct mptcp_sock *msk);
895b29fcfb5SPaolo Abeni void mptcp_pm_data_reset(struct mptcp_sock *msk);
896702c2f64SFlorian Westphal int mptcp_pm_parse_addr(struct nlattr *attr, struct genl_info *info,
897702c2f64SFlorian Westphal struct mptcp_addr_info *addr);
8989ab4807cSKishen Maloor int mptcp_pm_parse_entry(struct nlattr *attr, struct genl_info *info,
8999ab4807cSKishen Maloor bool require_family,
9009ab4807cSKishen Maloor struct mptcp_pm_addr_entry *entry);
901fb00ee4fSMatthieu Baerts bool mptcp_pm_addr_families_match(const struct sock *sk,
902fb00ee4fSMatthieu Baerts const struct mptcp_addr_info *loc,
903fb00ee4fSMatthieu Baerts const struct mptcp_addr_info *rem);
90471b7dec2SPaolo Abeni void mptcp_pm_subflow_chk_stale(const struct mptcp_sock *msk, struct sock *ssk);
905ff5a0b42SPaolo Abeni void mptcp_pm_nl_subflow_chk_stale(const struct mptcp_sock *msk, struct sock *ssk);
9066c714f1bSFlorian Westphal void mptcp_pm_new_connection(struct mptcp_sock *msk, const struct sock *ssk, int server_side);
9077a486c44SPaolo Abeni void mptcp_pm_fully_established(struct mptcp_sock *msk, const struct sock *ssk);
9081b1c7a0eSPeter Krystad bool mptcp_pm_allow_new_subflow(struct mptcp_sock *msk);
9091b1c7a0eSPeter Krystad void mptcp_pm_connection_closed(struct mptcp_sock *msk);
91062535200SGeliang Tang void mptcp_pm_subflow_established(struct mptcp_sock *msk);
911a88c9e49SPaolo Abeni bool mptcp_pm_nl_check_work_pending(struct mptcp_sock *msk);
912a88c9e49SPaolo Abeni void mptcp_pm_subflow_check_next(struct mptcp_sock *msk, const struct sock *ssk,
913a88c9e49SPaolo Abeni const struct mptcp_subflow_context *subflow);
914d1ace2d9SKishen Maloor void mptcp_pm_add_addr_received(const struct sock *ssk,
9151b1c7a0eSPeter Krystad const struct mptcp_addr_info *addr);
916557963c3SGeliang Tang void mptcp_pm_add_addr_echoed(struct mptcp_sock *msk,
91790d93088SPaolo Abeni const struct mptcp_addr_info *addr);
91884dfe367SGeliang Tang void mptcp_pm_add_addr_send_ack(struct mptcp_sock *msk);
919dc14d542SMatthieu Baerts (NGI0) bool mptcp_pm_nl_is_init_remote_addr(struct mptcp_sock *msk,
920dc14d542SMatthieu Baerts (NGI0) const struct mptcp_addr_info *remote);
921b46a0238SGeliang Tang void mptcp_pm_nl_addr_send_ack(struct mptcp_sock *msk);
9225c4a824dSGeliang Tang void mptcp_pm_rm_addr_received(struct mptcp_sock *msk,
9235c4a824dSGeliang Tang const struct mptcp_rm_list *rm_list);
92440453a5cSGeliang Tang void mptcp_pm_mp_prio_received(struct sock *sk, u8 bkup);
9255580d41bSGeliang Tang void mptcp_pm_mp_fail_received(struct sock *sk, u64 fail_seq);
926892f396cSKishen Maloor int mptcp_pm_nl_mp_prio_send_ack(struct mptcp_sock *msk,
927892f396cSKishen Maloor struct mptcp_addr_info *addr,
928892f396cSKishen Maloor struct mptcp_addr_info *rem,
929892f396cSKishen Maloor u8 bkup);
9309ab4807cSKishen Maloor bool mptcp_pm_alloc_anno_list(struct mptcp_sock *msk,
931528cb5f2SGeliang Tang const struct mptcp_addr_info *addr);
932b6c08380SGeliang Tang void mptcp_pm_free_anno_list(struct mptcp_sock *msk);
9335bc56388SGeliang Tang bool mptcp_pm_sport_in_anno_list(struct mptcp_sock *msk, const struct sock *sk);
93400cfd77bSGeliang Tang struct mptcp_pm_add_entry *
93500cfd77bSGeliang Tang mptcp_pm_del_add_timer(struct mptcp_sock *msk,
93690d93088SPaolo Abeni const struct mptcp_addr_info *addr, bool check_id);
937d88c476fSGeliang Tang struct mptcp_pm_add_entry *
93890d93088SPaolo Abeni mptcp_lookup_anno_list_by_saddr(const struct mptcp_sock *msk,
93990d93088SPaolo Abeni const struct mptcp_addr_info *addr);
9408b201370SKishen Maloor int mptcp_pm_get_flags_and_ifindex_by_id(struct mptcp_sock *msk,
9418b201370SKishen Maloor unsigned int id,
9428b201370SKishen Maloor u8 *flags, int *ifindex);
943f40be0dbSGeliang Tang int mptcp_pm_nl_get_flags_and_ifindex_by_id(struct mptcp_sock *msk, unsigned int id,
944f40be0dbSGeliang Tang u8 *flags, int *ifindex);
9458b201370SKishen Maloor int mptcp_userspace_pm_get_flags_and_ifindex_by_id(struct mptcp_sock *msk,
9468b201370SKishen Maloor unsigned int id,
947ee285257SGeliang Tang u8 *flags, int *ifindex);
9486ba7ce89SGeliang Tang int mptcp_pm_set_flags(struct net *net, struct nlattr *token,
9496ba7ce89SGeliang Tang struct mptcp_pm_addr_entry *loc,
9506ba7ce89SGeliang Tang struct mptcp_pm_addr_entry *rem, u8 bkup);
9516ba7ce89SGeliang Tang int mptcp_pm_nl_set_flags(struct net *net, struct mptcp_pm_addr_entry *addr, u8 bkup);
952892f396cSKishen Maloor int mptcp_userspace_pm_set_flags(struct net *net, struct nlattr *token,
953892f396cSKishen Maloor struct mptcp_pm_addr_entry *loc,
954892f396cSKishen Maloor struct mptcp_pm_addr_entry *rem, u8 bkup);
9551b1c7a0eSPeter Krystad int mptcp_pm_announce_addr(struct mptcp_sock *msk,
9566a6c05a8SGeliang Tang const struct mptcp_addr_info *addr,
957f7efc777SGeliang Tang bool echo);
958cbde2787SGeliang Tang int mptcp_pm_remove_addr(struct mptcp_sock *msk, const struct mptcp_rm_list *rm_list);
9598b1c94daSGeliang Tang void mptcp_pm_remove_addrs(struct mptcp_sock *msk, struct list_head *rm_list);
960d9a4594eSKishen Maloor
9614638de5aSKishen Maloor void mptcp_free_local_addr_list(struct mptcp_sock *msk);
9629ab4807cSKishen Maloor int mptcp_nl_cmd_announce(struct sk_buff *skb, struct genl_info *info);
963d9a4594eSKishen Maloor int mptcp_nl_cmd_remove(struct sk_buff *skb, struct genl_info *info);
964702c2f64SFlorian Westphal int mptcp_nl_cmd_sf_create(struct sk_buff *skb, struct genl_info *info);
965702c2f64SFlorian Westphal int mptcp_nl_cmd_sf_destroy(struct sk_buff *skb, struct genl_info *info);
9661b1c7a0eSPeter Krystad
967b911c97cSFlorian Westphal void mptcp_event(enum mptcp_event_type type, const struct mptcp_sock *msk,
968b911c97cSFlorian Westphal const struct sock *ssk, gfp_t gfp);
969d1ace2d9SKishen Maloor void mptcp_event_addr_announced(const struct sock *ssk, const struct mptcp_addr_info *info);
970b911c97cSFlorian Westphal void mptcp_event_addr_removed(const struct mptcp_sock *msk, u8 id);
971f8c9dfbdSGeliang Tang void mptcp_event_pm_listener(const struct sock *ssk,
972f8c9dfbdSGeliang Tang enum mptcp_event_type event);
9734d25247dSKishen Maloor bool mptcp_userspace_pm_active(const struct mptcp_sock *msk);
974b911c97cSFlorian Westphal
975b45df837SPaolo Abeni void __mptcp_fastopen_gen_msk_ackseq(struct mptcp_sock *msk, struct mptcp_subflow_context *subflow,
976dfc8d060SDmytro Shytyi const struct mptcp_options_received *mp_opt);
97736b122baSDmytro Shytyi void mptcp_fastopen_subflow_synack_set_params(struct mptcp_subflow_context *subflow,
97836b122baSDmytro Shytyi struct request_sock *req);
979dfc8d060SDmytro Shytyi
mptcp_pm_should_add_signal(struct mptcp_sock * msk)980f643b803SGeliang Tang static inline bool mptcp_pm_should_add_signal(struct mptcp_sock *msk)
9811b1c7a0eSPeter Krystad {
98218fc1a92SYonglong Li return READ_ONCE(msk->pm.addr_signal) &
98318fc1a92SYonglong Li (BIT(MPTCP_ADD_ADDR_SIGNAL) | BIT(MPTCP_ADD_ADDR_ECHO));
98418fc1a92SYonglong Li }
98518fc1a92SYonglong Li
mptcp_pm_should_add_signal_addr(struct mptcp_sock * msk)98618fc1a92SYonglong Li static inline bool mptcp_pm_should_add_signal_addr(struct mptcp_sock *msk)
98718fc1a92SYonglong Li {
98813ad9f01SGeliang Tang return READ_ONCE(msk->pm.addr_signal) & BIT(MPTCP_ADD_ADDR_SIGNAL);
989d91d322aSGeliang Tang }
990d91d322aSGeliang Tang
mptcp_pm_should_add_signal_echo(struct mptcp_sock * msk)991d91d322aSGeliang Tang static inline bool mptcp_pm_should_add_signal_echo(struct mptcp_sock *msk)
992d91d322aSGeliang Tang {
99313ad9f01SGeliang Tang return READ_ONCE(msk->pm.addr_signal) & BIT(MPTCP_ADD_ADDR_ECHO);
9941b1c7a0eSPeter Krystad }
9951b1c7a0eSPeter Krystad
mptcp_pm_should_rm_signal(struct mptcp_sock * msk)9965cb104aeSGeliang Tang static inline bool mptcp_pm_should_rm_signal(struct mptcp_sock *msk)
9975cb104aeSGeliang Tang {
99813ad9f01SGeliang Tang return READ_ONCE(msk->pm.addr_signal) & BIT(MPTCP_RM_ADDR_SIGNAL);
9995cb104aeSGeliang Tang }
10005cb104aeSGeliang Tang
mptcp_pm_is_userspace(const struct mptcp_sock * msk)100114b06811SMat Martineau static inline bool mptcp_pm_is_userspace(const struct mptcp_sock *msk)
100214b06811SMat Martineau {
100314b06811SMat Martineau return READ_ONCE(msk->pm.pm_type) == MPTCP_PM_TYPE_USERSPACE;
100414b06811SMat Martineau }
100514b06811SMat Martineau
mptcp_pm_is_kernel(const struct mptcp_sock * msk)10064d25247dSKishen Maloor static inline bool mptcp_pm_is_kernel(const struct mptcp_sock *msk)
10074d25247dSKishen Maloor {
10084d25247dSKishen Maloor return READ_ONCE(msk->pm.pm_type) == MPTCP_PM_TYPE_KERNEL;
10094d25247dSKishen Maloor }
10104d25247dSKishen Maloor
mptcp_add_addr_len(int family,bool echo,bool port)10114a2777a8SGeliang Tang static inline unsigned int mptcp_add_addr_len(int family, bool echo, bool port)
10121b1c7a0eSPeter Krystad {
10132ec72faeSGeliang Tang u8 len = TCPOLEN_MPTCP_ADD_ADDR_BASE;
10142ec72faeSGeliang Tang
10152ec72faeSGeliang Tang if (family == AF_INET6)
10162ec72faeSGeliang Tang len = TCPOLEN_MPTCP_ADD_ADDR6_BASE;
10172ec72faeSGeliang Tang if (!echo)
10182ec72faeSGeliang Tang len += MPTCPOPT_THMAC_LEN;
101927ab92d9SDavide Caratti /* account for 2 trailing 'nop' options */
10204a2777a8SGeliang Tang if (port)
102127ab92d9SDavide Caratti len += TCPOLEN_MPTCP_PORT_LEN + TCPOLEN_MPTCP_PORT_ALIGN;
10222ec72faeSGeliang Tang
10232ec72faeSGeliang Tang return len;
10241b1c7a0eSPeter Krystad }
10251b1c7a0eSPeter Krystad
mptcp_rm_addr_len(const struct mptcp_rm_list * rm_list)10266445e17aSGeliang Tang static inline int mptcp_rm_addr_len(const struct mptcp_rm_list *rm_list)
10276445e17aSGeliang Tang {
10286445e17aSGeliang Tang if (rm_list->nr == 0 || rm_list->nr > MPTCP_RM_IDS_MAX)
10296445e17aSGeliang Tang return -EINVAL;
10306445e17aSGeliang Tang
10316445e17aSGeliang Tang return TCPOLEN_MPTCP_RM_ADDR_BASE + roundup(rm_list->nr - 1, 4) + 1;
10326445e17aSGeliang Tang }
10336445e17aSGeliang Tang
103490d93088SPaolo Abeni bool mptcp_pm_add_addr_signal(struct mptcp_sock *msk, const struct sk_buff *skb,
10351f5e9e2fSYonglong Li unsigned int opt_size, unsigned int remaining,
1036f462a446SYonglong Li struct mptcp_addr_info *addr, bool *echo,
1037af7939f3SGeliang Tang bool *drop_other_suboptions);
10385cb104aeSGeliang Tang bool mptcp_pm_rm_addr_signal(struct mptcp_sock *msk, unsigned int remaining,
10396445e17aSGeliang Tang struct mptcp_rm_list *rm_list);
10401b1c7a0eSPeter Krystad int mptcp_pm_get_local_id(struct mptcp_sock *msk, struct sock_common *skc);
10419bbec87eSGeliang Tang int mptcp_pm_nl_get_local_id(struct mptcp_sock *msk, struct mptcp_addr_info *skc);
10428b201370SKishen Maloor int mptcp_userspace_pm_get_local_id(struct mptcp_sock *msk, struct mptcp_addr_info *skc);
1043fff9b920SMatthieu Baerts (NGI0) bool mptcp_pm_is_backup(struct mptcp_sock *msk, struct sock_common *skc);
1044fff9b920SMatthieu Baerts (NGI0) bool mptcp_pm_nl_is_backup(struct mptcp_sock *msk, struct mptcp_addr_info *skc);
1045fff9b920SMatthieu Baerts (NGI0) bool mptcp_userspace_pm_is_backup(struct mptcp_sock *msk, struct mptcp_addr_info *skc);
10461b1c7a0eSPeter Krystad
subflow_get_local_id(const struct mptcp_subflow_context * subflow)1047ba2cf922SPaolo Abeni static inline u8 subflow_get_local_id(const struct mptcp_subflow_context *subflow)
1048ba2cf922SPaolo Abeni {
1049ba2cf922SPaolo Abeni int local_id = READ_ONCE(subflow->local_id);
1050ba2cf922SPaolo Abeni
1051ba2cf922SPaolo Abeni if (local_id < 0)
1052ba2cf922SPaolo Abeni return 0;
1053ba2cf922SPaolo Abeni return local_id;
1054ba2cf922SPaolo Abeni }
1055ba2cf922SPaolo Abeni
1056d39dcecaSPaolo Abeni void __init mptcp_pm_nl_init(void);
1057e9801430SFlorian Westphal void mptcp_pm_nl_work(struct mptcp_sock *msk);
105890d93088SPaolo Abeni unsigned int mptcp_pm_get_add_addr_signal_max(const struct mptcp_sock *msk);
105990d93088SPaolo Abeni unsigned int mptcp_pm_get_add_addr_accept_max(const struct mptcp_sock *msk);
106090d93088SPaolo Abeni unsigned int mptcp_pm_get_subflows_max(const struct mptcp_sock *msk);
106190d93088SPaolo Abeni unsigned int mptcp_pm_get_local_addr_max(const struct mptcp_sock *msk);
106201cacb00SPaolo Abeni
106395d68651SPaolo Abeni /* called under PM lock */
__mptcp_pm_close_subflow(struct mptcp_sock * msk)106495d68651SPaolo Abeni static inline void __mptcp_pm_close_subflow(struct mptcp_sock *msk)
106595d68651SPaolo Abeni {
106695d68651SPaolo Abeni if (--msk->pm.subflows < mptcp_pm_get_subflows_max(msk))
106795d68651SPaolo Abeni WRITE_ONCE(msk->pm.accept_subflow, true);
106895d68651SPaolo Abeni }
106995d68651SPaolo Abeni
mptcp_pm_close_subflow(struct mptcp_sock * msk)107095d68651SPaolo Abeni static inline void mptcp_pm_close_subflow(struct mptcp_sock *msk)
107195d68651SPaolo Abeni {
107295d68651SPaolo Abeni spin_lock_bh(&msk->pm.lock);
107395d68651SPaolo Abeni __mptcp_pm_close_subflow(msk);
107495d68651SPaolo Abeni spin_unlock_bh(&msk->pm.lock);
107595d68651SPaolo Abeni }
107695d68651SPaolo Abeni
107778962489SFlorian Westphal void mptcp_sockopt_sync(struct mptcp_sock *msk, struct sock *ssk);
10783e501490SPaolo Abeni void mptcp_sockopt_sync_locked(struct mptcp_sock *msk, struct sock *ssk);
107978962489SFlorian Westphal
mptcp_get_ext(const struct sk_buff * skb)1080dc87efdbSFlorian Westphal static inline struct mptcp_ext *mptcp_get_ext(const struct sk_buff *skb)
10816d0060f6SMat Martineau {
10826d0060f6SMat Martineau return (struct mptcp_ext *)skb_ext_find(skb, SKB_EXT_MPTCP);
10836d0060f6SMat Martineau }
10846d0060f6SMat Martineau
10855147dfb5SDavide Caratti void mptcp_diag_subflow_init(struct tcp_ulp_ops *ops);
10865147dfb5SDavide Caratti
__mptcp_check_fallback(const struct mptcp_sock * msk)1087d5f49190SPaolo Abeni static inline bool __mptcp_check_fallback(const struct mptcp_sock *msk)
1088e1ff9e82SDavide Caratti {
1089e1ff9e82SDavide Caratti return test_bit(MPTCP_FALLBACK_DONE, &msk->flags);
1090e1ff9e82SDavide Caratti }
1091e1ff9e82SDavide Caratti
mptcp_check_fallback(const struct sock * sk)1092d5f49190SPaolo Abeni static inline bool mptcp_check_fallback(const struct sock *sk)
1093e1ff9e82SDavide Caratti {
1094e1ff9e82SDavide Caratti struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(sk);
1095e1ff9e82SDavide Caratti struct mptcp_sock *msk = mptcp_sk(subflow->conn);
1096e1ff9e82SDavide Caratti
1097e1ff9e82SDavide Caratti return __mptcp_check_fallback(msk);
1098e1ff9e82SDavide Caratti }
1099e1ff9e82SDavide Caratti
__mptcp_do_fallback(struct mptcp_sock * msk)1100e1ff9e82SDavide Caratti static inline void __mptcp_do_fallback(struct mptcp_sock *msk)
1101e1ff9e82SDavide Caratti {
1102e1ff9e82SDavide Caratti if (test_bit(MPTCP_FALLBACK_DONE, &msk->flags)) {
11033d2e1b82SMatthieu Baerts (NGI0) pr_debug("TCP fallback already done (msk=%p)\n", msk);
1104e1ff9e82SDavide Caratti return;
1105e1ff9e82SDavide Caratti }
1106*47f42722SMatthieu Baerts (NGI0) if (WARN_ON_ONCE(!READ_ONCE(msk->allow_infinite_fallback)))
1107*47f42722SMatthieu Baerts (NGI0) return;
1108e1ff9e82SDavide Caratti set_bit(MPTCP_FALLBACK_DONE, &msk->flags);
1109e1ff9e82SDavide Caratti }
1110e1ff9e82SDavide Caratti
1111d51991e2SPaolo Abeni static inline void mptcp_do_fallback(struct sock *ssk)
1112e1ff9e82SDavide Caratti {
1113d51991e2SPaolo Abeni struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(ssk);
1114d51991e2SPaolo Abeni struct sock *sk = subflow->conn;
1115d51991e2SPaolo Abeni struct mptcp_sock *msk;
1116e1ff9e82SDavide Caratti
1117d51991e2SPaolo Abeni msk = mptcp_sk(sk);
1118e1ff9e82SDavide Caratti __mptcp_do_fallback(msk);
1119d51991e2SPaolo Abeni if (READ_ONCE(msk->snd_data_fin_enable) && !(ssk->sk_shutdown & SEND_SHUTDOWN)) {
1120d51991e2SPaolo Abeni gfp_t saved_allocation = ssk->sk_allocation;
1121d51991e2SPaolo Abeni
1122d51991e2SPaolo Abeni /* we are in a atomic (BH) scope, override ssk default for data
1123d51991e2SPaolo Abeni * fin allocation
1124d51991e2SPaolo Abeni */
1125d51991e2SPaolo Abeni ssk->sk_allocation = GFP_ATOMIC;
1126d51991e2SPaolo Abeni ssk->sk_shutdown |= SEND_SHUTDOWN;
1127d51991e2SPaolo Abeni tcp_shutdown(ssk, SEND_SHUTDOWN);
1128d51991e2SPaolo Abeni ssk->sk_allocation = saved_allocation;
1129d51991e2SPaolo Abeni }
1130e1ff9e82SDavide Caratti }
1131e1ff9e82SDavide Caratti
mptcp_check_infinite_map(struct sk_buff * skb)11323d2e1b82SMatthieu Baerts (NGI0) #define pr_fallback(a) pr_debug("%s:fallback to TCP (msk=%p)\n", __func__, a)
1133e1ff9e82SDavide Caratti
11341e39e5a3SGeliang Tang static inline bool mptcp_check_infinite_map(struct sk_buff *skb)
11351e39e5a3SGeliang Tang {
11361e39e5a3SGeliang Tang struct mptcp_ext *mpext;
11371e39e5a3SGeliang Tang
11381e39e5a3SGeliang Tang mpext = skb ? mptcp_get_ext(skb) : NULL;
11391e39e5a3SGeliang Tang if (mpext && mpext->infinite_map)
11401e39e5a3SGeliang Tang return true;
11411e39e5a3SGeliang Tang
11421e39e5a3SGeliang Tang return false;
11431e39e5a3SGeliang Tang }
11441e39e5a3SGeliang Tang
114570c708e8SKishen Maloor static inline bool is_active_ssk(struct mptcp_subflow_context *subflow)
114670c708e8SKishen Maloor {
114770c708e8SKishen Maloor return (subflow->request_mptcp || subflow->request_join);
subflow_simultaneous_connect(struct sock * sk)114870c708e8SKishen Maloor }
114970c708e8SKishen Maloor
11508fd73804SDavide Caratti static inline bool subflow_simultaneous_connect(struct sock *sk)
11518fd73804SDavide Caratti {
11528fd73804SDavide Caratti struct mptcp_subflow_context *subflow = mptcp_subflow_ctx(sk);
11538fd73804SDavide Caratti
11544bfe217eSPaolo Abeni return (1 << sk->sk_state) &
11554bfe217eSPaolo Abeni (TCPF_ESTABLISHED | TCPF_FIN_WAIT1 | TCPF_FIN_WAIT2 | TCPF_CLOSING) &&
115670c708e8SKishen Maloor is_active_ssk(subflow) &&
11578fd73804SDavide Caratti !subflow->conn_finished;
11588fd73804SDavide Caratti }
11598fd73804SDavide Caratti
11609466a1ccSFlorian Westphal #ifdef CONFIG_SYN_COOKIES
11619466a1ccSFlorian Westphal void subflow_init_req_cookie_join_save(const struct mptcp_subflow_request_sock *subflow_req,
11629466a1ccSFlorian Westphal struct sk_buff *skb);
11639466a1ccSFlorian Westphal bool mptcp_token_join_cookie_init_state(struct mptcp_subflow_request_sock *subflow_req,
11649466a1ccSFlorian Westphal struct sk_buff *skb);
11659466a1ccSFlorian Westphal void __init mptcp_join_cookie_init(void);
subflow_init_req_cookie_join_save(const struct mptcp_subflow_request_sock * subflow_req,struct sk_buff * skb)11669466a1ccSFlorian Westphal #else
11679466a1ccSFlorian Westphal static inline void
11689466a1ccSFlorian Westphal subflow_init_req_cookie_join_save(const struct mptcp_subflow_request_sock *subflow_req,
11699466a1ccSFlorian Westphal struct sk_buff *skb) {}
11709466a1ccSFlorian Westphal static inline bool
11719466a1ccSFlorian Westphal mptcp_token_join_cookie_init_state(struct mptcp_subflow_request_sock *subflow_req,
11729466a1ccSFlorian Westphal struct sk_buff *skb)
11739466a1ccSFlorian Westphal {
11749466a1ccSFlorian Westphal return false;
mptcp_join_cookie_init(void)11759466a1ccSFlorian Westphal }
11769466a1ccSFlorian Westphal
11779466a1ccSFlorian Westphal static inline void mptcp_join_cookie_init(void) {}
11789466a1ccSFlorian Westphal #endif
11799466a1ccSFlorian Westphal
1180f870fa0bSMat Martineau #endif /* __MPTCP_PROTOCOL_H */
1181