xref: /openbmc/linux/net/mptcp/sched.c (revision ac8f933664c3a0e2d42f6ee9a2a6d25f87cb23f6)
1740ebe35SGeliang Tang // SPDX-License-Identifier: GPL-2.0
2740ebe35SGeliang Tang /* Multipath TCP
3740ebe35SGeliang Tang  *
4740ebe35SGeliang Tang  * Copyright (c) 2022, SUSE.
5740ebe35SGeliang Tang  */
6740ebe35SGeliang Tang 
7740ebe35SGeliang Tang #define pr_fmt(fmt) "MPTCP: " fmt
8740ebe35SGeliang Tang 
9740ebe35SGeliang Tang #include <linux/kernel.h>
10740ebe35SGeliang Tang #include <linux/module.h>
11740ebe35SGeliang Tang #include <linux/list.h>
12740ebe35SGeliang Tang #include <linux/rculist.h>
13740ebe35SGeliang Tang #include <linux/spinlock.h>
14740ebe35SGeliang Tang #include "protocol.h"
15740ebe35SGeliang Tang 
16740ebe35SGeliang Tang static DEFINE_SPINLOCK(mptcp_sched_list_lock);
17740ebe35SGeliang Tang static LIST_HEAD(mptcp_sched_list);
18740ebe35SGeliang Tang 
mptcp_sched_default_get_subflow(struct mptcp_sock * msk,struct mptcp_sched_data * data)19ed1ad86bSGeliang Tang static int mptcp_sched_default_get_subflow(struct mptcp_sock *msk,
20ed1ad86bSGeliang Tang 					   struct mptcp_sched_data *data)
21ed1ad86bSGeliang Tang {
22ed1ad86bSGeliang Tang 	struct sock *ssk;
23ed1ad86bSGeliang Tang 
24ed1ad86bSGeliang Tang 	ssk = data->reinject ? mptcp_subflow_get_retrans(msk) :
25ed1ad86bSGeliang Tang 			       mptcp_subflow_get_send(msk);
26ed1ad86bSGeliang Tang 	if (!ssk)
27ed1ad86bSGeliang Tang 		return -EINVAL;
28ed1ad86bSGeliang Tang 
29ed1ad86bSGeliang Tang 	mptcp_subflow_set_scheduled(mptcp_subflow_ctx(ssk), true);
30ed1ad86bSGeliang Tang 	return 0;
31ed1ad86bSGeliang Tang }
32ed1ad86bSGeliang Tang 
33ed1ad86bSGeliang Tang static struct mptcp_sched_ops mptcp_sched_default = {
34ed1ad86bSGeliang Tang 	.get_subflow	= mptcp_sched_default_get_subflow,
35ed1ad86bSGeliang Tang 	.name		= "default",
36ed1ad86bSGeliang Tang 	.owner		= THIS_MODULE,
37ed1ad86bSGeliang Tang };
38ed1ad86bSGeliang Tang 
39740ebe35SGeliang Tang /* Must be called with rcu read lock held */
mptcp_sched_find(const char * name)40740ebe35SGeliang Tang struct mptcp_sched_ops *mptcp_sched_find(const char *name)
41740ebe35SGeliang Tang {
42740ebe35SGeliang Tang 	struct mptcp_sched_ops *sched, *ret = NULL;
43740ebe35SGeliang Tang 
44740ebe35SGeliang Tang 	list_for_each_entry_rcu(sched, &mptcp_sched_list, list) {
45740ebe35SGeliang Tang 		if (!strcmp(sched->name, name)) {
46740ebe35SGeliang Tang 			ret = sched;
47740ebe35SGeliang Tang 			break;
48740ebe35SGeliang Tang 		}
49740ebe35SGeliang Tang 	}
50740ebe35SGeliang Tang 
51740ebe35SGeliang Tang 	return ret;
52740ebe35SGeliang Tang }
53740ebe35SGeliang Tang 
mptcp_register_scheduler(struct mptcp_sched_ops * sched)54740ebe35SGeliang Tang int mptcp_register_scheduler(struct mptcp_sched_ops *sched)
55740ebe35SGeliang Tang {
56740ebe35SGeliang Tang 	if (!sched->get_subflow)
57740ebe35SGeliang Tang 		return -EINVAL;
58740ebe35SGeliang Tang 
59740ebe35SGeliang Tang 	spin_lock(&mptcp_sched_list_lock);
60740ebe35SGeliang Tang 	if (mptcp_sched_find(sched->name)) {
61740ebe35SGeliang Tang 		spin_unlock(&mptcp_sched_list_lock);
62740ebe35SGeliang Tang 		return -EEXIST;
63740ebe35SGeliang Tang 	}
64740ebe35SGeliang Tang 	list_add_tail_rcu(&sched->list, &mptcp_sched_list);
65740ebe35SGeliang Tang 	spin_unlock(&mptcp_sched_list_lock);
66740ebe35SGeliang Tang 
67*3d2e1b82SMatthieu Baerts (NGI0) 	pr_debug("%s registered\n", sched->name);
68740ebe35SGeliang Tang 	return 0;
69740ebe35SGeliang Tang }
70740ebe35SGeliang Tang 
mptcp_unregister_scheduler(struct mptcp_sched_ops * sched)71740ebe35SGeliang Tang void mptcp_unregister_scheduler(struct mptcp_sched_ops *sched)
72740ebe35SGeliang Tang {
73ed1ad86bSGeliang Tang 	if (sched == &mptcp_sched_default)
74ed1ad86bSGeliang Tang 		return;
75ed1ad86bSGeliang Tang 
76740ebe35SGeliang Tang 	spin_lock(&mptcp_sched_list_lock);
77740ebe35SGeliang Tang 	list_del_rcu(&sched->list);
78740ebe35SGeliang Tang 	spin_unlock(&mptcp_sched_list_lock);
79740ebe35SGeliang Tang }
801730b2b2SGeliang Tang 
mptcp_sched_init(void)81ed1ad86bSGeliang Tang void mptcp_sched_init(void)
82ed1ad86bSGeliang Tang {
83ed1ad86bSGeliang Tang 	mptcp_register_scheduler(&mptcp_sched_default);
84ed1ad86bSGeliang Tang }
85ed1ad86bSGeliang Tang 
mptcp_init_sched(struct mptcp_sock * msk,struct mptcp_sched_ops * sched)861730b2b2SGeliang Tang int mptcp_init_sched(struct mptcp_sock *msk,
871730b2b2SGeliang Tang 		     struct mptcp_sched_ops *sched)
881730b2b2SGeliang Tang {
891730b2b2SGeliang Tang 	if (!sched)
90ed1ad86bSGeliang Tang 		sched = &mptcp_sched_default;
911730b2b2SGeliang Tang 
921730b2b2SGeliang Tang 	if (!bpf_try_module_get(sched, sched->owner))
931730b2b2SGeliang Tang 		return -EBUSY;
941730b2b2SGeliang Tang 
951730b2b2SGeliang Tang 	msk->sched = sched;
961730b2b2SGeliang Tang 	if (msk->sched->init)
971730b2b2SGeliang Tang 		msk->sched->init(msk);
981730b2b2SGeliang Tang 
99*3d2e1b82SMatthieu Baerts (NGI0) 	pr_debug("sched=%s\n", msk->sched->name);
1001730b2b2SGeliang Tang 
1011730b2b2SGeliang Tang 	return 0;
1021730b2b2SGeliang Tang }
1031730b2b2SGeliang Tang 
mptcp_release_sched(struct mptcp_sock * msk)1041730b2b2SGeliang Tang void mptcp_release_sched(struct mptcp_sock *msk)
1051730b2b2SGeliang Tang {
1061730b2b2SGeliang Tang 	struct mptcp_sched_ops *sched = msk->sched;
1071730b2b2SGeliang Tang 
1081730b2b2SGeliang Tang 	if (!sched)
1091730b2b2SGeliang Tang 		return;
1101730b2b2SGeliang Tang 
1111730b2b2SGeliang Tang 	msk->sched = NULL;
1121730b2b2SGeliang Tang 	if (sched->release)
1131730b2b2SGeliang Tang 		sched->release(msk);
1141730b2b2SGeliang Tang 
1151730b2b2SGeliang Tang 	bpf_module_put(sched, sched->owner);
1161730b2b2SGeliang Tang }
117fce68b03SGeliang Tang 
mptcp_subflow_set_scheduled(struct mptcp_subflow_context * subflow,bool scheduled)118fce68b03SGeliang Tang void mptcp_subflow_set_scheduled(struct mptcp_subflow_context *subflow,
119fce68b03SGeliang Tang 				 bool scheduled)
120fce68b03SGeliang Tang {
121fce68b03SGeliang Tang 	WRITE_ONCE(subflow->scheduled, scheduled);
122fce68b03SGeliang Tang }
12307336a87SGeliang Tang 
mptcp_sched_get_send(struct mptcp_sock * msk)12407336a87SGeliang Tang int mptcp_sched_get_send(struct mptcp_sock *msk)
12507336a87SGeliang Tang {
12607336a87SGeliang Tang 	struct mptcp_subflow_context *subflow;
12707336a87SGeliang Tang 	struct mptcp_sched_data data;
12807336a87SGeliang Tang 
1290fa1b378SGeliang Tang 	msk_owned_by_me(msk);
1300fa1b378SGeliang Tang 
1310fa1b378SGeliang Tang 	/* the following check is moved out of mptcp_subflow_get_send */
1320fa1b378SGeliang Tang 	if (__mptcp_check_fallback(msk)) {
1330fa1b378SGeliang Tang 		if (msk->first &&
1340fa1b378SGeliang Tang 		    __tcp_can_send(msk->first) &&
1350fa1b378SGeliang Tang 		    sk_stream_memory_free(msk->first)) {
1360fa1b378SGeliang Tang 			mptcp_subflow_set_scheduled(mptcp_subflow_ctx(msk->first), true);
1370fa1b378SGeliang Tang 			return 0;
1380fa1b378SGeliang Tang 		}
1390fa1b378SGeliang Tang 		return -EINVAL;
1400fa1b378SGeliang Tang 	}
1410fa1b378SGeliang Tang 
14207336a87SGeliang Tang 	mptcp_for_each_subflow(msk, subflow) {
14307336a87SGeliang Tang 		if (READ_ONCE(subflow->scheduled))
14407336a87SGeliang Tang 			return 0;
14507336a87SGeliang Tang 	}
14607336a87SGeliang Tang 
14707336a87SGeliang Tang 	data.reinject = false;
148ed1ad86bSGeliang Tang 	if (msk->sched == &mptcp_sched_default || !msk->sched)
149ed1ad86bSGeliang Tang 		return mptcp_sched_default_get_subflow(msk, &data);
15007336a87SGeliang Tang 	return msk->sched->get_subflow(msk, &data);
15107336a87SGeliang Tang }
15207336a87SGeliang Tang 
mptcp_sched_get_retrans(struct mptcp_sock * msk)15307336a87SGeliang Tang int mptcp_sched_get_retrans(struct mptcp_sock *msk)
15407336a87SGeliang Tang {
15507336a87SGeliang Tang 	struct mptcp_subflow_context *subflow;
15607336a87SGeliang Tang 	struct mptcp_sched_data data;
15707336a87SGeliang Tang 
158ee2708aeSGeliang Tang 	msk_owned_by_me(msk);
159ee2708aeSGeliang Tang 
160ee2708aeSGeliang Tang 	/* the following check is moved out of mptcp_subflow_get_retrans */
161ee2708aeSGeliang Tang 	if (__mptcp_check_fallback(msk))
162ee2708aeSGeliang Tang 		return -EINVAL;
163ee2708aeSGeliang Tang 
16407336a87SGeliang Tang 	mptcp_for_each_subflow(msk, subflow) {
16507336a87SGeliang Tang 		if (READ_ONCE(subflow->scheduled))
16607336a87SGeliang Tang 			return 0;
16707336a87SGeliang Tang 	}
16807336a87SGeliang Tang 
16907336a87SGeliang Tang 	data.reinject = true;
170ed1ad86bSGeliang Tang 	if (msk->sched == &mptcp_sched_default || !msk->sched)
171ed1ad86bSGeliang Tang 		return mptcp_sched_default_get_subflow(msk, &data);
17207336a87SGeliang Tang 	return msk->sched->get_subflow(msk, &data);
17307336a87SGeliang Tang }
174