13b3009eaSChuck Lever // SPDX-License-Identifier: GPL-2.0-only
23b3009eaSChuck Lever /*
33b3009eaSChuck Lever * Generic netlink handshake service
43b3009eaSChuck Lever *
53b3009eaSChuck Lever * Author: Chuck Lever <chuck.lever@oracle.com>
63b3009eaSChuck Lever *
73b3009eaSChuck Lever * Copyright (c) 2023, Oracle and/or its affiliates.
83b3009eaSChuck Lever */
93b3009eaSChuck Lever
103b3009eaSChuck Lever #include <linux/types.h>
113b3009eaSChuck Lever #include <linux/socket.h>
123b3009eaSChuck Lever #include <linux/kernel.h>
133b3009eaSChuck Lever #include <linux/module.h>
143b3009eaSChuck Lever #include <linux/skbuff.h>
153b3009eaSChuck Lever #include <linux/mm.h>
163b3009eaSChuck Lever
173b3009eaSChuck Lever #include <net/sock.h>
183b3009eaSChuck Lever #include <net/genetlink.h>
193b3009eaSChuck Lever #include <net/netns/generic.h>
203b3009eaSChuck Lever
2188232ec1SChuck Lever #include <kunit/visibility.h>
2288232ec1SChuck Lever
233b3009eaSChuck Lever #include <uapi/linux/handshake.h>
243b3009eaSChuck Lever #include "handshake.h"
253b3009eaSChuck Lever #include "genl.h"
263b3009eaSChuck Lever
273b3009eaSChuck Lever #include <trace/events/handshake.h>
283b3009eaSChuck Lever
293b3009eaSChuck Lever /**
303b3009eaSChuck Lever * handshake_genl_notify - Notify handlers that a request is waiting
313b3009eaSChuck Lever * @net: target network namespace
323b3009eaSChuck Lever * @proto: handshake protocol
333b3009eaSChuck Lever * @flags: memory allocation control flags
343b3009eaSChuck Lever *
353b3009eaSChuck Lever * Returns zero on success or a negative errno if notification failed.
363b3009eaSChuck Lever */
handshake_genl_notify(struct net * net,const struct handshake_proto * proto,gfp_t flags)373b3009eaSChuck Lever int handshake_genl_notify(struct net *net, const struct handshake_proto *proto,
383b3009eaSChuck Lever gfp_t flags)
393b3009eaSChuck Lever {
403b3009eaSChuck Lever struct sk_buff *msg;
413b3009eaSChuck Lever void *hdr;
423b3009eaSChuck Lever
4388232ec1SChuck Lever /* Disable notifications during unit testing */
4488232ec1SChuck Lever if (!test_bit(HANDSHAKE_F_PROTO_NOTIFY, &proto->hp_flags))
4588232ec1SChuck Lever return 0;
4688232ec1SChuck Lever
473b3009eaSChuck Lever if (!genl_has_listeners(&handshake_nl_family, net,
483b3009eaSChuck Lever proto->hp_handler_class))
493b3009eaSChuck Lever return -ESRCH;
503b3009eaSChuck Lever
51fc490880SChuck Lever msg = genlmsg_new(GENLMSG_DEFAULT_SIZE, flags);
523b3009eaSChuck Lever if (!msg)
533b3009eaSChuck Lever return -ENOMEM;
543b3009eaSChuck Lever
553b3009eaSChuck Lever hdr = genlmsg_put(msg, 0, 0, &handshake_nl_family, 0,
563b3009eaSChuck Lever HANDSHAKE_CMD_READY);
573b3009eaSChuck Lever if (!hdr)
583b3009eaSChuck Lever goto out_free;
593b3009eaSChuck Lever
603b3009eaSChuck Lever if (nla_put_u32(msg, HANDSHAKE_A_ACCEPT_HANDLER_CLASS,
613b3009eaSChuck Lever proto->hp_handler_class) < 0) {
623b3009eaSChuck Lever genlmsg_cancel(msg, hdr);
633b3009eaSChuck Lever goto out_free;
643b3009eaSChuck Lever }
653b3009eaSChuck Lever
663b3009eaSChuck Lever genlmsg_end(msg, hdr);
673b3009eaSChuck Lever return genlmsg_multicast_netns(&handshake_nl_family, net, msg,
683b3009eaSChuck Lever 0, proto->hp_handler_class, flags);
693b3009eaSChuck Lever
703b3009eaSChuck Lever out_free:
713b3009eaSChuck Lever nlmsg_free(msg);
723b3009eaSChuck Lever return -EMSGSIZE;
733b3009eaSChuck Lever }
743b3009eaSChuck Lever
753b3009eaSChuck Lever /**
763b3009eaSChuck Lever * handshake_genl_put - Create a generic netlink message header
773b3009eaSChuck Lever * @msg: buffer in which to create the header
783b3009eaSChuck Lever * @info: generic netlink message context
793b3009eaSChuck Lever *
803b3009eaSChuck Lever * Returns a ready-to-use header, or NULL.
813b3009eaSChuck Lever */
handshake_genl_put(struct sk_buff * msg,struct genl_info * info)823b3009eaSChuck Lever struct nlmsghdr *handshake_genl_put(struct sk_buff *msg,
833b3009eaSChuck Lever struct genl_info *info)
843b3009eaSChuck Lever {
853b3009eaSChuck Lever return genlmsg_put(msg, info->snd_portid, info->snd_seq,
863b3009eaSChuck Lever &handshake_nl_family, 0, info->genlhdr->cmd);
873b3009eaSChuck Lever }
883b3009eaSChuck Lever EXPORT_SYMBOL(handshake_genl_put);
893b3009eaSChuck Lever
handshake_nl_accept_doit(struct sk_buff * skb,struct genl_info * info)903b3009eaSChuck Lever int handshake_nl_accept_doit(struct sk_buff *skb, struct genl_info *info)
913b3009eaSChuck Lever {
923b3009eaSChuck Lever struct net *net = sock_net(skb->sk);
933b3009eaSChuck Lever struct handshake_net *hn = handshake_pernet(net);
943b3009eaSChuck Lever struct handshake_req *req = NULL;
953b3009eaSChuck Lever struct socket *sock;
963b3009eaSChuck Lever int class, fd, err;
973b3009eaSChuck Lever
983b3009eaSChuck Lever err = -EOPNOTSUPP;
993b3009eaSChuck Lever if (!hn)
1003b3009eaSChuck Lever goto out_status;
1013b3009eaSChuck Lever
1023b3009eaSChuck Lever err = -EINVAL;
1033b3009eaSChuck Lever if (GENL_REQ_ATTR_CHECK(info, HANDSHAKE_A_ACCEPT_HANDLER_CLASS))
1043b3009eaSChuck Lever goto out_status;
1053b3009eaSChuck Lever class = nla_get_u32(info->attrs[HANDSHAKE_A_ACCEPT_HANDLER_CLASS]);
1063b3009eaSChuck Lever
1073b3009eaSChuck Lever err = -EAGAIN;
1083b3009eaSChuck Lever req = handshake_req_next(hn, class);
1093b3009eaSChuck Lever if (!req)
1103b3009eaSChuck Lever goto out_status;
1113b3009eaSChuck Lever
1123b3009eaSChuck Lever sock = req->hr_sk->sk_socket;
113*7798b594SMoritz Wanzenböck fd = get_unused_fd_flags(O_CLOEXEC);
1143b3009eaSChuck Lever if (fd < 0) {
1153b3009eaSChuck Lever err = fd;
1163b3009eaSChuck Lever goto out_complete;
1173b3009eaSChuck Lever }
118*7798b594SMoritz Wanzenböck
1193b3009eaSChuck Lever err = req->hr_proto->hp_accept(req, info, fd);
1207ea9c1ecSChuck Lever if (err) {
121*7798b594SMoritz Wanzenböck put_unused_fd(fd);
1223b3009eaSChuck Lever goto out_complete;
1237ea9c1ecSChuck Lever }
1243b3009eaSChuck Lever
125*7798b594SMoritz Wanzenböck fd_install(fd, get_file(sock->file));
126*7798b594SMoritz Wanzenböck
1273b3009eaSChuck Lever trace_handshake_cmd_accept(net, req, req->hr_sk, fd);
1283b3009eaSChuck Lever return 0;
1293b3009eaSChuck Lever
1303b3009eaSChuck Lever out_complete:
1313b3009eaSChuck Lever handshake_complete(req, -EIO, NULL);
1323b3009eaSChuck Lever out_status:
1333b3009eaSChuck Lever trace_handshake_cmd_accept_err(net, req, NULL, err);
1343b3009eaSChuck Lever return err;
1353b3009eaSChuck Lever }
1363b3009eaSChuck Lever
handshake_nl_done_doit(struct sk_buff * skb,struct genl_info * info)1373b3009eaSChuck Lever int handshake_nl_done_doit(struct sk_buff *skb, struct genl_info *info)
1383b3009eaSChuck Lever {
1393b3009eaSChuck Lever struct net *net = sock_net(skb->sk);
14082ba0ff7SEric Dumazet struct handshake_req *req;
14182ba0ff7SEric Dumazet struct socket *sock;
1423b3009eaSChuck Lever int fd, status, err;
1433b3009eaSChuck Lever
1443b3009eaSChuck Lever if (GENL_REQ_ATTR_CHECK(info, HANDSHAKE_A_DONE_SOCKFD))
1453b3009eaSChuck Lever return -EINVAL;
1463b3009eaSChuck Lever fd = nla_get_u32(info->attrs[HANDSHAKE_A_DONE_SOCKFD]);
1473b3009eaSChuck Lever
1483b3009eaSChuck Lever sock = sockfd_lookup(fd, &err);
14982ba0ff7SEric Dumazet if (!sock)
15082ba0ff7SEric Dumazet return err;
1513b3009eaSChuck Lever
1523b3009eaSChuck Lever req = handshake_req_hash_lookup(sock->sk);
1533b3009eaSChuck Lever if (!req) {
1543b3009eaSChuck Lever err = -EBUSY;
15582ba0ff7SEric Dumazet trace_handshake_cmd_done_err(net, req, sock->sk, err);
1563b3009eaSChuck Lever fput(sock->file);
15782ba0ff7SEric Dumazet return err;
1583b3009eaSChuck Lever }
1593b3009eaSChuck Lever
1603b3009eaSChuck Lever trace_handshake_cmd_done(net, req, sock->sk, fd);
1613b3009eaSChuck Lever
1623b3009eaSChuck Lever status = -EIO;
1633b3009eaSChuck Lever if (info->attrs[HANDSHAKE_A_DONE_STATUS])
1643b3009eaSChuck Lever status = nla_get_u32(info->attrs[HANDSHAKE_A_DONE_STATUS]);
1653b3009eaSChuck Lever
1663b3009eaSChuck Lever handshake_complete(req, status, info);
1673b3009eaSChuck Lever fput(sock->file);
1683b3009eaSChuck Lever return 0;
1693b3009eaSChuck Lever }
1703b3009eaSChuck Lever
1713b3009eaSChuck Lever static unsigned int handshake_net_id;
1723b3009eaSChuck Lever
handshake_net_init(struct net * net)1733b3009eaSChuck Lever static int __net_init handshake_net_init(struct net *net)
1743b3009eaSChuck Lever {
1753b3009eaSChuck Lever struct handshake_net *hn = net_generic(net, handshake_net_id);
1763b3009eaSChuck Lever unsigned long tmp;
1773b3009eaSChuck Lever struct sysinfo si;
1783b3009eaSChuck Lever
1793b3009eaSChuck Lever /*
1803b3009eaSChuck Lever * Arbitrary limit to prevent handshakes that do not make
1813b3009eaSChuck Lever * progress from clogging up the system. The cap scales up
1823b3009eaSChuck Lever * with the amount of physical memory on the system.
1833b3009eaSChuck Lever */
1843b3009eaSChuck Lever si_meminfo(&si);
1853b3009eaSChuck Lever tmp = si.totalram / (25 * si.mem_unit);
1863b3009eaSChuck Lever hn->hn_pending_max = clamp(tmp, 3UL, 50UL);
1873b3009eaSChuck Lever
1883b3009eaSChuck Lever spin_lock_init(&hn->hn_lock);
1893b3009eaSChuck Lever hn->hn_pending = 0;
1903b3009eaSChuck Lever hn->hn_flags = 0;
1913b3009eaSChuck Lever INIT_LIST_HEAD(&hn->hn_requests);
1923b3009eaSChuck Lever return 0;
1933b3009eaSChuck Lever }
1943b3009eaSChuck Lever
handshake_net_exit(struct net * net)1953b3009eaSChuck Lever static void __net_exit handshake_net_exit(struct net *net)
1963b3009eaSChuck Lever {
1973b3009eaSChuck Lever struct handshake_net *hn = net_generic(net, handshake_net_id);
1983b3009eaSChuck Lever struct handshake_req *req;
1993b3009eaSChuck Lever LIST_HEAD(requests);
2003b3009eaSChuck Lever
2013b3009eaSChuck Lever /*
2023b3009eaSChuck Lever * Drain the net's pending list. Requests that have been
2033b3009eaSChuck Lever * accepted and are in progress will be destroyed when
2043b3009eaSChuck Lever * the socket is closed.
2053b3009eaSChuck Lever */
2063b3009eaSChuck Lever spin_lock(&hn->hn_lock);
2073b3009eaSChuck Lever set_bit(HANDSHAKE_F_NET_DRAINING, &hn->hn_flags);
2083b3009eaSChuck Lever list_splice_init(&requests, &hn->hn_requests);
2093b3009eaSChuck Lever spin_unlock(&hn->hn_lock);
2103b3009eaSChuck Lever
2113b3009eaSChuck Lever while (!list_empty(&requests)) {
2123b3009eaSChuck Lever req = list_first_entry(&requests, struct handshake_req, hr_list);
2133b3009eaSChuck Lever list_del(&req->hr_list);
2143b3009eaSChuck Lever
2153b3009eaSChuck Lever /*
2163b3009eaSChuck Lever * Requests on this list have not yet been
2173b3009eaSChuck Lever * accepted, so they do not have an fd to put.
2183b3009eaSChuck Lever */
2193b3009eaSChuck Lever
2203b3009eaSChuck Lever handshake_complete(req, -ETIMEDOUT, NULL);
2213b3009eaSChuck Lever }
2223b3009eaSChuck Lever }
2233b3009eaSChuck Lever
2246aa445e3SGeert Uytterhoeven static struct pernet_operations handshake_genl_net_ops = {
2253b3009eaSChuck Lever .init = handshake_net_init,
2263b3009eaSChuck Lever .exit = handshake_net_exit,
2273b3009eaSChuck Lever .id = &handshake_net_id,
2283b3009eaSChuck Lever .size = sizeof(struct handshake_net),
2293b3009eaSChuck Lever };
2303b3009eaSChuck Lever
2313b3009eaSChuck Lever /**
2323b3009eaSChuck Lever * handshake_pernet - Get the handshake private per-net structure
2333b3009eaSChuck Lever * @net: network namespace
2343b3009eaSChuck Lever *
2353b3009eaSChuck Lever * Returns a pointer to the net's private per-net structure for the
2363b3009eaSChuck Lever * handshake module, or NULL if handshake_init() failed.
2373b3009eaSChuck Lever */
handshake_pernet(struct net * net)2383b3009eaSChuck Lever struct handshake_net *handshake_pernet(struct net *net)
2393b3009eaSChuck Lever {
2403b3009eaSChuck Lever return handshake_net_id ?
2413b3009eaSChuck Lever net_generic(net, handshake_net_id) : NULL;
2423b3009eaSChuck Lever }
24388232ec1SChuck Lever EXPORT_SYMBOL_IF_KUNIT(handshake_pernet);
2443b3009eaSChuck Lever
handshake_init(void)2453b3009eaSChuck Lever static int __init handshake_init(void)
2463b3009eaSChuck Lever {
2473b3009eaSChuck Lever int ret;
2483b3009eaSChuck Lever
2493b3009eaSChuck Lever ret = handshake_req_hash_init();
2503b3009eaSChuck Lever if (ret) {
2513b3009eaSChuck Lever pr_warn("handshake: hash initialization failed (%d)\n", ret);
2523b3009eaSChuck Lever return ret;
2533b3009eaSChuck Lever }
2543b3009eaSChuck Lever
2553b3009eaSChuck Lever ret = genl_register_family(&handshake_nl_family);
2563b3009eaSChuck Lever if (ret) {
2573b3009eaSChuck Lever pr_warn("handshake: netlink registration failed (%d)\n", ret);
2583b3009eaSChuck Lever handshake_req_hash_destroy();
2593b3009eaSChuck Lever return ret;
2603b3009eaSChuck Lever }
2613b3009eaSChuck Lever
2623b3009eaSChuck Lever /*
2633b3009eaSChuck Lever * ORDER: register_pernet_subsys must be done last.
2643b3009eaSChuck Lever *
2653b3009eaSChuck Lever * If initialization does not make it past pernet_subsys
2663b3009eaSChuck Lever * registration, then handshake_net_id will remain 0. That
2673b3009eaSChuck Lever * shunts the handshake consumer API to return ENOTSUPP
2683b3009eaSChuck Lever * to prevent it from dereferencing something that hasn't
2693b3009eaSChuck Lever * been allocated.
2703b3009eaSChuck Lever */
2713b3009eaSChuck Lever ret = register_pernet_subsys(&handshake_genl_net_ops);
2723b3009eaSChuck Lever if (ret) {
2733b3009eaSChuck Lever pr_warn("handshake: pernet registration failed (%d)\n", ret);
2743b3009eaSChuck Lever genl_unregister_family(&handshake_nl_family);
2753b3009eaSChuck Lever handshake_req_hash_destroy();
2763b3009eaSChuck Lever }
2773b3009eaSChuck Lever
2783b3009eaSChuck Lever return ret;
2793b3009eaSChuck Lever }
2803b3009eaSChuck Lever
handshake_exit(void)2813b3009eaSChuck Lever static void __exit handshake_exit(void)
2823b3009eaSChuck Lever {
2833b3009eaSChuck Lever unregister_pernet_subsys(&handshake_genl_net_ops);
2843b3009eaSChuck Lever handshake_net_id = 0;
2853b3009eaSChuck Lever
2863b3009eaSChuck Lever handshake_req_hash_destroy();
2873b3009eaSChuck Lever genl_unregister_family(&handshake_nl_family);
2883b3009eaSChuck Lever }
2893b3009eaSChuck Lever
2903b3009eaSChuck Lever module_init(handshake_init);
2913b3009eaSChuck Lever module_exit(handshake_exit);
292