xref: /openbmc/linux/net/key/af_key.c (revision 5fa1f7680f2728d62561db6d4a9282c4d21f2324)
1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3  * net/key/af_key.c	An implementation of PF_KEYv2 sockets.
4  *
5  * Authors:	Maxim Giryaev	<gem@asplinux.ru>
6  *		David S. Miller	<davem@redhat.com>
7  *		Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
8  *		Kunihiro Ishiguro <kunihiro@ipinfusion.com>
9  *		Kazunori MIYAZAWA / USAGI Project <miyazawa@linux-ipv6.org>
10  *		Derek Atkins <derek@ihtfp.com>
11  */
12 
13 #include <linux/capability.h>
14 #include <linux/module.h>
15 #include <linux/kernel.h>
16 #include <linux/socket.h>
17 #include <linux/pfkeyv2.h>
18 #include <linux/ipsec.h>
19 #include <linux/skbuff.h>
20 #include <linux/rtnetlink.h>
21 #include <linux/in.h>
22 #include <linux/in6.h>
23 #include <linux/proc_fs.h>
24 #include <linux/init.h>
25 #include <linux/slab.h>
26 #include <net/net_namespace.h>
27 #include <net/netns/generic.h>
28 #include <net/xfrm.h>
29 
30 #include <net/sock.h>
31 
32 #define _X2KEY(x) ((x) == XFRM_INF ? 0 : (x))
33 #define _KEY2X(x) ((x) == 0 ? XFRM_INF : (x))
34 
35 static unsigned int pfkey_net_id __read_mostly;
36 struct netns_pfkey {
37 	/* List of all pfkey sockets. */
38 	struct hlist_head table;
39 	atomic_t socks_nr;
40 };
41 static DEFINE_MUTEX(pfkey_mutex);
42 
43 #define DUMMY_MARK 0
44 static const struct xfrm_mark dummy_mark = {0, 0};
45 struct pfkey_sock {
46 	/* struct sock must be the first member of struct pfkey_sock */
47 	struct sock	sk;
48 	int		registered;
49 	int		promisc;
50 
51 	struct {
52 		uint8_t		msg_version;
53 		uint32_t	msg_portid;
54 		int		(*dump)(struct pfkey_sock *sk);
55 		void		(*done)(struct pfkey_sock *sk);
56 		union {
57 			struct xfrm_policy_walk	policy;
58 			struct xfrm_state_walk	state;
59 		} u;
60 		struct sk_buff	*skb;
61 	} dump;
62 	struct mutex dump_lock;
63 };
64 
65 static int parse_sockaddr_pair(struct sockaddr *sa, int ext_len,
66 			       xfrm_address_t *saddr, xfrm_address_t *daddr,
67 			       u16 *family);
68 
69 static inline struct pfkey_sock *pfkey_sk(struct sock *sk)
70 {
71 	return (struct pfkey_sock *)sk;
72 }
73 
74 static int pfkey_can_dump(const struct sock *sk)
75 {
76 	if (3 * atomic_read(&sk->sk_rmem_alloc) <= 2 * sk->sk_rcvbuf)
77 		return 1;
78 	return 0;
79 }
80 
81 static void pfkey_terminate_dump(struct pfkey_sock *pfk)
82 {
83 	if (pfk->dump.dump) {
84 		if (pfk->dump.skb) {
85 			kfree_skb(pfk->dump.skb);
86 			pfk->dump.skb = NULL;
87 		}
88 		pfk->dump.done(pfk);
89 		pfk->dump.dump = NULL;
90 		pfk->dump.done = NULL;
91 	}
92 }
93 
94 static void pfkey_sock_destruct(struct sock *sk)
95 {
96 	struct net *net = sock_net(sk);
97 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
98 
99 	pfkey_terminate_dump(pfkey_sk(sk));
100 	skb_queue_purge(&sk->sk_receive_queue);
101 
102 	if (!sock_flag(sk, SOCK_DEAD)) {
103 		pr_err("Attempt to release alive pfkey socket: %p\n", sk);
104 		return;
105 	}
106 
107 	WARN_ON(atomic_read(&sk->sk_rmem_alloc));
108 	WARN_ON(refcount_read(&sk->sk_wmem_alloc));
109 
110 	atomic_dec(&net_pfkey->socks_nr);
111 }
112 
113 static const struct proto_ops pfkey_ops;
114 
115 static void pfkey_insert(struct sock *sk)
116 {
117 	struct net *net = sock_net(sk);
118 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
119 
120 	mutex_lock(&pfkey_mutex);
121 	sk_add_node_rcu(sk, &net_pfkey->table);
122 	mutex_unlock(&pfkey_mutex);
123 }
124 
125 static void pfkey_remove(struct sock *sk)
126 {
127 	mutex_lock(&pfkey_mutex);
128 	sk_del_node_init_rcu(sk);
129 	mutex_unlock(&pfkey_mutex);
130 }
131 
132 static struct proto key_proto = {
133 	.name	  = "KEY",
134 	.owner	  = THIS_MODULE,
135 	.obj_size = sizeof(struct pfkey_sock),
136 };
137 
138 static int pfkey_create(struct net *net, struct socket *sock, int protocol,
139 			int kern)
140 {
141 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
142 	struct sock *sk;
143 	struct pfkey_sock *pfk;
144 	int err;
145 
146 	if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
147 		return -EPERM;
148 	if (sock->type != SOCK_RAW)
149 		return -ESOCKTNOSUPPORT;
150 	if (protocol != PF_KEY_V2)
151 		return -EPROTONOSUPPORT;
152 
153 	err = -ENOMEM;
154 	sk = sk_alloc(net, PF_KEY, GFP_KERNEL, &key_proto, kern);
155 	if (sk == NULL)
156 		goto out;
157 
158 	pfk = pfkey_sk(sk);
159 	mutex_init(&pfk->dump_lock);
160 
161 	sock->ops = &pfkey_ops;
162 	sock_init_data(sock, sk);
163 
164 	sk->sk_family = PF_KEY;
165 	sk->sk_destruct = pfkey_sock_destruct;
166 
167 	atomic_inc(&net_pfkey->socks_nr);
168 
169 	pfkey_insert(sk);
170 
171 	return 0;
172 out:
173 	return err;
174 }
175 
176 static int pfkey_release(struct socket *sock)
177 {
178 	struct sock *sk = sock->sk;
179 
180 	if (!sk)
181 		return 0;
182 
183 	pfkey_remove(sk);
184 
185 	sock_orphan(sk);
186 	sock->sk = NULL;
187 	skb_queue_purge(&sk->sk_write_queue);
188 
189 	synchronize_rcu();
190 	sock_put(sk);
191 
192 	return 0;
193 }
194 
195 static int pfkey_broadcast_one(struct sk_buff *skb, gfp_t allocation,
196 			       struct sock *sk)
197 {
198 	int err = -ENOBUFS;
199 
200 	if (atomic_read(&sk->sk_rmem_alloc) > sk->sk_rcvbuf)
201 		return err;
202 
203 	skb = skb_clone(skb, allocation);
204 
205 	if (skb) {
206 		skb_set_owner_r(skb, sk);
207 		skb_queue_tail(&sk->sk_receive_queue, skb);
208 		sk->sk_data_ready(sk);
209 		err = 0;
210 	}
211 	return err;
212 }
213 
214 /* Send SKB to all pfkey sockets matching selected criteria.  */
215 #define BROADCAST_ALL		0
216 #define BROADCAST_ONE		1
217 #define BROADCAST_REGISTERED	2
218 #define BROADCAST_PROMISC_ONLY	4
219 static int pfkey_broadcast(struct sk_buff *skb, gfp_t allocation,
220 			   int broadcast_flags, struct sock *one_sk,
221 			   struct net *net)
222 {
223 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
224 	struct sock *sk;
225 	int err = -ESRCH;
226 
227 	/* XXX Do we need something like netlink_overrun?  I think
228 	 * XXX PF_KEY socket apps will not mind current behavior.
229 	 */
230 	if (!skb)
231 		return -ENOMEM;
232 
233 	rcu_read_lock();
234 	sk_for_each_rcu(sk, &net_pfkey->table) {
235 		struct pfkey_sock *pfk = pfkey_sk(sk);
236 		int err2;
237 
238 		/* Yes, it means that if you are meant to receive this
239 		 * pfkey message you receive it twice as promiscuous
240 		 * socket.
241 		 */
242 		if (pfk->promisc)
243 			pfkey_broadcast_one(skb, GFP_ATOMIC, sk);
244 
245 		/* the exact target will be processed later */
246 		if (sk == one_sk)
247 			continue;
248 		if (broadcast_flags != BROADCAST_ALL) {
249 			if (broadcast_flags & BROADCAST_PROMISC_ONLY)
250 				continue;
251 			if ((broadcast_flags & BROADCAST_REGISTERED) &&
252 			    !pfk->registered)
253 				continue;
254 			if (broadcast_flags & BROADCAST_ONE)
255 				continue;
256 		}
257 
258 		err2 = pfkey_broadcast_one(skb, GFP_ATOMIC, sk);
259 
260 		/* Error is cleared after successful sending to at least one
261 		 * registered KM */
262 		if ((broadcast_flags & BROADCAST_REGISTERED) && err)
263 			err = err2;
264 	}
265 	rcu_read_unlock();
266 
267 	if (one_sk != NULL)
268 		err = pfkey_broadcast_one(skb, allocation, one_sk);
269 
270 	kfree_skb(skb);
271 	return err;
272 }
273 
274 static int pfkey_do_dump(struct pfkey_sock *pfk)
275 {
276 	struct sadb_msg *hdr;
277 	int rc;
278 
279 	mutex_lock(&pfk->dump_lock);
280 	if (!pfk->dump.dump) {
281 		rc = 0;
282 		goto out;
283 	}
284 
285 	rc = pfk->dump.dump(pfk);
286 	if (rc == -ENOBUFS) {
287 		rc = 0;
288 		goto out;
289 	}
290 
291 	if (pfk->dump.skb) {
292 		if (!pfkey_can_dump(&pfk->sk)) {
293 			rc = 0;
294 			goto out;
295 		}
296 
297 		hdr = (struct sadb_msg *) pfk->dump.skb->data;
298 		hdr->sadb_msg_seq = 0;
299 		hdr->sadb_msg_errno = rc;
300 		pfkey_broadcast(pfk->dump.skb, GFP_ATOMIC, BROADCAST_ONE,
301 				&pfk->sk, sock_net(&pfk->sk));
302 		pfk->dump.skb = NULL;
303 	}
304 
305 	pfkey_terminate_dump(pfk);
306 
307 out:
308 	mutex_unlock(&pfk->dump_lock);
309 	return rc;
310 }
311 
312 static inline void pfkey_hdr_dup(struct sadb_msg *new,
313 				 const struct sadb_msg *orig)
314 {
315 	*new = *orig;
316 }
317 
318 static int pfkey_error(const struct sadb_msg *orig, int err, struct sock *sk)
319 {
320 	struct sk_buff *skb = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_KERNEL);
321 	struct sadb_msg *hdr;
322 
323 	if (!skb)
324 		return -ENOBUFS;
325 
326 	/* Woe be to the platform trying to support PFKEY yet
327 	 * having normal errnos outside the 1-255 range, inclusive.
328 	 */
329 	err = -err;
330 	if (err == ERESTARTSYS ||
331 	    err == ERESTARTNOHAND ||
332 	    err == ERESTARTNOINTR)
333 		err = EINTR;
334 	if (err >= 512)
335 		err = EINVAL;
336 	BUG_ON(err <= 0 || err >= 256);
337 
338 	hdr = skb_put(skb, sizeof(struct sadb_msg));
339 	pfkey_hdr_dup(hdr, orig);
340 	hdr->sadb_msg_errno = (uint8_t) err;
341 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) /
342 			     sizeof(uint64_t));
343 
344 	pfkey_broadcast(skb, GFP_KERNEL, BROADCAST_ONE, sk, sock_net(sk));
345 
346 	return 0;
347 }
348 
349 static const u8 sadb_ext_min_len[] = {
350 	[SADB_EXT_RESERVED]		= (u8) 0,
351 	[SADB_EXT_SA]			= (u8) sizeof(struct sadb_sa),
352 	[SADB_EXT_LIFETIME_CURRENT]	= (u8) sizeof(struct sadb_lifetime),
353 	[SADB_EXT_LIFETIME_HARD]	= (u8) sizeof(struct sadb_lifetime),
354 	[SADB_EXT_LIFETIME_SOFT]	= (u8) sizeof(struct sadb_lifetime),
355 	[SADB_EXT_ADDRESS_SRC]		= (u8) sizeof(struct sadb_address),
356 	[SADB_EXT_ADDRESS_DST]		= (u8) sizeof(struct sadb_address),
357 	[SADB_EXT_ADDRESS_PROXY]	= (u8) sizeof(struct sadb_address),
358 	[SADB_EXT_KEY_AUTH]		= (u8) sizeof(struct sadb_key),
359 	[SADB_EXT_KEY_ENCRYPT]		= (u8) sizeof(struct sadb_key),
360 	[SADB_EXT_IDENTITY_SRC]		= (u8) sizeof(struct sadb_ident),
361 	[SADB_EXT_IDENTITY_DST]		= (u8) sizeof(struct sadb_ident),
362 	[SADB_EXT_SENSITIVITY]		= (u8) sizeof(struct sadb_sens),
363 	[SADB_EXT_PROPOSAL]		= (u8) sizeof(struct sadb_prop),
364 	[SADB_EXT_SUPPORTED_AUTH]	= (u8) sizeof(struct sadb_supported),
365 	[SADB_EXT_SUPPORTED_ENCRYPT]	= (u8) sizeof(struct sadb_supported),
366 	[SADB_EXT_SPIRANGE]		= (u8) sizeof(struct sadb_spirange),
367 	[SADB_X_EXT_KMPRIVATE]		= (u8) sizeof(struct sadb_x_kmprivate),
368 	[SADB_X_EXT_POLICY]		= (u8) sizeof(struct sadb_x_policy),
369 	[SADB_X_EXT_SA2]		= (u8) sizeof(struct sadb_x_sa2),
370 	[SADB_X_EXT_NAT_T_TYPE]		= (u8) sizeof(struct sadb_x_nat_t_type),
371 	[SADB_X_EXT_NAT_T_SPORT]	= (u8) sizeof(struct sadb_x_nat_t_port),
372 	[SADB_X_EXT_NAT_T_DPORT]	= (u8) sizeof(struct sadb_x_nat_t_port),
373 	[SADB_X_EXT_NAT_T_OA]		= (u8) sizeof(struct sadb_address),
374 	[SADB_X_EXT_SEC_CTX]		= (u8) sizeof(struct sadb_x_sec_ctx),
375 	[SADB_X_EXT_KMADDRESS]		= (u8) sizeof(struct sadb_x_kmaddress),
376 	[SADB_X_EXT_FILTER]		= (u8) sizeof(struct sadb_x_filter),
377 };
378 
379 /* Verify sadb_address_{len,prefixlen} against sa_family.  */
380 static int verify_address_len(const void *p)
381 {
382 	const struct sadb_address *sp = p;
383 	const struct sockaddr *addr = (const struct sockaddr *)(sp + 1);
384 	const struct sockaddr_in *sin;
385 #if IS_ENABLED(CONFIG_IPV6)
386 	const struct sockaddr_in6 *sin6;
387 #endif
388 	int len;
389 
390 	if (sp->sadb_address_len <
391 	    DIV_ROUND_UP(sizeof(*sp) + offsetofend(typeof(*addr), sa_family),
392 			 sizeof(uint64_t)))
393 		return -EINVAL;
394 
395 	switch (addr->sa_family) {
396 	case AF_INET:
397 		len = DIV_ROUND_UP(sizeof(*sp) + sizeof(*sin), sizeof(uint64_t));
398 		if (sp->sadb_address_len != len ||
399 		    sp->sadb_address_prefixlen > 32)
400 			return -EINVAL;
401 		break;
402 #if IS_ENABLED(CONFIG_IPV6)
403 	case AF_INET6:
404 		len = DIV_ROUND_UP(sizeof(*sp) + sizeof(*sin6), sizeof(uint64_t));
405 		if (sp->sadb_address_len != len ||
406 		    sp->sadb_address_prefixlen > 128)
407 			return -EINVAL;
408 		break;
409 #endif
410 	default:
411 		/* It is user using kernel to keep track of security
412 		 * associations for another protocol, such as
413 		 * OSPF/RSVP/RIPV2/MIP.  It is user's job to verify
414 		 * lengths.
415 		 *
416 		 * XXX Actually, association/policy database is not yet
417 		 * XXX able to cope with arbitrary sockaddr families.
418 		 * XXX When it can, remove this -EINVAL.  -DaveM
419 		 */
420 		return -EINVAL;
421 	}
422 
423 	return 0;
424 }
425 
426 static inline int sadb_key_len(const struct sadb_key *key)
427 {
428 	int key_bytes = DIV_ROUND_UP(key->sadb_key_bits, 8);
429 
430 	return DIV_ROUND_UP(sizeof(struct sadb_key) + key_bytes,
431 			    sizeof(uint64_t));
432 }
433 
434 static int verify_key_len(const void *p)
435 {
436 	const struct sadb_key *key = p;
437 
438 	if (sadb_key_len(key) > key->sadb_key_len)
439 		return -EINVAL;
440 
441 	return 0;
442 }
443 
444 static inline int pfkey_sec_ctx_len(const struct sadb_x_sec_ctx *sec_ctx)
445 {
446 	return DIV_ROUND_UP(sizeof(struct sadb_x_sec_ctx) +
447 			    sec_ctx->sadb_x_ctx_len,
448 			    sizeof(uint64_t));
449 }
450 
451 static inline int verify_sec_ctx_len(const void *p)
452 {
453 	const struct sadb_x_sec_ctx *sec_ctx = p;
454 	int len = sec_ctx->sadb_x_ctx_len;
455 
456 	if (len > PAGE_SIZE)
457 		return -EINVAL;
458 
459 	len = pfkey_sec_ctx_len(sec_ctx);
460 
461 	if (sec_ctx->sadb_x_sec_len != len)
462 		return -EINVAL;
463 
464 	return 0;
465 }
466 
467 static inline struct xfrm_user_sec_ctx *pfkey_sadb2xfrm_user_sec_ctx(const struct sadb_x_sec_ctx *sec_ctx,
468 								     gfp_t gfp)
469 {
470 	struct xfrm_user_sec_ctx *uctx = NULL;
471 	int ctx_size = sec_ctx->sadb_x_ctx_len;
472 
473 	uctx = kmalloc((sizeof(*uctx)+ctx_size), gfp);
474 
475 	if (!uctx)
476 		return NULL;
477 
478 	uctx->len = pfkey_sec_ctx_len(sec_ctx);
479 	uctx->exttype = sec_ctx->sadb_x_sec_exttype;
480 	uctx->ctx_doi = sec_ctx->sadb_x_ctx_doi;
481 	uctx->ctx_alg = sec_ctx->sadb_x_ctx_alg;
482 	uctx->ctx_len = sec_ctx->sadb_x_ctx_len;
483 	memcpy(uctx + 1, sec_ctx + 1,
484 	       uctx->ctx_len);
485 
486 	return uctx;
487 }
488 
489 static int present_and_same_family(const struct sadb_address *src,
490 				   const struct sadb_address *dst)
491 {
492 	const struct sockaddr *s_addr, *d_addr;
493 
494 	if (!src || !dst)
495 		return 0;
496 
497 	s_addr = (const struct sockaddr *)(src + 1);
498 	d_addr = (const struct sockaddr *)(dst + 1);
499 	if (s_addr->sa_family != d_addr->sa_family)
500 		return 0;
501 	if (s_addr->sa_family != AF_INET
502 #if IS_ENABLED(CONFIG_IPV6)
503 	    && s_addr->sa_family != AF_INET6
504 #endif
505 		)
506 		return 0;
507 
508 	return 1;
509 }
510 
511 static int parse_exthdrs(struct sk_buff *skb, const struct sadb_msg *hdr, void **ext_hdrs)
512 {
513 	const char *p = (char *) hdr;
514 	int len = skb->len;
515 
516 	len -= sizeof(*hdr);
517 	p += sizeof(*hdr);
518 	while (len > 0) {
519 		const struct sadb_ext *ehdr = (const struct sadb_ext *) p;
520 		uint16_t ext_type;
521 		int ext_len;
522 
523 		if (len < sizeof(*ehdr))
524 			return -EINVAL;
525 
526 		ext_len  = ehdr->sadb_ext_len;
527 		ext_len *= sizeof(uint64_t);
528 		ext_type = ehdr->sadb_ext_type;
529 		if (ext_len < sizeof(uint64_t) ||
530 		    ext_len > len ||
531 		    ext_type == SADB_EXT_RESERVED)
532 			return -EINVAL;
533 
534 		if (ext_type <= SADB_EXT_MAX) {
535 			int min = (int) sadb_ext_min_len[ext_type];
536 			if (ext_len < min)
537 				return -EINVAL;
538 			if (ext_hdrs[ext_type-1] != NULL)
539 				return -EINVAL;
540 			switch (ext_type) {
541 			case SADB_EXT_ADDRESS_SRC:
542 			case SADB_EXT_ADDRESS_DST:
543 			case SADB_EXT_ADDRESS_PROXY:
544 			case SADB_X_EXT_NAT_T_OA:
545 				if (verify_address_len(p))
546 					return -EINVAL;
547 				break;
548 			case SADB_X_EXT_SEC_CTX:
549 				if (verify_sec_ctx_len(p))
550 					return -EINVAL;
551 				break;
552 			case SADB_EXT_KEY_AUTH:
553 			case SADB_EXT_KEY_ENCRYPT:
554 				if (verify_key_len(p))
555 					return -EINVAL;
556 				break;
557 			default:
558 				break;
559 			}
560 			ext_hdrs[ext_type-1] = (void *) p;
561 		}
562 		p   += ext_len;
563 		len -= ext_len;
564 	}
565 
566 	return 0;
567 }
568 
569 static uint16_t
570 pfkey_satype2proto(uint8_t satype)
571 {
572 	switch (satype) {
573 	case SADB_SATYPE_UNSPEC:
574 		return IPSEC_PROTO_ANY;
575 	case SADB_SATYPE_AH:
576 		return IPPROTO_AH;
577 	case SADB_SATYPE_ESP:
578 		return IPPROTO_ESP;
579 	case SADB_X_SATYPE_IPCOMP:
580 		return IPPROTO_COMP;
581 	default:
582 		return 0;
583 	}
584 	/* NOTREACHED */
585 }
586 
587 static uint8_t
588 pfkey_proto2satype(uint16_t proto)
589 {
590 	switch (proto) {
591 	case IPPROTO_AH:
592 		return SADB_SATYPE_AH;
593 	case IPPROTO_ESP:
594 		return SADB_SATYPE_ESP;
595 	case IPPROTO_COMP:
596 		return SADB_X_SATYPE_IPCOMP;
597 	default:
598 		return 0;
599 	}
600 	/* NOTREACHED */
601 }
602 
603 /* BTW, this scheme means that there is no way with PFKEY2 sockets to
604  * say specifically 'just raw sockets' as we encode them as 255.
605  */
606 
607 static uint8_t pfkey_proto_to_xfrm(uint8_t proto)
608 {
609 	return proto == IPSEC_PROTO_ANY ? 0 : proto;
610 }
611 
612 static uint8_t pfkey_proto_from_xfrm(uint8_t proto)
613 {
614 	return proto ? proto : IPSEC_PROTO_ANY;
615 }
616 
617 static inline int pfkey_sockaddr_len(sa_family_t family)
618 {
619 	switch (family) {
620 	case AF_INET:
621 		return sizeof(struct sockaddr_in);
622 #if IS_ENABLED(CONFIG_IPV6)
623 	case AF_INET6:
624 		return sizeof(struct sockaddr_in6);
625 #endif
626 	}
627 	return 0;
628 }
629 
630 static
631 int pfkey_sockaddr_extract(const struct sockaddr *sa, xfrm_address_t *xaddr)
632 {
633 	switch (sa->sa_family) {
634 	case AF_INET:
635 		xaddr->a4 =
636 			((struct sockaddr_in *)sa)->sin_addr.s_addr;
637 		return AF_INET;
638 #if IS_ENABLED(CONFIG_IPV6)
639 	case AF_INET6:
640 		memcpy(xaddr->a6,
641 		       &((struct sockaddr_in6 *)sa)->sin6_addr,
642 		       sizeof(struct in6_addr));
643 		return AF_INET6;
644 #endif
645 	}
646 	return 0;
647 }
648 
649 static
650 int pfkey_sadb_addr2xfrm_addr(const struct sadb_address *addr, xfrm_address_t *xaddr)
651 {
652 	return pfkey_sockaddr_extract((struct sockaddr *)(addr + 1),
653 				      xaddr);
654 }
655 
656 static struct  xfrm_state *pfkey_xfrm_state_lookup(struct net *net, const struct sadb_msg *hdr, void * const *ext_hdrs)
657 {
658 	const struct sadb_sa *sa;
659 	const struct sadb_address *addr;
660 	uint16_t proto;
661 	unsigned short family;
662 	xfrm_address_t *xaddr;
663 
664 	sa = ext_hdrs[SADB_EXT_SA - 1];
665 	if (sa == NULL)
666 		return NULL;
667 
668 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
669 	if (proto == 0)
670 		return NULL;
671 
672 	/* sadb_address_len should be checked by caller */
673 	addr = ext_hdrs[SADB_EXT_ADDRESS_DST - 1];
674 	if (addr == NULL)
675 		return NULL;
676 
677 	family = ((const struct sockaddr *)(addr + 1))->sa_family;
678 	switch (family) {
679 	case AF_INET:
680 		xaddr = (xfrm_address_t *)&((const struct sockaddr_in *)(addr + 1))->sin_addr;
681 		break;
682 #if IS_ENABLED(CONFIG_IPV6)
683 	case AF_INET6:
684 		xaddr = (xfrm_address_t *)&((const struct sockaddr_in6 *)(addr + 1))->sin6_addr;
685 		break;
686 #endif
687 	default:
688 		xaddr = NULL;
689 	}
690 
691 	if (!xaddr)
692 		return NULL;
693 
694 	return xfrm_state_lookup(net, DUMMY_MARK, xaddr, sa->sadb_sa_spi, proto, family);
695 }
696 
697 #define PFKEY_ALIGN8(a) (1 + (((a) - 1) | (8 - 1)))
698 
699 static int
700 pfkey_sockaddr_size(sa_family_t family)
701 {
702 	return PFKEY_ALIGN8(pfkey_sockaddr_len(family));
703 }
704 
705 static inline int pfkey_mode_from_xfrm(int mode)
706 {
707 	switch(mode) {
708 	case XFRM_MODE_TRANSPORT:
709 		return IPSEC_MODE_TRANSPORT;
710 	case XFRM_MODE_TUNNEL:
711 		return IPSEC_MODE_TUNNEL;
712 	case XFRM_MODE_BEET:
713 		return IPSEC_MODE_BEET;
714 	default:
715 		return -1;
716 	}
717 }
718 
719 static inline int pfkey_mode_to_xfrm(int mode)
720 {
721 	switch(mode) {
722 	case IPSEC_MODE_ANY:	/*XXX*/
723 	case IPSEC_MODE_TRANSPORT:
724 		return XFRM_MODE_TRANSPORT;
725 	case IPSEC_MODE_TUNNEL:
726 		return XFRM_MODE_TUNNEL;
727 	case IPSEC_MODE_BEET:
728 		return XFRM_MODE_BEET;
729 	default:
730 		return -1;
731 	}
732 }
733 
734 static unsigned int pfkey_sockaddr_fill(const xfrm_address_t *xaddr, __be16 port,
735 					struct sockaddr *sa,
736 					unsigned short family)
737 {
738 	switch (family) {
739 	case AF_INET:
740 	    {
741 		struct sockaddr_in *sin = (struct sockaddr_in *)sa;
742 		sin->sin_family = AF_INET;
743 		sin->sin_port = port;
744 		sin->sin_addr.s_addr = xaddr->a4;
745 		memset(sin->sin_zero, 0, sizeof(sin->sin_zero));
746 		return 32;
747 	    }
748 #if IS_ENABLED(CONFIG_IPV6)
749 	case AF_INET6:
750 	    {
751 		struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)sa;
752 		sin6->sin6_family = AF_INET6;
753 		sin6->sin6_port = port;
754 		sin6->sin6_flowinfo = 0;
755 		sin6->sin6_addr = xaddr->in6;
756 		sin6->sin6_scope_id = 0;
757 		return 128;
758 	    }
759 #endif
760 	}
761 	return 0;
762 }
763 
764 static struct sk_buff *__pfkey_xfrm_state2msg(const struct xfrm_state *x,
765 					      int add_keys, int hsc)
766 {
767 	struct sk_buff *skb;
768 	struct sadb_msg *hdr;
769 	struct sadb_sa *sa;
770 	struct sadb_lifetime *lifetime;
771 	struct sadb_address *addr;
772 	struct sadb_key *key;
773 	struct sadb_x_sa2 *sa2;
774 	struct sadb_x_sec_ctx *sec_ctx;
775 	struct xfrm_sec_ctx *xfrm_ctx;
776 	int ctx_size = 0;
777 	int size;
778 	int auth_key_size = 0;
779 	int encrypt_key_size = 0;
780 	int sockaddr_size;
781 	struct xfrm_encap_tmpl *natt = NULL;
782 	int mode;
783 
784 	/* address family check */
785 	sockaddr_size = pfkey_sockaddr_size(x->props.family);
786 	if (!sockaddr_size)
787 		return ERR_PTR(-EINVAL);
788 
789 	/* base, SA, (lifetime (HSC),) address(SD), (address(P),)
790 	   key(AE), (identity(SD),) (sensitivity)> */
791 	size = sizeof(struct sadb_msg) +sizeof(struct sadb_sa) +
792 		sizeof(struct sadb_lifetime) +
793 		((hsc & 1) ? sizeof(struct sadb_lifetime) : 0) +
794 		((hsc & 2) ? sizeof(struct sadb_lifetime) : 0) +
795 			sizeof(struct sadb_address)*2 +
796 				sockaddr_size*2 +
797 					sizeof(struct sadb_x_sa2);
798 
799 	if ((xfrm_ctx = x->security)) {
800 		ctx_size = PFKEY_ALIGN8(xfrm_ctx->ctx_len);
801 		size += sizeof(struct sadb_x_sec_ctx) + ctx_size;
802 	}
803 
804 	/* identity & sensitivity */
805 	if (!xfrm_addr_equal(&x->sel.saddr, &x->props.saddr, x->props.family))
806 		size += sizeof(struct sadb_address) + sockaddr_size;
807 
808 	if (add_keys) {
809 		if (x->aalg && x->aalg->alg_key_len) {
810 			auth_key_size =
811 				PFKEY_ALIGN8((x->aalg->alg_key_len + 7) / 8);
812 			size += sizeof(struct sadb_key) + auth_key_size;
813 		}
814 		if (x->ealg && x->ealg->alg_key_len) {
815 			encrypt_key_size =
816 				PFKEY_ALIGN8((x->ealg->alg_key_len+7) / 8);
817 			size += sizeof(struct sadb_key) + encrypt_key_size;
818 		}
819 	}
820 	if (x->encap)
821 		natt = x->encap;
822 
823 	if (natt && natt->encap_type) {
824 		size += sizeof(struct sadb_x_nat_t_type);
825 		size += sizeof(struct sadb_x_nat_t_port);
826 		size += sizeof(struct sadb_x_nat_t_port);
827 	}
828 
829 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
830 	if (skb == NULL)
831 		return ERR_PTR(-ENOBUFS);
832 
833 	/* call should fill header later */
834 	hdr = skb_put(skb, sizeof(struct sadb_msg));
835 	memset(hdr, 0, size);	/* XXX do we need this ? */
836 	hdr->sadb_msg_len = size / sizeof(uint64_t);
837 
838 	/* sa */
839 	sa = skb_put(skb, sizeof(struct sadb_sa));
840 	sa->sadb_sa_len = sizeof(struct sadb_sa)/sizeof(uint64_t);
841 	sa->sadb_sa_exttype = SADB_EXT_SA;
842 	sa->sadb_sa_spi = x->id.spi;
843 	sa->sadb_sa_replay = x->props.replay_window;
844 	switch (x->km.state) {
845 	case XFRM_STATE_VALID:
846 		sa->sadb_sa_state = x->km.dying ?
847 			SADB_SASTATE_DYING : SADB_SASTATE_MATURE;
848 		break;
849 	case XFRM_STATE_ACQ:
850 		sa->sadb_sa_state = SADB_SASTATE_LARVAL;
851 		break;
852 	default:
853 		sa->sadb_sa_state = SADB_SASTATE_DEAD;
854 		break;
855 	}
856 	sa->sadb_sa_auth = 0;
857 	if (x->aalg) {
858 		struct xfrm_algo_desc *a = xfrm_aalg_get_byname(x->aalg->alg_name, 0);
859 		sa->sadb_sa_auth = (a && a->pfkey_supported) ?
860 					a->desc.sadb_alg_id : 0;
861 	}
862 	sa->sadb_sa_encrypt = 0;
863 	BUG_ON(x->ealg && x->calg);
864 	if (x->ealg) {
865 		struct xfrm_algo_desc *a = xfrm_ealg_get_byname(x->ealg->alg_name, 0);
866 		sa->sadb_sa_encrypt = (a && a->pfkey_supported) ?
867 					a->desc.sadb_alg_id : 0;
868 	}
869 	/* KAME compatible: sadb_sa_encrypt is overloaded with calg id */
870 	if (x->calg) {
871 		struct xfrm_algo_desc *a = xfrm_calg_get_byname(x->calg->alg_name, 0);
872 		sa->sadb_sa_encrypt = (a && a->pfkey_supported) ?
873 					a->desc.sadb_alg_id : 0;
874 	}
875 
876 	sa->sadb_sa_flags = 0;
877 	if (x->props.flags & XFRM_STATE_NOECN)
878 		sa->sadb_sa_flags |= SADB_SAFLAGS_NOECN;
879 	if (x->props.flags & XFRM_STATE_DECAP_DSCP)
880 		sa->sadb_sa_flags |= SADB_SAFLAGS_DECAP_DSCP;
881 	if (x->props.flags & XFRM_STATE_NOPMTUDISC)
882 		sa->sadb_sa_flags |= SADB_SAFLAGS_NOPMTUDISC;
883 
884 	/* hard time */
885 	if (hsc & 2) {
886 		lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
887 		lifetime->sadb_lifetime_len =
888 			sizeof(struct sadb_lifetime)/sizeof(uint64_t);
889 		lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_HARD;
890 		lifetime->sadb_lifetime_allocations =  _X2KEY(x->lft.hard_packet_limit);
891 		lifetime->sadb_lifetime_bytes = _X2KEY(x->lft.hard_byte_limit);
892 		lifetime->sadb_lifetime_addtime = x->lft.hard_add_expires_seconds;
893 		lifetime->sadb_lifetime_usetime = x->lft.hard_use_expires_seconds;
894 	}
895 	/* soft time */
896 	if (hsc & 1) {
897 		lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
898 		lifetime->sadb_lifetime_len =
899 			sizeof(struct sadb_lifetime)/sizeof(uint64_t);
900 		lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_SOFT;
901 		lifetime->sadb_lifetime_allocations =  _X2KEY(x->lft.soft_packet_limit);
902 		lifetime->sadb_lifetime_bytes = _X2KEY(x->lft.soft_byte_limit);
903 		lifetime->sadb_lifetime_addtime = x->lft.soft_add_expires_seconds;
904 		lifetime->sadb_lifetime_usetime = x->lft.soft_use_expires_seconds;
905 	}
906 	/* current time */
907 	lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
908 	lifetime->sadb_lifetime_len =
909 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
910 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_CURRENT;
911 	lifetime->sadb_lifetime_allocations = x->curlft.packets;
912 	lifetime->sadb_lifetime_bytes = x->curlft.bytes;
913 	lifetime->sadb_lifetime_addtime = x->curlft.add_time;
914 	lifetime->sadb_lifetime_usetime = x->curlft.use_time;
915 	/* src address */
916 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
917 	addr->sadb_address_len =
918 		(sizeof(struct sadb_address)+sockaddr_size)/
919 			sizeof(uint64_t);
920 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
921 	/* "if the ports are non-zero, then the sadb_address_proto field,
922 	   normally zero, MUST be filled in with the transport
923 	   protocol's number." - RFC2367 */
924 	addr->sadb_address_proto = 0;
925 	addr->sadb_address_reserved = 0;
926 
927 	addr->sadb_address_prefixlen =
928 		pfkey_sockaddr_fill(&x->props.saddr, 0,
929 				    (struct sockaddr *) (addr + 1),
930 				    x->props.family);
931 	BUG_ON(!addr->sadb_address_prefixlen);
932 
933 	/* dst address */
934 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
935 	addr->sadb_address_len =
936 		(sizeof(struct sadb_address)+sockaddr_size)/
937 			sizeof(uint64_t);
938 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
939 	addr->sadb_address_proto = 0;
940 	addr->sadb_address_reserved = 0;
941 
942 	addr->sadb_address_prefixlen =
943 		pfkey_sockaddr_fill(&x->id.daddr, 0,
944 				    (struct sockaddr *) (addr + 1),
945 				    x->props.family);
946 	BUG_ON(!addr->sadb_address_prefixlen);
947 
948 	if (!xfrm_addr_equal(&x->sel.saddr, &x->props.saddr,
949 			     x->props.family)) {
950 		addr = skb_put(skb,
951 			       sizeof(struct sadb_address) + sockaddr_size);
952 		addr->sadb_address_len =
953 			(sizeof(struct sadb_address)+sockaddr_size)/
954 			sizeof(uint64_t);
955 		addr->sadb_address_exttype = SADB_EXT_ADDRESS_PROXY;
956 		addr->sadb_address_proto =
957 			pfkey_proto_from_xfrm(x->sel.proto);
958 		addr->sadb_address_prefixlen = x->sel.prefixlen_s;
959 		addr->sadb_address_reserved = 0;
960 
961 		pfkey_sockaddr_fill(&x->sel.saddr, x->sel.sport,
962 				    (struct sockaddr *) (addr + 1),
963 				    x->props.family);
964 	}
965 
966 	/* auth key */
967 	if (add_keys && auth_key_size) {
968 		key = skb_put(skb, sizeof(struct sadb_key) + auth_key_size);
969 		key->sadb_key_len = (sizeof(struct sadb_key) + auth_key_size) /
970 			sizeof(uint64_t);
971 		key->sadb_key_exttype = SADB_EXT_KEY_AUTH;
972 		key->sadb_key_bits = x->aalg->alg_key_len;
973 		key->sadb_key_reserved = 0;
974 		memcpy(key + 1, x->aalg->alg_key, (x->aalg->alg_key_len+7)/8);
975 	}
976 	/* encrypt key */
977 	if (add_keys && encrypt_key_size) {
978 		key = skb_put(skb, sizeof(struct sadb_key) + encrypt_key_size);
979 		key->sadb_key_len = (sizeof(struct sadb_key) +
980 				     encrypt_key_size) / sizeof(uint64_t);
981 		key->sadb_key_exttype = SADB_EXT_KEY_ENCRYPT;
982 		key->sadb_key_bits = x->ealg->alg_key_len;
983 		key->sadb_key_reserved = 0;
984 		memcpy(key + 1, x->ealg->alg_key,
985 		       (x->ealg->alg_key_len+7)/8);
986 	}
987 
988 	/* sa */
989 	sa2 = skb_put(skb, sizeof(struct sadb_x_sa2));
990 	sa2->sadb_x_sa2_len = sizeof(struct sadb_x_sa2)/sizeof(uint64_t);
991 	sa2->sadb_x_sa2_exttype = SADB_X_EXT_SA2;
992 	if ((mode = pfkey_mode_from_xfrm(x->props.mode)) < 0) {
993 		kfree_skb(skb);
994 		return ERR_PTR(-EINVAL);
995 	}
996 	sa2->sadb_x_sa2_mode = mode;
997 	sa2->sadb_x_sa2_reserved1 = 0;
998 	sa2->sadb_x_sa2_reserved2 = 0;
999 	sa2->sadb_x_sa2_sequence = 0;
1000 	sa2->sadb_x_sa2_reqid = x->props.reqid;
1001 
1002 	if (natt && natt->encap_type) {
1003 		struct sadb_x_nat_t_type *n_type;
1004 		struct sadb_x_nat_t_port *n_port;
1005 
1006 		/* type */
1007 		n_type = skb_put(skb, sizeof(*n_type));
1008 		n_type->sadb_x_nat_t_type_len = sizeof(*n_type)/sizeof(uint64_t);
1009 		n_type->sadb_x_nat_t_type_exttype = SADB_X_EXT_NAT_T_TYPE;
1010 		n_type->sadb_x_nat_t_type_type = natt->encap_type;
1011 		n_type->sadb_x_nat_t_type_reserved[0] = 0;
1012 		n_type->sadb_x_nat_t_type_reserved[1] = 0;
1013 		n_type->sadb_x_nat_t_type_reserved[2] = 0;
1014 
1015 		/* source port */
1016 		n_port = skb_put(skb, sizeof(*n_port));
1017 		n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
1018 		n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_SPORT;
1019 		n_port->sadb_x_nat_t_port_port = natt->encap_sport;
1020 		n_port->sadb_x_nat_t_port_reserved = 0;
1021 
1022 		/* dest port */
1023 		n_port = skb_put(skb, sizeof(*n_port));
1024 		n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
1025 		n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_DPORT;
1026 		n_port->sadb_x_nat_t_port_port = natt->encap_dport;
1027 		n_port->sadb_x_nat_t_port_reserved = 0;
1028 	}
1029 
1030 	/* security context */
1031 	if (xfrm_ctx) {
1032 		sec_ctx = skb_put(skb,
1033 				  sizeof(struct sadb_x_sec_ctx) + ctx_size);
1034 		sec_ctx->sadb_x_sec_len =
1035 		  (sizeof(struct sadb_x_sec_ctx) + ctx_size) / sizeof(uint64_t);
1036 		sec_ctx->sadb_x_sec_exttype = SADB_X_EXT_SEC_CTX;
1037 		sec_ctx->sadb_x_ctx_doi = xfrm_ctx->ctx_doi;
1038 		sec_ctx->sadb_x_ctx_alg = xfrm_ctx->ctx_alg;
1039 		sec_ctx->sadb_x_ctx_len = xfrm_ctx->ctx_len;
1040 		memcpy(sec_ctx + 1, xfrm_ctx->ctx_str,
1041 		       xfrm_ctx->ctx_len);
1042 	}
1043 
1044 	return skb;
1045 }
1046 
1047 
1048 static inline struct sk_buff *pfkey_xfrm_state2msg(const struct xfrm_state *x)
1049 {
1050 	struct sk_buff *skb;
1051 
1052 	skb = __pfkey_xfrm_state2msg(x, 1, 3);
1053 
1054 	return skb;
1055 }
1056 
1057 static inline struct sk_buff *pfkey_xfrm_state2msg_expire(const struct xfrm_state *x,
1058 							  int hsc)
1059 {
1060 	return __pfkey_xfrm_state2msg(x, 0, hsc);
1061 }
1062 
1063 static struct xfrm_state * pfkey_msg2xfrm_state(struct net *net,
1064 						const struct sadb_msg *hdr,
1065 						void * const *ext_hdrs)
1066 {
1067 	struct xfrm_state *x;
1068 	const struct sadb_lifetime *lifetime;
1069 	const struct sadb_sa *sa;
1070 	const struct sadb_key *key;
1071 	const struct sadb_x_sec_ctx *sec_ctx;
1072 	uint16_t proto;
1073 	int err;
1074 
1075 
1076 	sa = ext_hdrs[SADB_EXT_SA - 1];
1077 	if (!sa ||
1078 	    !present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1079 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1080 		return ERR_PTR(-EINVAL);
1081 	if (hdr->sadb_msg_satype == SADB_SATYPE_ESP &&
1082 	    !ext_hdrs[SADB_EXT_KEY_ENCRYPT-1])
1083 		return ERR_PTR(-EINVAL);
1084 	if (hdr->sadb_msg_satype == SADB_SATYPE_AH &&
1085 	    !ext_hdrs[SADB_EXT_KEY_AUTH-1])
1086 		return ERR_PTR(-EINVAL);
1087 	if (!!ext_hdrs[SADB_EXT_LIFETIME_HARD-1] !=
1088 	    !!ext_hdrs[SADB_EXT_LIFETIME_SOFT-1])
1089 		return ERR_PTR(-EINVAL);
1090 
1091 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1092 	if (proto == 0)
1093 		return ERR_PTR(-EINVAL);
1094 
1095 	/* default error is no buffer space */
1096 	err = -ENOBUFS;
1097 
1098 	/* RFC2367:
1099 
1100    Only SADB_SASTATE_MATURE SAs may be submitted in an SADB_ADD message.
1101    SADB_SASTATE_LARVAL SAs are created by SADB_GETSPI and it is not
1102    sensible to add a new SA in the DYING or SADB_SASTATE_DEAD state.
1103    Therefore, the sadb_sa_state field of all submitted SAs MUST be
1104    SADB_SASTATE_MATURE and the kernel MUST return an error if this is
1105    not true.
1106 
1107 	   However, KAME setkey always uses SADB_SASTATE_LARVAL.
1108 	   Hence, we have to _ignore_ sadb_sa_state, which is also reasonable.
1109 	 */
1110 	if (sa->sadb_sa_auth > SADB_AALG_MAX ||
1111 	    (hdr->sadb_msg_satype == SADB_X_SATYPE_IPCOMP &&
1112 	     sa->sadb_sa_encrypt > SADB_X_CALG_MAX) ||
1113 	    sa->sadb_sa_encrypt > SADB_EALG_MAX)
1114 		return ERR_PTR(-EINVAL);
1115 	key = ext_hdrs[SADB_EXT_KEY_AUTH - 1];
1116 	if (key != NULL &&
1117 	    sa->sadb_sa_auth != SADB_X_AALG_NULL &&
1118 	    key->sadb_key_bits == 0)
1119 		return ERR_PTR(-EINVAL);
1120 	key = ext_hdrs[SADB_EXT_KEY_ENCRYPT-1];
1121 	if (key != NULL &&
1122 	    sa->sadb_sa_encrypt != SADB_EALG_NULL &&
1123 	    key->sadb_key_bits == 0)
1124 		return ERR_PTR(-EINVAL);
1125 
1126 	x = xfrm_state_alloc(net);
1127 	if (x == NULL)
1128 		return ERR_PTR(-ENOBUFS);
1129 
1130 	x->id.proto = proto;
1131 	x->id.spi = sa->sadb_sa_spi;
1132 	x->props.replay_window = min_t(unsigned int, sa->sadb_sa_replay,
1133 					(sizeof(x->replay.bitmap) * 8));
1134 	if (sa->sadb_sa_flags & SADB_SAFLAGS_NOECN)
1135 		x->props.flags |= XFRM_STATE_NOECN;
1136 	if (sa->sadb_sa_flags & SADB_SAFLAGS_DECAP_DSCP)
1137 		x->props.flags |= XFRM_STATE_DECAP_DSCP;
1138 	if (sa->sadb_sa_flags & SADB_SAFLAGS_NOPMTUDISC)
1139 		x->props.flags |= XFRM_STATE_NOPMTUDISC;
1140 
1141 	lifetime = ext_hdrs[SADB_EXT_LIFETIME_HARD - 1];
1142 	if (lifetime != NULL) {
1143 		x->lft.hard_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
1144 		x->lft.hard_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
1145 		x->lft.hard_add_expires_seconds = lifetime->sadb_lifetime_addtime;
1146 		x->lft.hard_use_expires_seconds = lifetime->sadb_lifetime_usetime;
1147 	}
1148 	lifetime = ext_hdrs[SADB_EXT_LIFETIME_SOFT - 1];
1149 	if (lifetime != NULL) {
1150 		x->lft.soft_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
1151 		x->lft.soft_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
1152 		x->lft.soft_add_expires_seconds = lifetime->sadb_lifetime_addtime;
1153 		x->lft.soft_use_expires_seconds = lifetime->sadb_lifetime_usetime;
1154 	}
1155 
1156 	sec_ctx = ext_hdrs[SADB_X_EXT_SEC_CTX - 1];
1157 	if (sec_ctx != NULL) {
1158 		struct xfrm_user_sec_ctx *uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_KERNEL);
1159 
1160 		if (!uctx)
1161 			goto out;
1162 
1163 		err = security_xfrm_state_alloc(x, uctx);
1164 		kfree(uctx);
1165 
1166 		if (err)
1167 			goto out;
1168 	}
1169 
1170 	err = -ENOBUFS;
1171 	key = ext_hdrs[SADB_EXT_KEY_AUTH - 1];
1172 	if (sa->sadb_sa_auth) {
1173 		int keysize = 0;
1174 		struct xfrm_algo_desc *a = xfrm_aalg_get_byid(sa->sadb_sa_auth);
1175 		if (!a || !a->pfkey_supported) {
1176 			err = -ENOSYS;
1177 			goto out;
1178 		}
1179 		if (key)
1180 			keysize = (key->sadb_key_bits + 7) / 8;
1181 		x->aalg = kmalloc(sizeof(*x->aalg) + keysize, GFP_KERNEL);
1182 		if (!x->aalg) {
1183 			err = -ENOMEM;
1184 			goto out;
1185 		}
1186 		strcpy(x->aalg->alg_name, a->name);
1187 		x->aalg->alg_key_len = 0;
1188 		if (key) {
1189 			x->aalg->alg_key_len = key->sadb_key_bits;
1190 			memcpy(x->aalg->alg_key, key+1, keysize);
1191 		}
1192 		x->aalg->alg_trunc_len = a->uinfo.auth.icv_truncbits;
1193 		x->props.aalgo = sa->sadb_sa_auth;
1194 		/* x->algo.flags = sa->sadb_sa_flags; */
1195 	}
1196 	if (sa->sadb_sa_encrypt) {
1197 		if (hdr->sadb_msg_satype == SADB_X_SATYPE_IPCOMP) {
1198 			struct xfrm_algo_desc *a = xfrm_calg_get_byid(sa->sadb_sa_encrypt);
1199 			if (!a || !a->pfkey_supported) {
1200 				err = -ENOSYS;
1201 				goto out;
1202 			}
1203 			x->calg = kmalloc(sizeof(*x->calg), GFP_KERNEL);
1204 			if (!x->calg) {
1205 				err = -ENOMEM;
1206 				goto out;
1207 			}
1208 			strcpy(x->calg->alg_name, a->name);
1209 			x->props.calgo = sa->sadb_sa_encrypt;
1210 		} else {
1211 			int keysize = 0;
1212 			struct xfrm_algo_desc *a = xfrm_ealg_get_byid(sa->sadb_sa_encrypt);
1213 			if (!a || !a->pfkey_supported) {
1214 				err = -ENOSYS;
1215 				goto out;
1216 			}
1217 			key = (struct sadb_key*) ext_hdrs[SADB_EXT_KEY_ENCRYPT-1];
1218 			if (key)
1219 				keysize = (key->sadb_key_bits + 7) / 8;
1220 			x->ealg = kmalloc(sizeof(*x->ealg) + keysize, GFP_KERNEL);
1221 			if (!x->ealg) {
1222 				err = -ENOMEM;
1223 				goto out;
1224 			}
1225 			strcpy(x->ealg->alg_name, a->name);
1226 			x->ealg->alg_key_len = 0;
1227 			if (key) {
1228 				x->ealg->alg_key_len = key->sadb_key_bits;
1229 				memcpy(x->ealg->alg_key, key+1, keysize);
1230 			}
1231 			x->props.ealgo = sa->sadb_sa_encrypt;
1232 			x->geniv = a->uinfo.encr.geniv;
1233 		}
1234 	}
1235 	/* x->algo.flags = sa->sadb_sa_flags; */
1236 
1237 	x->props.family = pfkey_sadb_addr2xfrm_addr((struct sadb_address *) ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1238 						    &x->props.saddr);
1239 	pfkey_sadb_addr2xfrm_addr((struct sadb_address *) ext_hdrs[SADB_EXT_ADDRESS_DST-1],
1240 				  &x->id.daddr);
1241 
1242 	if (ext_hdrs[SADB_X_EXT_SA2-1]) {
1243 		const struct sadb_x_sa2 *sa2 = ext_hdrs[SADB_X_EXT_SA2-1];
1244 		int mode = pfkey_mode_to_xfrm(sa2->sadb_x_sa2_mode);
1245 		if (mode < 0) {
1246 			err = -EINVAL;
1247 			goto out;
1248 		}
1249 		x->props.mode = mode;
1250 		x->props.reqid = sa2->sadb_x_sa2_reqid;
1251 	}
1252 
1253 	if (ext_hdrs[SADB_EXT_ADDRESS_PROXY-1]) {
1254 		const struct sadb_address *addr = ext_hdrs[SADB_EXT_ADDRESS_PROXY-1];
1255 
1256 		/* Nobody uses this, but we try. */
1257 		x->sel.family = pfkey_sadb_addr2xfrm_addr(addr, &x->sel.saddr);
1258 		x->sel.prefixlen_s = addr->sadb_address_prefixlen;
1259 	}
1260 
1261 	if (!x->sel.family)
1262 		x->sel.family = x->props.family;
1263 
1264 	if (ext_hdrs[SADB_X_EXT_NAT_T_TYPE-1]) {
1265 		const struct sadb_x_nat_t_type* n_type;
1266 		struct xfrm_encap_tmpl *natt;
1267 
1268 		x->encap = kmalloc(sizeof(*x->encap), GFP_KERNEL);
1269 		if (!x->encap) {
1270 			err = -ENOMEM;
1271 			goto out;
1272 		}
1273 
1274 		natt = x->encap;
1275 		n_type = ext_hdrs[SADB_X_EXT_NAT_T_TYPE-1];
1276 		natt->encap_type = n_type->sadb_x_nat_t_type_type;
1277 
1278 		if (ext_hdrs[SADB_X_EXT_NAT_T_SPORT-1]) {
1279 			const struct sadb_x_nat_t_port *n_port =
1280 				ext_hdrs[SADB_X_EXT_NAT_T_SPORT-1];
1281 			natt->encap_sport = n_port->sadb_x_nat_t_port_port;
1282 		}
1283 		if (ext_hdrs[SADB_X_EXT_NAT_T_DPORT-1]) {
1284 			const struct sadb_x_nat_t_port *n_port =
1285 				ext_hdrs[SADB_X_EXT_NAT_T_DPORT-1];
1286 			natt->encap_dport = n_port->sadb_x_nat_t_port_port;
1287 		}
1288 		memset(&natt->encap_oa, 0, sizeof(natt->encap_oa));
1289 	}
1290 
1291 	err = xfrm_init_state(x);
1292 	if (err)
1293 		goto out;
1294 
1295 	x->km.seq = hdr->sadb_msg_seq;
1296 	return x;
1297 
1298 out:
1299 	x->km.state = XFRM_STATE_DEAD;
1300 	xfrm_state_put(x);
1301 	return ERR_PTR(err);
1302 }
1303 
1304 static int pfkey_reserved(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1305 {
1306 	return -EOPNOTSUPP;
1307 }
1308 
1309 static int pfkey_getspi(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1310 {
1311 	struct net *net = sock_net(sk);
1312 	struct sk_buff *resp_skb;
1313 	struct sadb_x_sa2 *sa2;
1314 	struct sadb_address *saddr, *daddr;
1315 	struct sadb_msg *out_hdr;
1316 	struct sadb_spirange *range;
1317 	struct xfrm_state *x = NULL;
1318 	int mode;
1319 	int err;
1320 	u32 min_spi, max_spi;
1321 	u32 reqid;
1322 	u8 proto;
1323 	unsigned short family;
1324 	xfrm_address_t *xsaddr = NULL, *xdaddr = NULL;
1325 
1326 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1327 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1328 		return -EINVAL;
1329 
1330 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1331 	if (proto == 0)
1332 		return -EINVAL;
1333 
1334 	if ((sa2 = ext_hdrs[SADB_X_EXT_SA2-1]) != NULL) {
1335 		mode = pfkey_mode_to_xfrm(sa2->sadb_x_sa2_mode);
1336 		if (mode < 0)
1337 			return -EINVAL;
1338 		reqid = sa2->sadb_x_sa2_reqid;
1339 	} else {
1340 		mode = 0;
1341 		reqid = 0;
1342 	}
1343 
1344 	saddr = ext_hdrs[SADB_EXT_ADDRESS_SRC-1];
1345 	daddr = ext_hdrs[SADB_EXT_ADDRESS_DST-1];
1346 
1347 	family = ((struct sockaddr *)(saddr + 1))->sa_family;
1348 	switch (family) {
1349 	case AF_INET:
1350 		xdaddr = (xfrm_address_t *)&((struct sockaddr_in *)(daddr + 1))->sin_addr.s_addr;
1351 		xsaddr = (xfrm_address_t *)&((struct sockaddr_in *)(saddr + 1))->sin_addr.s_addr;
1352 		break;
1353 #if IS_ENABLED(CONFIG_IPV6)
1354 	case AF_INET6:
1355 		xdaddr = (xfrm_address_t *)&((struct sockaddr_in6 *)(daddr + 1))->sin6_addr;
1356 		xsaddr = (xfrm_address_t *)&((struct sockaddr_in6 *)(saddr + 1))->sin6_addr;
1357 		break;
1358 #endif
1359 	}
1360 
1361 	if (hdr->sadb_msg_seq) {
1362 		x = xfrm_find_acq_byseq(net, DUMMY_MARK, hdr->sadb_msg_seq);
1363 		if (x && !xfrm_addr_equal(&x->id.daddr, xdaddr, family)) {
1364 			xfrm_state_put(x);
1365 			x = NULL;
1366 		}
1367 	}
1368 
1369 	if (!x)
1370 		x = xfrm_find_acq(net, &dummy_mark, mode, reqid, 0, proto, xdaddr, xsaddr, 1, family);
1371 
1372 	if (x == NULL)
1373 		return -ENOENT;
1374 
1375 	min_spi = 0x100;
1376 	max_spi = 0x0fffffff;
1377 
1378 	range = ext_hdrs[SADB_EXT_SPIRANGE-1];
1379 	if (range) {
1380 		min_spi = range->sadb_spirange_min;
1381 		max_spi = range->sadb_spirange_max;
1382 	}
1383 
1384 	err = verify_spi_info(x->id.proto, min_spi, max_spi);
1385 	if (err) {
1386 		xfrm_state_put(x);
1387 		return err;
1388 	}
1389 
1390 	err = xfrm_alloc_spi(x, min_spi, max_spi);
1391 	resp_skb = err ? ERR_PTR(err) : pfkey_xfrm_state2msg(x);
1392 
1393 	if (IS_ERR(resp_skb)) {
1394 		xfrm_state_put(x);
1395 		return  PTR_ERR(resp_skb);
1396 	}
1397 
1398 	out_hdr = (struct sadb_msg *) resp_skb->data;
1399 	out_hdr->sadb_msg_version = hdr->sadb_msg_version;
1400 	out_hdr->sadb_msg_type = SADB_GETSPI;
1401 	out_hdr->sadb_msg_satype = pfkey_proto2satype(proto);
1402 	out_hdr->sadb_msg_errno = 0;
1403 	out_hdr->sadb_msg_reserved = 0;
1404 	out_hdr->sadb_msg_seq = hdr->sadb_msg_seq;
1405 	out_hdr->sadb_msg_pid = hdr->sadb_msg_pid;
1406 
1407 	xfrm_state_put(x);
1408 
1409 	pfkey_broadcast(resp_skb, GFP_KERNEL, BROADCAST_ONE, sk, net);
1410 
1411 	return 0;
1412 }
1413 
1414 static int pfkey_acquire(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1415 {
1416 	struct net *net = sock_net(sk);
1417 	struct xfrm_state *x;
1418 
1419 	if (hdr->sadb_msg_len != sizeof(struct sadb_msg)/8)
1420 		return -EOPNOTSUPP;
1421 
1422 	if (hdr->sadb_msg_seq == 0 || hdr->sadb_msg_errno == 0)
1423 		return 0;
1424 
1425 	x = xfrm_find_acq_byseq(net, DUMMY_MARK, hdr->sadb_msg_seq);
1426 	if (x == NULL)
1427 		return 0;
1428 
1429 	spin_lock_bh(&x->lock);
1430 	if (x->km.state == XFRM_STATE_ACQ)
1431 		x->km.state = XFRM_STATE_ERROR;
1432 
1433 	spin_unlock_bh(&x->lock);
1434 	xfrm_state_put(x);
1435 	return 0;
1436 }
1437 
1438 static inline int event2poltype(int event)
1439 {
1440 	switch (event) {
1441 	case XFRM_MSG_DELPOLICY:
1442 		return SADB_X_SPDDELETE;
1443 	case XFRM_MSG_NEWPOLICY:
1444 		return SADB_X_SPDADD;
1445 	case XFRM_MSG_UPDPOLICY:
1446 		return SADB_X_SPDUPDATE;
1447 	case XFRM_MSG_POLEXPIRE:
1448 	//	return SADB_X_SPDEXPIRE;
1449 	default:
1450 		pr_err("pfkey: Unknown policy event %d\n", event);
1451 		break;
1452 	}
1453 
1454 	return 0;
1455 }
1456 
1457 static inline int event2keytype(int event)
1458 {
1459 	switch (event) {
1460 	case XFRM_MSG_DELSA:
1461 		return SADB_DELETE;
1462 	case XFRM_MSG_NEWSA:
1463 		return SADB_ADD;
1464 	case XFRM_MSG_UPDSA:
1465 		return SADB_UPDATE;
1466 	case XFRM_MSG_EXPIRE:
1467 		return SADB_EXPIRE;
1468 	default:
1469 		pr_err("pfkey: Unknown SA event %d\n", event);
1470 		break;
1471 	}
1472 
1473 	return 0;
1474 }
1475 
1476 /* ADD/UPD/DEL */
1477 static int key_notify_sa(struct xfrm_state *x, const struct km_event *c)
1478 {
1479 	struct sk_buff *skb;
1480 	struct sadb_msg *hdr;
1481 
1482 	skb = pfkey_xfrm_state2msg(x);
1483 
1484 	if (IS_ERR(skb))
1485 		return PTR_ERR(skb);
1486 
1487 	hdr = (struct sadb_msg *) skb->data;
1488 	hdr->sadb_msg_version = PF_KEY_V2;
1489 	hdr->sadb_msg_type = event2keytype(c->event);
1490 	hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
1491 	hdr->sadb_msg_errno = 0;
1492 	hdr->sadb_msg_reserved = 0;
1493 	hdr->sadb_msg_seq = c->seq;
1494 	hdr->sadb_msg_pid = c->portid;
1495 
1496 	pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_ALL, NULL, xs_net(x));
1497 
1498 	return 0;
1499 }
1500 
1501 static int pfkey_add(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1502 {
1503 	struct net *net = sock_net(sk);
1504 	struct xfrm_state *x;
1505 	int err;
1506 	struct km_event c;
1507 
1508 	x = pfkey_msg2xfrm_state(net, hdr, ext_hdrs);
1509 	if (IS_ERR(x))
1510 		return PTR_ERR(x);
1511 
1512 	xfrm_state_hold(x);
1513 	if (hdr->sadb_msg_type == SADB_ADD)
1514 		err = xfrm_state_add(x);
1515 	else
1516 		err = xfrm_state_update(x);
1517 
1518 	xfrm_audit_state_add(x, err ? 0 : 1, true);
1519 
1520 	if (err < 0) {
1521 		x->km.state = XFRM_STATE_DEAD;
1522 		__xfrm_state_put(x);
1523 		goto out;
1524 	}
1525 
1526 	if (hdr->sadb_msg_type == SADB_ADD)
1527 		c.event = XFRM_MSG_NEWSA;
1528 	else
1529 		c.event = XFRM_MSG_UPDSA;
1530 	c.seq = hdr->sadb_msg_seq;
1531 	c.portid = hdr->sadb_msg_pid;
1532 	km_state_notify(x, &c);
1533 out:
1534 	xfrm_state_put(x);
1535 	return err;
1536 }
1537 
1538 static int pfkey_delete(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1539 {
1540 	struct net *net = sock_net(sk);
1541 	struct xfrm_state *x;
1542 	struct km_event c;
1543 	int err;
1544 
1545 	if (!ext_hdrs[SADB_EXT_SA-1] ||
1546 	    !present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1547 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1548 		return -EINVAL;
1549 
1550 	x = pfkey_xfrm_state_lookup(net, hdr, ext_hdrs);
1551 	if (x == NULL)
1552 		return -ESRCH;
1553 
1554 	if ((err = security_xfrm_state_delete(x)))
1555 		goto out;
1556 
1557 	if (xfrm_state_kern(x)) {
1558 		err = -EPERM;
1559 		goto out;
1560 	}
1561 
1562 	err = xfrm_state_delete(x);
1563 
1564 	if (err < 0)
1565 		goto out;
1566 
1567 	c.seq = hdr->sadb_msg_seq;
1568 	c.portid = hdr->sadb_msg_pid;
1569 	c.event = XFRM_MSG_DELSA;
1570 	km_state_notify(x, &c);
1571 out:
1572 	xfrm_audit_state_delete(x, err ? 0 : 1, true);
1573 	xfrm_state_put(x);
1574 
1575 	return err;
1576 }
1577 
1578 static int pfkey_get(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1579 {
1580 	struct net *net = sock_net(sk);
1581 	__u8 proto;
1582 	struct sk_buff *out_skb;
1583 	struct sadb_msg *out_hdr;
1584 	struct xfrm_state *x;
1585 
1586 	if (!ext_hdrs[SADB_EXT_SA-1] ||
1587 	    !present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1588 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1589 		return -EINVAL;
1590 
1591 	x = pfkey_xfrm_state_lookup(net, hdr, ext_hdrs);
1592 	if (x == NULL)
1593 		return -ESRCH;
1594 
1595 	out_skb = pfkey_xfrm_state2msg(x);
1596 	proto = x->id.proto;
1597 	xfrm_state_put(x);
1598 	if (IS_ERR(out_skb))
1599 		return  PTR_ERR(out_skb);
1600 
1601 	out_hdr = (struct sadb_msg *) out_skb->data;
1602 	out_hdr->sadb_msg_version = hdr->sadb_msg_version;
1603 	out_hdr->sadb_msg_type = SADB_GET;
1604 	out_hdr->sadb_msg_satype = pfkey_proto2satype(proto);
1605 	out_hdr->sadb_msg_errno = 0;
1606 	out_hdr->sadb_msg_reserved = 0;
1607 	out_hdr->sadb_msg_seq = hdr->sadb_msg_seq;
1608 	out_hdr->sadb_msg_pid = hdr->sadb_msg_pid;
1609 	pfkey_broadcast(out_skb, GFP_ATOMIC, BROADCAST_ONE, sk, sock_net(sk));
1610 
1611 	return 0;
1612 }
1613 
1614 static struct sk_buff *compose_sadb_supported(const struct sadb_msg *orig,
1615 					      gfp_t allocation)
1616 {
1617 	struct sk_buff *skb;
1618 	struct sadb_msg *hdr;
1619 	int len, auth_len, enc_len, i;
1620 
1621 	auth_len = xfrm_count_pfkey_auth_supported();
1622 	if (auth_len) {
1623 		auth_len *= sizeof(struct sadb_alg);
1624 		auth_len += sizeof(struct sadb_supported);
1625 	}
1626 
1627 	enc_len = xfrm_count_pfkey_enc_supported();
1628 	if (enc_len) {
1629 		enc_len *= sizeof(struct sadb_alg);
1630 		enc_len += sizeof(struct sadb_supported);
1631 	}
1632 
1633 	len = enc_len + auth_len + sizeof(struct sadb_msg);
1634 
1635 	skb = alloc_skb(len + 16, allocation);
1636 	if (!skb)
1637 		goto out_put_algs;
1638 
1639 	hdr = skb_put(skb, sizeof(*hdr));
1640 	pfkey_hdr_dup(hdr, orig);
1641 	hdr->sadb_msg_errno = 0;
1642 	hdr->sadb_msg_len = len / sizeof(uint64_t);
1643 
1644 	if (auth_len) {
1645 		struct sadb_supported *sp;
1646 		struct sadb_alg *ap;
1647 
1648 		sp = skb_put(skb, auth_len);
1649 		ap = (struct sadb_alg *) (sp + 1);
1650 
1651 		sp->sadb_supported_len = auth_len / sizeof(uint64_t);
1652 		sp->sadb_supported_exttype = SADB_EXT_SUPPORTED_AUTH;
1653 
1654 		for (i = 0; ; i++) {
1655 			struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(i);
1656 			if (!aalg)
1657 				break;
1658 			if (!aalg->pfkey_supported)
1659 				continue;
1660 			if (aalg->available)
1661 				*ap++ = aalg->desc;
1662 		}
1663 	}
1664 
1665 	if (enc_len) {
1666 		struct sadb_supported *sp;
1667 		struct sadb_alg *ap;
1668 
1669 		sp = skb_put(skb, enc_len);
1670 		ap = (struct sadb_alg *) (sp + 1);
1671 
1672 		sp->sadb_supported_len = enc_len / sizeof(uint64_t);
1673 		sp->sadb_supported_exttype = SADB_EXT_SUPPORTED_ENCRYPT;
1674 
1675 		for (i = 0; ; i++) {
1676 			struct xfrm_algo_desc *ealg = xfrm_ealg_get_byidx(i);
1677 			if (!ealg)
1678 				break;
1679 			if (!ealg->pfkey_supported)
1680 				continue;
1681 			if (ealg->available)
1682 				*ap++ = ealg->desc;
1683 		}
1684 	}
1685 
1686 out_put_algs:
1687 	return skb;
1688 }
1689 
1690 static int pfkey_register(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1691 {
1692 	struct pfkey_sock *pfk = pfkey_sk(sk);
1693 	struct sk_buff *supp_skb;
1694 
1695 	if (hdr->sadb_msg_satype > SADB_SATYPE_MAX)
1696 		return -EINVAL;
1697 
1698 	if (hdr->sadb_msg_satype != SADB_SATYPE_UNSPEC) {
1699 		if (pfk->registered&(1<<hdr->sadb_msg_satype))
1700 			return -EEXIST;
1701 		pfk->registered |= (1<<hdr->sadb_msg_satype);
1702 	}
1703 
1704 	xfrm_probe_algs();
1705 
1706 	supp_skb = compose_sadb_supported(hdr, GFP_KERNEL);
1707 	if (!supp_skb) {
1708 		if (hdr->sadb_msg_satype != SADB_SATYPE_UNSPEC)
1709 			pfk->registered &= ~(1<<hdr->sadb_msg_satype);
1710 
1711 		return -ENOBUFS;
1712 	}
1713 
1714 	pfkey_broadcast(supp_skb, GFP_KERNEL, BROADCAST_REGISTERED, sk,
1715 			sock_net(sk));
1716 	return 0;
1717 }
1718 
1719 static int unicast_flush_resp(struct sock *sk, const struct sadb_msg *ihdr)
1720 {
1721 	struct sk_buff *skb;
1722 	struct sadb_msg *hdr;
1723 
1724 	skb = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_ATOMIC);
1725 	if (!skb)
1726 		return -ENOBUFS;
1727 
1728 	hdr = skb_put_data(skb, ihdr, sizeof(struct sadb_msg));
1729 	hdr->sadb_msg_errno = (uint8_t) 0;
1730 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) / sizeof(uint64_t));
1731 
1732 	return pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_ONE, sk,
1733 			       sock_net(sk));
1734 }
1735 
1736 static int key_notify_sa_flush(const struct km_event *c)
1737 {
1738 	struct sk_buff *skb;
1739 	struct sadb_msg *hdr;
1740 
1741 	skb = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_ATOMIC);
1742 	if (!skb)
1743 		return -ENOBUFS;
1744 	hdr = skb_put(skb, sizeof(struct sadb_msg));
1745 	hdr->sadb_msg_satype = pfkey_proto2satype(c->data.proto);
1746 	hdr->sadb_msg_type = SADB_FLUSH;
1747 	hdr->sadb_msg_seq = c->seq;
1748 	hdr->sadb_msg_pid = c->portid;
1749 	hdr->sadb_msg_version = PF_KEY_V2;
1750 	hdr->sadb_msg_errno = (uint8_t) 0;
1751 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) / sizeof(uint64_t));
1752 	hdr->sadb_msg_reserved = 0;
1753 
1754 	pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_ALL, NULL, c->net);
1755 
1756 	return 0;
1757 }
1758 
1759 static int pfkey_flush(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1760 {
1761 	struct net *net = sock_net(sk);
1762 	unsigned int proto;
1763 	struct km_event c;
1764 	int err, err2;
1765 
1766 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1767 	if (proto == 0)
1768 		return -EINVAL;
1769 
1770 	err = xfrm_state_flush(net, proto, true, false);
1771 	err2 = unicast_flush_resp(sk, hdr);
1772 	if (err || err2) {
1773 		if (err == -ESRCH) /* empty table - go quietly */
1774 			err = 0;
1775 		return err ? err : err2;
1776 	}
1777 
1778 	c.data.proto = proto;
1779 	c.seq = hdr->sadb_msg_seq;
1780 	c.portid = hdr->sadb_msg_pid;
1781 	c.event = XFRM_MSG_FLUSHSA;
1782 	c.net = net;
1783 	km_state_notify(NULL, &c);
1784 
1785 	return 0;
1786 }
1787 
1788 static int dump_sa(struct xfrm_state *x, int count, void *ptr)
1789 {
1790 	struct pfkey_sock *pfk = ptr;
1791 	struct sk_buff *out_skb;
1792 	struct sadb_msg *out_hdr;
1793 
1794 	if (!pfkey_can_dump(&pfk->sk))
1795 		return -ENOBUFS;
1796 
1797 	out_skb = pfkey_xfrm_state2msg(x);
1798 	if (IS_ERR(out_skb))
1799 		return PTR_ERR(out_skb);
1800 
1801 	out_hdr = (struct sadb_msg *) out_skb->data;
1802 	out_hdr->sadb_msg_version = pfk->dump.msg_version;
1803 	out_hdr->sadb_msg_type = SADB_DUMP;
1804 	out_hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
1805 	out_hdr->sadb_msg_errno = 0;
1806 	out_hdr->sadb_msg_reserved = 0;
1807 	out_hdr->sadb_msg_seq = count + 1;
1808 	out_hdr->sadb_msg_pid = pfk->dump.msg_portid;
1809 
1810 	if (pfk->dump.skb)
1811 		pfkey_broadcast(pfk->dump.skb, GFP_ATOMIC, BROADCAST_ONE,
1812 				&pfk->sk, sock_net(&pfk->sk));
1813 	pfk->dump.skb = out_skb;
1814 
1815 	return 0;
1816 }
1817 
1818 static int pfkey_dump_sa(struct pfkey_sock *pfk)
1819 {
1820 	struct net *net = sock_net(&pfk->sk);
1821 	return xfrm_state_walk(net, &pfk->dump.u.state, dump_sa, (void *) pfk);
1822 }
1823 
1824 static void pfkey_dump_sa_done(struct pfkey_sock *pfk)
1825 {
1826 	struct net *net = sock_net(&pfk->sk);
1827 
1828 	xfrm_state_walk_done(&pfk->dump.u.state, net);
1829 }
1830 
1831 static int pfkey_dump(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1832 {
1833 	u8 proto;
1834 	struct xfrm_address_filter *filter = NULL;
1835 	struct pfkey_sock *pfk = pfkey_sk(sk);
1836 
1837 	mutex_lock(&pfk->dump_lock);
1838 	if (pfk->dump.dump != NULL) {
1839 		mutex_unlock(&pfk->dump_lock);
1840 		return -EBUSY;
1841 	}
1842 
1843 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1844 	if (proto == 0) {
1845 		mutex_unlock(&pfk->dump_lock);
1846 		return -EINVAL;
1847 	}
1848 
1849 	if (ext_hdrs[SADB_X_EXT_FILTER - 1]) {
1850 		struct sadb_x_filter *xfilter = ext_hdrs[SADB_X_EXT_FILTER - 1];
1851 
1852 		if ((xfilter->sadb_x_filter_splen >=
1853 			(sizeof(xfrm_address_t) << 3)) ||
1854 		    (xfilter->sadb_x_filter_dplen >=
1855 			(sizeof(xfrm_address_t) << 3))) {
1856 			mutex_unlock(&pfk->dump_lock);
1857 			return -EINVAL;
1858 		}
1859 		filter = kmalloc(sizeof(*filter), GFP_KERNEL);
1860 		if (filter == NULL) {
1861 			mutex_unlock(&pfk->dump_lock);
1862 			return -ENOMEM;
1863 		}
1864 
1865 		memcpy(&filter->saddr, &xfilter->sadb_x_filter_saddr,
1866 		       sizeof(xfrm_address_t));
1867 		memcpy(&filter->daddr, &xfilter->sadb_x_filter_daddr,
1868 		       sizeof(xfrm_address_t));
1869 		filter->family = xfilter->sadb_x_filter_family;
1870 		filter->splen = xfilter->sadb_x_filter_splen;
1871 		filter->dplen = xfilter->sadb_x_filter_dplen;
1872 	}
1873 
1874 	pfk->dump.msg_version = hdr->sadb_msg_version;
1875 	pfk->dump.msg_portid = hdr->sadb_msg_pid;
1876 	pfk->dump.dump = pfkey_dump_sa;
1877 	pfk->dump.done = pfkey_dump_sa_done;
1878 	xfrm_state_walk_init(&pfk->dump.u.state, proto, filter);
1879 	mutex_unlock(&pfk->dump_lock);
1880 
1881 	return pfkey_do_dump(pfk);
1882 }
1883 
1884 static int pfkey_promisc(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1885 {
1886 	struct pfkey_sock *pfk = pfkey_sk(sk);
1887 	int satype = hdr->sadb_msg_satype;
1888 	bool reset_errno = false;
1889 
1890 	if (hdr->sadb_msg_len == (sizeof(*hdr) / sizeof(uint64_t))) {
1891 		reset_errno = true;
1892 		if (satype != 0 && satype != 1)
1893 			return -EINVAL;
1894 		pfk->promisc = satype;
1895 	}
1896 	if (reset_errno && skb_cloned(skb))
1897 		skb = skb_copy(skb, GFP_KERNEL);
1898 	else
1899 		skb = skb_clone(skb, GFP_KERNEL);
1900 
1901 	if (reset_errno && skb) {
1902 		struct sadb_msg *new_hdr = (struct sadb_msg *) skb->data;
1903 		new_hdr->sadb_msg_errno = 0;
1904 	}
1905 
1906 	pfkey_broadcast(skb, GFP_KERNEL, BROADCAST_ALL, NULL, sock_net(sk));
1907 	return 0;
1908 }
1909 
1910 static int check_reqid(struct xfrm_policy *xp, int dir, int count, void *ptr)
1911 {
1912 	int i;
1913 	u32 reqid = *(u32*)ptr;
1914 
1915 	for (i=0; i<xp->xfrm_nr; i++) {
1916 		if (xp->xfrm_vec[i].reqid == reqid)
1917 			return -EEXIST;
1918 	}
1919 	return 0;
1920 }
1921 
1922 static u32 gen_reqid(struct net *net)
1923 {
1924 	struct xfrm_policy_walk walk;
1925 	u32 start;
1926 	int rc;
1927 	static u32 reqid = IPSEC_MANUAL_REQID_MAX;
1928 
1929 	start = reqid;
1930 	do {
1931 		++reqid;
1932 		if (reqid == 0)
1933 			reqid = IPSEC_MANUAL_REQID_MAX+1;
1934 		xfrm_policy_walk_init(&walk, XFRM_POLICY_TYPE_MAIN);
1935 		rc = xfrm_policy_walk(net, &walk, check_reqid, (void*)&reqid);
1936 		xfrm_policy_walk_done(&walk, net);
1937 		if (rc != -EEXIST)
1938 			return reqid;
1939 	} while (reqid != start);
1940 	return 0;
1941 }
1942 
1943 static int
1944 parse_ipsecrequest(struct xfrm_policy *xp, struct sadb_x_ipsecrequest *rq)
1945 {
1946 	struct net *net = xp_net(xp);
1947 	struct xfrm_tmpl *t = xp->xfrm_vec + xp->xfrm_nr;
1948 	int mode;
1949 
1950 	if (xp->xfrm_nr >= XFRM_MAX_DEPTH)
1951 		return -ELOOP;
1952 
1953 	if (rq->sadb_x_ipsecrequest_mode == 0)
1954 		return -EINVAL;
1955 	if (!xfrm_id_proto_valid(rq->sadb_x_ipsecrequest_proto))
1956 		return -EINVAL;
1957 
1958 	t->id.proto = rq->sadb_x_ipsecrequest_proto;
1959 	if ((mode = pfkey_mode_to_xfrm(rq->sadb_x_ipsecrequest_mode)) < 0)
1960 		return -EINVAL;
1961 	t->mode = mode;
1962 	if (rq->sadb_x_ipsecrequest_level == IPSEC_LEVEL_USE)
1963 		t->optional = 1;
1964 	else if (rq->sadb_x_ipsecrequest_level == IPSEC_LEVEL_UNIQUE) {
1965 		t->reqid = rq->sadb_x_ipsecrequest_reqid;
1966 		if (t->reqid > IPSEC_MANUAL_REQID_MAX)
1967 			t->reqid = 0;
1968 		if (!t->reqid && !(t->reqid = gen_reqid(net)))
1969 			return -ENOBUFS;
1970 	}
1971 
1972 	/* addresses present only in tunnel mode */
1973 	if (t->mode == XFRM_MODE_TUNNEL) {
1974 		int err;
1975 
1976 		err = parse_sockaddr_pair(
1977 			(struct sockaddr *)(rq + 1),
1978 			rq->sadb_x_ipsecrequest_len - sizeof(*rq),
1979 			&t->saddr, &t->id.daddr, &t->encap_family);
1980 		if (err)
1981 			return err;
1982 	} else
1983 		t->encap_family = xp->family;
1984 
1985 	/* No way to set this via kame pfkey */
1986 	t->allalgs = 1;
1987 	xp->xfrm_nr++;
1988 	return 0;
1989 }
1990 
1991 static int
1992 parse_ipsecrequests(struct xfrm_policy *xp, struct sadb_x_policy *pol)
1993 {
1994 	int err;
1995 	int len = pol->sadb_x_policy_len*8 - sizeof(struct sadb_x_policy);
1996 	struct sadb_x_ipsecrequest *rq = (void*)(pol+1);
1997 
1998 	if (pol->sadb_x_policy_len * 8 < sizeof(struct sadb_x_policy))
1999 		return -EINVAL;
2000 
2001 	while (len >= sizeof(*rq)) {
2002 		if (len < rq->sadb_x_ipsecrequest_len ||
2003 		    rq->sadb_x_ipsecrequest_len < sizeof(*rq))
2004 			return -EINVAL;
2005 
2006 		if ((err = parse_ipsecrequest(xp, rq)) < 0)
2007 			return err;
2008 		len -= rq->sadb_x_ipsecrequest_len;
2009 		rq = (void*)((u8*)rq + rq->sadb_x_ipsecrequest_len);
2010 	}
2011 	return 0;
2012 }
2013 
2014 static inline int pfkey_xfrm_policy2sec_ctx_size(const struct xfrm_policy *xp)
2015 {
2016 	struct xfrm_sec_ctx *xfrm_ctx = xp->security;
2017 
2018 	if (xfrm_ctx) {
2019 		int len = sizeof(struct sadb_x_sec_ctx);
2020 		len += xfrm_ctx->ctx_len;
2021 		return PFKEY_ALIGN8(len);
2022 	}
2023 	return 0;
2024 }
2025 
2026 static int pfkey_xfrm_policy2msg_size(const struct xfrm_policy *xp)
2027 {
2028 	const struct xfrm_tmpl *t;
2029 	int sockaddr_size = pfkey_sockaddr_size(xp->family);
2030 	int socklen = 0;
2031 	int i;
2032 
2033 	for (i=0; i<xp->xfrm_nr; i++) {
2034 		t = xp->xfrm_vec + i;
2035 		socklen += pfkey_sockaddr_len(t->encap_family);
2036 	}
2037 
2038 	return sizeof(struct sadb_msg) +
2039 		(sizeof(struct sadb_lifetime) * 3) +
2040 		(sizeof(struct sadb_address) * 2) +
2041 		(sockaddr_size * 2) +
2042 		sizeof(struct sadb_x_policy) +
2043 		(xp->xfrm_nr * sizeof(struct sadb_x_ipsecrequest)) +
2044 		(socklen * 2) +
2045 		pfkey_xfrm_policy2sec_ctx_size(xp);
2046 }
2047 
2048 static struct sk_buff * pfkey_xfrm_policy2msg_prep(const struct xfrm_policy *xp)
2049 {
2050 	struct sk_buff *skb;
2051 	int size;
2052 
2053 	size = pfkey_xfrm_policy2msg_size(xp);
2054 
2055 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
2056 	if (skb == NULL)
2057 		return ERR_PTR(-ENOBUFS);
2058 
2059 	return skb;
2060 }
2061 
2062 static int pfkey_xfrm_policy2msg(struct sk_buff *skb, const struct xfrm_policy *xp, int dir)
2063 {
2064 	struct sadb_msg *hdr;
2065 	struct sadb_address *addr;
2066 	struct sadb_lifetime *lifetime;
2067 	struct sadb_x_policy *pol;
2068 	struct sadb_x_sec_ctx *sec_ctx;
2069 	struct xfrm_sec_ctx *xfrm_ctx;
2070 	int i;
2071 	int size;
2072 	int sockaddr_size = pfkey_sockaddr_size(xp->family);
2073 	int socklen = pfkey_sockaddr_len(xp->family);
2074 
2075 	size = pfkey_xfrm_policy2msg_size(xp);
2076 
2077 	/* call should fill header later */
2078 	hdr = skb_put(skb, sizeof(struct sadb_msg));
2079 	memset(hdr, 0, size);	/* XXX do we need this ? */
2080 
2081 	/* src address */
2082 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
2083 	addr->sadb_address_len =
2084 		(sizeof(struct sadb_address)+sockaddr_size)/
2085 			sizeof(uint64_t);
2086 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
2087 	addr->sadb_address_proto = pfkey_proto_from_xfrm(xp->selector.proto);
2088 	addr->sadb_address_prefixlen = xp->selector.prefixlen_s;
2089 	addr->sadb_address_reserved = 0;
2090 	if (!pfkey_sockaddr_fill(&xp->selector.saddr,
2091 				 xp->selector.sport,
2092 				 (struct sockaddr *) (addr + 1),
2093 				 xp->family))
2094 		BUG();
2095 
2096 	/* dst address */
2097 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
2098 	addr->sadb_address_len =
2099 		(sizeof(struct sadb_address)+sockaddr_size)/
2100 			sizeof(uint64_t);
2101 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
2102 	addr->sadb_address_proto = pfkey_proto_from_xfrm(xp->selector.proto);
2103 	addr->sadb_address_prefixlen = xp->selector.prefixlen_d;
2104 	addr->sadb_address_reserved = 0;
2105 
2106 	pfkey_sockaddr_fill(&xp->selector.daddr, xp->selector.dport,
2107 			    (struct sockaddr *) (addr + 1),
2108 			    xp->family);
2109 
2110 	/* hard time */
2111 	lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
2112 	lifetime->sadb_lifetime_len =
2113 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
2114 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_HARD;
2115 	lifetime->sadb_lifetime_allocations =  _X2KEY(xp->lft.hard_packet_limit);
2116 	lifetime->sadb_lifetime_bytes = _X2KEY(xp->lft.hard_byte_limit);
2117 	lifetime->sadb_lifetime_addtime = xp->lft.hard_add_expires_seconds;
2118 	lifetime->sadb_lifetime_usetime = xp->lft.hard_use_expires_seconds;
2119 	/* soft time */
2120 	lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
2121 	lifetime->sadb_lifetime_len =
2122 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
2123 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_SOFT;
2124 	lifetime->sadb_lifetime_allocations =  _X2KEY(xp->lft.soft_packet_limit);
2125 	lifetime->sadb_lifetime_bytes = _X2KEY(xp->lft.soft_byte_limit);
2126 	lifetime->sadb_lifetime_addtime = xp->lft.soft_add_expires_seconds;
2127 	lifetime->sadb_lifetime_usetime = xp->lft.soft_use_expires_seconds;
2128 	/* current time */
2129 	lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
2130 	lifetime->sadb_lifetime_len =
2131 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
2132 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_CURRENT;
2133 	lifetime->sadb_lifetime_allocations = xp->curlft.packets;
2134 	lifetime->sadb_lifetime_bytes = xp->curlft.bytes;
2135 	lifetime->sadb_lifetime_addtime = xp->curlft.add_time;
2136 	lifetime->sadb_lifetime_usetime = xp->curlft.use_time;
2137 
2138 	pol = skb_put(skb, sizeof(struct sadb_x_policy));
2139 	pol->sadb_x_policy_len = sizeof(struct sadb_x_policy)/sizeof(uint64_t);
2140 	pol->sadb_x_policy_exttype = SADB_X_EXT_POLICY;
2141 	pol->sadb_x_policy_type = IPSEC_POLICY_DISCARD;
2142 	if (xp->action == XFRM_POLICY_ALLOW) {
2143 		if (xp->xfrm_nr)
2144 			pol->sadb_x_policy_type = IPSEC_POLICY_IPSEC;
2145 		else
2146 			pol->sadb_x_policy_type = IPSEC_POLICY_NONE;
2147 	}
2148 	pol->sadb_x_policy_dir = dir+1;
2149 	pol->sadb_x_policy_reserved = 0;
2150 	pol->sadb_x_policy_id = xp->index;
2151 	pol->sadb_x_policy_priority = xp->priority;
2152 
2153 	for (i=0; i<xp->xfrm_nr; i++) {
2154 		const struct xfrm_tmpl *t = xp->xfrm_vec + i;
2155 		struct sadb_x_ipsecrequest *rq;
2156 		int req_size;
2157 		int mode;
2158 
2159 		req_size = sizeof(struct sadb_x_ipsecrequest);
2160 		if (t->mode == XFRM_MODE_TUNNEL) {
2161 			socklen = pfkey_sockaddr_len(t->encap_family);
2162 			req_size += socklen * 2;
2163 		} else {
2164 			size -= 2*socklen;
2165 		}
2166 		rq = skb_put(skb, req_size);
2167 		pol->sadb_x_policy_len += req_size/8;
2168 		memset(rq, 0, sizeof(*rq));
2169 		rq->sadb_x_ipsecrequest_len = req_size;
2170 		rq->sadb_x_ipsecrequest_proto = t->id.proto;
2171 		if ((mode = pfkey_mode_from_xfrm(t->mode)) < 0)
2172 			return -EINVAL;
2173 		rq->sadb_x_ipsecrequest_mode = mode;
2174 		rq->sadb_x_ipsecrequest_level = IPSEC_LEVEL_REQUIRE;
2175 		if (t->reqid)
2176 			rq->sadb_x_ipsecrequest_level = IPSEC_LEVEL_UNIQUE;
2177 		if (t->optional)
2178 			rq->sadb_x_ipsecrequest_level = IPSEC_LEVEL_USE;
2179 		rq->sadb_x_ipsecrequest_reqid = t->reqid;
2180 
2181 		if (t->mode == XFRM_MODE_TUNNEL) {
2182 			u8 *sa = (void *)(rq + 1);
2183 			pfkey_sockaddr_fill(&t->saddr, 0,
2184 					    (struct sockaddr *)sa,
2185 					    t->encap_family);
2186 			pfkey_sockaddr_fill(&t->id.daddr, 0,
2187 					    (struct sockaddr *) (sa + socklen),
2188 					    t->encap_family);
2189 		}
2190 	}
2191 
2192 	/* security context */
2193 	if ((xfrm_ctx = xp->security)) {
2194 		int ctx_size = pfkey_xfrm_policy2sec_ctx_size(xp);
2195 
2196 		sec_ctx = skb_put(skb, ctx_size);
2197 		sec_ctx->sadb_x_sec_len = ctx_size / sizeof(uint64_t);
2198 		sec_ctx->sadb_x_sec_exttype = SADB_X_EXT_SEC_CTX;
2199 		sec_ctx->sadb_x_ctx_doi = xfrm_ctx->ctx_doi;
2200 		sec_ctx->sadb_x_ctx_alg = xfrm_ctx->ctx_alg;
2201 		sec_ctx->sadb_x_ctx_len = xfrm_ctx->ctx_len;
2202 		memcpy(sec_ctx + 1, xfrm_ctx->ctx_str,
2203 		       xfrm_ctx->ctx_len);
2204 	}
2205 
2206 	hdr->sadb_msg_len = size / sizeof(uint64_t);
2207 	hdr->sadb_msg_reserved = refcount_read(&xp->refcnt);
2208 
2209 	return 0;
2210 }
2211 
2212 static int key_notify_policy(struct xfrm_policy *xp, int dir, const struct km_event *c)
2213 {
2214 	struct sk_buff *out_skb;
2215 	struct sadb_msg *out_hdr;
2216 	int err;
2217 
2218 	out_skb = pfkey_xfrm_policy2msg_prep(xp);
2219 	if (IS_ERR(out_skb))
2220 		return PTR_ERR(out_skb);
2221 
2222 	err = pfkey_xfrm_policy2msg(out_skb, xp, dir);
2223 	if (err < 0) {
2224 		kfree_skb(out_skb);
2225 		return err;
2226 	}
2227 
2228 	out_hdr = (struct sadb_msg *) out_skb->data;
2229 	out_hdr->sadb_msg_version = PF_KEY_V2;
2230 
2231 	if (c->data.byid && c->event == XFRM_MSG_DELPOLICY)
2232 		out_hdr->sadb_msg_type = SADB_X_SPDDELETE2;
2233 	else
2234 		out_hdr->sadb_msg_type = event2poltype(c->event);
2235 	out_hdr->sadb_msg_errno = 0;
2236 	out_hdr->sadb_msg_seq = c->seq;
2237 	out_hdr->sadb_msg_pid = c->portid;
2238 	pfkey_broadcast(out_skb, GFP_ATOMIC, BROADCAST_ALL, NULL, xp_net(xp));
2239 	return 0;
2240 
2241 }
2242 
2243 static int pfkey_spdadd(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2244 {
2245 	struct net *net = sock_net(sk);
2246 	int err = 0;
2247 	struct sadb_lifetime *lifetime;
2248 	struct sadb_address *sa;
2249 	struct sadb_x_policy *pol;
2250 	struct xfrm_policy *xp;
2251 	struct km_event c;
2252 	struct sadb_x_sec_ctx *sec_ctx;
2253 
2254 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
2255 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]) ||
2256 	    !ext_hdrs[SADB_X_EXT_POLICY-1])
2257 		return -EINVAL;
2258 
2259 	pol = ext_hdrs[SADB_X_EXT_POLICY-1];
2260 	if (pol->sadb_x_policy_type > IPSEC_POLICY_IPSEC)
2261 		return -EINVAL;
2262 	if (!pol->sadb_x_policy_dir || pol->sadb_x_policy_dir >= IPSEC_DIR_MAX)
2263 		return -EINVAL;
2264 
2265 	xp = xfrm_policy_alloc(net, GFP_KERNEL);
2266 	if (xp == NULL)
2267 		return -ENOBUFS;
2268 
2269 	xp->action = (pol->sadb_x_policy_type == IPSEC_POLICY_DISCARD ?
2270 		      XFRM_POLICY_BLOCK : XFRM_POLICY_ALLOW);
2271 	xp->priority = pol->sadb_x_policy_priority;
2272 
2273 	sa = ext_hdrs[SADB_EXT_ADDRESS_SRC-1];
2274 	xp->family = pfkey_sadb_addr2xfrm_addr(sa, &xp->selector.saddr);
2275 	xp->selector.family = xp->family;
2276 	xp->selector.prefixlen_s = sa->sadb_address_prefixlen;
2277 	xp->selector.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2278 	xp->selector.sport = ((struct sockaddr_in *)(sa+1))->sin_port;
2279 	if (xp->selector.sport)
2280 		xp->selector.sport_mask = htons(0xffff);
2281 
2282 	sa = ext_hdrs[SADB_EXT_ADDRESS_DST-1];
2283 	pfkey_sadb_addr2xfrm_addr(sa, &xp->selector.daddr);
2284 	xp->selector.prefixlen_d = sa->sadb_address_prefixlen;
2285 
2286 	/* Amusing, we set this twice.  KAME apps appear to set same value
2287 	 * in both addresses.
2288 	 */
2289 	xp->selector.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2290 
2291 	xp->selector.dport = ((struct sockaddr_in *)(sa+1))->sin_port;
2292 	if (xp->selector.dport)
2293 		xp->selector.dport_mask = htons(0xffff);
2294 
2295 	sec_ctx = ext_hdrs[SADB_X_EXT_SEC_CTX - 1];
2296 	if (sec_ctx != NULL) {
2297 		struct xfrm_user_sec_ctx *uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_KERNEL);
2298 
2299 		if (!uctx) {
2300 			err = -ENOBUFS;
2301 			goto out;
2302 		}
2303 
2304 		err = security_xfrm_policy_alloc(&xp->security, uctx, GFP_KERNEL);
2305 		kfree(uctx);
2306 
2307 		if (err)
2308 			goto out;
2309 	}
2310 
2311 	xp->lft.soft_byte_limit = XFRM_INF;
2312 	xp->lft.hard_byte_limit = XFRM_INF;
2313 	xp->lft.soft_packet_limit = XFRM_INF;
2314 	xp->lft.hard_packet_limit = XFRM_INF;
2315 	if ((lifetime = ext_hdrs[SADB_EXT_LIFETIME_HARD-1]) != NULL) {
2316 		xp->lft.hard_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
2317 		xp->lft.hard_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
2318 		xp->lft.hard_add_expires_seconds = lifetime->sadb_lifetime_addtime;
2319 		xp->lft.hard_use_expires_seconds = lifetime->sadb_lifetime_usetime;
2320 	}
2321 	if ((lifetime = ext_hdrs[SADB_EXT_LIFETIME_SOFT-1]) != NULL) {
2322 		xp->lft.soft_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
2323 		xp->lft.soft_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
2324 		xp->lft.soft_add_expires_seconds = lifetime->sadb_lifetime_addtime;
2325 		xp->lft.soft_use_expires_seconds = lifetime->sadb_lifetime_usetime;
2326 	}
2327 	xp->xfrm_nr = 0;
2328 	if (pol->sadb_x_policy_type == IPSEC_POLICY_IPSEC &&
2329 	    (err = parse_ipsecrequests(xp, pol)) < 0)
2330 		goto out;
2331 
2332 	err = xfrm_policy_insert(pol->sadb_x_policy_dir-1, xp,
2333 				 hdr->sadb_msg_type != SADB_X_SPDUPDATE);
2334 
2335 	xfrm_audit_policy_add(xp, err ? 0 : 1, true);
2336 
2337 	if (err)
2338 		goto out;
2339 
2340 	if (hdr->sadb_msg_type == SADB_X_SPDUPDATE)
2341 		c.event = XFRM_MSG_UPDPOLICY;
2342 	else
2343 		c.event = XFRM_MSG_NEWPOLICY;
2344 
2345 	c.seq = hdr->sadb_msg_seq;
2346 	c.portid = hdr->sadb_msg_pid;
2347 
2348 	km_policy_notify(xp, pol->sadb_x_policy_dir-1, &c);
2349 	xfrm_pol_put(xp);
2350 	return 0;
2351 
2352 out:
2353 	xp->walk.dead = 1;
2354 	xfrm_policy_destroy(xp);
2355 	return err;
2356 }
2357 
2358 static int pfkey_spddelete(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2359 {
2360 	struct net *net = sock_net(sk);
2361 	int err;
2362 	struct sadb_address *sa;
2363 	struct sadb_x_policy *pol;
2364 	struct xfrm_policy *xp;
2365 	struct xfrm_selector sel;
2366 	struct km_event c;
2367 	struct sadb_x_sec_ctx *sec_ctx;
2368 	struct xfrm_sec_ctx *pol_ctx = NULL;
2369 
2370 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
2371 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]) ||
2372 	    !ext_hdrs[SADB_X_EXT_POLICY-1])
2373 		return -EINVAL;
2374 
2375 	pol = ext_hdrs[SADB_X_EXT_POLICY-1];
2376 	if (!pol->sadb_x_policy_dir || pol->sadb_x_policy_dir >= IPSEC_DIR_MAX)
2377 		return -EINVAL;
2378 
2379 	memset(&sel, 0, sizeof(sel));
2380 
2381 	sa = ext_hdrs[SADB_EXT_ADDRESS_SRC-1];
2382 	sel.family = pfkey_sadb_addr2xfrm_addr(sa, &sel.saddr);
2383 	sel.prefixlen_s = sa->sadb_address_prefixlen;
2384 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2385 	sel.sport = ((struct sockaddr_in *)(sa+1))->sin_port;
2386 	if (sel.sport)
2387 		sel.sport_mask = htons(0xffff);
2388 
2389 	sa = ext_hdrs[SADB_EXT_ADDRESS_DST-1];
2390 	pfkey_sadb_addr2xfrm_addr(sa, &sel.daddr);
2391 	sel.prefixlen_d = sa->sadb_address_prefixlen;
2392 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2393 	sel.dport = ((struct sockaddr_in *)(sa+1))->sin_port;
2394 	if (sel.dport)
2395 		sel.dport_mask = htons(0xffff);
2396 
2397 	sec_ctx = ext_hdrs[SADB_X_EXT_SEC_CTX - 1];
2398 	if (sec_ctx != NULL) {
2399 		struct xfrm_user_sec_ctx *uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_KERNEL);
2400 
2401 		if (!uctx)
2402 			return -ENOMEM;
2403 
2404 		err = security_xfrm_policy_alloc(&pol_ctx, uctx, GFP_KERNEL);
2405 		kfree(uctx);
2406 		if (err)
2407 			return err;
2408 	}
2409 
2410 	xp = xfrm_policy_bysel_ctx(net, &dummy_mark, 0, XFRM_POLICY_TYPE_MAIN,
2411 				   pol->sadb_x_policy_dir - 1, &sel, pol_ctx,
2412 				   1, &err);
2413 	security_xfrm_policy_free(pol_ctx);
2414 	if (xp == NULL)
2415 		return -ENOENT;
2416 
2417 	xfrm_audit_policy_delete(xp, err ? 0 : 1, true);
2418 
2419 	if (err)
2420 		goto out;
2421 
2422 	c.seq = hdr->sadb_msg_seq;
2423 	c.portid = hdr->sadb_msg_pid;
2424 	c.data.byid = 0;
2425 	c.event = XFRM_MSG_DELPOLICY;
2426 	km_policy_notify(xp, pol->sadb_x_policy_dir-1, &c);
2427 
2428 out:
2429 	xfrm_pol_put(xp);
2430 	return err;
2431 }
2432 
2433 static int key_pol_get_resp(struct sock *sk, struct xfrm_policy *xp, const struct sadb_msg *hdr, int dir)
2434 {
2435 	int err;
2436 	struct sk_buff *out_skb;
2437 	struct sadb_msg *out_hdr;
2438 	err = 0;
2439 
2440 	out_skb = pfkey_xfrm_policy2msg_prep(xp);
2441 	if (IS_ERR(out_skb)) {
2442 		err =  PTR_ERR(out_skb);
2443 		goto out;
2444 	}
2445 	err = pfkey_xfrm_policy2msg(out_skb, xp, dir);
2446 	if (err < 0) {
2447 		kfree_skb(out_skb);
2448 		goto out;
2449 	}
2450 
2451 	out_hdr = (struct sadb_msg *) out_skb->data;
2452 	out_hdr->sadb_msg_version = hdr->sadb_msg_version;
2453 	out_hdr->sadb_msg_type = hdr->sadb_msg_type;
2454 	out_hdr->sadb_msg_satype = 0;
2455 	out_hdr->sadb_msg_errno = 0;
2456 	out_hdr->sadb_msg_seq = hdr->sadb_msg_seq;
2457 	out_hdr->sadb_msg_pid = hdr->sadb_msg_pid;
2458 	pfkey_broadcast(out_skb, GFP_ATOMIC, BROADCAST_ONE, sk, xp_net(xp));
2459 	err = 0;
2460 
2461 out:
2462 	return err;
2463 }
2464 
2465 static int pfkey_sockaddr_pair_size(sa_family_t family)
2466 {
2467 	return PFKEY_ALIGN8(pfkey_sockaddr_len(family) * 2);
2468 }
2469 
2470 static int parse_sockaddr_pair(struct sockaddr *sa, int ext_len,
2471 			       xfrm_address_t *saddr, xfrm_address_t *daddr,
2472 			       u16 *family)
2473 {
2474 	int af, socklen;
2475 
2476 	if (ext_len < 2 || ext_len < pfkey_sockaddr_pair_size(sa->sa_family))
2477 		return -EINVAL;
2478 
2479 	af = pfkey_sockaddr_extract(sa, saddr);
2480 	if (!af)
2481 		return -EINVAL;
2482 
2483 	socklen = pfkey_sockaddr_len(af);
2484 	if (pfkey_sockaddr_extract((struct sockaddr *) (((u8 *)sa) + socklen),
2485 				   daddr) != af)
2486 		return -EINVAL;
2487 
2488 	*family = af;
2489 	return 0;
2490 }
2491 
2492 #ifdef CONFIG_NET_KEY_MIGRATE
2493 static int ipsecrequests_to_migrate(struct sadb_x_ipsecrequest *rq1, int len,
2494 				    struct xfrm_migrate *m)
2495 {
2496 	int err;
2497 	struct sadb_x_ipsecrequest *rq2;
2498 	int mode;
2499 
2500 	if (len < sizeof(*rq1) ||
2501 	    len < rq1->sadb_x_ipsecrequest_len ||
2502 	    rq1->sadb_x_ipsecrequest_len < sizeof(*rq1))
2503 		return -EINVAL;
2504 
2505 	/* old endoints */
2506 	err = parse_sockaddr_pair((struct sockaddr *)(rq1 + 1),
2507 				  rq1->sadb_x_ipsecrequest_len - sizeof(*rq1),
2508 				  &m->old_saddr, &m->old_daddr,
2509 				  &m->old_family);
2510 	if (err)
2511 		return err;
2512 
2513 	rq2 = (struct sadb_x_ipsecrequest *)((u8 *)rq1 + rq1->sadb_x_ipsecrequest_len);
2514 	len -= rq1->sadb_x_ipsecrequest_len;
2515 
2516 	if (len <= sizeof(*rq2) ||
2517 	    len < rq2->sadb_x_ipsecrequest_len ||
2518 	    rq2->sadb_x_ipsecrequest_len < sizeof(*rq2))
2519 		return -EINVAL;
2520 
2521 	/* new endpoints */
2522 	err = parse_sockaddr_pair((struct sockaddr *)(rq2 + 1),
2523 				  rq2->sadb_x_ipsecrequest_len - sizeof(*rq2),
2524 				  &m->new_saddr, &m->new_daddr,
2525 				  &m->new_family);
2526 	if (err)
2527 		return err;
2528 
2529 	if (rq1->sadb_x_ipsecrequest_proto != rq2->sadb_x_ipsecrequest_proto ||
2530 	    rq1->sadb_x_ipsecrequest_mode != rq2->sadb_x_ipsecrequest_mode ||
2531 	    rq1->sadb_x_ipsecrequest_reqid != rq2->sadb_x_ipsecrequest_reqid)
2532 		return -EINVAL;
2533 
2534 	m->proto = rq1->sadb_x_ipsecrequest_proto;
2535 	if ((mode = pfkey_mode_to_xfrm(rq1->sadb_x_ipsecrequest_mode)) < 0)
2536 		return -EINVAL;
2537 	m->mode = mode;
2538 	m->reqid = rq1->sadb_x_ipsecrequest_reqid;
2539 
2540 	return ((int)(rq1->sadb_x_ipsecrequest_len +
2541 		      rq2->sadb_x_ipsecrequest_len));
2542 }
2543 
2544 static int pfkey_migrate(struct sock *sk, struct sk_buff *skb,
2545 			 const struct sadb_msg *hdr, void * const *ext_hdrs)
2546 {
2547 	int i, len, ret, err = -EINVAL;
2548 	u8 dir;
2549 	struct sadb_address *sa;
2550 	struct sadb_x_kmaddress *kma;
2551 	struct sadb_x_policy *pol;
2552 	struct sadb_x_ipsecrequest *rq;
2553 	struct xfrm_selector sel;
2554 	struct xfrm_migrate m[XFRM_MAX_DEPTH];
2555 	struct xfrm_kmaddress k;
2556 	struct net *net = sock_net(sk);
2557 
2558 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC - 1],
2559 				     ext_hdrs[SADB_EXT_ADDRESS_DST - 1]) ||
2560 	    !ext_hdrs[SADB_X_EXT_POLICY - 1]) {
2561 		err = -EINVAL;
2562 		goto out;
2563 	}
2564 
2565 	kma = ext_hdrs[SADB_X_EXT_KMADDRESS - 1];
2566 	pol = ext_hdrs[SADB_X_EXT_POLICY - 1];
2567 
2568 	if (pol->sadb_x_policy_dir >= IPSEC_DIR_MAX) {
2569 		err = -EINVAL;
2570 		goto out;
2571 	}
2572 
2573 	if (kma) {
2574 		/* convert sadb_x_kmaddress to xfrm_kmaddress */
2575 		k.reserved = kma->sadb_x_kmaddress_reserved;
2576 		ret = parse_sockaddr_pair((struct sockaddr *)(kma + 1),
2577 					  8*(kma->sadb_x_kmaddress_len) - sizeof(*kma),
2578 					  &k.local, &k.remote, &k.family);
2579 		if (ret < 0) {
2580 			err = ret;
2581 			goto out;
2582 		}
2583 	}
2584 
2585 	dir = pol->sadb_x_policy_dir - 1;
2586 	memset(&sel, 0, sizeof(sel));
2587 
2588 	/* set source address info of selector */
2589 	sa = ext_hdrs[SADB_EXT_ADDRESS_SRC - 1];
2590 	sel.family = pfkey_sadb_addr2xfrm_addr(sa, &sel.saddr);
2591 	sel.prefixlen_s = sa->sadb_address_prefixlen;
2592 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2593 	sel.sport = ((struct sockaddr_in *)(sa + 1))->sin_port;
2594 	if (sel.sport)
2595 		sel.sport_mask = htons(0xffff);
2596 
2597 	/* set destination address info of selector */
2598 	sa = ext_hdrs[SADB_EXT_ADDRESS_DST - 1];
2599 	pfkey_sadb_addr2xfrm_addr(sa, &sel.daddr);
2600 	sel.prefixlen_d = sa->sadb_address_prefixlen;
2601 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2602 	sel.dport = ((struct sockaddr_in *)(sa + 1))->sin_port;
2603 	if (sel.dport)
2604 		sel.dport_mask = htons(0xffff);
2605 
2606 	rq = (struct sadb_x_ipsecrequest *)(pol + 1);
2607 
2608 	/* extract ipsecrequests */
2609 	i = 0;
2610 	len = pol->sadb_x_policy_len * 8 - sizeof(struct sadb_x_policy);
2611 
2612 	while (len > 0 && i < XFRM_MAX_DEPTH) {
2613 		ret = ipsecrequests_to_migrate(rq, len, &m[i]);
2614 		if (ret < 0) {
2615 			err = ret;
2616 			goto out;
2617 		} else {
2618 			rq = (struct sadb_x_ipsecrequest *)((u8 *)rq + ret);
2619 			len -= ret;
2620 			i++;
2621 		}
2622 	}
2623 
2624 	if (!i || len > 0) {
2625 		err = -EINVAL;
2626 		goto out;
2627 	}
2628 
2629 	return xfrm_migrate(&sel, dir, XFRM_POLICY_TYPE_MAIN, m, i,
2630 			    kma ? &k : NULL, net, NULL);
2631 
2632  out:
2633 	return err;
2634 }
2635 #else
2636 static int pfkey_migrate(struct sock *sk, struct sk_buff *skb,
2637 			 const struct sadb_msg *hdr, void * const *ext_hdrs)
2638 {
2639 	return -ENOPROTOOPT;
2640 }
2641 #endif
2642 
2643 
2644 static int pfkey_spdget(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2645 {
2646 	struct net *net = sock_net(sk);
2647 	unsigned int dir;
2648 	int err = 0, delete;
2649 	struct sadb_x_policy *pol;
2650 	struct xfrm_policy *xp;
2651 	struct km_event c;
2652 
2653 	if ((pol = ext_hdrs[SADB_X_EXT_POLICY-1]) == NULL)
2654 		return -EINVAL;
2655 
2656 	dir = xfrm_policy_id2dir(pol->sadb_x_policy_id);
2657 	if (dir >= XFRM_POLICY_MAX)
2658 		return -EINVAL;
2659 
2660 	delete = (hdr->sadb_msg_type == SADB_X_SPDDELETE2);
2661 	xp = xfrm_policy_byid(net, &dummy_mark, 0, XFRM_POLICY_TYPE_MAIN,
2662 			      dir, pol->sadb_x_policy_id, delete, &err);
2663 	if (xp == NULL)
2664 		return -ENOENT;
2665 
2666 	if (delete) {
2667 		xfrm_audit_policy_delete(xp, err ? 0 : 1, true);
2668 
2669 		if (err)
2670 			goto out;
2671 		c.seq = hdr->sadb_msg_seq;
2672 		c.portid = hdr->sadb_msg_pid;
2673 		c.data.byid = 1;
2674 		c.event = XFRM_MSG_DELPOLICY;
2675 		km_policy_notify(xp, dir, &c);
2676 	} else {
2677 		err = key_pol_get_resp(sk, xp, hdr, dir);
2678 	}
2679 
2680 out:
2681 	xfrm_pol_put(xp);
2682 	return err;
2683 }
2684 
2685 static int dump_sp(struct xfrm_policy *xp, int dir, int count, void *ptr)
2686 {
2687 	struct pfkey_sock *pfk = ptr;
2688 	struct sk_buff *out_skb;
2689 	struct sadb_msg *out_hdr;
2690 	int err;
2691 
2692 	if (!pfkey_can_dump(&pfk->sk))
2693 		return -ENOBUFS;
2694 
2695 	out_skb = pfkey_xfrm_policy2msg_prep(xp);
2696 	if (IS_ERR(out_skb))
2697 		return PTR_ERR(out_skb);
2698 
2699 	err = pfkey_xfrm_policy2msg(out_skb, xp, dir);
2700 	if (err < 0) {
2701 		kfree_skb(out_skb);
2702 		return err;
2703 	}
2704 
2705 	out_hdr = (struct sadb_msg *) out_skb->data;
2706 	out_hdr->sadb_msg_version = pfk->dump.msg_version;
2707 	out_hdr->sadb_msg_type = SADB_X_SPDDUMP;
2708 	out_hdr->sadb_msg_satype = SADB_SATYPE_UNSPEC;
2709 	out_hdr->sadb_msg_errno = 0;
2710 	out_hdr->sadb_msg_seq = count + 1;
2711 	out_hdr->sadb_msg_pid = pfk->dump.msg_portid;
2712 
2713 	if (pfk->dump.skb)
2714 		pfkey_broadcast(pfk->dump.skb, GFP_ATOMIC, BROADCAST_ONE,
2715 				&pfk->sk, sock_net(&pfk->sk));
2716 	pfk->dump.skb = out_skb;
2717 
2718 	return 0;
2719 }
2720 
2721 static int pfkey_dump_sp(struct pfkey_sock *pfk)
2722 {
2723 	struct net *net = sock_net(&pfk->sk);
2724 	return xfrm_policy_walk(net, &pfk->dump.u.policy, dump_sp, (void *) pfk);
2725 }
2726 
2727 static void pfkey_dump_sp_done(struct pfkey_sock *pfk)
2728 {
2729 	struct net *net = sock_net((struct sock *)pfk);
2730 
2731 	xfrm_policy_walk_done(&pfk->dump.u.policy, net);
2732 }
2733 
2734 static int pfkey_spddump(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2735 {
2736 	struct pfkey_sock *pfk = pfkey_sk(sk);
2737 
2738 	mutex_lock(&pfk->dump_lock);
2739 	if (pfk->dump.dump != NULL) {
2740 		mutex_unlock(&pfk->dump_lock);
2741 		return -EBUSY;
2742 	}
2743 
2744 	pfk->dump.msg_version = hdr->sadb_msg_version;
2745 	pfk->dump.msg_portid = hdr->sadb_msg_pid;
2746 	pfk->dump.dump = pfkey_dump_sp;
2747 	pfk->dump.done = pfkey_dump_sp_done;
2748 	xfrm_policy_walk_init(&pfk->dump.u.policy, XFRM_POLICY_TYPE_MAIN);
2749 	mutex_unlock(&pfk->dump_lock);
2750 
2751 	return pfkey_do_dump(pfk);
2752 }
2753 
2754 static int key_notify_policy_flush(const struct km_event *c)
2755 {
2756 	struct sk_buff *skb_out;
2757 	struct sadb_msg *hdr;
2758 
2759 	skb_out = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_ATOMIC);
2760 	if (!skb_out)
2761 		return -ENOBUFS;
2762 	hdr = skb_put(skb_out, sizeof(struct sadb_msg));
2763 	hdr->sadb_msg_type = SADB_X_SPDFLUSH;
2764 	hdr->sadb_msg_seq = c->seq;
2765 	hdr->sadb_msg_pid = c->portid;
2766 	hdr->sadb_msg_version = PF_KEY_V2;
2767 	hdr->sadb_msg_errno = (uint8_t) 0;
2768 	hdr->sadb_msg_satype = SADB_SATYPE_UNSPEC;
2769 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) / sizeof(uint64_t));
2770 	hdr->sadb_msg_reserved = 0;
2771 	pfkey_broadcast(skb_out, GFP_ATOMIC, BROADCAST_ALL, NULL, c->net);
2772 	return 0;
2773 
2774 }
2775 
2776 static int pfkey_spdflush(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2777 {
2778 	struct net *net = sock_net(sk);
2779 	struct km_event c;
2780 	int err, err2;
2781 
2782 	err = xfrm_policy_flush(net, XFRM_POLICY_TYPE_MAIN, true);
2783 	err2 = unicast_flush_resp(sk, hdr);
2784 	if (err || err2) {
2785 		if (err == -ESRCH) /* empty table - old silent behavior */
2786 			return 0;
2787 		return err;
2788 	}
2789 
2790 	c.data.type = XFRM_POLICY_TYPE_MAIN;
2791 	c.event = XFRM_MSG_FLUSHPOLICY;
2792 	c.portid = hdr->sadb_msg_pid;
2793 	c.seq = hdr->sadb_msg_seq;
2794 	c.net = net;
2795 	km_policy_notify(NULL, 0, &c);
2796 
2797 	return 0;
2798 }
2799 
2800 typedef int (*pfkey_handler)(struct sock *sk, struct sk_buff *skb,
2801 			     const struct sadb_msg *hdr, void * const *ext_hdrs);
2802 static const pfkey_handler pfkey_funcs[SADB_MAX + 1] = {
2803 	[SADB_RESERVED]		= pfkey_reserved,
2804 	[SADB_GETSPI]		= pfkey_getspi,
2805 	[SADB_UPDATE]		= pfkey_add,
2806 	[SADB_ADD]		= pfkey_add,
2807 	[SADB_DELETE]		= pfkey_delete,
2808 	[SADB_GET]		= pfkey_get,
2809 	[SADB_ACQUIRE]		= pfkey_acquire,
2810 	[SADB_REGISTER]		= pfkey_register,
2811 	[SADB_EXPIRE]		= NULL,
2812 	[SADB_FLUSH]		= pfkey_flush,
2813 	[SADB_DUMP]		= pfkey_dump,
2814 	[SADB_X_PROMISC]	= pfkey_promisc,
2815 	[SADB_X_PCHANGE]	= NULL,
2816 	[SADB_X_SPDUPDATE]	= pfkey_spdadd,
2817 	[SADB_X_SPDADD]		= pfkey_spdadd,
2818 	[SADB_X_SPDDELETE]	= pfkey_spddelete,
2819 	[SADB_X_SPDGET]		= pfkey_spdget,
2820 	[SADB_X_SPDACQUIRE]	= NULL,
2821 	[SADB_X_SPDDUMP]	= pfkey_spddump,
2822 	[SADB_X_SPDFLUSH]	= pfkey_spdflush,
2823 	[SADB_X_SPDSETIDX]	= pfkey_spdadd,
2824 	[SADB_X_SPDDELETE2]	= pfkey_spdget,
2825 	[SADB_X_MIGRATE]	= pfkey_migrate,
2826 };
2827 
2828 static int pfkey_process(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr)
2829 {
2830 	void *ext_hdrs[SADB_EXT_MAX];
2831 	int err;
2832 
2833 	pfkey_broadcast(skb_clone(skb, GFP_KERNEL), GFP_KERNEL,
2834 			BROADCAST_PROMISC_ONLY, NULL, sock_net(sk));
2835 
2836 	memset(ext_hdrs, 0, sizeof(ext_hdrs));
2837 	err = parse_exthdrs(skb, hdr, ext_hdrs);
2838 	if (!err) {
2839 		err = -EOPNOTSUPP;
2840 		if (pfkey_funcs[hdr->sadb_msg_type])
2841 			err = pfkey_funcs[hdr->sadb_msg_type](sk, skb, hdr, ext_hdrs);
2842 	}
2843 	return err;
2844 }
2845 
2846 static struct sadb_msg *pfkey_get_base_msg(struct sk_buff *skb, int *errp)
2847 {
2848 	struct sadb_msg *hdr = NULL;
2849 
2850 	if (skb->len < sizeof(*hdr)) {
2851 		*errp = -EMSGSIZE;
2852 	} else {
2853 		hdr = (struct sadb_msg *) skb->data;
2854 		if (hdr->sadb_msg_version != PF_KEY_V2 ||
2855 		    hdr->sadb_msg_reserved != 0 ||
2856 		    (hdr->sadb_msg_type <= SADB_RESERVED ||
2857 		     hdr->sadb_msg_type > SADB_MAX)) {
2858 			hdr = NULL;
2859 			*errp = -EINVAL;
2860 		} else if (hdr->sadb_msg_len != (skb->len /
2861 						 sizeof(uint64_t)) ||
2862 			   hdr->sadb_msg_len < (sizeof(struct sadb_msg) /
2863 						sizeof(uint64_t))) {
2864 			hdr = NULL;
2865 			*errp = -EMSGSIZE;
2866 		} else {
2867 			*errp = 0;
2868 		}
2869 	}
2870 	return hdr;
2871 }
2872 
2873 static inline int aalg_tmpl_set(const struct xfrm_tmpl *t,
2874 				const struct xfrm_algo_desc *d)
2875 {
2876 	unsigned int id = d->desc.sadb_alg_id;
2877 
2878 	if (id >= sizeof(t->aalgos) * 8)
2879 		return 0;
2880 
2881 	return (t->aalgos >> id) & 1;
2882 }
2883 
2884 static inline int ealg_tmpl_set(const struct xfrm_tmpl *t,
2885 				const struct xfrm_algo_desc *d)
2886 {
2887 	unsigned int id = d->desc.sadb_alg_id;
2888 
2889 	if (id >= sizeof(t->ealgos) * 8)
2890 		return 0;
2891 
2892 	return (t->ealgos >> id) & 1;
2893 }
2894 
2895 static int count_ah_combs(const struct xfrm_tmpl *t)
2896 {
2897 	int i, sz = 0;
2898 
2899 	for (i = 0; ; i++) {
2900 		const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(i);
2901 		if (!aalg)
2902 			break;
2903 		if (!aalg->pfkey_supported)
2904 			continue;
2905 		if (aalg_tmpl_set(t, aalg) && aalg->available)
2906 			sz += sizeof(struct sadb_comb);
2907 	}
2908 	return sz + sizeof(struct sadb_prop);
2909 }
2910 
2911 static int count_esp_combs(const struct xfrm_tmpl *t)
2912 {
2913 	int i, k, sz = 0;
2914 
2915 	for (i = 0; ; i++) {
2916 		const struct xfrm_algo_desc *ealg = xfrm_ealg_get_byidx(i);
2917 		if (!ealg)
2918 			break;
2919 
2920 		if (!ealg->pfkey_supported)
2921 			continue;
2922 
2923 		if (!(ealg_tmpl_set(t, ealg) && ealg->available))
2924 			continue;
2925 
2926 		for (k = 1; ; k++) {
2927 			const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(k);
2928 			if (!aalg)
2929 				break;
2930 
2931 			if (!aalg->pfkey_supported)
2932 				continue;
2933 
2934 			if (aalg_tmpl_set(t, aalg) && aalg->available)
2935 				sz += sizeof(struct sadb_comb);
2936 		}
2937 	}
2938 	return sz + sizeof(struct sadb_prop);
2939 }
2940 
2941 static void dump_ah_combs(struct sk_buff *skb, const struct xfrm_tmpl *t)
2942 {
2943 	struct sadb_prop *p;
2944 	int i;
2945 
2946 	p = skb_put(skb, sizeof(struct sadb_prop));
2947 	p->sadb_prop_len = sizeof(struct sadb_prop)/8;
2948 	p->sadb_prop_exttype = SADB_EXT_PROPOSAL;
2949 	p->sadb_prop_replay = 32;
2950 	memset(p->sadb_prop_reserved, 0, sizeof(p->sadb_prop_reserved));
2951 
2952 	for (i = 0; ; i++) {
2953 		const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(i);
2954 		if (!aalg)
2955 			break;
2956 
2957 		if (!aalg->pfkey_supported)
2958 			continue;
2959 
2960 		if (aalg_tmpl_set(t, aalg) && aalg->available) {
2961 			struct sadb_comb *c;
2962 			c = skb_put_zero(skb, sizeof(struct sadb_comb));
2963 			p->sadb_prop_len += sizeof(struct sadb_comb)/8;
2964 			c->sadb_comb_auth = aalg->desc.sadb_alg_id;
2965 			c->sadb_comb_auth_minbits = aalg->desc.sadb_alg_minbits;
2966 			c->sadb_comb_auth_maxbits = aalg->desc.sadb_alg_maxbits;
2967 			c->sadb_comb_hard_addtime = 24*60*60;
2968 			c->sadb_comb_soft_addtime = 20*60*60;
2969 			c->sadb_comb_hard_usetime = 8*60*60;
2970 			c->sadb_comb_soft_usetime = 7*60*60;
2971 		}
2972 	}
2973 }
2974 
2975 static void dump_esp_combs(struct sk_buff *skb, const struct xfrm_tmpl *t)
2976 {
2977 	struct sadb_prop *p;
2978 	int i, k;
2979 
2980 	p = skb_put(skb, sizeof(struct sadb_prop));
2981 	p->sadb_prop_len = sizeof(struct sadb_prop)/8;
2982 	p->sadb_prop_exttype = SADB_EXT_PROPOSAL;
2983 	p->sadb_prop_replay = 32;
2984 	memset(p->sadb_prop_reserved, 0, sizeof(p->sadb_prop_reserved));
2985 
2986 	for (i=0; ; i++) {
2987 		const struct xfrm_algo_desc *ealg = xfrm_ealg_get_byidx(i);
2988 		if (!ealg)
2989 			break;
2990 
2991 		if (!ealg->pfkey_supported)
2992 			continue;
2993 
2994 		if (!(ealg_tmpl_set(t, ealg) && ealg->available))
2995 			continue;
2996 
2997 		for (k = 1; ; k++) {
2998 			struct sadb_comb *c;
2999 			const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(k);
3000 			if (!aalg)
3001 				break;
3002 			if (!aalg->pfkey_supported)
3003 				continue;
3004 			if (!(aalg_tmpl_set(t, aalg) && aalg->available))
3005 				continue;
3006 			c = skb_put(skb, sizeof(struct sadb_comb));
3007 			memset(c, 0, sizeof(*c));
3008 			p->sadb_prop_len += sizeof(struct sadb_comb)/8;
3009 			c->sadb_comb_auth = aalg->desc.sadb_alg_id;
3010 			c->sadb_comb_auth_minbits = aalg->desc.sadb_alg_minbits;
3011 			c->sadb_comb_auth_maxbits = aalg->desc.sadb_alg_maxbits;
3012 			c->sadb_comb_encrypt = ealg->desc.sadb_alg_id;
3013 			c->sadb_comb_encrypt_minbits = ealg->desc.sadb_alg_minbits;
3014 			c->sadb_comb_encrypt_maxbits = ealg->desc.sadb_alg_maxbits;
3015 			c->sadb_comb_hard_addtime = 24*60*60;
3016 			c->sadb_comb_soft_addtime = 20*60*60;
3017 			c->sadb_comb_hard_usetime = 8*60*60;
3018 			c->sadb_comb_soft_usetime = 7*60*60;
3019 		}
3020 	}
3021 }
3022 
3023 static int key_notify_policy_expire(struct xfrm_policy *xp, const struct km_event *c)
3024 {
3025 	return 0;
3026 }
3027 
3028 static int key_notify_sa_expire(struct xfrm_state *x, const struct km_event *c)
3029 {
3030 	struct sk_buff *out_skb;
3031 	struct sadb_msg *out_hdr;
3032 	int hard;
3033 	int hsc;
3034 
3035 	hard = c->data.hard;
3036 	if (hard)
3037 		hsc = 2;
3038 	else
3039 		hsc = 1;
3040 
3041 	out_skb = pfkey_xfrm_state2msg_expire(x, hsc);
3042 	if (IS_ERR(out_skb))
3043 		return PTR_ERR(out_skb);
3044 
3045 	out_hdr = (struct sadb_msg *) out_skb->data;
3046 	out_hdr->sadb_msg_version = PF_KEY_V2;
3047 	out_hdr->sadb_msg_type = SADB_EXPIRE;
3048 	out_hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
3049 	out_hdr->sadb_msg_errno = 0;
3050 	out_hdr->sadb_msg_reserved = 0;
3051 	out_hdr->sadb_msg_seq = 0;
3052 	out_hdr->sadb_msg_pid = 0;
3053 
3054 	pfkey_broadcast(out_skb, GFP_ATOMIC, BROADCAST_REGISTERED, NULL,
3055 			xs_net(x));
3056 	return 0;
3057 }
3058 
3059 static int pfkey_send_notify(struct xfrm_state *x, const struct km_event *c)
3060 {
3061 	struct net *net = x ? xs_net(x) : c->net;
3062 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3063 
3064 	if (atomic_read(&net_pfkey->socks_nr) == 0)
3065 		return 0;
3066 
3067 	switch (c->event) {
3068 	case XFRM_MSG_EXPIRE:
3069 		return key_notify_sa_expire(x, c);
3070 	case XFRM_MSG_DELSA:
3071 	case XFRM_MSG_NEWSA:
3072 	case XFRM_MSG_UPDSA:
3073 		return key_notify_sa(x, c);
3074 	case XFRM_MSG_FLUSHSA:
3075 		return key_notify_sa_flush(c);
3076 	case XFRM_MSG_NEWAE: /* not yet supported */
3077 		break;
3078 	default:
3079 		pr_err("pfkey: Unknown SA event %d\n", c->event);
3080 		break;
3081 	}
3082 
3083 	return 0;
3084 }
3085 
3086 static int pfkey_send_policy_notify(struct xfrm_policy *xp, int dir, const struct km_event *c)
3087 {
3088 	if (xp && xp->type != XFRM_POLICY_TYPE_MAIN)
3089 		return 0;
3090 
3091 	switch (c->event) {
3092 	case XFRM_MSG_POLEXPIRE:
3093 		return key_notify_policy_expire(xp, c);
3094 	case XFRM_MSG_DELPOLICY:
3095 	case XFRM_MSG_NEWPOLICY:
3096 	case XFRM_MSG_UPDPOLICY:
3097 		return key_notify_policy(xp, dir, c);
3098 	case XFRM_MSG_FLUSHPOLICY:
3099 		if (c->data.type != XFRM_POLICY_TYPE_MAIN)
3100 			break;
3101 		return key_notify_policy_flush(c);
3102 	default:
3103 		pr_err("pfkey: Unknown policy event %d\n", c->event);
3104 		break;
3105 	}
3106 
3107 	return 0;
3108 }
3109 
3110 static u32 get_acqseq(void)
3111 {
3112 	u32 res;
3113 	static atomic_t acqseq;
3114 
3115 	do {
3116 		res = atomic_inc_return(&acqseq);
3117 	} while (!res);
3118 	return res;
3119 }
3120 
3121 static bool pfkey_is_alive(const struct km_event *c)
3122 {
3123 	struct netns_pfkey *net_pfkey = net_generic(c->net, pfkey_net_id);
3124 	struct sock *sk;
3125 	bool is_alive = false;
3126 
3127 	rcu_read_lock();
3128 	sk_for_each_rcu(sk, &net_pfkey->table) {
3129 		if (pfkey_sk(sk)->registered) {
3130 			is_alive = true;
3131 			break;
3132 		}
3133 	}
3134 	rcu_read_unlock();
3135 
3136 	return is_alive;
3137 }
3138 
3139 static int pfkey_send_acquire(struct xfrm_state *x, struct xfrm_tmpl *t, struct xfrm_policy *xp)
3140 {
3141 	struct sk_buff *skb;
3142 	struct sadb_msg *hdr;
3143 	struct sadb_address *addr;
3144 	struct sadb_x_policy *pol;
3145 	int sockaddr_size;
3146 	int size;
3147 	struct sadb_x_sec_ctx *sec_ctx;
3148 	struct xfrm_sec_ctx *xfrm_ctx;
3149 	int ctx_size = 0;
3150 
3151 	sockaddr_size = pfkey_sockaddr_size(x->props.family);
3152 	if (!sockaddr_size)
3153 		return -EINVAL;
3154 
3155 	size = sizeof(struct sadb_msg) +
3156 		(sizeof(struct sadb_address) * 2) +
3157 		(sockaddr_size * 2) +
3158 		sizeof(struct sadb_x_policy);
3159 
3160 	if (x->id.proto == IPPROTO_AH)
3161 		size += count_ah_combs(t);
3162 	else if (x->id.proto == IPPROTO_ESP)
3163 		size += count_esp_combs(t);
3164 
3165 	if ((xfrm_ctx = x->security)) {
3166 		ctx_size = PFKEY_ALIGN8(xfrm_ctx->ctx_len);
3167 		size +=  sizeof(struct sadb_x_sec_ctx) + ctx_size;
3168 	}
3169 
3170 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
3171 	if (skb == NULL)
3172 		return -ENOMEM;
3173 
3174 	hdr = skb_put(skb, sizeof(struct sadb_msg));
3175 	hdr->sadb_msg_version = PF_KEY_V2;
3176 	hdr->sadb_msg_type = SADB_ACQUIRE;
3177 	hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
3178 	hdr->sadb_msg_len = size / sizeof(uint64_t);
3179 	hdr->sadb_msg_errno = 0;
3180 	hdr->sadb_msg_reserved = 0;
3181 	hdr->sadb_msg_seq = x->km.seq = get_acqseq();
3182 	hdr->sadb_msg_pid = 0;
3183 
3184 	/* src address */
3185 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
3186 	addr->sadb_address_len =
3187 		(sizeof(struct sadb_address)+sockaddr_size)/
3188 			sizeof(uint64_t);
3189 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
3190 	addr->sadb_address_proto = 0;
3191 	addr->sadb_address_reserved = 0;
3192 	addr->sadb_address_prefixlen =
3193 		pfkey_sockaddr_fill(&x->props.saddr, 0,
3194 				    (struct sockaddr *) (addr + 1),
3195 				    x->props.family);
3196 	if (!addr->sadb_address_prefixlen)
3197 		BUG();
3198 
3199 	/* dst address */
3200 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
3201 	addr->sadb_address_len =
3202 		(sizeof(struct sadb_address)+sockaddr_size)/
3203 			sizeof(uint64_t);
3204 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
3205 	addr->sadb_address_proto = 0;
3206 	addr->sadb_address_reserved = 0;
3207 	addr->sadb_address_prefixlen =
3208 		pfkey_sockaddr_fill(&x->id.daddr, 0,
3209 				    (struct sockaddr *) (addr + 1),
3210 				    x->props.family);
3211 	if (!addr->sadb_address_prefixlen)
3212 		BUG();
3213 
3214 	pol = skb_put(skb, sizeof(struct sadb_x_policy));
3215 	pol->sadb_x_policy_len = sizeof(struct sadb_x_policy)/sizeof(uint64_t);
3216 	pol->sadb_x_policy_exttype = SADB_X_EXT_POLICY;
3217 	pol->sadb_x_policy_type = IPSEC_POLICY_IPSEC;
3218 	pol->sadb_x_policy_dir = XFRM_POLICY_OUT + 1;
3219 	pol->sadb_x_policy_reserved = 0;
3220 	pol->sadb_x_policy_id = xp->index;
3221 	pol->sadb_x_policy_priority = xp->priority;
3222 
3223 	/* Set sadb_comb's. */
3224 	if (x->id.proto == IPPROTO_AH)
3225 		dump_ah_combs(skb, t);
3226 	else if (x->id.proto == IPPROTO_ESP)
3227 		dump_esp_combs(skb, t);
3228 
3229 	/* security context */
3230 	if (xfrm_ctx) {
3231 		sec_ctx = skb_put(skb,
3232 				  sizeof(struct sadb_x_sec_ctx) + ctx_size);
3233 		sec_ctx->sadb_x_sec_len =
3234 		  (sizeof(struct sadb_x_sec_ctx) + ctx_size) / sizeof(uint64_t);
3235 		sec_ctx->sadb_x_sec_exttype = SADB_X_EXT_SEC_CTX;
3236 		sec_ctx->sadb_x_ctx_doi = xfrm_ctx->ctx_doi;
3237 		sec_ctx->sadb_x_ctx_alg = xfrm_ctx->ctx_alg;
3238 		sec_ctx->sadb_x_ctx_len = xfrm_ctx->ctx_len;
3239 		memcpy(sec_ctx + 1, xfrm_ctx->ctx_str,
3240 		       xfrm_ctx->ctx_len);
3241 	}
3242 
3243 	return pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_REGISTERED, NULL,
3244 			       xs_net(x));
3245 }
3246 
3247 static struct xfrm_policy *pfkey_compile_policy(struct sock *sk, int opt,
3248 						u8 *data, int len, int *dir)
3249 {
3250 	struct net *net = sock_net(sk);
3251 	struct xfrm_policy *xp;
3252 	struct sadb_x_policy *pol = (struct sadb_x_policy*)data;
3253 	struct sadb_x_sec_ctx *sec_ctx;
3254 
3255 	switch (sk->sk_family) {
3256 	case AF_INET:
3257 		if (opt != IP_IPSEC_POLICY) {
3258 			*dir = -EOPNOTSUPP;
3259 			return NULL;
3260 		}
3261 		break;
3262 #if IS_ENABLED(CONFIG_IPV6)
3263 	case AF_INET6:
3264 		if (opt != IPV6_IPSEC_POLICY) {
3265 			*dir = -EOPNOTSUPP;
3266 			return NULL;
3267 		}
3268 		break;
3269 #endif
3270 	default:
3271 		*dir = -EINVAL;
3272 		return NULL;
3273 	}
3274 
3275 	*dir = -EINVAL;
3276 
3277 	if (len < sizeof(struct sadb_x_policy) ||
3278 	    pol->sadb_x_policy_len*8 > len ||
3279 	    pol->sadb_x_policy_type > IPSEC_POLICY_BYPASS ||
3280 	    (!pol->sadb_x_policy_dir || pol->sadb_x_policy_dir > IPSEC_DIR_OUTBOUND))
3281 		return NULL;
3282 
3283 	xp = xfrm_policy_alloc(net, GFP_ATOMIC);
3284 	if (xp == NULL) {
3285 		*dir = -ENOBUFS;
3286 		return NULL;
3287 	}
3288 
3289 	xp->action = (pol->sadb_x_policy_type == IPSEC_POLICY_DISCARD ?
3290 		      XFRM_POLICY_BLOCK : XFRM_POLICY_ALLOW);
3291 
3292 	xp->lft.soft_byte_limit = XFRM_INF;
3293 	xp->lft.hard_byte_limit = XFRM_INF;
3294 	xp->lft.soft_packet_limit = XFRM_INF;
3295 	xp->lft.hard_packet_limit = XFRM_INF;
3296 	xp->family = sk->sk_family;
3297 
3298 	xp->xfrm_nr = 0;
3299 	if (pol->sadb_x_policy_type == IPSEC_POLICY_IPSEC &&
3300 	    (*dir = parse_ipsecrequests(xp, pol)) < 0)
3301 		goto out;
3302 
3303 	/* security context too */
3304 	if (len >= (pol->sadb_x_policy_len*8 +
3305 	    sizeof(struct sadb_x_sec_ctx))) {
3306 		char *p = (char *)pol;
3307 		struct xfrm_user_sec_ctx *uctx;
3308 
3309 		p += pol->sadb_x_policy_len*8;
3310 		sec_ctx = (struct sadb_x_sec_ctx *)p;
3311 		if (len < pol->sadb_x_policy_len*8 +
3312 		    sec_ctx->sadb_x_sec_len*8) {
3313 			*dir = -EINVAL;
3314 			goto out;
3315 		}
3316 		if ((*dir = verify_sec_ctx_len(p)))
3317 			goto out;
3318 		uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_ATOMIC);
3319 		*dir = security_xfrm_policy_alloc(&xp->security, uctx, GFP_ATOMIC);
3320 		kfree(uctx);
3321 
3322 		if (*dir)
3323 			goto out;
3324 	}
3325 
3326 	*dir = pol->sadb_x_policy_dir-1;
3327 	return xp;
3328 
3329 out:
3330 	xp->walk.dead = 1;
3331 	xfrm_policy_destroy(xp);
3332 	return NULL;
3333 }
3334 
3335 static int pfkey_send_new_mapping(struct xfrm_state *x, xfrm_address_t *ipaddr, __be16 sport)
3336 {
3337 	struct sk_buff *skb;
3338 	struct sadb_msg *hdr;
3339 	struct sadb_sa *sa;
3340 	struct sadb_address *addr;
3341 	struct sadb_x_nat_t_port *n_port;
3342 	int sockaddr_size;
3343 	int size;
3344 	__u8 satype = (x->id.proto == IPPROTO_ESP ? SADB_SATYPE_ESP : 0);
3345 	struct xfrm_encap_tmpl *natt = NULL;
3346 
3347 	sockaddr_size = pfkey_sockaddr_size(x->props.family);
3348 	if (!sockaddr_size)
3349 		return -EINVAL;
3350 
3351 	if (!satype)
3352 		return -EINVAL;
3353 
3354 	if (!x->encap)
3355 		return -EINVAL;
3356 
3357 	natt = x->encap;
3358 
3359 	/* Build an SADB_X_NAT_T_NEW_MAPPING message:
3360 	 *
3361 	 * HDR | SA | ADDRESS_SRC (old addr) | NAT_T_SPORT (old port) |
3362 	 * ADDRESS_DST (new addr) | NAT_T_DPORT (new port)
3363 	 */
3364 
3365 	size = sizeof(struct sadb_msg) +
3366 		sizeof(struct sadb_sa) +
3367 		(sizeof(struct sadb_address) * 2) +
3368 		(sockaddr_size * 2) +
3369 		(sizeof(struct sadb_x_nat_t_port) * 2);
3370 
3371 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
3372 	if (skb == NULL)
3373 		return -ENOMEM;
3374 
3375 	hdr = skb_put(skb, sizeof(struct sadb_msg));
3376 	hdr->sadb_msg_version = PF_KEY_V2;
3377 	hdr->sadb_msg_type = SADB_X_NAT_T_NEW_MAPPING;
3378 	hdr->sadb_msg_satype = satype;
3379 	hdr->sadb_msg_len = size / sizeof(uint64_t);
3380 	hdr->sadb_msg_errno = 0;
3381 	hdr->sadb_msg_reserved = 0;
3382 	hdr->sadb_msg_seq = x->km.seq = get_acqseq();
3383 	hdr->sadb_msg_pid = 0;
3384 
3385 	/* SA */
3386 	sa = skb_put(skb, sizeof(struct sadb_sa));
3387 	sa->sadb_sa_len = sizeof(struct sadb_sa)/sizeof(uint64_t);
3388 	sa->sadb_sa_exttype = SADB_EXT_SA;
3389 	sa->sadb_sa_spi = x->id.spi;
3390 	sa->sadb_sa_replay = 0;
3391 	sa->sadb_sa_state = 0;
3392 	sa->sadb_sa_auth = 0;
3393 	sa->sadb_sa_encrypt = 0;
3394 	sa->sadb_sa_flags = 0;
3395 
3396 	/* ADDRESS_SRC (old addr) */
3397 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
3398 	addr->sadb_address_len =
3399 		(sizeof(struct sadb_address)+sockaddr_size)/
3400 			sizeof(uint64_t);
3401 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
3402 	addr->sadb_address_proto = 0;
3403 	addr->sadb_address_reserved = 0;
3404 	addr->sadb_address_prefixlen =
3405 		pfkey_sockaddr_fill(&x->props.saddr, 0,
3406 				    (struct sockaddr *) (addr + 1),
3407 				    x->props.family);
3408 	if (!addr->sadb_address_prefixlen)
3409 		BUG();
3410 
3411 	/* NAT_T_SPORT (old port) */
3412 	n_port = skb_put(skb, sizeof(*n_port));
3413 	n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
3414 	n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_SPORT;
3415 	n_port->sadb_x_nat_t_port_port = natt->encap_sport;
3416 	n_port->sadb_x_nat_t_port_reserved = 0;
3417 
3418 	/* ADDRESS_DST (new addr) */
3419 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
3420 	addr->sadb_address_len =
3421 		(sizeof(struct sadb_address)+sockaddr_size)/
3422 			sizeof(uint64_t);
3423 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
3424 	addr->sadb_address_proto = 0;
3425 	addr->sadb_address_reserved = 0;
3426 	addr->sadb_address_prefixlen =
3427 		pfkey_sockaddr_fill(ipaddr, 0,
3428 				    (struct sockaddr *) (addr + 1),
3429 				    x->props.family);
3430 	if (!addr->sadb_address_prefixlen)
3431 		BUG();
3432 
3433 	/* NAT_T_DPORT (new port) */
3434 	n_port = skb_put(skb, sizeof(*n_port));
3435 	n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
3436 	n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_DPORT;
3437 	n_port->sadb_x_nat_t_port_port = sport;
3438 	n_port->sadb_x_nat_t_port_reserved = 0;
3439 
3440 	return pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_REGISTERED, NULL,
3441 			       xs_net(x));
3442 }
3443 
3444 #ifdef CONFIG_NET_KEY_MIGRATE
3445 static int set_sadb_address(struct sk_buff *skb, int sasize, int type,
3446 			    const struct xfrm_selector *sel)
3447 {
3448 	struct sadb_address *addr;
3449 	addr = skb_put(skb, sizeof(struct sadb_address) + sasize);
3450 	addr->sadb_address_len = (sizeof(struct sadb_address) + sasize)/8;
3451 	addr->sadb_address_exttype = type;
3452 	addr->sadb_address_proto = sel->proto;
3453 	addr->sadb_address_reserved = 0;
3454 
3455 	switch (type) {
3456 	case SADB_EXT_ADDRESS_SRC:
3457 		addr->sadb_address_prefixlen = sel->prefixlen_s;
3458 		pfkey_sockaddr_fill(&sel->saddr, 0,
3459 				    (struct sockaddr *)(addr + 1),
3460 				    sel->family);
3461 		break;
3462 	case SADB_EXT_ADDRESS_DST:
3463 		addr->sadb_address_prefixlen = sel->prefixlen_d;
3464 		pfkey_sockaddr_fill(&sel->daddr, 0,
3465 				    (struct sockaddr *)(addr + 1),
3466 				    sel->family);
3467 		break;
3468 	default:
3469 		return -EINVAL;
3470 	}
3471 
3472 	return 0;
3473 }
3474 
3475 
3476 static int set_sadb_kmaddress(struct sk_buff *skb, const struct xfrm_kmaddress *k)
3477 {
3478 	struct sadb_x_kmaddress *kma;
3479 	u8 *sa;
3480 	int family = k->family;
3481 	int socklen = pfkey_sockaddr_len(family);
3482 	int size_req;
3483 
3484 	size_req = (sizeof(struct sadb_x_kmaddress) +
3485 		    pfkey_sockaddr_pair_size(family));
3486 
3487 	kma = skb_put_zero(skb, size_req);
3488 	kma->sadb_x_kmaddress_len = size_req / 8;
3489 	kma->sadb_x_kmaddress_exttype = SADB_X_EXT_KMADDRESS;
3490 	kma->sadb_x_kmaddress_reserved = k->reserved;
3491 
3492 	sa = (u8 *)(kma + 1);
3493 	if (!pfkey_sockaddr_fill(&k->local, 0, (struct sockaddr *)sa, family) ||
3494 	    !pfkey_sockaddr_fill(&k->remote, 0, (struct sockaddr *)(sa+socklen), family))
3495 		return -EINVAL;
3496 
3497 	return 0;
3498 }
3499 
3500 static int set_ipsecrequest(struct sk_buff *skb,
3501 			    uint8_t proto, uint8_t mode, int level,
3502 			    uint32_t reqid, uint8_t family,
3503 			    const xfrm_address_t *src, const xfrm_address_t *dst)
3504 {
3505 	struct sadb_x_ipsecrequest *rq;
3506 	u8 *sa;
3507 	int socklen = pfkey_sockaddr_len(family);
3508 	int size_req;
3509 
3510 	size_req = sizeof(struct sadb_x_ipsecrequest) +
3511 		   pfkey_sockaddr_pair_size(family);
3512 
3513 	rq = skb_put_zero(skb, size_req);
3514 	rq->sadb_x_ipsecrequest_len = size_req;
3515 	rq->sadb_x_ipsecrequest_proto = proto;
3516 	rq->sadb_x_ipsecrequest_mode = mode;
3517 	rq->sadb_x_ipsecrequest_level = level;
3518 	rq->sadb_x_ipsecrequest_reqid = reqid;
3519 
3520 	sa = (u8 *) (rq + 1);
3521 	if (!pfkey_sockaddr_fill(src, 0, (struct sockaddr *)sa, family) ||
3522 	    !pfkey_sockaddr_fill(dst, 0, (struct sockaddr *)(sa + socklen), family))
3523 		return -EINVAL;
3524 
3525 	return 0;
3526 }
3527 #endif
3528 
3529 #ifdef CONFIG_NET_KEY_MIGRATE
3530 static int pfkey_send_migrate(const struct xfrm_selector *sel, u8 dir, u8 type,
3531 			      const struct xfrm_migrate *m, int num_bundles,
3532 			      const struct xfrm_kmaddress *k,
3533 			      const struct xfrm_encap_tmpl *encap)
3534 {
3535 	int i;
3536 	int sasize_sel;
3537 	int size = 0;
3538 	int size_pol = 0;
3539 	struct sk_buff *skb;
3540 	struct sadb_msg *hdr;
3541 	struct sadb_x_policy *pol;
3542 	const struct xfrm_migrate *mp;
3543 
3544 	if (type != XFRM_POLICY_TYPE_MAIN)
3545 		return 0;
3546 
3547 	if (num_bundles <= 0 || num_bundles > XFRM_MAX_DEPTH)
3548 		return -EINVAL;
3549 
3550 	if (k != NULL) {
3551 		/* addresses for KM */
3552 		size += PFKEY_ALIGN8(sizeof(struct sadb_x_kmaddress) +
3553 				     pfkey_sockaddr_pair_size(k->family));
3554 	}
3555 
3556 	/* selector */
3557 	sasize_sel = pfkey_sockaddr_size(sel->family);
3558 	if (!sasize_sel)
3559 		return -EINVAL;
3560 	size += (sizeof(struct sadb_address) + sasize_sel) * 2;
3561 
3562 	/* policy info */
3563 	size_pol += sizeof(struct sadb_x_policy);
3564 
3565 	/* ipsecrequests */
3566 	for (i = 0, mp = m; i < num_bundles; i++, mp++) {
3567 		/* old locator pair */
3568 		size_pol += sizeof(struct sadb_x_ipsecrequest) +
3569 			    pfkey_sockaddr_pair_size(mp->old_family);
3570 		/* new locator pair */
3571 		size_pol += sizeof(struct sadb_x_ipsecrequest) +
3572 			    pfkey_sockaddr_pair_size(mp->new_family);
3573 	}
3574 
3575 	size += sizeof(struct sadb_msg) + size_pol;
3576 
3577 	/* alloc buffer */
3578 	skb = alloc_skb(size, GFP_ATOMIC);
3579 	if (skb == NULL)
3580 		return -ENOMEM;
3581 
3582 	hdr = skb_put(skb, sizeof(struct sadb_msg));
3583 	hdr->sadb_msg_version = PF_KEY_V2;
3584 	hdr->sadb_msg_type = SADB_X_MIGRATE;
3585 	hdr->sadb_msg_satype = pfkey_proto2satype(m->proto);
3586 	hdr->sadb_msg_len = size / 8;
3587 	hdr->sadb_msg_errno = 0;
3588 	hdr->sadb_msg_reserved = 0;
3589 	hdr->sadb_msg_seq = 0;
3590 	hdr->sadb_msg_pid = 0;
3591 
3592 	/* Addresses to be used by KM for negotiation, if ext is available */
3593 	if (k != NULL && (set_sadb_kmaddress(skb, k) < 0))
3594 		goto err;
3595 
3596 	/* selector src */
3597 	set_sadb_address(skb, sasize_sel, SADB_EXT_ADDRESS_SRC, sel);
3598 
3599 	/* selector dst */
3600 	set_sadb_address(skb, sasize_sel, SADB_EXT_ADDRESS_DST, sel);
3601 
3602 	/* policy information */
3603 	pol = skb_put(skb, sizeof(struct sadb_x_policy));
3604 	pol->sadb_x_policy_len = size_pol / 8;
3605 	pol->sadb_x_policy_exttype = SADB_X_EXT_POLICY;
3606 	pol->sadb_x_policy_type = IPSEC_POLICY_IPSEC;
3607 	pol->sadb_x_policy_dir = dir + 1;
3608 	pol->sadb_x_policy_reserved = 0;
3609 	pol->sadb_x_policy_id = 0;
3610 	pol->sadb_x_policy_priority = 0;
3611 
3612 	for (i = 0, mp = m; i < num_bundles; i++, mp++) {
3613 		/* old ipsecrequest */
3614 		int mode = pfkey_mode_from_xfrm(mp->mode);
3615 		if (mode < 0)
3616 			goto err;
3617 		if (set_ipsecrequest(skb, mp->proto, mode,
3618 				     (mp->reqid ?  IPSEC_LEVEL_UNIQUE : IPSEC_LEVEL_REQUIRE),
3619 				     mp->reqid, mp->old_family,
3620 				     &mp->old_saddr, &mp->old_daddr) < 0)
3621 			goto err;
3622 
3623 		/* new ipsecrequest */
3624 		if (set_ipsecrequest(skb, mp->proto, mode,
3625 				     (mp->reqid ? IPSEC_LEVEL_UNIQUE : IPSEC_LEVEL_REQUIRE),
3626 				     mp->reqid, mp->new_family,
3627 				     &mp->new_saddr, &mp->new_daddr) < 0)
3628 			goto err;
3629 	}
3630 
3631 	/* broadcast migrate message to sockets */
3632 	pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_ALL, NULL, &init_net);
3633 
3634 	return 0;
3635 
3636 err:
3637 	kfree_skb(skb);
3638 	return -EINVAL;
3639 }
3640 #else
3641 static int pfkey_send_migrate(const struct xfrm_selector *sel, u8 dir, u8 type,
3642 			      const struct xfrm_migrate *m, int num_bundles,
3643 			      const struct xfrm_kmaddress *k,
3644 			      const struct xfrm_encap_tmpl *encap)
3645 {
3646 	return -ENOPROTOOPT;
3647 }
3648 #endif
3649 
3650 static int pfkey_sendmsg(struct socket *sock, struct msghdr *msg, size_t len)
3651 {
3652 	struct sock *sk = sock->sk;
3653 	struct sk_buff *skb = NULL;
3654 	struct sadb_msg *hdr = NULL;
3655 	int err;
3656 	struct net *net = sock_net(sk);
3657 
3658 	err = -EOPNOTSUPP;
3659 	if (msg->msg_flags & MSG_OOB)
3660 		goto out;
3661 
3662 	err = -EMSGSIZE;
3663 	if ((unsigned int)len > sk->sk_sndbuf - 32)
3664 		goto out;
3665 
3666 	err = -ENOBUFS;
3667 	skb = alloc_skb(len, GFP_KERNEL);
3668 	if (skb == NULL)
3669 		goto out;
3670 
3671 	err = -EFAULT;
3672 	if (memcpy_from_msg(skb_put(skb,len), msg, len))
3673 		goto out;
3674 
3675 	hdr = pfkey_get_base_msg(skb, &err);
3676 	if (!hdr)
3677 		goto out;
3678 
3679 	mutex_lock(&net->xfrm.xfrm_cfg_mutex);
3680 	err = pfkey_process(sk, skb, hdr);
3681 	mutex_unlock(&net->xfrm.xfrm_cfg_mutex);
3682 
3683 out:
3684 	if (err && hdr && pfkey_error(hdr, err, sk) == 0)
3685 		err = 0;
3686 	kfree_skb(skb);
3687 
3688 	return err ? : len;
3689 }
3690 
3691 static int pfkey_recvmsg(struct socket *sock, struct msghdr *msg, size_t len,
3692 			 int flags)
3693 {
3694 	struct sock *sk = sock->sk;
3695 	struct pfkey_sock *pfk = pfkey_sk(sk);
3696 	struct sk_buff *skb;
3697 	int copied, err;
3698 
3699 	err = -EINVAL;
3700 	if (flags & ~(MSG_PEEK|MSG_DONTWAIT|MSG_TRUNC|MSG_CMSG_COMPAT))
3701 		goto out;
3702 
3703 	skb = skb_recv_datagram(sk, flags, flags & MSG_DONTWAIT, &err);
3704 	if (skb == NULL)
3705 		goto out;
3706 
3707 	copied = skb->len;
3708 	if (copied > len) {
3709 		msg->msg_flags |= MSG_TRUNC;
3710 		copied = len;
3711 	}
3712 
3713 	skb_reset_transport_header(skb);
3714 	err = skb_copy_datagram_msg(skb, 0, msg, copied);
3715 	if (err)
3716 		goto out_free;
3717 
3718 	sock_recv_ts_and_drops(msg, sk, skb);
3719 
3720 	err = (flags & MSG_TRUNC) ? skb->len : copied;
3721 
3722 	if (pfk->dump.dump != NULL &&
3723 	    3 * atomic_read(&sk->sk_rmem_alloc) <= sk->sk_rcvbuf)
3724 		pfkey_do_dump(pfk);
3725 
3726 out_free:
3727 	skb_free_datagram(sk, skb);
3728 out:
3729 	return err;
3730 }
3731 
3732 static const struct proto_ops pfkey_ops = {
3733 	.family		=	PF_KEY,
3734 	.owner		=	THIS_MODULE,
3735 	/* Operations that make no sense on pfkey sockets. */
3736 	.bind		=	sock_no_bind,
3737 	.connect	=	sock_no_connect,
3738 	.socketpair	=	sock_no_socketpair,
3739 	.accept		=	sock_no_accept,
3740 	.getname	=	sock_no_getname,
3741 	.ioctl		=	sock_no_ioctl,
3742 	.listen		=	sock_no_listen,
3743 	.shutdown	=	sock_no_shutdown,
3744 	.mmap		=	sock_no_mmap,
3745 	.sendpage	=	sock_no_sendpage,
3746 
3747 	/* Now the operations that really occur. */
3748 	.release	=	pfkey_release,
3749 	.poll		=	datagram_poll,
3750 	.sendmsg	=	pfkey_sendmsg,
3751 	.recvmsg	=	pfkey_recvmsg,
3752 };
3753 
3754 static const struct net_proto_family pfkey_family_ops = {
3755 	.family	=	PF_KEY,
3756 	.create	=	pfkey_create,
3757 	.owner	=	THIS_MODULE,
3758 };
3759 
3760 #ifdef CONFIG_PROC_FS
3761 static int pfkey_seq_show(struct seq_file *f, void *v)
3762 {
3763 	struct sock *s = sk_entry(v);
3764 
3765 	if (v == SEQ_START_TOKEN)
3766 		seq_printf(f ,"sk       RefCnt Rmem   Wmem   User   Inode\n");
3767 	else
3768 		seq_printf(f, "%pK %-6d %-6u %-6u %-6u %-6lu\n",
3769 			       s,
3770 			       refcount_read(&s->sk_refcnt),
3771 			       sk_rmem_alloc_get(s),
3772 			       sk_wmem_alloc_get(s),
3773 			       from_kuid_munged(seq_user_ns(f), sock_i_uid(s)),
3774 			       sock_i_ino(s)
3775 			       );
3776 	return 0;
3777 }
3778 
3779 static void *pfkey_seq_start(struct seq_file *f, loff_t *ppos)
3780 	__acquires(rcu)
3781 {
3782 	struct net *net = seq_file_net(f);
3783 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3784 
3785 	rcu_read_lock();
3786 	return seq_hlist_start_head_rcu(&net_pfkey->table, *ppos);
3787 }
3788 
3789 static void *pfkey_seq_next(struct seq_file *f, void *v, loff_t *ppos)
3790 {
3791 	struct net *net = seq_file_net(f);
3792 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3793 
3794 	return seq_hlist_next_rcu(v, &net_pfkey->table, ppos);
3795 }
3796 
3797 static void pfkey_seq_stop(struct seq_file *f, void *v)
3798 	__releases(rcu)
3799 {
3800 	rcu_read_unlock();
3801 }
3802 
3803 static const struct seq_operations pfkey_seq_ops = {
3804 	.start	= pfkey_seq_start,
3805 	.next	= pfkey_seq_next,
3806 	.stop	= pfkey_seq_stop,
3807 	.show	= pfkey_seq_show,
3808 };
3809 
3810 static int __net_init pfkey_init_proc(struct net *net)
3811 {
3812 	struct proc_dir_entry *e;
3813 
3814 	e = proc_create_net("pfkey", 0, net->proc_net, &pfkey_seq_ops,
3815 			sizeof(struct seq_net_private));
3816 	if (e == NULL)
3817 		return -ENOMEM;
3818 
3819 	return 0;
3820 }
3821 
3822 static void __net_exit pfkey_exit_proc(struct net *net)
3823 {
3824 	remove_proc_entry("pfkey", net->proc_net);
3825 }
3826 #else
3827 static inline int pfkey_init_proc(struct net *net)
3828 {
3829 	return 0;
3830 }
3831 
3832 static inline void pfkey_exit_proc(struct net *net)
3833 {
3834 }
3835 #endif
3836 
3837 static struct xfrm_mgr pfkeyv2_mgr =
3838 {
3839 	.notify		= pfkey_send_notify,
3840 	.acquire	= pfkey_send_acquire,
3841 	.compile_policy	= pfkey_compile_policy,
3842 	.new_mapping	= pfkey_send_new_mapping,
3843 	.notify_policy	= pfkey_send_policy_notify,
3844 	.migrate	= pfkey_send_migrate,
3845 	.is_alive	= pfkey_is_alive,
3846 };
3847 
3848 static int __net_init pfkey_net_init(struct net *net)
3849 {
3850 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3851 	int rv;
3852 
3853 	INIT_HLIST_HEAD(&net_pfkey->table);
3854 	atomic_set(&net_pfkey->socks_nr, 0);
3855 
3856 	rv = pfkey_init_proc(net);
3857 
3858 	return rv;
3859 }
3860 
3861 static void __net_exit pfkey_net_exit(struct net *net)
3862 {
3863 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3864 
3865 	pfkey_exit_proc(net);
3866 	WARN_ON(!hlist_empty(&net_pfkey->table));
3867 }
3868 
3869 static struct pernet_operations pfkey_net_ops = {
3870 	.init = pfkey_net_init,
3871 	.exit = pfkey_net_exit,
3872 	.id   = &pfkey_net_id,
3873 	.size = sizeof(struct netns_pfkey),
3874 };
3875 
3876 static void __exit ipsec_pfkey_exit(void)
3877 {
3878 	xfrm_unregister_km(&pfkeyv2_mgr);
3879 	sock_unregister(PF_KEY);
3880 	unregister_pernet_subsys(&pfkey_net_ops);
3881 	proto_unregister(&key_proto);
3882 }
3883 
3884 static int __init ipsec_pfkey_init(void)
3885 {
3886 	int err = proto_register(&key_proto, 0);
3887 
3888 	if (err != 0)
3889 		goto out;
3890 
3891 	err = register_pernet_subsys(&pfkey_net_ops);
3892 	if (err != 0)
3893 		goto out_unregister_key_proto;
3894 	err = sock_register(&pfkey_family_ops);
3895 	if (err != 0)
3896 		goto out_unregister_pernet;
3897 	err = xfrm_register_km(&pfkeyv2_mgr);
3898 	if (err != 0)
3899 		goto out_sock_unregister;
3900 out:
3901 	return err;
3902 
3903 out_sock_unregister:
3904 	sock_unregister(PF_KEY);
3905 out_unregister_pernet:
3906 	unregister_pernet_subsys(&pfkey_net_ops);
3907 out_unregister_key_proto:
3908 	proto_unregister(&key_proto);
3909 	goto out;
3910 }
3911 
3912 module_init(ipsec_pfkey_init);
3913 module_exit(ipsec_pfkey_exit);
3914 MODULE_LICENSE("GPL");
3915 MODULE_ALIAS_NETPROTO(PF_KEY);
3916