xref: /linux/net/key/af_key.c (revision e9deb406c10f5a73bcfd62f42ca1187b220bc188)
1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3  * net/key/af_key.c	An implementation of PF_KEYv2 sockets.
4  *
5  * Authors:	Maxim Giryaev	<gem@asplinux.ru>
6  *		David S. Miller	<davem@redhat.com>
7  *		Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
8  *		Kunihiro Ishiguro <kunihiro@ipinfusion.com>
9  *		Kazunori MIYAZAWA / USAGI Project <miyazawa@linux-ipv6.org>
10  *		Derek Atkins <derek@ihtfp.com>
11  */
12 
13 #include <linux/capability.h>
14 #include <linux/module.h>
15 #include <linux/kernel.h>
16 #include <linux/socket.h>
17 #include <linux/pfkeyv2.h>
18 #include <linux/ipsec.h>
19 #include <linux/skbuff.h>
20 #include <linux/rtnetlink.h>
21 #include <linux/in.h>
22 #include <linux/in6.h>
23 #include <linux/proc_fs.h>
24 #include <linux/init.h>
25 #include <linux/slab.h>
26 #include <net/net_namespace.h>
27 #include <net/netns/generic.h>
28 #include <net/xfrm.h>
29 
30 #include <net/sock.h>
31 
32 #define _X2KEY(x) ((x) == XFRM_INF ? 0 : (x))
33 #define _KEY2X(x) ((x) == 0 ? XFRM_INF : (x))
34 
35 static unsigned int pfkey_net_id __read_mostly;
36 struct netns_pfkey {
37 	/* List of all pfkey sockets. */
38 	struct hlist_head table;
39 	atomic_t socks_nr;
40 };
41 static DEFINE_MUTEX(pfkey_mutex);
42 
43 #define DUMMY_MARK 0
44 static const struct xfrm_mark dummy_mark = {0, 0};
45 struct pfkey_sock {
46 	/* struct sock must be the first member of struct pfkey_sock */
47 	struct sock	sk;
48 	int		registered;
49 	int		promisc;
50 
51 	struct {
52 		uint8_t		msg_version;
53 		uint32_t	msg_portid;
54 		int		(*dump)(struct pfkey_sock *sk);
55 		void		(*done)(struct pfkey_sock *sk);
56 		union {
57 			struct xfrm_policy_walk	policy;
58 			struct xfrm_state_walk	state;
59 		} u;
60 		struct sk_buff	*skb;
61 	} dump;
62 	struct mutex dump_lock;
63 };
64 
65 static int parse_sockaddr_pair(struct sockaddr *sa, int ext_len,
66 			       xfrm_address_t *saddr, xfrm_address_t *daddr,
67 			       u16 *family);
68 
69 static inline struct pfkey_sock *pfkey_sk(struct sock *sk)
70 {
71 	return (struct pfkey_sock *)sk;
72 }
73 
74 static int pfkey_can_dump(const struct sock *sk)
75 {
76 	if (3 * atomic_read(&sk->sk_rmem_alloc) <= 2 * sk->sk_rcvbuf)
77 		return 1;
78 	return 0;
79 }
80 
81 static void pfkey_terminate_dump(struct pfkey_sock *pfk)
82 {
83 	if (pfk->dump.dump) {
84 		if (pfk->dump.skb) {
85 			kfree_skb(pfk->dump.skb);
86 			pfk->dump.skb = NULL;
87 		}
88 		pfk->dump.done(pfk);
89 		pfk->dump.dump = NULL;
90 		pfk->dump.done = NULL;
91 	}
92 }
93 
94 static void pfkey_sock_destruct(struct sock *sk)
95 {
96 	struct net *net = sock_net(sk);
97 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
98 
99 	pfkey_terminate_dump(pfkey_sk(sk));
100 	skb_queue_purge(&sk->sk_receive_queue);
101 
102 	if (!sock_flag(sk, SOCK_DEAD)) {
103 		pr_err("Attempt to release alive pfkey socket: %p\n", sk);
104 		return;
105 	}
106 
107 	WARN_ON(atomic_read(&sk->sk_rmem_alloc));
108 	WARN_ON(refcount_read(&sk->sk_wmem_alloc));
109 
110 	atomic_dec(&net_pfkey->socks_nr);
111 }
112 
113 static const struct proto_ops pfkey_ops;
114 
115 static void pfkey_insert(struct sock *sk)
116 {
117 	struct net *net = sock_net(sk);
118 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
119 
120 	mutex_lock(&pfkey_mutex);
121 	sk_add_node_rcu(sk, &net_pfkey->table);
122 	mutex_unlock(&pfkey_mutex);
123 }
124 
125 static void pfkey_remove(struct sock *sk)
126 {
127 	mutex_lock(&pfkey_mutex);
128 	sk_del_node_init_rcu(sk);
129 	mutex_unlock(&pfkey_mutex);
130 }
131 
132 static struct proto key_proto = {
133 	.name	  = "KEY",
134 	.owner	  = THIS_MODULE,
135 	.obj_size = sizeof(struct pfkey_sock),
136 };
137 
138 static int pfkey_create(struct net *net, struct socket *sock, int protocol,
139 			int kern)
140 {
141 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
142 	struct sock *sk;
143 	struct pfkey_sock *pfk;
144 
145 	if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
146 		return -EPERM;
147 	if (sock->type != SOCK_RAW)
148 		return -ESOCKTNOSUPPORT;
149 	if (protocol != PF_KEY_V2)
150 		return -EPROTONOSUPPORT;
151 
152 	sk = sk_alloc(net, PF_KEY, GFP_KERNEL, &key_proto, kern);
153 	if (sk == NULL)
154 		return -ENOMEM;
155 
156 	pfk = pfkey_sk(sk);
157 	mutex_init(&pfk->dump_lock);
158 
159 	sock->ops = &pfkey_ops;
160 	sock_init_data(sock, sk);
161 
162 	sk->sk_family = PF_KEY;
163 	sk->sk_destruct = pfkey_sock_destruct;
164 
165 	atomic_inc(&net_pfkey->socks_nr);
166 
167 	pfkey_insert(sk);
168 
169 	return 0;
170 }
171 
172 static int pfkey_release(struct socket *sock)
173 {
174 	struct sock *sk = sock->sk;
175 
176 	if (!sk)
177 		return 0;
178 
179 	pfkey_remove(sk);
180 
181 	sock_orphan(sk);
182 	sock->sk = NULL;
183 	skb_queue_purge(&sk->sk_write_queue);
184 
185 	synchronize_rcu();
186 	sock_put(sk);
187 
188 	return 0;
189 }
190 
191 static int pfkey_broadcast_one(struct sk_buff *skb, gfp_t allocation,
192 			       struct sock *sk)
193 {
194 	int err = -ENOBUFS;
195 
196 	if (atomic_read(&sk->sk_rmem_alloc) > sk->sk_rcvbuf)
197 		return err;
198 
199 	skb = skb_clone(skb, allocation);
200 
201 	if (skb) {
202 		skb_set_owner_r(skb, sk);
203 		skb_queue_tail(&sk->sk_receive_queue, skb);
204 		sk->sk_data_ready(sk);
205 		err = 0;
206 	}
207 	return err;
208 }
209 
210 /* Send SKB to all pfkey sockets matching selected criteria.  */
211 #define BROADCAST_ALL		0
212 #define BROADCAST_ONE		1
213 #define BROADCAST_REGISTERED	2
214 #define BROADCAST_PROMISC_ONLY	4
215 static int pfkey_broadcast(struct sk_buff *skb, gfp_t allocation,
216 			   int broadcast_flags, struct sock *one_sk,
217 			   struct net *net)
218 {
219 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
220 	struct sock *sk;
221 	int err = -ESRCH;
222 
223 	/* XXX Do we need something like netlink_overrun?  I think
224 	 * XXX PF_KEY socket apps will not mind current behavior.
225 	 */
226 	if (!skb)
227 		return -ENOMEM;
228 
229 	rcu_read_lock();
230 	sk_for_each_rcu(sk, &net_pfkey->table) {
231 		struct pfkey_sock *pfk = pfkey_sk(sk);
232 		int err2;
233 
234 		/* Yes, it means that if you are meant to receive this
235 		 * pfkey message you receive it twice as promiscuous
236 		 * socket.
237 		 */
238 		if (pfk->promisc)
239 			pfkey_broadcast_one(skb, GFP_ATOMIC, sk);
240 
241 		/* the exact target will be processed later */
242 		if (sk == one_sk)
243 			continue;
244 		if (broadcast_flags != BROADCAST_ALL) {
245 			if (broadcast_flags & BROADCAST_PROMISC_ONLY)
246 				continue;
247 			if ((broadcast_flags & BROADCAST_REGISTERED) &&
248 			    !pfk->registered)
249 				continue;
250 			if (broadcast_flags & BROADCAST_ONE)
251 				continue;
252 		}
253 
254 		err2 = pfkey_broadcast_one(skb, GFP_ATOMIC, sk);
255 
256 		/* Error is cleared after successful sending to at least one
257 		 * registered KM */
258 		if ((broadcast_flags & BROADCAST_REGISTERED) && err)
259 			err = err2;
260 	}
261 	rcu_read_unlock();
262 
263 	if (one_sk != NULL)
264 		err = pfkey_broadcast_one(skb, allocation, one_sk);
265 
266 	kfree_skb(skb);
267 	return err;
268 }
269 
270 static int pfkey_do_dump(struct pfkey_sock *pfk)
271 {
272 	struct sadb_msg *hdr;
273 	int rc;
274 
275 	mutex_lock(&pfk->dump_lock);
276 	if (!pfk->dump.dump) {
277 		rc = 0;
278 		goto out;
279 	}
280 
281 	rc = pfk->dump.dump(pfk);
282 	if (rc == -ENOBUFS) {
283 		rc = 0;
284 		goto out;
285 	}
286 
287 	if (pfk->dump.skb) {
288 		if (!pfkey_can_dump(&pfk->sk)) {
289 			rc = 0;
290 			goto out;
291 		}
292 
293 		hdr = (struct sadb_msg *) pfk->dump.skb->data;
294 		hdr->sadb_msg_seq = 0;
295 		hdr->sadb_msg_errno = rc;
296 		pfkey_broadcast(pfk->dump.skb, GFP_ATOMIC, BROADCAST_ONE,
297 				&pfk->sk, sock_net(&pfk->sk));
298 		pfk->dump.skb = NULL;
299 	}
300 
301 	pfkey_terminate_dump(pfk);
302 
303 out:
304 	mutex_unlock(&pfk->dump_lock);
305 	return rc;
306 }
307 
308 static inline void pfkey_hdr_dup(struct sadb_msg *new,
309 				 const struct sadb_msg *orig)
310 {
311 	*new = *orig;
312 }
313 
314 static int pfkey_error(const struct sadb_msg *orig, int err, struct sock *sk)
315 {
316 	struct sk_buff *skb = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_KERNEL);
317 	struct sadb_msg *hdr;
318 
319 	if (!skb)
320 		return -ENOBUFS;
321 
322 	/* Woe be to the platform trying to support PFKEY yet
323 	 * having normal errnos outside the 1-255 range, inclusive.
324 	 */
325 	err = -err;
326 	if (err == ERESTARTSYS ||
327 	    err == ERESTARTNOHAND ||
328 	    err == ERESTARTNOINTR)
329 		err = EINTR;
330 	if (err >= 512)
331 		err = EINVAL;
332 	BUG_ON(err <= 0 || err >= 256);
333 
334 	hdr = skb_put(skb, sizeof(struct sadb_msg));
335 	pfkey_hdr_dup(hdr, orig);
336 	hdr->sadb_msg_errno = (uint8_t) err;
337 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) /
338 			     sizeof(uint64_t));
339 
340 	pfkey_broadcast(skb, GFP_KERNEL, BROADCAST_ONE, sk, sock_net(sk));
341 
342 	return 0;
343 }
344 
345 static const u8 sadb_ext_min_len[] = {
346 	[SADB_EXT_RESERVED]		= (u8) 0,
347 	[SADB_EXT_SA]			= (u8) sizeof(struct sadb_sa),
348 	[SADB_EXT_LIFETIME_CURRENT]	= (u8) sizeof(struct sadb_lifetime),
349 	[SADB_EXT_LIFETIME_HARD]	= (u8) sizeof(struct sadb_lifetime),
350 	[SADB_EXT_LIFETIME_SOFT]	= (u8) sizeof(struct sadb_lifetime),
351 	[SADB_EXT_ADDRESS_SRC]		= (u8) sizeof(struct sadb_address),
352 	[SADB_EXT_ADDRESS_DST]		= (u8) sizeof(struct sadb_address),
353 	[SADB_EXT_ADDRESS_PROXY]	= (u8) sizeof(struct sadb_address),
354 	[SADB_EXT_KEY_AUTH]		= (u8) sizeof(struct sadb_key),
355 	[SADB_EXT_KEY_ENCRYPT]		= (u8) sizeof(struct sadb_key),
356 	[SADB_EXT_IDENTITY_SRC]		= (u8) sizeof(struct sadb_ident),
357 	[SADB_EXT_IDENTITY_DST]		= (u8) sizeof(struct sadb_ident),
358 	[SADB_EXT_SENSITIVITY]		= (u8) sizeof(struct sadb_sens),
359 	[SADB_EXT_PROPOSAL]		= (u8) sizeof(struct sadb_prop),
360 	[SADB_EXT_SUPPORTED_AUTH]	= (u8) sizeof(struct sadb_supported),
361 	[SADB_EXT_SUPPORTED_ENCRYPT]	= (u8) sizeof(struct sadb_supported),
362 	[SADB_EXT_SPIRANGE]		= (u8) sizeof(struct sadb_spirange),
363 	[SADB_X_EXT_KMPRIVATE]		= (u8) sizeof(struct sadb_x_kmprivate),
364 	[SADB_X_EXT_POLICY]		= (u8) sizeof(struct sadb_x_policy),
365 	[SADB_X_EXT_SA2]		= (u8) sizeof(struct sadb_x_sa2),
366 	[SADB_X_EXT_NAT_T_TYPE]		= (u8) sizeof(struct sadb_x_nat_t_type),
367 	[SADB_X_EXT_NAT_T_SPORT]	= (u8) sizeof(struct sadb_x_nat_t_port),
368 	[SADB_X_EXT_NAT_T_DPORT]	= (u8) sizeof(struct sadb_x_nat_t_port),
369 	[SADB_X_EXT_NAT_T_OA]		= (u8) sizeof(struct sadb_address),
370 	[SADB_X_EXT_SEC_CTX]		= (u8) sizeof(struct sadb_x_sec_ctx),
371 	[SADB_X_EXT_KMADDRESS]		= (u8) sizeof(struct sadb_x_kmaddress),
372 	[SADB_X_EXT_FILTER]		= (u8) sizeof(struct sadb_x_filter),
373 };
374 
375 /* Verify sadb_address_{len,prefixlen} against sa_family.  */
376 static int verify_address_len(const void *p)
377 {
378 	const struct sadb_address *sp = p;
379 	const struct sockaddr *addr = (const struct sockaddr *)(sp + 1);
380 	const struct sockaddr_in *sin;
381 #if IS_ENABLED(CONFIG_IPV6)
382 	const struct sockaddr_in6 *sin6;
383 #endif
384 	int len;
385 
386 	if (sp->sadb_address_len <
387 	    DIV_ROUND_UP(sizeof(*sp) + offsetofend(typeof(*addr), sa_family),
388 			 sizeof(uint64_t)))
389 		return -EINVAL;
390 
391 	switch (addr->sa_family) {
392 	case AF_INET:
393 		len = DIV_ROUND_UP(sizeof(*sp) + sizeof(*sin), sizeof(uint64_t));
394 		if (sp->sadb_address_len != len ||
395 		    sp->sadb_address_prefixlen > 32)
396 			return -EINVAL;
397 		break;
398 #if IS_ENABLED(CONFIG_IPV6)
399 	case AF_INET6:
400 		len = DIV_ROUND_UP(sizeof(*sp) + sizeof(*sin6), sizeof(uint64_t));
401 		if (sp->sadb_address_len != len ||
402 		    sp->sadb_address_prefixlen > 128)
403 			return -EINVAL;
404 		break;
405 #endif
406 	default:
407 		/* It is user using kernel to keep track of security
408 		 * associations for another protocol, such as
409 		 * OSPF/RSVP/RIPV2/MIP.  It is user's job to verify
410 		 * lengths.
411 		 *
412 		 * XXX Actually, association/policy database is not yet
413 		 * XXX able to cope with arbitrary sockaddr families.
414 		 * XXX When it can, remove this -EINVAL.  -DaveM
415 		 */
416 		return -EINVAL;
417 	}
418 
419 	return 0;
420 }
421 
422 static inline int sadb_key_len(const struct sadb_key *key)
423 {
424 	int key_bytes = DIV_ROUND_UP(key->sadb_key_bits, 8);
425 
426 	return DIV_ROUND_UP(sizeof(struct sadb_key) + key_bytes,
427 			    sizeof(uint64_t));
428 }
429 
430 static int verify_key_len(const void *p)
431 {
432 	const struct sadb_key *key = p;
433 
434 	if (sadb_key_len(key) > key->sadb_key_len)
435 		return -EINVAL;
436 
437 	return 0;
438 }
439 
440 static inline int pfkey_sec_ctx_len(const struct sadb_x_sec_ctx *sec_ctx)
441 {
442 	return DIV_ROUND_UP(sizeof(struct sadb_x_sec_ctx) +
443 			    sec_ctx->sadb_x_ctx_len,
444 			    sizeof(uint64_t));
445 }
446 
447 static inline int verify_sec_ctx_len(const void *p)
448 {
449 	const struct sadb_x_sec_ctx *sec_ctx = p;
450 	int len = sec_ctx->sadb_x_ctx_len;
451 
452 	if (len > PAGE_SIZE)
453 		return -EINVAL;
454 
455 	len = pfkey_sec_ctx_len(sec_ctx);
456 
457 	if (sec_ctx->sadb_x_sec_len != len)
458 		return -EINVAL;
459 
460 	return 0;
461 }
462 
463 static inline struct xfrm_user_sec_ctx *pfkey_sadb2xfrm_user_sec_ctx(const struct sadb_x_sec_ctx *sec_ctx,
464 								     gfp_t gfp)
465 {
466 	struct xfrm_user_sec_ctx *uctx = NULL;
467 	int ctx_size = sec_ctx->sadb_x_ctx_len;
468 
469 	uctx = kmalloc((sizeof(*uctx)+ctx_size), gfp);
470 
471 	if (!uctx)
472 		return NULL;
473 
474 	uctx->len = pfkey_sec_ctx_len(sec_ctx);
475 	uctx->exttype = sec_ctx->sadb_x_sec_exttype;
476 	uctx->ctx_doi = sec_ctx->sadb_x_ctx_doi;
477 	uctx->ctx_alg = sec_ctx->sadb_x_ctx_alg;
478 	uctx->ctx_len = sec_ctx->sadb_x_ctx_len;
479 	memcpy(uctx + 1, sec_ctx + 1,
480 	       uctx->ctx_len);
481 
482 	return uctx;
483 }
484 
485 static int present_and_same_family(const struct sadb_address *src,
486 				   const struct sadb_address *dst)
487 {
488 	const struct sockaddr *s_addr, *d_addr;
489 
490 	if (!src || !dst)
491 		return 0;
492 
493 	s_addr = (const struct sockaddr *)(src + 1);
494 	d_addr = (const struct sockaddr *)(dst + 1);
495 	if (s_addr->sa_family != d_addr->sa_family)
496 		return 0;
497 	if (s_addr->sa_family != AF_INET
498 #if IS_ENABLED(CONFIG_IPV6)
499 	    && s_addr->sa_family != AF_INET6
500 #endif
501 		)
502 		return 0;
503 
504 	return 1;
505 }
506 
507 static int parse_exthdrs(struct sk_buff *skb, const struct sadb_msg *hdr, void **ext_hdrs)
508 {
509 	const char *p = (char *) hdr;
510 	int len = skb->len;
511 
512 	len -= sizeof(*hdr);
513 	p += sizeof(*hdr);
514 	while (len > 0) {
515 		const struct sadb_ext *ehdr = (const struct sadb_ext *) p;
516 		uint16_t ext_type;
517 		int ext_len;
518 
519 		if (len < sizeof(*ehdr))
520 			return -EINVAL;
521 
522 		ext_len  = ehdr->sadb_ext_len;
523 		ext_len *= sizeof(uint64_t);
524 		ext_type = ehdr->sadb_ext_type;
525 		if (ext_len < sizeof(uint64_t) ||
526 		    ext_len > len ||
527 		    ext_type == SADB_EXT_RESERVED)
528 			return -EINVAL;
529 
530 		if (ext_type <= SADB_EXT_MAX) {
531 			int min = (int) sadb_ext_min_len[ext_type];
532 			if (ext_len < min)
533 				return -EINVAL;
534 			if (ext_hdrs[ext_type-1] != NULL)
535 				return -EINVAL;
536 			switch (ext_type) {
537 			case SADB_EXT_ADDRESS_SRC:
538 			case SADB_EXT_ADDRESS_DST:
539 			case SADB_EXT_ADDRESS_PROXY:
540 			case SADB_X_EXT_NAT_T_OA:
541 				if (verify_address_len(p))
542 					return -EINVAL;
543 				break;
544 			case SADB_X_EXT_SEC_CTX:
545 				if (verify_sec_ctx_len(p))
546 					return -EINVAL;
547 				break;
548 			case SADB_EXT_KEY_AUTH:
549 			case SADB_EXT_KEY_ENCRYPT:
550 				if (verify_key_len(p))
551 					return -EINVAL;
552 				break;
553 			default:
554 				break;
555 			}
556 			ext_hdrs[ext_type-1] = (void *) p;
557 		}
558 		p   += ext_len;
559 		len -= ext_len;
560 	}
561 
562 	return 0;
563 }
564 
565 static uint16_t
566 pfkey_satype2proto(uint8_t satype)
567 {
568 	switch (satype) {
569 	case SADB_SATYPE_UNSPEC:
570 		return IPSEC_PROTO_ANY;
571 	case SADB_SATYPE_AH:
572 		return IPPROTO_AH;
573 	case SADB_SATYPE_ESP:
574 		return IPPROTO_ESP;
575 	case SADB_X_SATYPE_IPCOMP:
576 		return IPPROTO_COMP;
577 	default:
578 		return 0;
579 	}
580 	/* NOTREACHED */
581 }
582 
583 static uint8_t
584 pfkey_proto2satype(uint16_t proto)
585 {
586 	switch (proto) {
587 	case IPPROTO_AH:
588 		return SADB_SATYPE_AH;
589 	case IPPROTO_ESP:
590 		return SADB_SATYPE_ESP;
591 	case IPPROTO_COMP:
592 		return SADB_X_SATYPE_IPCOMP;
593 	default:
594 		return 0;
595 	}
596 	/* NOTREACHED */
597 }
598 
599 /* BTW, this scheme means that there is no way with PFKEY2 sockets to
600  * say specifically 'just raw sockets' as we encode them as 255.
601  */
602 
603 static uint8_t pfkey_proto_to_xfrm(uint8_t proto)
604 {
605 	return proto == IPSEC_PROTO_ANY ? 0 : proto;
606 }
607 
608 static uint8_t pfkey_proto_from_xfrm(uint8_t proto)
609 {
610 	return proto ? proto : IPSEC_PROTO_ANY;
611 }
612 
613 static inline int pfkey_sockaddr_len(sa_family_t family)
614 {
615 	switch (family) {
616 	case AF_INET:
617 		return sizeof(struct sockaddr_in);
618 #if IS_ENABLED(CONFIG_IPV6)
619 	case AF_INET6:
620 		return sizeof(struct sockaddr_in6);
621 #endif
622 	}
623 	return 0;
624 }
625 
626 static
627 int pfkey_sockaddr_extract(const struct sockaddr *sa, xfrm_address_t *xaddr)
628 {
629 	switch (sa->sa_family) {
630 	case AF_INET:
631 		xaddr->a4 =
632 			((struct sockaddr_in *)sa)->sin_addr.s_addr;
633 		return AF_INET;
634 #if IS_ENABLED(CONFIG_IPV6)
635 	case AF_INET6:
636 		memcpy(xaddr->a6,
637 		       &((struct sockaddr_in6 *)sa)->sin6_addr,
638 		       sizeof(struct in6_addr));
639 		return AF_INET6;
640 #endif
641 	}
642 	return 0;
643 }
644 
645 static
646 int pfkey_sadb_addr2xfrm_addr(const struct sadb_address *addr, xfrm_address_t *xaddr)
647 {
648 	return pfkey_sockaddr_extract((struct sockaddr *)(addr + 1),
649 				      xaddr);
650 }
651 
652 static struct  xfrm_state *pfkey_xfrm_state_lookup(struct net *net, const struct sadb_msg *hdr, void * const *ext_hdrs)
653 {
654 	const struct sadb_sa *sa;
655 	const struct sadb_address *addr;
656 	uint16_t proto;
657 	unsigned short family;
658 	xfrm_address_t *xaddr;
659 
660 	sa = ext_hdrs[SADB_EXT_SA - 1];
661 	if (sa == NULL)
662 		return NULL;
663 
664 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
665 	if (proto == 0)
666 		return NULL;
667 
668 	/* sadb_address_len should be checked by caller */
669 	addr = ext_hdrs[SADB_EXT_ADDRESS_DST - 1];
670 	if (addr == NULL)
671 		return NULL;
672 
673 	family = ((const struct sockaddr *)(addr + 1))->sa_family;
674 	switch (family) {
675 	case AF_INET:
676 		xaddr = (xfrm_address_t *)&((const struct sockaddr_in *)(addr + 1))->sin_addr;
677 		break;
678 #if IS_ENABLED(CONFIG_IPV6)
679 	case AF_INET6:
680 		xaddr = (xfrm_address_t *)&((const struct sockaddr_in6 *)(addr + 1))->sin6_addr;
681 		break;
682 #endif
683 	default:
684 		xaddr = NULL;
685 	}
686 
687 	if (!xaddr)
688 		return NULL;
689 
690 	return xfrm_state_lookup(net, DUMMY_MARK, xaddr, sa->sadb_sa_spi, proto, family);
691 }
692 
693 #define PFKEY_ALIGN8(a) (1 + (((a) - 1) | (8 - 1)))
694 
695 static int
696 pfkey_sockaddr_size(sa_family_t family)
697 {
698 	return PFKEY_ALIGN8(pfkey_sockaddr_len(family));
699 }
700 
701 static inline int pfkey_mode_from_xfrm(int mode)
702 {
703 	switch(mode) {
704 	case XFRM_MODE_TRANSPORT:
705 		return IPSEC_MODE_TRANSPORT;
706 	case XFRM_MODE_TUNNEL:
707 		return IPSEC_MODE_TUNNEL;
708 	case XFRM_MODE_BEET:
709 		return IPSEC_MODE_BEET;
710 	default:
711 		return -1;
712 	}
713 }
714 
715 static inline int pfkey_mode_to_xfrm(int mode)
716 {
717 	switch(mode) {
718 	case IPSEC_MODE_ANY:	/*XXX*/
719 	case IPSEC_MODE_TRANSPORT:
720 		return XFRM_MODE_TRANSPORT;
721 	case IPSEC_MODE_TUNNEL:
722 		return XFRM_MODE_TUNNEL;
723 	case IPSEC_MODE_BEET:
724 		return XFRM_MODE_BEET;
725 	default:
726 		return -1;
727 	}
728 }
729 
730 static unsigned int pfkey_sockaddr_fill(const xfrm_address_t *xaddr, __be16 port,
731 					struct sockaddr *sa,
732 					unsigned short family)
733 {
734 	switch (family) {
735 	case AF_INET:
736 	    {
737 		struct sockaddr_in *sin = (struct sockaddr_in *)sa;
738 		sin->sin_family = AF_INET;
739 		sin->sin_port = port;
740 		sin->sin_addr.s_addr = xaddr->a4;
741 		memset(sin->sin_zero, 0, sizeof(sin->sin_zero));
742 		return 32;
743 	    }
744 #if IS_ENABLED(CONFIG_IPV6)
745 	case AF_INET6:
746 	    {
747 		struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)sa;
748 		sin6->sin6_family = AF_INET6;
749 		sin6->sin6_port = port;
750 		sin6->sin6_flowinfo = 0;
751 		sin6->sin6_addr = xaddr->in6;
752 		sin6->sin6_scope_id = 0;
753 		return 128;
754 	    }
755 #endif
756 	}
757 	return 0;
758 }
759 
760 static unsigned int pfkey_sockaddr_fill_zero_tail(const xfrm_address_t *xaddr,
761 						  __be16 port,
762 						  struct sockaddr *sa,
763 						  unsigned short family)
764 {
765 	unsigned int prefixlen;
766 	int sockaddr_len = pfkey_sockaddr_len(family);
767 	int sockaddr_size = pfkey_sockaddr_size(family);
768 
769 	prefixlen = pfkey_sockaddr_fill(xaddr, port, sa, family);
770 	if (sockaddr_size > sockaddr_len)
771 		memset((u8 *)sa + sockaddr_len, 0, sockaddr_size - sockaddr_len);
772 
773 	return prefixlen;
774 }
775 
776 static struct sk_buff *__pfkey_xfrm_state2msg(const struct xfrm_state *x,
777 					      int add_keys, int hsc)
778 {
779 	struct sk_buff *skb;
780 	struct sadb_msg *hdr;
781 	struct sadb_sa *sa;
782 	struct sadb_lifetime *lifetime;
783 	struct sadb_address *addr;
784 	struct sadb_key *key;
785 	struct sadb_x_sa2 *sa2;
786 	struct sadb_x_sec_ctx *sec_ctx;
787 	struct xfrm_sec_ctx *xfrm_ctx;
788 	int ctx_size = 0;
789 	int size;
790 	int auth_key_size = 0;
791 	int encrypt_key_size = 0;
792 	int sockaddr_size;
793 	struct xfrm_encap_tmpl *natt = NULL;
794 	int mode;
795 
796 	/* address family check */
797 	sockaddr_size = pfkey_sockaddr_size(x->props.family);
798 	if (!sockaddr_size)
799 		return ERR_PTR(-EINVAL);
800 
801 	/* base, SA, (lifetime (HSC),) address(SD), (address(P),)
802 	   key(AE), (identity(SD),) (sensitivity)> */
803 	size = sizeof(struct sadb_msg) +sizeof(struct sadb_sa) +
804 		sizeof(struct sadb_lifetime) +
805 		((hsc & 1) ? sizeof(struct sadb_lifetime) : 0) +
806 		((hsc & 2) ? sizeof(struct sadb_lifetime) : 0) +
807 			sizeof(struct sadb_address)*2 +
808 				sockaddr_size*2 +
809 					sizeof(struct sadb_x_sa2);
810 
811 	if ((xfrm_ctx = x->security)) {
812 		ctx_size = PFKEY_ALIGN8(xfrm_ctx->ctx_len);
813 		size += sizeof(struct sadb_x_sec_ctx) + ctx_size;
814 	}
815 
816 	/* identity & sensitivity */
817 	if (!xfrm_addr_equal(&x->sel.saddr, &x->props.saddr, x->props.family))
818 		size += sizeof(struct sadb_address) + sockaddr_size;
819 
820 	if (add_keys) {
821 		if (x->aalg && x->aalg->alg_key_len) {
822 			auth_key_size =
823 				PFKEY_ALIGN8((x->aalg->alg_key_len + 7) / 8);
824 			size += sizeof(struct sadb_key) + auth_key_size;
825 		}
826 		if (x->ealg && x->ealg->alg_key_len) {
827 			encrypt_key_size =
828 				PFKEY_ALIGN8((x->ealg->alg_key_len+7) / 8);
829 			size += sizeof(struct sadb_key) + encrypt_key_size;
830 		}
831 	}
832 	if (x->encap)
833 		natt = x->encap;
834 
835 	if (natt && natt->encap_type) {
836 		size += sizeof(struct sadb_x_nat_t_type);
837 		size += sizeof(struct sadb_x_nat_t_port);
838 		size += sizeof(struct sadb_x_nat_t_port);
839 	}
840 
841 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
842 	if (skb == NULL)
843 		return ERR_PTR(-ENOBUFS);
844 
845 	/* call should fill header later */
846 	hdr = skb_put(skb, sizeof(struct sadb_msg));
847 	memset(hdr, 0, size);	/* XXX do we need this ? */
848 	hdr->sadb_msg_len = size / sizeof(uint64_t);
849 
850 	/* sa */
851 	sa = skb_put(skb, sizeof(struct sadb_sa));
852 	sa->sadb_sa_len = sizeof(struct sadb_sa)/sizeof(uint64_t);
853 	sa->sadb_sa_exttype = SADB_EXT_SA;
854 	sa->sadb_sa_spi = x->id.spi;
855 	sa->sadb_sa_replay = x->props.replay_window;
856 	switch (x->km.state) {
857 	case XFRM_STATE_VALID:
858 		sa->sadb_sa_state = x->km.dying ?
859 			SADB_SASTATE_DYING : SADB_SASTATE_MATURE;
860 		break;
861 	case XFRM_STATE_ACQ:
862 		sa->sadb_sa_state = SADB_SASTATE_LARVAL;
863 		break;
864 	default:
865 		sa->sadb_sa_state = SADB_SASTATE_DEAD;
866 		break;
867 	}
868 	sa->sadb_sa_auth = 0;
869 	if (x->aalg) {
870 		struct xfrm_algo_desc *a = xfrm_aalg_get_byname(x->aalg->alg_name, 0);
871 		sa->sadb_sa_auth = (a && a->pfkey_supported) ?
872 					a->desc.sadb_alg_id : 0;
873 	}
874 	sa->sadb_sa_encrypt = 0;
875 	BUG_ON(x->ealg && x->calg);
876 	if (x->ealg) {
877 		struct xfrm_algo_desc *a = xfrm_ealg_get_byname(x->ealg->alg_name, 0);
878 		sa->sadb_sa_encrypt = (a && a->pfkey_supported) ?
879 					a->desc.sadb_alg_id : 0;
880 	}
881 	/* KAME compatible: sadb_sa_encrypt is overloaded with calg id */
882 	if (x->calg) {
883 		struct xfrm_algo_desc *a = xfrm_calg_get_byname(x->calg->alg_name, 0);
884 		sa->sadb_sa_encrypt = (a && a->pfkey_supported) ?
885 					a->desc.sadb_alg_id : 0;
886 	}
887 
888 	sa->sadb_sa_flags = 0;
889 	if (x->props.flags & XFRM_STATE_NOECN)
890 		sa->sadb_sa_flags |= SADB_SAFLAGS_NOECN;
891 	if (x->props.flags & XFRM_STATE_DECAP_DSCP)
892 		sa->sadb_sa_flags |= SADB_SAFLAGS_DECAP_DSCP;
893 	if (x->props.flags & XFRM_STATE_NOPMTUDISC)
894 		sa->sadb_sa_flags |= SADB_SAFLAGS_NOPMTUDISC;
895 
896 	/* hard time */
897 	if (hsc & 2) {
898 		lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
899 		lifetime->sadb_lifetime_len =
900 			sizeof(struct sadb_lifetime)/sizeof(uint64_t);
901 		lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_HARD;
902 		lifetime->sadb_lifetime_allocations =  _X2KEY(x->lft.hard_packet_limit);
903 		lifetime->sadb_lifetime_bytes = _X2KEY(x->lft.hard_byte_limit);
904 		lifetime->sadb_lifetime_addtime = x->lft.hard_add_expires_seconds;
905 		lifetime->sadb_lifetime_usetime = x->lft.hard_use_expires_seconds;
906 	}
907 	/* soft time */
908 	if (hsc & 1) {
909 		lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
910 		lifetime->sadb_lifetime_len =
911 			sizeof(struct sadb_lifetime)/sizeof(uint64_t);
912 		lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_SOFT;
913 		lifetime->sadb_lifetime_allocations =  _X2KEY(x->lft.soft_packet_limit);
914 		lifetime->sadb_lifetime_bytes = _X2KEY(x->lft.soft_byte_limit);
915 		lifetime->sadb_lifetime_addtime = x->lft.soft_add_expires_seconds;
916 		lifetime->sadb_lifetime_usetime = x->lft.soft_use_expires_seconds;
917 	}
918 	/* current time */
919 	lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
920 	lifetime->sadb_lifetime_len =
921 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
922 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_CURRENT;
923 	lifetime->sadb_lifetime_allocations = x->curlft.packets;
924 	lifetime->sadb_lifetime_bytes = x->curlft.bytes;
925 	lifetime->sadb_lifetime_addtime = x->curlft.add_time;
926 	lifetime->sadb_lifetime_usetime = x->curlft.use_time;
927 	/* src address */
928 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
929 	addr->sadb_address_len =
930 		(sizeof(struct sadb_address)+sockaddr_size)/
931 			sizeof(uint64_t);
932 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
933 	/* "if the ports are non-zero, then the sadb_address_proto field,
934 	   normally zero, MUST be filled in with the transport
935 	   protocol's number." - RFC2367 */
936 	addr->sadb_address_proto = 0;
937 	addr->sadb_address_reserved = 0;
938 
939 	addr->sadb_address_prefixlen =
940 		pfkey_sockaddr_fill(&x->props.saddr, 0,
941 				    (struct sockaddr *) (addr + 1),
942 				    x->props.family);
943 	BUG_ON(!addr->sadb_address_prefixlen);
944 
945 	/* dst address */
946 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
947 	addr->sadb_address_len =
948 		(sizeof(struct sadb_address)+sockaddr_size)/
949 			sizeof(uint64_t);
950 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
951 	addr->sadb_address_proto = 0;
952 	addr->sadb_address_reserved = 0;
953 
954 	addr->sadb_address_prefixlen =
955 		pfkey_sockaddr_fill(&x->id.daddr, 0,
956 				    (struct sockaddr *) (addr + 1),
957 				    x->props.family);
958 	BUG_ON(!addr->sadb_address_prefixlen);
959 
960 	if (!xfrm_addr_equal(&x->sel.saddr, &x->props.saddr,
961 			     x->props.family)) {
962 		addr = skb_put(skb,
963 			       sizeof(struct sadb_address) + sockaddr_size);
964 		addr->sadb_address_len =
965 			(sizeof(struct sadb_address)+sockaddr_size)/
966 			sizeof(uint64_t);
967 		addr->sadb_address_exttype = SADB_EXT_ADDRESS_PROXY;
968 		addr->sadb_address_proto =
969 			pfkey_proto_from_xfrm(x->sel.proto);
970 		addr->sadb_address_prefixlen = x->sel.prefixlen_s;
971 		addr->sadb_address_reserved = 0;
972 
973 		pfkey_sockaddr_fill(&x->sel.saddr, x->sel.sport,
974 				    (struct sockaddr *) (addr + 1),
975 				    x->props.family);
976 	}
977 
978 	/* auth key */
979 	if (add_keys && auth_key_size) {
980 		key = skb_put(skb, sizeof(struct sadb_key) + auth_key_size);
981 		key->sadb_key_len = (sizeof(struct sadb_key) + auth_key_size) /
982 			sizeof(uint64_t);
983 		key->sadb_key_exttype = SADB_EXT_KEY_AUTH;
984 		key->sadb_key_bits = x->aalg->alg_key_len;
985 		key->sadb_key_reserved = 0;
986 		memcpy(key + 1, x->aalg->alg_key, (x->aalg->alg_key_len+7)/8);
987 	}
988 	/* encrypt key */
989 	if (add_keys && encrypt_key_size) {
990 		key = skb_put(skb, sizeof(struct sadb_key) + encrypt_key_size);
991 		key->sadb_key_len = (sizeof(struct sadb_key) +
992 				     encrypt_key_size) / sizeof(uint64_t);
993 		key->sadb_key_exttype = SADB_EXT_KEY_ENCRYPT;
994 		key->sadb_key_bits = x->ealg->alg_key_len;
995 		key->sadb_key_reserved = 0;
996 		memcpy(key + 1, x->ealg->alg_key,
997 		       (x->ealg->alg_key_len+7)/8);
998 	}
999 
1000 	/* sa */
1001 	sa2 = skb_put(skb, sizeof(struct sadb_x_sa2));
1002 	sa2->sadb_x_sa2_len = sizeof(struct sadb_x_sa2)/sizeof(uint64_t);
1003 	sa2->sadb_x_sa2_exttype = SADB_X_EXT_SA2;
1004 	if ((mode = pfkey_mode_from_xfrm(x->props.mode)) < 0) {
1005 		kfree_skb(skb);
1006 		return ERR_PTR(-EINVAL);
1007 	}
1008 	sa2->sadb_x_sa2_mode = mode;
1009 	sa2->sadb_x_sa2_reserved1 = 0;
1010 	sa2->sadb_x_sa2_reserved2 = 0;
1011 	sa2->sadb_x_sa2_sequence = 0;
1012 	sa2->sadb_x_sa2_reqid = x->props.reqid;
1013 
1014 	if (natt && natt->encap_type) {
1015 		struct sadb_x_nat_t_type *n_type;
1016 		struct sadb_x_nat_t_port *n_port;
1017 
1018 		/* type */
1019 		n_type = skb_put(skb, sizeof(*n_type));
1020 		n_type->sadb_x_nat_t_type_len = sizeof(*n_type)/sizeof(uint64_t);
1021 		n_type->sadb_x_nat_t_type_exttype = SADB_X_EXT_NAT_T_TYPE;
1022 		n_type->sadb_x_nat_t_type_type = natt->encap_type;
1023 		n_type->sadb_x_nat_t_type_reserved[0] = 0;
1024 		n_type->sadb_x_nat_t_type_reserved[1] = 0;
1025 		n_type->sadb_x_nat_t_type_reserved[2] = 0;
1026 
1027 		/* source port */
1028 		n_port = skb_put(skb, sizeof(*n_port));
1029 		n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
1030 		n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_SPORT;
1031 		n_port->sadb_x_nat_t_port_port = natt->encap_sport;
1032 		n_port->sadb_x_nat_t_port_reserved = 0;
1033 
1034 		/* dest port */
1035 		n_port = skb_put(skb, sizeof(*n_port));
1036 		n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
1037 		n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_DPORT;
1038 		n_port->sadb_x_nat_t_port_port = natt->encap_dport;
1039 		n_port->sadb_x_nat_t_port_reserved = 0;
1040 	}
1041 
1042 	/* security context */
1043 	if (xfrm_ctx) {
1044 		sec_ctx = skb_put(skb,
1045 				  sizeof(struct sadb_x_sec_ctx) + ctx_size);
1046 		sec_ctx->sadb_x_sec_len =
1047 		  (sizeof(struct sadb_x_sec_ctx) + ctx_size) / sizeof(uint64_t);
1048 		sec_ctx->sadb_x_sec_exttype = SADB_X_EXT_SEC_CTX;
1049 		sec_ctx->sadb_x_ctx_doi = xfrm_ctx->ctx_doi;
1050 		sec_ctx->sadb_x_ctx_alg = xfrm_ctx->ctx_alg;
1051 		sec_ctx->sadb_x_ctx_len = xfrm_ctx->ctx_len;
1052 		memcpy(sec_ctx + 1, xfrm_ctx->ctx_str,
1053 		       xfrm_ctx->ctx_len);
1054 	}
1055 
1056 	return skb;
1057 }
1058 
1059 
1060 static inline struct sk_buff *pfkey_xfrm_state2msg(const struct xfrm_state *x)
1061 {
1062 	struct sk_buff *skb;
1063 
1064 	skb = __pfkey_xfrm_state2msg(x, 1, 3);
1065 
1066 	return skb;
1067 }
1068 
1069 static inline struct sk_buff *pfkey_xfrm_state2msg_expire(const struct xfrm_state *x,
1070 							  int hsc)
1071 {
1072 	return __pfkey_xfrm_state2msg(x, 0, hsc);
1073 }
1074 
1075 static struct xfrm_state * pfkey_msg2xfrm_state(struct net *net,
1076 						const struct sadb_msg *hdr,
1077 						void * const *ext_hdrs)
1078 {
1079 	struct xfrm_state *x;
1080 	const struct sadb_lifetime *lifetime;
1081 	const struct sadb_sa *sa;
1082 	const struct sadb_key *key;
1083 	const struct sadb_x_sec_ctx *sec_ctx;
1084 	uint16_t proto;
1085 	int err;
1086 
1087 
1088 	sa = ext_hdrs[SADB_EXT_SA - 1];
1089 	if (!sa ||
1090 	    !present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1091 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1092 		return ERR_PTR(-EINVAL);
1093 	if (hdr->sadb_msg_satype == SADB_SATYPE_ESP &&
1094 	    !ext_hdrs[SADB_EXT_KEY_ENCRYPT-1])
1095 		return ERR_PTR(-EINVAL);
1096 	if (hdr->sadb_msg_satype == SADB_SATYPE_AH &&
1097 	    !ext_hdrs[SADB_EXT_KEY_AUTH-1])
1098 		return ERR_PTR(-EINVAL);
1099 	if (!!ext_hdrs[SADB_EXT_LIFETIME_HARD-1] !=
1100 	    !!ext_hdrs[SADB_EXT_LIFETIME_SOFT-1])
1101 		return ERR_PTR(-EINVAL);
1102 
1103 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1104 	if (proto == 0)
1105 		return ERR_PTR(-EINVAL);
1106 
1107 	/* default error is no buffer space */
1108 	err = -ENOBUFS;
1109 
1110 	/* RFC2367:
1111 
1112    Only SADB_SASTATE_MATURE SAs may be submitted in an SADB_ADD message.
1113    SADB_SASTATE_LARVAL SAs are created by SADB_GETSPI and it is not
1114    sensible to add a new SA in the DYING or SADB_SASTATE_DEAD state.
1115    Therefore, the sadb_sa_state field of all submitted SAs MUST be
1116    SADB_SASTATE_MATURE and the kernel MUST return an error if this is
1117    not true.
1118 
1119 	   However, KAME setkey always uses SADB_SASTATE_LARVAL.
1120 	   Hence, we have to _ignore_ sadb_sa_state, which is also reasonable.
1121 	 */
1122 	if (sa->sadb_sa_auth > SADB_AALG_MAX ||
1123 	    (hdr->sadb_msg_satype == SADB_X_SATYPE_IPCOMP &&
1124 	     sa->sadb_sa_encrypt > SADB_X_CALG_MAX) ||
1125 	    sa->sadb_sa_encrypt > SADB_EALG_MAX)
1126 		return ERR_PTR(-EINVAL);
1127 	key = ext_hdrs[SADB_EXT_KEY_AUTH - 1];
1128 	if (key != NULL &&
1129 	    sa->sadb_sa_auth != SADB_X_AALG_NULL &&
1130 	    key->sadb_key_bits == 0)
1131 		return ERR_PTR(-EINVAL);
1132 	key = ext_hdrs[SADB_EXT_KEY_ENCRYPT-1];
1133 	if (key != NULL &&
1134 	    sa->sadb_sa_encrypt != SADB_EALG_NULL &&
1135 	    key->sadb_key_bits == 0)
1136 		return ERR_PTR(-EINVAL);
1137 
1138 	x = xfrm_state_alloc(net);
1139 	if (x == NULL)
1140 		return ERR_PTR(-ENOBUFS);
1141 
1142 	x->id.proto = proto;
1143 	x->id.spi = sa->sadb_sa_spi;
1144 	x->props.replay_window = min_t(unsigned int, sa->sadb_sa_replay,
1145 					(sizeof(x->replay.bitmap) * 8));
1146 	if (sa->sadb_sa_flags & SADB_SAFLAGS_NOECN)
1147 		x->props.flags |= XFRM_STATE_NOECN;
1148 	if (sa->sadb_sa_flags & SADB_SAFLAGS_DECAP_DSCP)
1149 		x->props.flags |= XFRM_STATE_DECAP_DSCP;
1150 	if (sa->sadb_sa_flags & SADB_SAFLAGS_NOPMTUDISC)
1151 		x->props.flags |= XFRM_STATE_NOPMTUDISC;
1152 
1153 	lifetime = ext_hdrs[SADB_EXT_LIFETIME_HARD - 1];
1154 	if (lifetime != NULL) {
1155 		x->lft.hard_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
1156 		x->lft.hard_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
1157 		x->lft.hard_add_expires_seconds = lifetime->sadb_lifetime_addtime;
1158 		x->lft.hard_use_expires_seconds = lifetime->sadb_lifetime_usetime;
1159 	}
1160 	lifetime = ext_hdrs[SADB_EXT_LIFETIME_SOFT - 1];
1161 	if (lifetime != NULL) {
1162 		x->lft.soft_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
1163 		x->lft.soft_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
1164 		x->lft.soft_add_expires_seconds = lifetime->sadb_lifetime_addtime;
1165 		x->lft.soft_use_expires_seconds = lifetime->sadb_lifetime_usetime;
1166 	}
1167 
1168 	sec_ctx = ext_hdrs[SADB_X_EXT_SEC_CTX - 1];
1169 	if (sec_ctx != NULL) {
1170 		struct xfrm_user_sec_ctx *uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_KERNEL);
1171 
1172 		if (!uctx)
1173 			goto out;
1174 
1175 		err = security_xfrm_state_alloc(x, uctx);
1176 		kfree(uctx);
1177 
1178 		if (err)
1179 			goto out;
1180 	}
1181 
1182 	err = -ENOBUFS;
1183 	key = ext_hdrs[SADB_EXT_KEY_AUTH - 1];
1184 	if (sa->sadb_sa_auth) {
1185 		int keysize = 0;
1186 		struct xfrm_algo_desc *a = xfrm_aalg_get_byid(sa->sadb_sa_auth);
1187 		if (!a || !a->pfkey_supported) {
1188 			err = -ENOSYS;
1189 			goto out;
1190 		}
1191 		if (key)
1192 			keysize = (key->sadb_key_bits + 7) / 8;
1193 		x->aalg = kmalloc(sizeof(*x->aalg) + keysize, GFP_KERNEL);
1194 		if (!x->aalg) {
1195 			err = -ENOMEM;
1196 			goto out;
1197 		}
1198 		strcpy(x->aalg->alg_name, a->name);
1199 		x->aalg->alg_key_len = 0;
1200 		if (key) {
1201 			x->aalg->alg_key_len = key->sadb_key_bits;
1202 			memcpy(x->aalg->alg_key, key+1, keysize);
1203 		}
1204 		x->aalg->alg_trunc_len = a->uinfo.auth.icv_truncbits;
1205 		x->props.aalgo = sa->sadb_sa_auth;
1206 		/* x->algo.flags = sa->sadb_sa_flags; */
1207 	}
1208 	if (sa->sadb_sa_encrypt) {
1209 		if (hdr->sadb_msg_satype == SADB_X_SATYPE_IPCOMP) {
1210 			struct xfrm_algo_desc *a = xfrm_calg_get_byid(sa->sadb_sa_encrypt);
1211 			if (!a || !a->pfkey_supported) {
1212 				err = -ENOSYS;
1213 				goto out;
1214 			}
1215 			x->calg = kmalloc_obj(*x->calg);
1216 			if (!x->calg) {
1217 				err = -ENOMEM;
1218 				goto out;
1219 			}
1220 			strcpy(x->calg->alg_name, a->name);
1221 			x->calg->alg_key_len = 0;
1222 			x->props.calgo = sa->sadb_sa_encrypt;
1223 		} else {
1224 			int keysize = 0;
1225 			struct xfrm_algo_desc *a = xfrm_ealg_get_byid(sa->sadb_sa_encrypt);
1226 			if (!a || !a->pfkey_supported) {
1227 				err = -ENOSYS;
1228 				goto out;
1229 			}
1230 			key = (struct sadb_key*) ext_hdrs[SADB_EXT_KEY_ENCRYPT-1];
1231 			if (key)
1232 				keysize = (key->sadb_key_bits + 7) / 8;
1233 			x->ealg = kmalloc(sizeof(*x->ealg) + keysize, GFP_KERNEL);
1234 			if (!x->ealg) {
1235 				err = -ENOMEM;
1236 				goto out;
1237 			}
1238 			strcpy(x->ealg->alg_name, a->name);
1239 			x->ealg->alg_key_len = 0;
1240 			if (key) {
1241 				x->ealg->alg_key_len = key->sadb_key_bits;
1242 				memcpy(x->ealg->alg_key, key+1, keysize);
1243 			}
1244 			x->props.ealgo = sa->sadb_sa_encrypt;
1245 			x->geniv = a->uinfo.encr.geniv;
1246 		}
1247 	}
1248 	/* x->algo.flags = sa->sadb_sa_flags; */
1249 
1250 	x->props.family = pfkey_sadb_addr2xfrm_addr((struct sadb_address *) ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1251 						    &x->props.saddr);
1252 	pfkey_sadb_addr2xfrm_addr((struct sadb_address *) ext_hdrs[SADB_EXT_ADDRESS_DST-1],
1253 				  &x->id.daddr);
1254 
1255 	if (ext_hdrs[SADB_X_EXT_SA2-1]) {
1256 		const struct sadb_x_sa2 *sa2 = ext_hdrs[SADB_X_EXT_SA2-1];
1257 		int mode = pfkey_mode_to_xfrm(sa2->sadb_x_sa2_mode);
1258 		if (mode < 0) {
1259 			err = -EINVAL;
1260 			goto out;
1261 		}
1262 		x->props.mode = mode;
1263 		x->props.reqid = sa2->sadb_x_sa2_reqid;
1264 	}
1265 
1266 	if (ext_hdrs[SADB_EXT_ADDRESS_PROXY-1]) {
1267 		const struct sadb_address *addr = ext_hdrs[SADB_EXT_ADDRESS_PROXY-1];
1268 
1269 		/* Nobody uses this, but we try. */
1270 		x->sel.family = pfkey_sadb_addr2xfrm_addr(addr, &x->sel.saddr);
1271 		x->sel.prefixlen_s = addr->sadb_address_prefixlen;
1272 	}
1273 
1274 	if (!x->sel.family)
1275 		x->sel.family = x->props.family;
1276 
1277 	if (ext_hdrs[SADB_X_EXT_NAT_T_TYPE-1]) {
1278 		const struct sadb_x_nat_t_type* n_type;
1279 		struct xfrm_encap_tmpl *natt;
1280 
1281 		x->encap = kzalloc_obj(*x->encap);
1282 		if (!x->encap) {
1283 			err = -ENOMEM;
1284 			goto out;
1285 		}
1286 
1287 		natt = x->encap;
1288 		n_type = ext_hdrs[SADB_X_EXT_NAT_T_TYPE-1];
1289 		natt->encap_type = n_type->sadb_x_nat_t_type_type;
1290 
1291 		if (ext_hdrs[SADB_X_EXT_NAT_T_SPORT-1]) {
1292 			const struct sadb_x_nat_t_port *n_port =
1293 				ext_hdrs[SADB_X_EXT_NAT_T_SPORT-1];
1294 			natt->encap_sport = n_port->sadb_x_nat_t_port_port;
1295 		}
1296 		if (ext_hdrs[SADB_X_EXT_NAT_T_DPORT-1]) {
1297 			const struct sadb_x_nat_t_port *n_port =
1298 				ext_hdrs[SADB_X_EXT_NAT_T_DPORT-1];
1299 			natt->encap_dport = n_port->sadb_x_nat_t_port_port;
1300 		}
1301 	}
1302 
1303 	err = xfrm_init_state(x, NULL);
1304 	if (err)
1305 		goto out;
1306 
1307 	x->km.seq = hdr->sadb_msg_seq;
1308 	return x;
1309 
1310 out:
1311 	x->km.state = XFRM_STATE_DEAD;
1312 	xfrm_state_put(x);
1313 	return ERR_PTR(err);
1314 }
1315 
1316 static int pfkey_reserved(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1317 {
1318 	return -EOPNOTSUPP;
1319 }
1320 
1321 static int pfkey_getspi(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1322 {
1323 	struct net *net = sock_net(sk);
1324 	struct sk_buff *resp_skb;
1325 	struct sadb_x_sa2 *sa2;
1326 	struct sadb_address *saddr, *daddr;
1327 	struct sadb_msg *out_hdr;
1328 	struct sadb_spirange *range;
1329 	struct xfrm_state *x = NULL;
1330 	int mode;
1331 	int err;
1332 	u32 min_spi, max_spi;
1333 	u32 reqid;
1334 	u8 proto;
1335 	unsigned short family;
1336 	xfrm_address_t *xsaddr = NULL, *xdaddr = NULL;
1337 
1338 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1339 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1340 		return -EINVAL;
1341 
1342 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1343 	if (proto == 0)
1344 		return -EINVAL;
1345 
1346 	if ((sa2 = ext_hdrs[SADB_X_EXT_SA2-1]) != NULL) {
1347 		mode = pfkey_mode_to_xfrm(sa2->sadb_x_sa2_mode);
1348 		if (mode < 0)
1349 			return -EINVAL;
1350 		reqid = sa2->sadb_x_sa2_reqid;
1351 	} else {
1352 		mode = 0;
1353 		reqid = 0;
1354 	}
1355 
1356 	saddr = ext_hdrs[SADB_EXT_ADDRESS_SRC-1];
1357 	daddr = ext_hdrs[SADB_EXT_ADDRESS_DST-1];
1358 
1359 	family = ((struct sockaddr *)(saddr + 1))->sa_family;
1360 	switch (family) {
1361 	case AF_INET:
1362 		xdaddr = (xfrm_address_t *)&((struct sockaddr_in *)(daddr + 1))->sin_addr.s_addr;
1363 		xsaddr = (xfrm_address_t *)&((struct sockaddr_in *)(saddr + 1))->sin_addr.s_addr;
1364 		break;
1365 #if IS_ENABLED(CONFIG_IPV6)
1366 	case AF_INET6:
1367 		xdaddr = (xfrm_address_t *)&((struct sockaddr_in6 *)(daddr + 1))->sin6_addr;
1368 		xsaddr = (xfrm_address_t *)&((struct sockaddr_in6 *)(saddr + 1))->sin6_addr;
1369 		break;
1370 #endif
1371 	}
1372 
1373 	if (hdr->sadb_msg_seq) {
1374 		x = xfrm_find_acq_byseq(net, DUMMY_MARK, hdr->sadb_msg_seq, UINT_MAX);
1375 		if (x && !xfrm_addr_equal(&x->id.daddr, xdaddr, family)) {
1376 			xfrm_state_put(x);
1377 			x = NULL;
1378 		}
1379 	}
1380 
1381 	if (!x)
1382 		x = xfrm_find_acq(net, &dummy_mark, mode, reqid, 0, UINT_MAX,
1383 				  proto, xdaddr, xsaddr, 1, family);
1384 
1385 	if (x == NULL)
1386 		return -ENOENT;
1387 
1388 	min_spi = 0x100;
1389 	max_spi = 0x0fffffff;
1390 
1391 	range = ext_hdrs[SADB_EXT_SPIRANGE-1];
1392 	if (range) {
1393 		min_spi = range->sadb_spirange_min;
1394 		max_spi = range->sadb_spirange_max;
1395 	}
1396 
1397 	err = verify_spi_info(x->id.proto, min_spi, max_spi, NULL);
1398 	if (err) {
1399 		xfrm_state_put(x);
1400 		return err;
1401 	}
1402 
1403 	err = xfrm_alloc_spi(x, min_spi, max_spi, NULL);
1404 	resp_skb = err ? ERR_PTR(err) : pfkey_xfrm_state2msg(x);
1405 
1406 	if (IS_ERR(resp_skb)) {
1407 		xfrm_state_put(x);
1408 		return  PTR_ERR(resp_skb);
1409 	}
1410 
1411 	out_hdr = (struct sadb_msg *) resp_skb->data;
1412 	out_hdr->sadb_msg_version = hdr->sadb_msg_version;
1413 	out_hdr->sadb_msg_type = SADB_GETSPI;
1414 	out_hdr->sadb_msg_satype = pfkey_proto2satype(proto);
1415 	out_hdr->sadb_msg_errno = 0;
1416 	out_hdr->sadb_msg_reserved = 0;
1417 	out_hdr->sadb_msg_seq = hdr->sadb_msg_seq;
1418 	out_hdr->sadb_msg_pid = hdr->sadb_msg_pid;
1419 
1420 	xfrm_state_put(x);
1421 
1422 	pfkey_broadcast(resp_skb, GFP_KERNEL, BROADCAST_ONE, sk, net);
1423 
1424 	return 0;
1425 }
1426 
1427 static int pfkey_acquire(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1428 {
1429 	struct net *net = sock_net(sk);
1430 	struct xfrm_state *x;
1431 
1432 	if (hdr->sadb_msg_len != sizeof(struct sadb_msg)/8)
1433 		return -EOPNOTSUPP;
1434 
1435 	if (hdr->sadb_msg_seq == 0 || hdr->sadb_msg_errno == 0)
1436 		return 0;
1437 
1438 	x = xfrm_find_acq_byseq(net, DUMMY_MARK, hdr->sadb_msg_seq, UINT_MAX);
1439 	if (x == NULL)
1440 		return 0;
1441 
1442 	spin_lock_bh(&x->lock);
1443 	if (x->km.state == XFRM_STATE_ACQ)
1444 		x->km.state = XFRM_STATE_ERROR;
1445 
1446 	spin_unlock_bh(&x->lock);
1447 	xfrm_state_put(x);
1448 	return 0;
1449 }
1450 
1451 static inline int event2poltype(int event)
1452 {
1453 	switch (event) {
1454 	case XFRM_MSG_DELPOLICY:
1455 		return SADB_X_SPDDELETE;
1456 	case XFRM_MSG_NEWPOLICY:
1457 		return SADB_X_SPDADD;
1458 	case XFRM_MSG_UPDPOLICY:
1459 		return SADB_X_SPDUPDATE;
1460 	case XFRM_MSG_POLEXPIRE:
1461 	//	return SADB_X_SPDEXPIRE;
1462 	default:
1463 		pr_err("pfkey: Unknown policy event %d\n", event);
1464 		break;
1465 	}
1466 
1467 	return 0;
1468 }
1469 
1470 static inline int event2keytype(int event)
1471 {
1472 	switch (event) {
1473 	case XFRM_MSG_DELSA:
1474 		return SADB_DELETE;
1475 	case XFRM_MSG_NEWSA:
1476 		return SADB_ADD;
1477 	case XFRM_MSG_UPDSA:
1478 		return SADB_UPDATE;
1479 	case XFRM_MSG_EXPIRE:
1480 		return SADB_EXPIRE;
1481 	default:
1482 		pr_err("pfkey: Unknown SA event %d\n", event);
1483 		break;
1484 	}
1485 
1486 	return 0;
1487 }
1488 
1489 /* ADD/UPD/DEL */
1490 static int key_notify_sa(struct xfrm_state *x, const struct km_event *c)
1491 {
1492 	struct sk_buff *skb;
1493 	struct sadb_msg *hdr;
1494 
1495 	skb = pfkey_xfrm_state2msg(x);
1496 
1497 	if (IS_ERR(skb))
1498 		return PTR_ERR(skb);
1499 
1500 	hdr = (struct sadb_msg *) skb->data;
1501 	hdr->sadb_msg_version = PF_KEY_V2;
1502 	hdr->sadb_msg_type = event2keytype(c->event);
1503 	hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
1504 	hdr->sadb_msg_errno = 0;
1505 	hdr->sadb_msg_reserved = 0;
1506 	hdr->sadb_msg_seq = c->seq;
1507 	hdr->sadb_msg_pid = c->portid;
1508 
1509 	pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_ALL, NULL, xs_net(x));
1510 
1511 	return 0;
1512 }
1513 
1514 static int pfkey_add(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1515 {
1516 	struct net *net = sock_net(sk);
1517 	struct xfrm_state *x;
1518 	int err;
1519 	struct km_event c;
1520 
1521 	x = pfkey_msg2xfrm_state(net, hdr, ext_hdrs);
1522 	if (IS_ERR(x))
1523 		return PTR_ERR(x);
1524 
1525 	xfrm_state_hold(x);
1526 	if (hdr->sadb_msg_type == SADB_ADD)
1527 		err = xfrm_state_add(x);
1528 	else
1529 		err = xfrm_state_update(x);
1530 
1531 	xfrm_audit_state_add(x, err ? 0 : 1, true);
1532 
1533 	if (err < 0) {
1534 		x->km.state = XFRM_STATE_DEAD;
1535 		__xfrm_state_put(x);
1536 		goto out;
1537 	}
1538 
1539 	if (hdr->sadb_msg_type == SADB_ADD)
1540 		c.event = XFRM_MSG_NEWSA;
1541 	else
1542 		c.event = XFRM_MSG_UPDSA;
1543 	c.seq = hdr->sadb_msg_seq;
1544 	c.portid = hdr->sadb_msg_pid;
1545 	km_state_notify(x, &c);
1546 out:
1547 	xfrm_state_put(x);
1548 	return err;
1549 }
1550 
1551 static int pfkey_delete(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1552 {
1553 	struct net *net = sock_net(sk);
1554 	struct xfrm_state *x;
1555 	struct km_event c;
1556 	int err;
1557 
1558 	if (!ext_hdrs[SADB_EXT_SA-1] ||
1559 	    !present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1560 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1561 		return -EINVAL;
1562 
1563 	x = pfkey_xfrm_state_lookup(net, hdr, ext_hdrs);
1564 	if (x == NULL)
1565 		return -ESRCH;
1566 
1567 	if ((err = security_xfrm_state_delete(x)))
1568 		goto out;
1569 
1570 	if (xfrm_state_kern(x)) {
1571 		err = -EPERM;
1572 		goto out;
1573 	}
1574 
1575 	err = xfrm_state_delete(x);
1576 
1577 	if (err < 0)
1578 		goto out;
1579 
1580 	c.seq = hdr->sadb_msg_seq;
1581 	c.portid = hdr->sadb_msg_pid;
1582 	c.event = XFRM_MSG_DELSA;
1583 	km_state_notify(x, &c);
1584 out:
1585 	xfrm_audit_state_delete(x, err ? 0 : 1, true);
1586 	xfrm_state_put(x);
1587 
1588 	return err;
1589 }
1590 
1591 static int pfkey_get(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1592 {
1593 	struct net *net = sock_net(sk);
1594 	__u8 proto;
1595 	struct sk_buff *out_skb;
1596 	struct sadb_msg *out_hdr;
1597 	struct xfrm_state *x;
1598 
1599 	if (!ext_hdrs[SADB_EXT_SA-1] ||
1600 	    !present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1601 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1602 		return -EINVAL;
1603 
1604 	x = pfkey_xfrm_state_lookup(net, hdr, ext_hdrs);
1605 	if (x == NULL)
1606 		return -ESRCH;
1607 
1608 	out_skb = pfkey_xfrm_state2msg(x);
1609 	proto = x->id.proto;
1610 	xfrm_state_put(x);
1611 	if (IS_ERR(out_skb))
1612 		return  PTR_ERR(out_skb);
1613 
1614 	out_hdr = (struct sadb_msg *) out_skb->data;
1615 	out_hdr->sadb_msg_version = hdr->sadb_msg_version;
1616 	out_hdr->sadb_msg_type = SADB_GET;
1617 	out_hdr->sadb_msg_satype = pfkey_proto2satype(proto);
1618 	out_hdr->sadb_msg_errno = 0;
1619 	out_hdr->sadb_msg_reserved = 0;
1620 	out_hdr->sadb_msg_seq = hdr->sadb_msg_seq;
1621 	out_hdr->sadb_msg_pid = hdr->sadb_msg_pid;
1622 	pfkey_broadcast(out_skb, GFP_ATOMIC, BROADCAST_ONE, sk, sock_net(sk));
1623 
1624 	return 0;
1625 }
1626 
1627 static struct sk_buff *compose_sadb_supported(const struct sadb_msg *orig,
1628 					      gfp_t allocation)
1629 {
1630 	struct sk_buff *skb;
1631 	struct sadb_msg *hdr;
1632 	int len, auth_len, enc_len, i;
1633 
1634 	auth_len = xfrm_count_pfkey_auth_supported();
1635 	if (auth_len) {
1636 		auth_len *= sizeof(struct sadb_alg);
1637 		auth_len += sizeof(struct sadb_supported);
1638 	}
1639 
1640 	enc_len = xfrm_count_pfkey_enc_supported();
1641 	if (enc_len) {
1642 		enc_len *= sizeof(struct sadb_alg);
1643 		enc_len += sizeof(struct sadb_supported);
1644 	}
1645 
1646 	len = enc_len + auth_len + sizeof(struct sadb_msg);
1647 
1648 	skb = alloc_skb(len + 16, allocation);
1649 	if (!skb)
1650 		goto out_put_algs;
1651 
1652 	hdr = skb_put(skb, sizeof(*hdr));
1653 	pfkey_hdr_dup(hdr, orig);
1654 	hdr->sadb_msg_errno = 0;
1655 	hdr->sadb_msg_len = len / sizeof(uint64_t);
1656 
1657 	if (auth_len) {
1658 		struct sadb_supported *sp;
1659 		struct sadb_alg *ap;
1660 
1661 		sp = skb_put(skb, auth_len);
1662 		ap = (struct sadb_alg *) (sp + 1);
1663 
1664 		sp->sadb_supported_len = auth_len / sizeof(uint64_t);
1665 		sp->sadb_supported_exttype = SADB_EXT_SUPPORTED_AUTH;
1666 
1667 		for (i = 0; ; i++) {
1668 			struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(i);
1669 			if (!aalg)
1670 				break;
1671 			if (!aalg->pfkey_supported)
1672 				continue;
1673 			if (aalg->available)
1674 				*ap++ = aalg->desc;
1675 		}
1676 	}
1677 
1678 	if (enc_len) {
1679 		struct sadb_supported *sp;
1680 		struct sadb_alg *ap;
1681 
1682 		sp = skb_put(skb, enc_len);
1683 		ap = (struct sadb_alg *) (sp + 1);
1684 
1685 		sp->sadb_supported_len = enc_len / sizeof(uint64_t);
1686 		sp->sadb_supported_exttype = SADB_EXT_SUPPORTED_ENCRYPT;
1687 
1688 		for (i = 0; ; i++) {
1689 			struct xfrm_algo_desc *ealg = xfrm_ealg_get_byidx(i);
1690 			if (!ealg)
1691 				break;
1692 			if (!ealg->pfkey_supported)
1693 				continue;
1694 			if (ealg->available)
1695 				*ap++ = ealg->desc;
1696 		}
1697 	}
1698 
1699 out_put_algs:
1700 	return skb;
1701 }
1702 
1703 static int pfkey_register(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1704 {
1705 	struct pfkey_sock *pfk = pfkey_sk(sk);
1706 	struct sk_buff *supp_skb;
1707 
1708 	if (hdr->sadb_msg_satype > SADB_SATYPE_MAX)
1709 		return -EINVAL;
1710 
1711 	if (hdr->sadb_msg_satype != SADB_SATYPE_UNSPEC) {
1712 		if (pfk->registered&(1<<hdr->sadb_msg_satype))
1713 			return -EEXIST;
1714 		pfk->registered |= (1<<hdr->sadb_msg_satype);
1715 	}
1716 
1717 	mutex_lock(&pfkey_mutex);
1718 	xfrm_probe_algs();
1719 
1720 	supp_skb = compose_sadb_supported(hdr, GFP_KERNEL | __GFP_ZERO);
1721 	mutex_unlock(&pfkey_mutex);
1722 
1723 	if (!supp_skb) {
1724 		if (hdr->sadb_msg_satype != SADB_SATYPE_UNSPEC)
1725 			pfk->registered &= ~(1<<hdr->sadb_msg_satype);
1726 
1727 		return -ENOBUFS;
1728 	}
1729 
1730 	pfkey_broadcast(supp_skb, GFP_KERNEL, BROADCAST_REGISTERED, sk,
1731 			sock_net(sk));
1732 	return 0;
1733 }
1734 
1735 static int unicast_flush_resp(struct sock *sk, const struct sadb_msg *ihdr)
1736 {
1737 	struct sk_buff *skb;
1738 	struct sadb_msg *hdr;
1739 
1740 	skb = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_ATOMIC);
1741 	if (!skb)
1742 		return -ENOBUFS;
1743 
1744 	hdr = skb_put_data(skb, ihdr, sizeof(struct sadb_msg));
1745 	hdr->sadb_msg_errno = (uint8_t) 0;
1746 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) / sizeof(uint64_t));
1747 
1748 	return pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_ONE, sk,
1749 			       sock_net(sk));
1750 }
1751 
1752 static int key_notify_sa_flush(const struct km_event *c)
1753 {
1754 	struct sk_buff *skb;
1755 	struct sadb_msg *hdr;
1756 
1757 	skb = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_ATOMIC);
1758 	if (!skb)
1759 		return -ENOBUFS;
1760 	hdr = skb_put(skb, sizeof(struct sadb_msg));
1761 	hdr->sadb_msg_satype = pfkey_proto2satype(c->data.proto);
1762 	hdr->sadb_msg_type = SADB_FLUSH;
1763 	hdr->sadb_msg_seq = c->seq;
1764 	hdr->sadb_msg_pid = c->portid;
1765 	hdr->sadb_msg_version = PF_KEY_V2;
1766 	hdr->sadb_msg_errno = (uint8_t) 0;
1767 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) / sizeof(uint64_t));
1768 	hdr->sadb_msg_reserved = 0;
1769 
1770 	pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_ALL, NULL, c->net);
1771 
1772 	return 0;
1773 }
1774 
1775 static int pfkey_flush(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1776 {
1777 	struct net *net = sock_net(sk);
1778 	unsigned int proto;
1779 	struct km_event c;
1780 	int err, err2;
1781 
1782 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1783 	if (proto == 0)
1784 		return -EINVAL;
1785 
1786 	err = xfrm_state_flush(net, proto, true);
1787 	err2 = unicast_flush_resp(sk, hdr);
1788 	if (err || err2) {
1789 		if (err == -ESRCH) /* empty table - go quietly */
1790 			err = 0;
1791 		return err ? err : err2;
1792 	}
1793 
1794 	c.data.proto = proto;
1795 	c.seq = hdr->sadb_msg_seq;
1796 	c.portid = hdr->sadb_msg_pid;
1797 	c.event = XFRM_MSG_FLUSHSA;
1798 	c.net = net;
1799 	km_state_notify(NULL, &c);
1800 
1801 	return 0;
1802 }
1803 
1804 static int dump_sa(struct xfrm_state *x, int count, void *ptr)
1805 {
1806 	struct pfkey_sock *pfk = ptr;
1807 	struct sk_buff *out_skb;
1808 	struct sadb_msg *out_hdr;
1809 
1810 	if (!pfkey_can_dump(&pfk->sk))
1811 		return -ENOBUFS;
1812 
1813 	out_skb = pfkey_xfrm_state2msg(x);
1814 	if (IS_ERR(out_skb))
1815 		return PTR_ERR(out_skb);
1816 
1817 	out_hdr = (struct sadb_msg *) out_skb->data;
1818 	out_hdr->sadb_msg_version = pfk->dump.msg_version;
1819 	out_hdr->sadb_msg_type = SADB_DUMP;
1820 	out_hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
1821 	out_hdr->sadb_msg_errno = 0;
1822 	out_hdr->sadb_msg_reserved = 0;
1823 	out_hdr->sadb_msg_seq = count + 1;
1824 	out_hdr->sadb_msg_pid = pfk->dump.msg_portid;
1825 
1826 	if (pfk->dump.skb)
1827 		pfkey_broadcast(pfk->dump.skb, GFP_ATOMIC, BROADCAST_ONE,
1828 				&pfk->sk, sock_net(&pfk->sk));
1829 	pfk->dump.skb = out_skb;
1830 
1831 	return 0;
1832 }
1833 
1834 static int pfkey_dump_sa(struct pfkey_sock *pfk)
1835 {
1836 	struct net *net = sock_net(&pfk->sk);
1837 	return xfrm_state_walk(net, &pfk->dump.u.state, dump_sa, (void *) pfk);
1838 }
1839 
1840 static void pfkey_dump_sa_done(struct pfkey_sock *pfk)
1841 {
1842 	struct net *net = sock_net(&pfk->sk);
1843 
1844 	xfrm_state_walk_done(&pfk->dump.u.state, net);
1845 }
1846 
1847 static int pfkey_dump(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1848 {
1849 	u8 proto;
1850 	struct xfrm_address_filter *filter = NULL;
1851 	struct pfkey_sock *pfk = pfkey_sk(sk);
1852 
1853 	mutex_lock(&pfk->dump_lock);
1854 	if (pfk->dump.dump != NULL) {
1855 		mutex_unlock(&pfk->dump_lock);
1856 		return -EBUSY;
1857 	}
1858 
1859 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1860 	if (proto == 0) {
1861 		mutex_unlock(&pfk->dump_lock);
1862 		return -EINVAL;
1863 	}
1864 
1865 	if (ext_hdrs[SADB_X_EXT_FILTER - 1]) {
1866 		struct sadb_x_filter *xfilter = ext_hdrs[SADB_X_EXT_FILTER - 1];
1867 
1868 		if ((xfilter->sadb_x_filter_splen >
1869 			(sizeof(xfrm_address_t) << 3)) ||
1870 		    (xfilter->sadb_x_filter_dplen >
1871 			(sizeof(xfrm_address_t) << 3))) {
1872 			mutex_unlock(&pfk->dump_lock);
1873 			return -EINVAL;
1874 		}
1875 		filter = kmalloc_obj(*filter);
1876 		if (filter == NULL) {
1877 			mutex_unlock(&pfk->dump_lock);
1878 			return -ENOMEM;
1879 		}
1880 
1881 		memcpy(&filter->saddr, &xfilter->sadb_x_filter_saddr,
1882 		       sizeof(xfrm_address_t));
1883 		memcpy(&filter->daddr, &xfilter->sadb_x_filter_daddr,
1884 		       sizeof(xfrm_address_t));
1885 		filter->family = xfilter->sadb_x_filter_family;
1886 		filter->splen = xfilter->sadb_x_filter_splen;
1887 		filter->dplen = xfilter->sadb_x_filter_dplen;
1888 	}
1889 
1890 	pfk->dump.msg_version = hdr->sadb_msg_version;
1891 	pfk->dump.msg_portid = hdr->sadb_msg_pid;
1892 	pfk->dump.dump = pfkey_dump_sa;
1893 	pfk->dump.done = pfkey_dump_sa_done;
1894 	xfrm_state_walk_init(&pfk->dump.u.state, proto, filter);
1895 	mutex_unlock(&pfk->dump_lock);
1896 
1897 	return pfkey_do_dump(pfk);
1898 }
1899 
1900 static int pfkey_promisc(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1901 {
1902 	struct pfkey_sock *pfk = pfkey_sk(sk);
1903 	int satype = hdr->sadb_msg_satype;
1904 	bool reset_errno = false;
1905 
1906 	if (hdr->sadb_msg_len == (sizeof(*hdr) / sizeof(uint64_t))) {
1907 		reset_errno = true;
1908 		if (satype != 0 && satype != 1)
1909 			return -EINVAL;
1910 		pfk->promisc = satype;
1911 	}
1912 	if (reset_errno && skb_cloned(skb))
1913 		skb = skb_copy(skb, GFP_KERNEL);
1914 	else
1915 		skb = skb_clone(skb, GFP_KERNEL);
1916 
1917 	if (reset_errno && skb) {
1918 		struct sadb_msg *new_hdr = (struct sadb_msg *) skb->data;
1919 		new_hdr->sadb_msg_errno = 0;
1920 	}
1921 
1922 	pfkey_broadcast(skb, GFP_KERNEL, BROADCAST_ALL, NULL, sock_net(sk));
1923 	return 0;
1924 }
1925 
1926 static int check_reqid(struct xfrm_policy *xp, int dir, int count, void *ptr)
1927 {
1928 	int i;
1929 	u32 reqid = *(u32*)ptr;
1930 
1931 	for (i=0; i<xp->xfrm_nr; i++) {
1932 		if (xp->xfrm_vec[i].reqid == reqid)
1933 			return -EEXIST;
1934 	}
1935 	return 0;
1936 }
1937 
1938 static u32 gen_reqid(struct net *net)
1939 {
1940 	struct xfrm_policy_walk walk;
1941 	u32 start;
1942 	int rc;
1943 	static u32 reqid = IPSEC_MANUAL_REQID_MAX;
1944 
1945 	start = reqid;
1946 	do {
1947 		++reqid;
1948 		if (reqid == 0)
1949 			reqid = IPSEC_MANUAL_REQID_MAX+1;
1950 		xfrm_policy_walk_init(&walk, XFRM_POLICY_TYPE_MAIN);
1951 		rc = xfrm_policy_walk(net, &walk, check_reqid, (void*)&reqid);
1952 		xfrm_policy_walk_done(&walk, net);
1953 		if (rc != -EEXIST)
1954 			return reqid;
1955 	} while (reqid != start);
1956 	return 0;
1957 }
1958 
1959 static int
1960 parse_ipsecrequest(struct xfrm_policy *xp, struct sadb_x_policy *pol,
1961 		   struct sadb_x_ipsecrequest *rq)
1962 {
1963 	struct net *net = xp_net(xp);
1964 	struct xfrm_tmpl *t = xp->xfrm_vec + xp->xfrm_nr;
1965 	int mode;
1966 
1967 	if (xp->xfrm_nr >= XFRM_MAX_DEPTH)
1968 		return -ELOOP;
1969 
1970 	if (rq->sadb_x_ipsecrequest_mode == 0)
1971 		return -EINVAL;
1972 	if (!xfrm_id_proto_valid(rq->sadb_x_ipsecrequest_proto))
1973 		return -EINVAL;
1974 
1975 	t->id.proto = rq->sadb_x_ipsecrequest_proto;
1976 	if ((mode = pfkey_mode_to_xfrm(rq->sadb_x_ipsecrequest_mode)) < 0)
1977 		return -EINVAL;
1978 	t->mode = mode;
1979 	if (rq->sadb_x_ipsecrequest_level == IPSEC_LEVEL_USE) {
1980 		if ((mode == XFRM_MODE_TUNNEL || mode == XFRM_MODE_BEET) &&
1981 		    pol->sadb_x_policy_dir == IPSEC_DIR_OUTBOUND)
1982 			return -EINVAL;
1983 		t->optional = 1;
1984 	} else if (rq->sadb_x_ipsecrequest_level == IPSEC_LEVEL_UNIQUE) {
1985 		t->reqid = rq->sadb_x_ipsecrequest_reqid;
1986 		if (t->reqid > IPSEC_MANUAL_REQID_MAX)
1987 			t->reqid = 0;
1988 		if (!t->reqid && !(t->reqid = gen_reqid(net)))
1989 			return -ENOBUFS;
1990 	}
1991 
1992 	/* addresses present only in tunnel mode */
1993 	if (t->mode == XFRM_MODE_TUNNEL) {
1994 		int err;
1995 
1996 		err = parse_sockaddr_pair(
1997 			(struct sockaddr *)(rq + 1),
1998 			rq->sadb_x_ipsecrequest_len - sizeof(*rq),
1999 			&t->saddr, &t->id.daddr, &t->encap_family);
2000 		if (err)
2001 			return err;
2002 	} else
2003 		t->encap_family = xp->family;
2004 
2005 	/* No way to set this via kame pfkey */
2006 	t->allalgs = 1;
2007 	xp->xfrm_nr++;
2008 	return 0;
2009 }
2010 
2011 static int
2012 parse_ipsecrequests(struct xfrm_policy *xp, struct sadb_x_policy *pol)
2013 {
2014 	int err;
2015 	int len = pol->sadb_x_policy_len*8 - sizeof(struct sadb_x_policy);
2016 	struct sadb_x_ipsecrequest *rq = (void*)(pol+1);
2017 
2018 	if (pol->sadb_x_policy_len * 8 < sizeof(struct sadb_x_policy))
2019 		return -EINVAL;
2020 
2021 	while (len >= sizeof(*rq)) {
2022 		if (len < rq->sadb_x_ipsecrequest_len ||
2023 		    rq->sadb_x_ipsecrequest_len < sizeof(*rq))
2024 			return -EINVAL;
2025 
2026 		if ((err = parse_ipsecrequest(xp, pol, rq)) < 0)
2027 			return err;
2028 		len -= rq->sadb_x_ipsecrequest_len;
2029 		rq = (void*)((u8*)rq + rq->sadb_x_ipsecrequest_len);
2030 	}
2031 	return 0;
2032 }
2033 
2034 static inline int pfkey_xfrm_policy2sec_ctx_size(const struct xfrm_policy *xp)
2035 {
2036 	struct xfrm_sec_ctx *xfrm_ctx = xp->security;
2037 
2038 	if (xfrm_ctx) {
2039 		int len = sizeof(struct sadb_x_sec_ctx);
2040 		len += xfrm_ctx->ctx_len;
2041 		return PFKEY_ALIGN8(len);
2042 	}
2043 	return 0;
2044 }
2045 
2046 static int pfkey_xfrm_policy2msg_size(const struct xfrm_policy *xp)
2047 {
2048 	const struct xfrm_tmpl *t;
2049 	int sockaddr_size = pfkey_sockaddr_size(xp->family);
2050 	int socklen = 0;
2051 	int i;
2052 
2053 	for (i=0; i<xp->xfrm_nr; i++) {
2054 		t = xp->xfrm_vec + i;
2055 		socklen += pfkey_sockaddr_len(t->encap_family);
2056 	}
2057 
2058 	return sizeof(struct sadb_msg) +
2059 		(sizeof(struct sadb_lifetime) * 3) +
2060 		(sizeof(struct sadb_address) * 2) +
2061 		(sockaddr_size * 2) +
2062 		sizeof(struct sadb_x_policy) +
2063 		(xp->xfrm_nr * sizeof(struct sadb_x_ipsecrequest)) +
2064 		(socklen * 2) +
2065 		pfkey_xfrm_policy2sec_ctx_size(xp);
2066 }
2067 
2068 static struct sk_buff * pfkey_xfrm_policy2msg_prep(const struct xfrm_policy *xp)
2069 {
2070 	struct sk_buff *skb;
2071 	int size;
2072 
2073 	size = pfkey_xfrm_policy2msg_size(xp);
2074 
2075 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
2076 	if (skb == NULL)
2077 		return ERR_PTR(-ENOBUFS);
2078 
2079 	return skb;
2080 }
2081 
2082 static int pfkey_xfrm_policy2msg(struct sk_buff *skb, const struct xfrm_policy *xp, int dir)
2083 {
2084 	struct sadb_msg *hdr;
2085 	struct sadb_address *addr;
2086 	struct sadb_lifetime *lifetime;
2087 	struct sadb_x_policy *pol;
2088 	struct sadb_x_sec_ctx *sec_ctx;
2089 	struct xfrm_sec_ctx *xfrm_ctx;
2090 	int i;
2091 	int size;
2092 	int sockaddr_size = pfkey_sockaddr_size(xp->family);
2093 	int socklen = pfkey_sockaddr_len(xp->family);
2094 
2095 	size = pfkey_xfrm_policy2msg_size(xp);
2096 
2097 	/* call should fill header later */
2098 	hdr = skb_put(skb, sizeof(struct sadb_msg));
2099 	memset(hdr, 0, size);	/* XXX do we need this ? */
2100 
2101 	/* src address */
2102 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
2103 	addr->sadb_address_len =
2104 		(sizeof(struct sadb_address)+sockaddr_size)/
2105 			sizeof(uint64_t);
2106 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
2107 	addr->sadb_address_proto = pfkey_proto_from_xfrm(xp->selector.proto);
2108 	addr->sadb_address_prefixlen = xp->selector.prefixlen_s;
2109 	addr->sadb_address_reserved = 0;
2110 	if (!pfkey_sockaddr_fill(&xp->selector.saddr,
2111 				 xp->selector.sport,
2112 				 (struct sockaddr *) (addr + 1),
2113 				 xp->family))
2114 		BUG();
2115 
2116 	/* dst address */
2117 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
2118 	addr->sadb_address_len =
2119 		(sizeof(struct sadb_address)+sockaddr_size)/
2120 			sizeof(uint64_t);
2121 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
2122 	addr->sadb_address_proto = pfkey_proto_from_xfrm(xp->selector.proto);
2123 	addr->sadb_address_prefixlen = xp->selector.prefixlen_d;
2124 	addr->sadb_address_reserved = 0;
2125 
2126 	pfkey_sockaddr_fill(&xp->selector.daddr, xp->selector.dport,
2127 			    (struct sockaddr *) (addr + 1),
2128 			    xp->family);
2129 
2130 	/* hard time */
2131 	lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
2132 	lifetime->sadb_lifetime_len =
2133 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
2134 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_HARD;
2135 	lifetime->sadb_lifetime_allocations =  _X2KEY(xp->lft.hard_packet_limit);
2136 	lifetime->sadb_lifetime_bytes = _X2KEY(xp->lft.hard_byte_limit);
2137 	lifetime->sadb_lifetime_addtime = xp->lft.hard_add_expires_seconds;
2138 	lifetime->sadb_lifetime_usetime = xp->lft.hard_use_expires_seconds;
2139 	/* soft time */
2140 	lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
2141 	lifetime->sadb_lifetime_len =
2142 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
2143 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_SOFT;
2144 	lifetime->sadb_lifetime_allocations =  _X2KEY(xp->lft.soft_packet_limit);
2145 	lifetime->sadb_lifetime_bytes = _X2KEY(xp->lft.soft_byte_limit);
2146 	lifetime->sadb_lifetime_addtime = xp->lft.soft_add_expires_seconds;
2147 	lifetime->sadb_lifetime_usetime = xp->lft.soft_use_expires_seconds;
2148 	/* current time */
2149 	lifetime = skb_put(skb, sizeof(struct sadb_lifetime));
2150 	lifetime->sadb_lifetime_len =
2151 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
2152 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_CURRENT;
2153 	lifetime->sadb_lifetime_allocations = xp->curlft.packets;
2154 	lifetime->sadb_lifetime_bytes = xp->curlft.bytes;
2155 	lifetime->sadb_lifetime_addtime = xp->curlft.add_time;
2156 	lifetime->sadb_lifetime_usetime = xp->curlft.use_time;
2157 
2158 	pol = skb_put(skb, sizeof(struct sadb_x_policy));
2159 	pol->sadb_x_policy_len = sizeof(struct sadb_x_policy)/sizeof(uint64_t);
2160 	pol->sadb_x_policy_exttype = SADB_X_EXT_POLICY;
2161 	pol->sadb_x_policy_type = IPSEC_POLICY_DISCARD;
2162 	if (xp->action == XFRM_POLICY_ALLOW) {
2163 		if (xp->xfrm_nr)
2164 			pol->sadb_x_policy_type = IPSEC_POLICY_IPSEC;
2165 		else
2166 			pol->sadb_x_policy_type = IPSEC_POLICY_NONE;
2167 	}
2168 	pol->sadb_x_policy_dir = dir+1;
2169 	pol->sadb_x_policy_reserved = 0;
2170 	pol->sadb_x_policy_id = xp->index;
2171 	pol->sadb_x_policy_priority = xp->priority;
2172 
2173 	for (i=0; i<xp->xfrm_nr; i++) {
2174 		const struct xfrm_tmpl *t = xp->xfrm_vec + i;
2175 		struct sadb_x_ipsecrequest *rq;
2176 		int req_size;
2177 		int mode;
2178 
2179 		req_size = sizeof(struct sadb_x_ipsecrequest);
2180 		if (t->mode == XFRM_MODE_TUNNEL) {
2181 			socklen = pfkey_sockaddr_len(t->encap_family);
2182 			req_size += socklen * 2;
2183 		} else {
2184 			size -= 2*socklen;
2185 		}
2186 		rq = skb_put(skb, req_size);
2187 		pol->sadb_x_policy_len += req_size/8;
2188 		memset(rq, 0, sizeof(*rq));
2189 		rq->sadb_x_ipsecrequest_len = req_size;
2190 		rq->sadb_x_ipsecrequest_proto = t->id.proto;
2191 		if ((mode = pfkey_mode_from_xfrm(t->mode)) < 0)
2192 			return -EINVAL;
2193 		rq->sadb_x_ipsecrequest_mode = mode;
2194 		rq->sadb_x_ipsecrequest_level = IPSEC_LEVEL_REQUIRE;
2195 		if (t->reqid)
2196 			rq->sadb_x_ipsecrequest_level = IPSEC_LEVEL_UNIQUE;
2197 		if (t->optional)
2198 			rq->sadb_x_ipsecrequest_level = IPSEC_LEVEL_USE;
2199 		rq->sadb_x_ipsecrequest_reqid = t->reqid;
2200 
2201 		if (t->mode == XFRM_MODE_TUNNEL) {
2202 			u8 *sa = (void *)(rq + 1);
2203 			pfkey_sockaddr_fill(&t->saddr, 0,
2204 					    (struct sockaddr *)sa,
2205 					    t->encap_family);
2206 			pfkey_sockaddr_fill(&t->id.daddr, 0,
2207 					    (struct sockaddr *) (sa + socklen),
2208 					    t->encap_family);
2209 		}
2210 	}
2211 
2212 	/* security context */
2213 	if ((xfrm_ctx = xp->security)) {
2214 		int ctx_size = pfkey_xfrm_policy2sec_ctx_size(xp);
2215 
2216 		sec_ctx = skb_put(skb, ctx_size);
2217 		sec_ctx->sadb_x_sec_len = ctx_size / sizeof(uint64_t);
2218 		sec_ctx->sadb_x_sec_exttype = SADB_X_EXT_SEC_CTX;
2219 		sec_ctx->sadb_x_ctx_doi = xfrm_ctx->ctx_doi;
2220 		sec_ctx->sadb_x_ctx_alg = xfrm_ctx->ctx_alg;
2221 		sec_ctx->sadb_x_ctx_len = xfrm_ctx->ctx_len;
2222 		memcpy(sec_ctx + 1, xfrm_ctx->ctx_str,
2223 		       xfrm_ctx->ctx_len);
2224 	}
2225 
2226 	hdr->sadb_msg_len = size / sizeof(uint64_t);
2227 	hdr->sadb_msg_reserved = refcount_read(&xp->refcnt);
2228 
2229 	return 0;
2230 }
2231 
2232 static int key_notify_policy(struct xfrm_policy *xp, int dir, const struct km_event *c)
2233 {
2234 	struct sk_buff *out_skb;
2235 	struct sadb_msg *out_hdr;
2236 	int err;
2237 
2238 	out_skb = pfkey_xfrm_policy2msg_prep(xp);
2239 	if (IS_ERR(out_skb))
2240 		return PTR_ERR(out_skb);
2241 
2242 	err = pfkey_xfrm_policy2msg(out_skb, xp, dir);
2243 	if (err < 0) {
2244 		kfree_skb(out_skb);
2245 		return err;
2246 	}
2247 
2248 	out_hdr = (struct sadb_msg *) out_skb->data;
2249 	out_hdr->sadb_msg_version = PF_KEY_V2;
2250 
2251 	if (c->data.byid && c->event == XFRM_MSG_DELPOLICY)
2252 		out_hdr->sadb_msg_type = SADB_X_SPDDELETE2;
2253 	else
2254 		out_hdr->sadb_msg_type = event2poltype(c->event);
2255 	out_hdr->sadb_msg_errno = 0;
2256 	out_hdr->sadb_msg_seq = c->seq;
2257 	out_hdr->sadb_msg_pid = c->portid;
2258 	pfkey_broadcast(out_skb, GFP_ATOMIC, BROADCAST_ALL, NULL, xp_net(xp));
2259 	return 0;
2260 
2261 }
2262 
2263 static int pfkey_spdadd(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2264 {
2265 	struct net *net = sock_net(sk);
2266 	int err = 0;
2267 	struct sadb_lifetime *lifetime;
2268 	struct sadb_address *sa;
2269 	struct sadb_x_policy *pol;
2270 	struct xfrm_policy *xp;
2271 	struct km_event c;
2272 	struct sadb_x_sec_ctx *sec_ctx;
2273 
2274 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
2275 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]) ||
2276 	    !ext_hdrs[SADB_X_EXT_POLICY-1])
2277 		return -EINVAL;
2278 
2279 	pol = ext_hdrs[SADB_X_EXT_POLICY-1];
2280 	if (pol->sadb_x_policy_type > IPSEC_POLICY_IPSEC)
2281 		return -EINVAL;
2282 	if (!pol->sadb_x_policy_dir || pol->sadb_x_policy_dir >= IPSEC_DIR_MAX)
2283 		return -EINVAL;
2284 
2285 	xp = xfrm_policy_alloc(net, GFP_KERNEL);
2286 	if (xp == NULL)
2287 		return -ENOBUFS;
2288 
2289 	xp->action = (pol->sadb_x_policy_type == IPSEC_POLICY_DISCARD ?
2290 		      XFRM_POLICY_BLOCK : XFRM_POLICY_ALLOW);
2291 	xp->priority = pol->sadb_x_policy_priority;
2292 
2293 	sa = ext_hdrs[SADB_EXT_ADDRESS_SRC-1];
2294 	xp->family = pfkey_sadb_addr2xfrm_addr(sa, &xp->selector.saddr);
2295 	xp->selector.family = xp->family;
2296 	xp->selector.prefixlen_s = sa->sadb_address_prefixlen;
2297 	xp->selector.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2298 	xp->selector.sport = ((struct sockaddr_in *)(sa+1))->sin_port;
2299 	if (xp->selector.sport)
2300 		xp->selector.sport_mask = htons(0xffff);
2301 
2302 	sa = ext_hdrs[SADB_EXT_ADDRESS_DST-1];
2303 	pfkey_sadb_addr2xfrm_addr(sa, &xp->selector.daddr);
2304 	xp->selector.prefixlen_d = sa->sadb_address_prefixlen;
2305 
2306 	/* Amusing, we set this twice.  KAME apps appear to set same value
2307 	 * in both addresses.
2308 	 */
2309 	xp->selector.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2310 
2311 	xp->selector.dport = ((struct sockaddr_in *)(sa+1))->sin_port;
2312 	if (xp->selector.dport)
2313 		xp->selector.dport_mask = htons(0xffff);
2314 
2315 	sec_ctx = ext_hdrs[SADB_X_EXT_SEC_CTX - 1];
2316 	if (sec_ctx != NULL) {
2317 		struct xfrm_user_sec_ctx *uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_KERNEL);
2318 
2319 		if (!uctx) {
2320 			err = -ENOBUFS;
2321 			goto out;
2322 		}
2323 
2324 		err = security_xfrm_policy_alloc(&xp->security, uctx, GFP_KERNEL);
2325 		kfree(uctx);
2326 
2327 		if (err)
2328 			goto out;
2329 	}
2330 
2331 	xp->lft.soft_byte_limit = XFRM_INF;
2332 	xp->lft.hard_byte_limit = XFRM_INF;
2333 	xp->lft.soft_packet_limit = XFRM_INF;
2334 	xp->lft.hard_packet_limit = XFRM_INF;
2335 	if ((lifetime = ext_hdrs[SADB_EXT_LIFETIME_HARD-1]) != NULL) {
2336 		xp->lft.hard_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
2337 		xp->lft.hard_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
2338 		xp->lft.hard_add_expires_seconds = lifetime->sadb_lifetime_addtime;
2339 		xp->lft.hard_use_expires_seconds = lifetime->sadb_lifetime_usetime;
2340 	}
2341 	if ((lifetime = ext_hdrs[SADB_EXT_LIFETIME_SOFT-1]) != NULL) {
2342 		xp->lft.soft_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
2343 		xp->lft.soft_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
2344 		xp->lft.soft_add_expires_seconds = lifetime->sadb_lifetime_addtime;
2345 		xp->lft.soft_use_expires_seconds = lifetime->sadb_lifetime_usetime;
2346 	}
2347 	xp->xfrm_nr = 0;
2348 	if (pol->sadb_x_policy_type == IPSEC_POLICY_IPSEC &&
2349 	    (err = parse_ipsecrequests(xp, pol)) < 0)
2350 		goto out;
2351 
2352 	err = xfrm_policy_insert(pol->sadb_x_policy_dir-1, xp,
2353 				 hdr->sadb_msg_type != SADB_X_SPDUPDATE);
2354 
2355 	xfrm_audit_policy_add(xp, err ? 0 : 1, true);
2356 
2357 	if (err)
2358 		goto out;
2359 
2360 	if (hdr->sadb_msg_type == SADB_X_SPDUPDATE)
2361 		c.event = XFRM_MSG_UPDPOLICY;
2362 	else
2363 		c.event = XFRM_MSG_NEWPOLICY;
2364 
2365 	c.seq = hdr->sadb_msg_seq;
2366 	c.portid = hdr->sadb_msg_pid;
2367 
2368 	km_policy_notify(xp, pol->sadb_x_policy_dir-1, &c);
2369 	xfrm_pol_put(xp);
2370 	return 0;
2371 
2372 out:
2373 	xp->walk.dead = 1;
2374 	xfrm_policy_destroy(xp);
2375 	return err;
2376 }
2377 
2378 static int pfkey_spddelete(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2379 {
2380 	struct net *net = sock_net(sk);
2381 	int err;
2382 	struct sadb_address *sa;
2383 	struct sadb_x_policy *pol;
2384 	struct xfrm_policy *xp;
2385 	struct xfrm_selector sel;
2386 	struct km_event c;
2387 	struct sadb_x_sec_ctx *sec_ctx;
2388 	struct xfrm_sec_ctx *pol_ctx = NULL;
2389 
2390 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
2391 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]) ||
2392 	    !ext_hdrs[SADB_X_EXT_POLICY-1])
2393 		return -EINVAL;
2394 
2395 	pol = ext_hdrs[SADB_X_EXT_POLICY-1];
2396 	if (!pol->sadb_x_policy_dir || pol->sadb_x_policy_dir >= IPSEC_DIR_MAX)
2397 		return -EINVAL;
2398 
2399 	memset(&sel, 0, sizeof(sel));
2400 
2401 	sa = ext_hdrs[SADB_EXT_ADDRESS_SRC-1];
2402 	sel.family = pfkey_sadb_addr2xfrm_addr(sa, &sel.saddr);
2403 	sel.prefixlen_s = sa->sadb_address_prefixlen;
2404 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2405 	sel.sport = ((struct sockaddr_in *)(sa+1))->sin_port;
2406 	if (sel.sport)
2407 		sel.sport_mask = htons(0xffff);
2408 
2409 	sa = ext_hdrs[SADB_EXT_ADDRESS_DST-1];
2410 	pfkey_sadb_addr2xfrm_addr(sa, &sel.daddr);
2411 	sel.prefixlen_d = sa->sadb_address_prefixlen;
2412 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2413 	sel.dport = ((struct sockaddr_in *)(sa+1))->sin_port;
2414 	if (sel.dport)
2415 		sel.dport_mask = htons(0xffff);
2416 
2417 	sec_ctx = ext_hdrs[SADB_X_EXT_SEC_CTX - 1];
2418 	if (sec_ctx != NULL) {
2419 		struct xfrm_user_sec_ctx *uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_KERNEL);
2420 
2421 		if (!uctx)
2422 			return -ENOMEM;
2423 
2424 		err = security_xfrm_policy_alloc(&pol_ctx, uctx, GFP_KERNEL);
2425 		kfree(uctx);
2426 		if (err)
2427 			return err;
2428 	}
2429 
2430 	xp = xfrm_policy_bysel_ctx(net, &dummy_mark, 0, XFRM_POLICY_TYPE_MAIN,
2431 				   pol->sadb_x_policy_dir - 1, &sel, pol_ctx,
2432 				   1, &err);
2433 	security_xfrm_policy_free(pol_ctx);
2434 	if (xp == NULL)
2435 		return -ENOENT;
2436 
2437 	xfrm_audit_policy_delete(xp, err ? 0 : 1, true);
2438 
2439 	if (err)
2440 		goto out;
2441 
2442 	c.seq = hdr->sadb_msg_seq;
2443 	c.portid = hdr->sadb_msg_pid;
2444 	c.data.byid = 0;
2445 	c.event = XFRM_MSG_DELPOLICY;
2446 	km_policy_notify(xp, pol->sadb_x_policy_dir-1, &c);
2447 
2448 out:
2449 	xfrm_pol_put(xp);
2450 	return err;
2451 }
2452 
2453 static int key_pol_get_resp(struct sock *sk, struct xfrm_policy *xp, const struct sadb_msg *hdr, int dir)
2454 {
2455 	int err;
2456 	struct sk_buff *out_skb;
2457 	struct sadb_msg *out_hdr;
2458 	err = 0;
2459 
2460 	out_skb = pfkey_xfrm_policy2msg_prep(xp);
2461 	if (IS_ERR(out_skb)) {
2462 		err =  PTR_ERR(out_skb);
2463 		goto out;
2464 	}
2465 	err = pfkey_xfrm_policy2msg(out_skb, xp, dir);
2466 	if (err < 0) {
2467 		kfree_skb(out_skb);
2468 		goto out;
2469 	}
2470 
2471 	out_hdr = (struct sadb_msg *) out_skb->data;
2472 	out_hdr->sadb_msg_version = hdr->sadb_msg_version;
2473 	out_hdr->sadb_msg_type = hdr->sadb_msg_type;
2474 	out_hdr->sadb_msg_satype = 0;
2475 	out_hdr->sadb_msg_errno = 0;
2476 	out_hdr->sadb_msg_seq = hdr->sadb_msg_seq;
2477 	out_hdr->sadb_msg_pid = hdr->sadb_msg_pid;
2478 	pfkey_broadcast(out_skb, GFP_ATOMIC, BROADCAST_ONE, sk, xp_net(xp));
2479 	err = 0;
2480 
2481 out:
2482 	return err;
2483 }
2484 
2485 static int pfkey_sockaddr_pair_size(sa_family_t family)
2486 {
2487 	return PFKEY_ALIGN8(pfkey_sockaddr_len(family) * 2);
2488 }
2489 
2490 static int parse_sockaddr_pair(struct sockaddr *sa, int ext_len,
2491 			       xfrm_address_t *saddr, xfrm_address_t *daddr,
2492 			       u16 *family)
2493 {
2494 	int af, socklen;
2495 
2496 	if (ext_len < 2 || ext_len < pfkey_sockaddr_pair_size(sa->sa_family))
2497 		return -EINVAL;
2498 
2499 	af = pfkey_sockaddr_extract(sa, saddr);
2500 	if (!af)
2501 		return -EINVAL;
2502 
2503 	socklen = pfkey_sockaddr_len(af);
2504 	if (pfkey_sockaddr_extract((struct sockaddr *) (((u8 *)sa) + socklen),
2505 				   daddr) != af)
2506 		return -EINVAL;
2507 
2508 	*family = af;
2509 	return 0;
2510 }
2511 
2512 #ifdef CONFIG_NET_KEY_MIGRATE
2513 static int ipsecrequests_to_migrate(struct sadb_x_ipsecrequest *rq1, int len,
2514 				    struct xfrm_migrate *m)
2515 {
2516 	int err;
2517 	struct sadb_x_ipsecrequest *rq2;
2518 	int mode;
2519 
2520 	if (len < sizeof(*rq1) ||
2521 	    len < rq1->sadb_x_ipsecrequest_len ||
2522 	    rq1->sadb_x_ipsecrequest_len < sizeof(*rq1))
2523 		return -EINVAL;
2524 
2525 	/* old endoints */
2526 	err = parse_sockaddr_pair((struct sockaddr *)(rq1 + 1),
2527 				  rq1->sadb_x_ipsecrequest_len - sizeof(*rq1),
2528 				  &m->old_saddr, &m->old_daddr,
2529 				  &m->old_family);
2530 	if (err)
2531 		return err;
2532 
2533 	rq2 = (struct sadb_x_ipsecrequest *)((u8 *)rq1 + rq1->sadb_x_ipsecrequest_len);
2534 	len -= rq1->sadb_x_ipsecrequest_len;
2535 
2536 	if (len <= sizeof(*rq2) ||
2537 	    len < rq2->sadb_x_ipsecrequest_len ||
2538 	    rq2->sadb_x_ipsecrequest_len < sizeof(*rq2))
2539 		return -EINVAL;
2540 
2541 	/* new endpoints */
2542 	err = parse_sockaddr_pair((struct sockaddr *)(rq2 + 1),
2543 				  rq2->sadb_x_ipsecrequest_len - sizeof(*rq2),
2544 				  &m->new_saddr, &m->new_daddr,
2545 				  &m->new_family);
2546 	if (err)
2547 		return err;
2548 
2549 	if (rq1->sadb_x_ipsecrequest_proto != rq2->sadb_x_ipsecrequest_proto ||
2550 	    rq1->sadb_x_ipsecrequest_mode != rq2->sadb_x_ipsecrequest_mode ||
2551 	    rq1->sadb_x_ipsecrequest_reqid != rq2->sadb_x_ipsecrequest_reqid)
2552 		return -EINVAL;
2553 
2554 	m->proto = rq1->sadb_x_ipsecrequest_proto;
2555 	if ((mode = pfkey_mode_to_xfrm(rq1->sadb_x_ipsecrequest_mode)) < 0)
2556 		return -EINVAL;
2557 	m->mode = mode;
2558 	m->old_reqid = rq1->sadb_x_ipsecrequest_reqid;
2559 
2560 	return ((int)(rq1->sadb_x_ipsecrequest_len +
2561 		      rq2->sadb_x_ipsecrequest_len));
2562 }
2563 
2564 static int pfkey_migrate(struct sock *sk, struct sk_buff *skb,
2565 			 const struct sadb_msg *hdr, void * const *ext_hdrs)
2566 {
2567 	int i, len, ret, err = -EINVAL;
2568 	u8 dir;
2569 	struct sadb_address *sa;
2570 	struct sadb_x_kmaddress *kma;
2571 	struct sadb_x_policy *pol;
2572 	struct sadb_x_ipsecrequest *rq;
2573 	struct xfrm_selector sel;
2574 	struct xfrm_migrate m[XFRM_MAX_DEPTH];
2575 	struct xfrm_kmaddress k;
2576 	struct net *net = sock_net(sk);
2577 
2578 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC - 1],
2579 				     ext_hdrs[SADB_EXT_ADDRESS_DST - 1]) ||
2580 	    !ext_hdrs[SADB_X_EXT_POLICY - 1]) {
2581 		err = -EINVAL;
2582 		goto out;
2583 	}
2584 
2585 	kma = ext_hdrs[SADB_X_EXT_KMADDRESS - 1];
2586 	pol = ext_hdrs[SADB_X_EXT_POLICY - 1];
2587 
2588 	if (pol->sadb_x_policy_dir >= IPSEC_DIR_MAX) {
2589 		err = -EINVAL;
2590 		goto out;
2591 	}
2592 
2593 	if (kma) {
2594 		/* convert sadb_x_kmaddress to xfrm_kmaddress */
2595 		k.reserved = kma->sadb_x_kmaddress_reserved;
2596 		ret = parse_sockaddr_pair((struct sockaddr *)(kma + 1),
2597 					  8*(kma->sadb_x_kmaddress_len) - sizeof(*kma),
2598 					  &k.local, &k.remote, &k.family);
2599 		if (ret < 0) {
2600 			err = ret;
2601 			goto out;
2602 		}
2603 	}
2604 
2605 	dir = pol->sadb_x_policy_dir - 1;
2606 	memset(&sel, 0, sizeof(sel));
2607 
2608 	/* set source address info of selector */
2609 	sa = ext_hdrs[SADB_EXT_ADDRESS_SRC - 1];
2610 	sel.family = pfkey_sadb_addr2xfrm_addr(sa, &sel.saddr);
2611 	sel.prefixlen_s = sa->sadb_address_prefixlen;
2612 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2613 	sel.sport = ((struct sockaddr_in *)(sa + 1))->sin_port;
2614 	if (sel.sport)
2615 		sel.sport_mask = htons(0xffff);
2616 
2617 	/* set destination address info of selector */
2618 	sa = ext_hdrs[SADB_EXT_ADDRESS_DST - 1];
2619 	pfkey_sadb_addr2xfrm_addr(sa, &sel.daddr);
2620 	sel.prefixlen_d = sa->sadb_address_prefixlen;
2621 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2622 	sel.dport = ((struct sockaddr_in *)(sa + 1))->sin_port;
2623 	if (sel.dport)
2624 		sel.dport_mask = htons(0xffff);
2625 
2626 	rq = (struct sadb_x_ipsecrequest *)(pol + 1);
2627 
2628 	/* extract ipsecrequests */
2629 	i = 0;
2630 	len = pol->sadb_x_policy_len * 8 - sizeof(struct sadb_x_policy);
2631 
2632 	while (len > 0 && i < XFRM_MAX_DEPTH) {
2633 		ret = ipsecrequests_to_migrate(rq, len, &m[i]);
2634 		if (ret < 0) {
2635 			err = ret;
2636 			goto out;
2637 		} else {
2638 			rq = (struct sadb_x_ipsecrequest *)((u8 *)rq + ret);
2639 			len -= ret;
2640 			i++;
2641 		}
2642 	}
2643 
2644 	if (!i || len > 0) {
2645 		err = -EINVAL;
2646 		goto out;
2647 	}
2648 
2649 	return xfrm_migrate(&sel, dir, XFRM_POLICY_TYPE_MAIN, m, i,
2650 			    kma ? &k : NULL, net, NULL, 0, NULL, NULL);
2651 
2652  out:
2653 	return err;
2654 }
2655 #else
2656 static int pfkey_migrate(struct sock *sk, struct sk_buff *skb,
2657 			 const struct sadb_msg *hdr, void * const *ext_hdrs)
2658 {
2659 	return -ENOPROTOOPT;
2660 }
2661 #endif
2662 
2663 
2664 static int pfkey_spdget(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2665 {
2666 	struct net *net = sock_net(sk);
2667 	unsigned int dir;
2668 	int err = 0, delete;
2669 	struct sadb_x_policy *pol;
2670 	struct xfrm_policy *xp;
2671 	struct km_event c;
2672 
2673 	if ((pol = ext_hdrs[SADB_X_EXT_POLICY-1]) == NULL)
2674 		return -EINVAL;
2675 
2676 	dir = xfrm_policy_id2dir(pol->sadb_x_policy_id);
2677 	if (dir >= XFRM_POLICY_MAX)
2678 		return -EINVAL;
2679 
2680 	delete = (hdr->sadb_msg_type == SADB_X_SPDDELETE2);
2681 	xp = xfrm_policy_byid(net, &dummy_mark, 0, XFRM_POLICY_TYPE_MAIN,
2682 			      dir, pol->sadb_x_policy_id, delete, &err);
2683 	if (xp == NULL)
2684 		return -ENOENT;
2685 
2686 	if (delete) {
2687 		xfrm_audit_policy_delete(xp, err ? 0 : 1, true);
2688 
2689 		if (err)
2690 			goto out;
2691 		c.seq = hdr->sadb_msg_seq;
2692 		c.portid = hdr->sadb_msg_pid;
2693 		c.data.byid = 1;
2694 		c.event = XFRM_MSG_DELPOLICY;
2695 		km_policy_notify(xp, dir, &c);
2696 	} else {
2697 		err = key_pol_get_resp(sk, xp, hdr, dir);
2698 	}
2699 
2700 out:
2701 	xfrm_pol_put(xp);
2702 	return err;
2703 }
2704 
2705 static int dump_sp(struct xfrm_policy *xp, int dir, int count, void *ptr)
2706 {
2707 	struct pfkey_sock *pfk = ptr;
2708 	struct sk_buff *out_skb;
2709 	struct sadb_msg *out_hdr;
2710 	int err;
2711 
2712 	if (!pfkey_can_dump(&pfk->sk))
2713 		return -ENOBUFS;
2714 
2715 	out_skb = pfkey_xfrm_policy2msg_prep(xp);
2716 	if (IS_ERR(out_skb))
2717 		return PTR_ERR(out_skb);
2718 
2719 	err = pfkey_xfrm_policy2msg(out_skb, xp, dir);
2720 	if (err < 0) {
2721 		kfree_skb(out_skb);
2722 		return err;
2723 	}
2724 
2725 	out_hdr = (struct sadb_msg *) out_skb->data;
2726 	out_hdr->sadb_msg_version = pfk->dump.msg_version;
2727 	out_hdr->sadb_msg_type = SADB_X_SPDDUMP;
2728 	out_hdr->sadb_msg_satype = SADB_SATYPE_UNSPEC;
2729 	out_hdr->sadb_msg_errno = 0;
2730 	out_hdr->sadb_msg_seq = count + 1;
2731 	out_hdr->sadb_msg_pid = pfk->dump.msg_portid;
2732 
2733 	if (pfk->dump.skb)
2734 		pfkey_broadcast(pfk->dump.skb, GFP_ATOMIC, BROADCAST_ONE,
2735 				&pfk->sk, sock_net(&pfk->sk));
2736 	pfk->dump.skb = out_skb;
2737 
2738 	return 0;
2739 }
2740 
2741 static int pfkey_dump_sp(struct pfkey_sock *pfk)
2742 {
2743 	struct net *net = sock_net(&pfk->sk);
2744 	return xfrm_policy_walk(net, &pfk->dump.u.policy, dump_sp, (void *) pfk);
2745 }
2746 
2747 static void pfkey_dump_sp_done(struct pfkey_sock *pfk)
2748 {
2749 	struct net *net = sock_net((struct sock *)pfk);
2750 
2751 	xfrm_policy_walk_done(&pfk->dump.u.policy, net);
2752 }
2753 
2754 static int pfkey_spddump(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2755 {
2756 	struct pfkey_sock *pfk = pfkey_sk(sk);
2757 
2758 	mutex_lock(&pfk->dump_lock);
2759 	if (pfk->dump.dump != NULL) {
2760 		mutex_unlock(&pfk->dump_lock);
2761 		return -EBUSY;
2762 	}
2763 
2764 	pfk->dump.msg_version = hdr->sadb_msg_version;
2765 	pfk->dump.msg_portid = hdr->sadb_msg_pid;
2766 	pfk->dump.dump = pfkey_dump_sp;
2767 	pfk->dump.done = pfkey_dump_sp_done;
2768 	xfrm_policy_walk_init(&pfk->dump.u.policy, XFRM_POLICY_TYPE_MAIN);
2769 	mutex_unlock(&pfk->dump_lock);
2770 
2771 	return pfkey_do_dump(pfk);
2772 }
2773 
2774 static int key_notify_policy_flush(const struct km_event *c)
2775 {
2776 	struct sk_buff *skb_out;
2777 	struct sadb_msg *hdr;
2778 
2779 	skb_out = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_ATOMIC);
2780 	if (!skb_out)
2781 		return -ENOBUFS;
2782 	hdr = skb_put(skb_out, sizeof(struct sadb_msg));
2783 	hdr->sadb_msg_type = SADB_X_SPDFLUSH;
2784 	hdr->sadb_msg_seq = c->seq;
2785 	hdr->sadb_msg_pid = c->portid;
2786 	hdr->sadb_msg_version = PF_KEY_V2;
2787 	hdr->sadb_msg_errno = (uint8_t) 0;
2788 	hdr->sadb_msg_satype = SADB_SATYPE_UNSPEC;
2789 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) / sizeof(uint64_t));
2790 	hdr->sadb_msg_reserved = 0;
2791 	pfkey_broadcast(skb_out, GFP_ATOMIC, BROADCAST_ALL, NULL, c->net);
2792 	return 0;
2793 
2794 }
2795 
2796 static int pfkey_spdflush(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2797 {
2798 	struct net *net = sock_net(sk);
2799 	struct km_event c;
2800 	int err, err2;
2801 
2802 	err = xfrm_policy_flush(net, XFRM_POLICY_TYPE_MAIN, true);
2803 	err2 = unicast_flush_resp(sk, hdr);
2804 	if (err || err2) {
2805 		if (err == -ESRCH) /* empty table - old silent behavior */
2806 			return 0;
2807 		return err;
2808 	}
2809 
2810 	c.data.type = XFRM_POLICY_TYPE_MAIN;
2811 	c.event = XFRM_MSG_FLUSHPOLICY;
2812 	c.portid = hdr->sadb_msg_pid;
2813 	c.seq = hdr->sadb_msg_seq;
2814 	c.net = net;
2815 	km_policy_notify(NULL, 0, &c);
2816 
2817 	return 0;
2818 }
2819 
2820 typedef int (*pfkey_handler)(struct sock *sk, struct sk_buff *skb,
2821 			     const struct sadb_msg *hdr, void * const *ext_hdrs);
2822 static const pfkey_handler pfkey_funcs[SADB_MAX + 1] = {
2823 	[SADB_RESERVED]		= pfkey_reserved,
2824 	[SADB_GETSPI]		= pfkey_getspi,
2825 	[SADB_UPDATE]		= pfkey_add,
2826 	[SADB_ADD]		= pfkey_add,
2827 	[SADB_DELETE]		= pfkey_delete,
2828 	[SADB_GET]		= pfkey_get,
2829 	[SADB_ACQUIRE]		= pfkey_acquire,
2830 	[SADB_REGISTER]		= pfkey_register,
2831 	[SADB_EXPIRE]		= NULL,
2832 	[SADB_FLUSH]		= pfkey_flush,
2833 	[SADB_DUMP]		= pfkey_dump,
2834 	[SADB_X_PROMISC]	= pfkey_promisc,
2835 	[SADB_X_PCHANGE]	= NULL,
2836 	[SADB_X_SPDUPDATE]	= pfkey_spdadd,
2837 	[SADB_X_SPDADD]		= pfkey_spdadd,
2838 	[SADB_X_SPDDELETE]	= pfkey_spddelete,
2839 	[SADB_X_SPDGET]		= pfkey_spdget,
2840 	[SADB_X_SPDACQUIRE]	= NULL,
2841 	[SADB_X_SPDDUMP]	= pfkey_spddump,
2842 	[SADB_X_SPDFLUSH]	= pfkey_spdflush,
2843 	[SADB_X_SPDSETIDX]	= pfkey_spdadd,
2844 	[SADB_X_SPDDELETE2]	= pfkey_spdget,
2845 	[SADB_X_MIGRATE]	= pfkey_migrate,
2846 };
2847 
2848 static int pfkey_process(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr)
2849 {
2850 	void *ext_hdrs[SADB_EXT_MAX];
2851 	int err;
2852 
2853 	/* Non-zero return value of pfkey_broadcast() does not always signal
2854 	 * an error and even on an actual error we may still want to process
2855 	 * the message so rather ignore the return value.
2856 	 */
2857 	pfkey_broadcast(skb_clone(skb, GFP_KERNEL), GFP_KERNEL,
2858 			BROADCAST_PROMISC_ONLY, NULL, sock_net(sk));
2859 
2860 	memset(ext_hdrs, 0, sizeof(ext_hdrs));
2861 	err = parse_exthdrs(skb, hdr, ext_hdrs);
2862 	if (!err) {
2863 		err = -EOPNOTSUPP;
2864 		if (pfkey_funcs[hdr->sadb_msg_type])
2865 			err = pfkey_funcs[hdr->sadb_msg_type](sk, skb, hdr, ext_hdrs);
2866 	}
2867 	return err;
2868 }
2869 
2870 static struct sadb_msg *pfkey_get_base_msg(struct sk_buff *skb, int *errp)
2871 {
2872 	struct sadb_msg *hdr = NULL;
2873 
2874 	if (skb->len < sizeof(*hdr)) {
2875 		*errp = -EMSGSIZE;
2876 	} else {
2877 		hdr = (struct sadb_msg *) skb->data;
2878 		if (hdr->sadb_msg_version != PF_KEY_V2 ||
2879 		    hdr->sadb_msg_reserved != 0 ||
2880 		    (hdr->sadb_msg_type <= SADB_RESERVED ||
2881 		     hdr->sadb_msg_type > SADB_MAX)) {
2882 			hdr = NULL;
2883 			*errp = -EINVAL;
2884 		} else if (hdr->sadb_msg_len != (skb->len /
2885 						 sizeof(uint64_t)) ||
2886 			   hdr->sadb_msg_len < (sizeof(struct sadb_msg) /
2887 						sizeof(uint64_t))) {
2888 			hdr = NULL;
2889 			*errp = -EMSGSIZE;
2890 		} else {
2891 			*errp = 0;
2892 		}
2893 	}
2894 	return hdr;
2895 }
2896 
2897 static inline int aalg_tmpl_set(const struct xfrm_tmpl *t,
2898 				const struct xfrm_algo_desc *d)
2899 {
2900 	unsigned int id = d->desc.sadb_alg_id;
2901 
2902 	if (id >= sizeof(t->aalgos) * 8)
2903 		return 0;
2904 
2905 	return (t->aalgos >> id) & 1;
2906 }
2907 
2908 static inline int ealg_tmpl_set(const struct xfrm_tmpl *t,
2909 				const struct xfrm_algo_desc *d)
2910 {
2911 	unsigned int id = d->desc.sadb_alg_id;
2912 
2913 	if (id >= sizeof(t->ealgos) * 8)
2914 		return 0;
2915 
2916 	return (t->ealgos >> id) & 1;
2917 }
2918 
2919 static int count_ah_combs(const struct xfrm_tmpl *t)
2920 {
2921 	int i, sz = 0;
2922 
2923 	for (i = 0; ; i++) {
2924 		const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(i);
2925 		if (!aalg)
2926 			break;
2927 		if (!aalg->pfkey_supported)
2928 			continue;
2929 		if (aalg_tmpl_set(t, aalg))
2930 			sz += sizeof(struct sadb_comb);
2931 	}
2932 	return sz + sizeof(struct sadb_prop);
2933 }
2934 
2935 static int count_esp_combs(const struct xfrm_tmpl *t)
2936 {
2937 	int i, k, sz = 0;
2938 
2939 	for (i = 0; ; i++) {
2940 		const struct xfrm_algo_desc *ealg = xfrm_ealg_get_byidx(i);
2941 		if (!ealg)
2942 			break;
2943 
2944 		if (!ealg->pfkey_supported)
2945 			continue;
2946 
2947 		if (!(ealg_tmpl_set(t, ealg)))
2948 			continue;
2949 
2950 		for (k = 1; ; k++) {
2951 			const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(k);
2952 			if (!aalg)
2953 				break;
2954 
2955 			if (!aalg->pfkey_supported)
2956 				continue;
2957 
2958 			if (aalg_tmpl_set(t, aalg))
2959 				sz += sizeof(struct sadb_comb);
2960 		}
2961 	}
2962 	return sz + sizeof(struct sadb_prop);
2963 }
2964 
2965 static int dump_ah_combs(struct sk_buff *skb, const struct xfrm_tmpl *t)
2966 {
2967 	struct sadb_prop *p;
2968 	int sz = 0;
2969 	int i;
2970 
2971 	p = skb_put(skb, sizeof(struct sadb_prop));
2972 	p->sadb_prop_len = sizeof(struct sadb_prop)/8;
2973 	p->sadb_prop_exttype = SADB_EXT_PROPOSAL;
2974 	p->sadb_prop_replay = 32;
2975 	memset(p->sadb_prop_reserved, 0, sizeof(p->sadb_prop_reserved));
2976 
2977 	for (i = 0; ; i++) {
2978 		const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(i);
2979 		if (!aalg)
2980 			break;
2981 
2982 		if (!aalg->pfkey_supported)
2983 			continue;
2984 
2985 		if (aalg_tmpl_set(t, aalg) && aalg->available) {
2986 			struct sadb_comb *c;
2987 			c = skb_put_zero(skb, sizeof(struct sadb_comb));
2988 			p->sadb_prop_len += sizeof(struct sadb_comb)/8;
2989 			c->sadb_comb_auth = aalg->desc.sadb_alg_id;
2990 			c->sadb_comb_auth_minbits = aalg->desc.sadb_alg_minbits;
2991 			c->sadb_comb_auth_maxbits = aalg->desc.sadb_alg_maxbits;
2992 			c->sadb_comb_hard_addtime = 24*60*60;
2993 			c->sadb_comb_soft_addtime = 20*60*60;
2994 			c->sadb_comb_hard_usetime = 8*60*60;
2995 			c->sadb_comb_soft_usetime = 7*60*60;
2996 			sz += sizeof(*c);
2997 		}
2998 	}
2999 
3000 	return sz + sizeof(*p);
3001 }
3002 
3003 static int dump_esp_combs(struct sk_buff *skb, const struct xfrm_tmpl *t)
3004 {
3005 	struct sadb_prop *p;
3006 	int sz = 0;
3007 	int i, k;
3008 
3009 	p = skb_put(skb, sizeof(struct sadb_prop));
3010 	p->sadb_prop_len = sizeof(struct sadb_prop)/8;
3011 	p->sadb_prop_exttype = SADB_EXT_PROPOSAL;
3012 	p->sadb_prop_replay = 32;
3013 	memset(p->sadb_prop_reserved, 0, sizeof(p->sadb_prop_reserved));
3014 
3015 	for (i=0; ; i++) {
3016 		const struct xfrm_algo_desc *ealg = xfrm_ealg_get_byidx(i);
3017 		if (!ealg)
3018 			break;
3019 
3020 		if (!ealg->pfkey_supported)
3021 			continue;
3022 
3023 		if (!(ealg_tmpl_set(t, ealg) && ealg->available))
3024 			continue;
3025 
3026 		for (k = 1; ; k++) {
3027 			struct sadb_comb *c;
3028 			const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(k);
3029 			if (!aalg)
3030 				break;
3031 			if (!aalg->pfkey_supported)
3032 				continue;
3033 			if (!(aalg_tmpl_set(t, aalg) && aalg->available))
3034 				continue;
3035 			c = skb_put(skb, sizeof(struct sadb_comb));
3036 			memset(c, 0, sizeof(*c));
3037 			p->sadb_prop_len += sizeof(struct sadb_comb)/8;
3038 			c->sadb_comb_auth = aalg->desc.sadb_alg_id;
3039 			c->sadb_comb_auth_minbits = aalg->desc.sadb_alg_minbits;
3040 			c->sadb_comb_auth_maxbits = aalg->desc.sadb_alg_maxbits;
3041 			c->sadb_comb_encrypt = ealg->desc.sadb_alg_id;
3042 			c->sadb_comb_encrypt_minbits = ealg->desc.sadb_alg_minbits;
3043 			c->sadb_comb_encrypt_maxbits = ealg->desc.sadb_alg_maxbits;
3044 			c->sadb_comb_hard_addtime = 24*60*60;
3045 			c->sadb_comb_soft_addtime = 20*60*60;
3046 			c->sadb_comb_hard_usetime = 8*60*60;
3047 			c->sadb_comb_soft_usetime = 7*60*60;
3048 			sz += sizeof(*c);
3049 		}
3050 	}
3051 
3052 	return sz + sizeof(*p);
3053 }
3054 
3055 static int key_notify_policy_expire(struct xfrm_policy *xp, const struct km_event *c)
3056 {
3057 	return 0;
3058 }
3059 
3060 static int key_notify_sa_expire(struct xfrm_state *x, const struct km_event *c)
3061 {
3062 	struct sk_buff *out_skb;
3063 	struct sadb_msg *out_hdr;
3064 	int hard;
3065 	int hsc;
3066 
3067 	hard = c->data.hard;
3068 	if (hard)
3069 		hsc = 2;
3070 	else
3071 		hsc = 1;
3072 
3073 	out_skb = pfkey_xfrm_state2msg_expire(x, hsc);
3074 	if (IS_ERR(out_skb))
3075 		return PTR_ERR(out_skb);
3076 
3077 	out_hdr = (struct sadb_msg *) out_skb->data;
3078 	out_hdr->sadb_msg_version = PF_KEY_V2;
3079 	out_hdr->sadb_msg_type = SADB_EXPIRE;
3080 	out_hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
3081 	out_hdr->sadb_msg_errno = 0;
3082 	out_hdr->sadb_msg_reserved = 0;
3083 	out_hdr->sadb_msg_seq = 0;
3084 	out_hdr->sadb_msg_pid = 0;
3085 
3086 	pfkey_broadcast(out_skb, GFP_ATOMIC, BROADCAST_REGISTERED, NULL,
3087 			xs_net(x));
3088 	return 0;
3089 }
3090 
3091 static int pfkey_send_notify(struct xfrm_state *x, const struct km_event *c)
3092 {
3093 	struct net *net = x ? xs_net(x) : c->net;
3094 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3095 
3096 	if (atomic_read(&net_pfkey->socks_nr) == 0)
3097 		return 0;
3098 
3099 	switch (c->event) {
3100 	case XFRM_MSG_EXPIRE:
3101 		return key_notify_sa_expire(x, c);
3102 	case XFRM_MSG_DELSA:
3103 	case XFRM_MSG_NEWSA:
3104 	case XFRM_MSG_UPDSA:
3105 		return key_notify_sa(x, c);
3106 	case XFRM_MSG_FLUSHSA:
3107 		return key_notify_sa_flush(c);
3108 	case XFRM_MSG_NEWAE: /* not yet supported */
3109 		break;
3110 	default:
3111 		pr_err("pfkey: Unknown SA event %d\n", c->event);
3112 		break;
3113 	}
3114 
3115 	return 0;
3116 }
3117 
3118 static int pfkey_send_policy_notify(struct xfrm_policy *xp, int dir, const struct km_event *c)
3119 {
3120 	if (xp && xp->type != XFRM_POLICY_TYPE_MAIN)
3121 		return 0;
3122 
3123 	switch (c->event) {
3124 	case XFRM_MSG_POLEXPIRE:
3125 		return key_notify_policy_expire(xp, c);
3126 	case XFRM_MSG_DELPOLICY:
3127 	case XFRM_MSG_NEWPOLICY:
3128 	case XFRM_MSG_UPDPOLICY:
3129 		return key_notify_policy(xp, dir, c);
3130 	case XFRM_MSG_FLUSHPOLICY:
3131 		if (c->data.type != XFRM_POLICY_TYPE_MAIN)
3132 			break;
3133 		return key_notify_policy_flush(c);
3134 	default:
3135 		pr_err("pfkey: Unknown policy event %d\n", c->event);
3136 		break;
3137 	}
3138 
3139 	return 0;
3140 }
3141 
3142 static u32 get_acqseq(void)
3143 {
3144 	u32 res;
3145 	static atomic_t acqseq;
3146 
3147 	do {
3148 		res = atomic_inc_return(&acqseq);
3149 	} while (!res);
3150 	return res;
3151 }
3152 
3153 static bool pfkey_is_alive(const struct km_event *c)
3154 {
3155 	struct netns_pfkey *net_pfkey = net_generic(c->net, pfkey_net_id);
3156 	struct sock *sk;
3157 	bool is_alive = false;
3158 
3159 	rcu_read_lock();
3160 	sk_for_each_rcu(sk, &net_pfkey->table) {
3161 		if (pfkey_sk(sk)->registered) {
3162 			is_alive = true;
3163 			break;
3164 		}
3165 	}
3166 	rcu_read_unlock();
3167 
3168 	return is_alive;
3169 }
3170 
3171 static int pfkey_send_acquire(struct xfrm_state *x, struct xfrm_tmpl *t, struct xfrm_policy *xp)
3172 {
3173 	struct sk_buff *skb;
3174 	struct sadb_msg *hdr;
3175 	struct sadb_address *addr;
3176 	struct sadb_x_policy *pol;
3177 	int sockaddr_size;
3178 	int size;
3179 	struct sadb_x_sec_ctx *sec_ctx;
3180 	struct xfrm_sec_ctx *xfrm_ctx;
3181 	int ctx_size = 0;
3182 	int alg_size = 0;
3183 
3184 	sockaddr_size = pfkey_sockaddr_size(x->props.family);
3185 	if (!sockaddr_size)
3186 		return -EINVAL;
3187 
3188 	size = sizeof(struct sadb_msg) +
3189 		(sizeof(struct sadb_address) * 2) +
3190 		(sockaddr_size * 2) +
3191 		sizeof(struct sadb_x_policy);
3192 
3193 	if (x->id.proto == IPPROTO_AH)
3194 		alg_size = count_ah_combs(t);
3195 	else if (x->id.proto == IPPROTO_ESP)
3196 		alg_size = count_esp_combs(t);
3197 
3198 	if ((xfrm_ctx = x->security)) {
3199 		ctx_size = PFKEY_ALIGN8(xfrm_ctx->ctx_len);
3200 		size +=  sizeof(struct sadb_x_sec_ctx) + ctx_size;
3201 	}
3202 
3203 	skb =  alloc_skb(size + alg_size + 16, GFP_ATOMIC);
3204 	if (skb == NULL)
3205 		return -ENOMEM;
3206 
3207 	hdr = skb_put(skb, sizeof(struct sadb_msg));
3208 	hdr->sadb_msg_version = PF_KEY_V2;
3209 	hdr->sadb_msg_type = SADB_ACQUIRE;
3210 	hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
3211 	hdr->sadb_msg_len = size / sizeof(uint64_t);
3212 	hdr->sadb_msg_errno = 0;
3213 	hdr->sadb_msg_reserved = 0;
3214 	hdr->sadb_msg_seq = x->km.seq = get_acqseq();
3215 	hdr->sadb_msg_pid = 0;
3216 
3217 	/* src address */
3218 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
3219 	addr->sadb_address_len =
3220 		(sizeof(struct sadb_address)+sockaddr_size)/
3221 			sizeof(uint64_t);
3222 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
3223 	addr->sadb_address_proto = 0;
3224 	addr->sadb_address_reserved = 0;
3225 	addr->sadb_address_prefixlen =
3226 		pfkey_sockaddr_fill_zero_tail(&x->props.saddr, 0,
3227 					      (struct sockaddr *)(addr + 1),
3228 					      x->props.family);
3229 	if (!addr->sadb_address_prefixlen)
3230 		BUG();
3231 
3232 	/* dst address */
3233 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
3234 	addr->sadb_address_len =
3235 		(sizeof(struct sadb_address)+sockaddr_size)/
3236 			sizeof(uint64_t);
3237 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
3238 	addr->sadb_address_proto = 0;
3239 	addr->sadb_address_reserved = 0;
3240 	addr->sadb_address_prefixlen =
3241 		pfkey_sockaddr_fill_zero_tail(&x->id.daddr, 0,
3242 					      (struct sockaddr *)(addr + 1),
3243 					      x->props.family);
3244 	if (!addr->sadb_address_prefixlen)
3245 		BUG();
3246 
3247 	pol = skb_put(skb, sizeof(struct sadb_x_policy));
3248 	pol->sadb_x_policy_len = sizeof(struct sadb_x_policy)/sizeof(uint64_t);
3249 	pol->sadb_x_policy_exttype = SADB_X_EXT_POLICY;
3250 	pol->sadb_x_policy_type = IPSEC_POLICY_IPSEC;
3251 	pol->sadb_x_policy_dir = XFRM_POLICY_OUT + 1;
3252 	pol->sadb_x_policy_reserved = 0;
3253 	pol->sadb_x_policy_id = xp->index;
3254 	pol->sadb_x_policy_priority = xp->priority;
3255 
3256 	/* Set sadb_comb's. */
3257 	alg_size = 0;
3258 	if (x->id.proto == IPPROTO_AH)
3259 		alg_size = dump_ah_combs(skb, t);
3260 	else if (x->id.proto == IPPROTO_ESP)
3261 		alg_size = dump_esp_combs(skb, t);
3262 
3263 	hdr->sadb_msg_len += alg_size / 8;
3264 
3265 	/* security context */
3266 	if (xfrm_ctx) {
3267 		sec_ctx = skb_put(skb,
3268 				  sizeof(struct sadb_x_sec_ctx) + ctx_size);
3269 		sec_ctx->sadb_x_sec_len =
3270 		  (sizeof(struct sadb_x_sec_ctx) + ctx_size) / sizeof(uint64_t);
3271 		sec_ctx->sadb_x_sec_exttype = SADB_X_EXT_SEC_CTX;
3272 		sec_ctx->sadb_x_ctx_doi = xfrm_ctx->ctx_doi;
3273 		sec_ctx->sadb_x_ctx_alg = xfrm_ctx->ctx_alg;
3274 		sec_ctx->sadb_x_ctx_len = xfrm_ctx->ctx_len;
3275 		memcpy(sec_ctx + 1, xfrm_ctx->ctx_str,
3276 		       xfrm_ctx->ctx_len);
3277 	}
3278 
3279 	return pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_REGISTERED, NULL,
3280 			       xs_net(x));
3281 }
3282 
3283 static struct xfrm_policy *pfkey_compile_policy(struct sock *sk, int opt,
3284 						u8 *data, int len, int *dir)
3285 {
3286 	struct net *net = sock_net(sk);
3287 	struct xfrm_policy *xp;
3288 	struct sadb_x_policy *pol = (struct sadb_x_policy*)data;
3289 	struct sadb_x_sec_ctx *sec_ctx;
3290 
3291 	switch (sk->sk_family) {
3292 	case AF_INET:
3293 		if (opt != IP_IPSEC_POLICY) {
3294 			*dir = -EOPNOTSUPP;
3295 			return NULL;
3296 		}
3297 		break;
3298 #if IS_ENABLED(CONFIG_IPV6)
3299 	case AF_INET6:
3300 		if (opt != IPV6_IPSEC_POLICY) {
3301 			*dir = -EOPNOTSUPP;
3302 			return NULL;
3303 		}
3304 		break;
3305 #endif
3306 	default:
3307 		*dir = -EINVAL;
3308 		return NULL;
3309 	}
3310 
3311 	*dir = -EINVAL;
3312 
3313 	if (len < sizeof(struct sadb_x_policy) ||
3314 	    pol->sadb_x_policy_len*8 > len ||
3315 	    pol->sadb_x_policy_type > IPSEC_POLICY_BYPASS ||
3316 	    (!pol->sadb_x_policy_dir || pol->sadb_x_policy_dir > IPSEC_DIR_OUTBOUND))
3317 		return NULL;
3318 
3319 	xp = xfrm_policy_alloc(net, GFP_ATOMIC);
3320 	if (xp == NULL) {
3321 		*dir = -ENOBUFS;
3322 		return NULL;
3323 	}
3324 
3325 	xp->action = (pol->sadb_x_policy_type == IPSEC_POLICY_DISCARD ?
3326 		      XFRM_POLICY_BLOCK : XFRM_POLICY_ALLOW);
3327 
3328 	xp->lft.soft_byte_limit = XFRM_INF;
3329 	xp->lft.hard_byte_limit = XFRM_INF;
3330 	xp->lft.soft_packet_limit = XFRM_INF;
3331 	xp->lft.hard_packet_limit = XFRM_INF;
3332 	xp->family = sk->sk_family;
3333 
3334 	xp->xfrm_nr = 0;
3335 	if (pol->sadb_x_policy_type == IPSEC_POLICY_IPSEC &&
3336 	    (*dir = parse_ipsecrequests(xp, pol)) < 0)
3337 		goto out;
3338 
3339 	/* security context too */
3340 	if (len >= (pol->sadb_x_policy_len*8 +
3341 	    sizeof(struct sadb_x_sec_ctx))) {
3342 		char *p = (char *)pol;
3343 		struct xfrm_user_sec_ctx *uctx;
3344 
3345 		p += pol->sadb_x_policy_len*8;
3346 		sec_ctx = (struct sadb_x_sec_ctx *)p;
3347 		if (len < pol->sadb_x_policy_len*8 +
3348 		    sec_ctx->sadb_x_sec_len*8) {
3349 			*dir = -EINVAL;
3350 			goto out;
3351 		}
3352 		if ((*dir = verify_sec_ctx_len(p)))
3353 			goto out;
3354 		uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_ATOMIC);
3355 		*dir = security_xfrm_policy_alloc(&xp->security, uctx, GFP_ATOMIC);
3356 		kfree(uctx);
3357 
3358 		if (*dir)
3359 			goto out;
3360 	}
3361 
3362 	*dir = pol->sadb_x_policy_dir-1;
3363 	return xp;
3364 
3365 out:
3366 	xp->walk.dead = 1;
3367 	xfrm_policy_destroy(xp);
3368 	return NULL;
3369 }
3370 
3371 static int pfkey_send_new_mapping(struct xfrm_state *x, xfrm_address_t *ipaddr, __be16 sport)
3372 {
3373 	struct sk_buff *skb;
3374 	struct sadb_msg *hdr;
3375 	struct sadb_sa *sa;
3376 	struct sadb_address *addr;
3377 	struct sadb_x_nat_t_port *n_port;
3378 	int sockaddr_size;
3379 	int size;
3380 	__u8 satype = (x->id.proto == IPPROTO_ESP ? SADB_SATYPE_ESP : 0);
3381 	struct xfrm_encap_tmpl *natt = NULL;
3382 
3383 	sockaddr_size = pfkey_sockaddr_size(x->props.family);
3384 	if (!sockaddr_size)
3385 		return -EINVAL;
3386 
3387 	if (!satype)
3388 		return -EINVAL;
3389 
3390 	if (!x->encap)
3391 		return -EINVAL;
3392 
3393 	natt = x->encap;
3394 
3395 	/* Build an SADB_X_NAT_T_NEW_MAPPING message:
3396 	 *
3397 	 * HDR | SA | ADDRESS_SRC (old addr) | NAT_T_SPORT (old port) |
3398 	 * ADDRESS_DST (new addr) | NAT_T_DPORT (new port)
3399 	 */
3400 
3401 	size = sizeof(struct sadb_msg) +
3402 		sizeof(struct sadb_sa) +
3403 		(sizeof(struct sadb_address) * 2) +
3404 		(sockaddr_size * 2) +
3405 		(sizeof(struct sadb_x_nat_t_port) * 2);
3406 
3407 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
3408 	if (skb == NULL)
3409 		return -ENOMEM;
3410 
3411 	hdr = skb_put(skb, sizeof(struct sadb_msg));
3412 	hdr->sadb_msg_version = PF_KEY_V2;
3413 	hdr->sadb_msg_type = SADB_X_NAT_T_NEW_MAPPING;
3414 	hdr->sadb_msg_satype = satype;
3415 	hdr->sadb_msg_len = size / sizeof(uint64_t);
3416 	hdr->sadb_msg_errno = 0;
3417 	hdr->sadb_msg_reserved = 0;
3418 	hdr->sadb_msg_seq = x->km.seq;
3419 	hdr->sadb_msg_pid = 0;
3420 
3421 	/* SA */
3422 	sa = skb_put(skb, sizeof(struct sadb_sa));
3423 	sa->sadb_sa_len = sizeof(struct sadb_sa)/sizeof(uint64_t);
3424 	sa->sadb_sa_exttype = SADB_EXT_SA;
3425 	sa->sadb_sa_spi = x->id.spi;
3426 	sa->sadb_sa_replay = 0;
3427 	sa->sadb_sa_state = 0;
3428 	sa->sadb_sa_auth = 0;
3429 	sa->sadb_sa_encrypt = 0;
3430 	sa->sadb_sa_flags = 0;
3431 
3432 	/* ADDRESS_SRC (old addr) */
3433 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
3434 	addr->sadb_address_len =
3435 		(sizeof(struct sadb_address)+sockaddr_size)/
3436 			sizeof(uint64_t);
3437 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
3438 	addr->sadb_address_proto = 0;
3439 	addr->sadb_address_reserved = 0;
3440 	addr->sadb_address_prefixlen =
3441 		pfkey_sockaddr_fill_zero_tail(&x->props.saddr, 0,
3442 					      (struct sockaddr *)(addr + 1),
3443 					      x->props.family);
3444 	if (!addr->sadb_address_prefixlen)
3445 		BUG();
3446 
3447 	/* NAT_T_SPORT (old port) */
3448 	n_port = skb_put(skb, sizeof(*n_port));
3449 	n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
3450 	n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_SPORT;
3451 	n_port->sadb_x_nat_t_port_port = natt->encap_sport;
3452 	n_port->sadb_x_nat_t_port_reserved = 0;
3453 
3454 	/* ADDRESS_DST (new addr) */
3455 	addr = skb_put(skb, sizeof(struct sadb_address) + sockaddr_size);
3456 	addr->sadb_address_len =
3457 		(sizeof(struct sadb_address)+sockaddr_size)/
3458 			sizeof(uint64_t);
3459 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
3460 	addr->sadb_address_proto = 0;
3461 	addr->sadb_address_reserved = 0;
3462 	addr->sadb_address_prefixlen =
3463 		pfkey_sockaddr_fill_zero_tail(ipaddr, 0,
3464 					      (struct sockaddr *)(addr + 1),
3465 					      x->props.family);
3466 	if (!addr->sadb_address_prefixlen)
3467 		BUG();
3468 
3469 	/* NAT_T_DPORT (new port) */
3470 	n_port = skb_put(skb, sizeof(*n_port));
3471 	n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
3472 	n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_DPORT;
3473 	n_port->sadb_x_nat_t_port_port = sport;
3474 	n_port->sadb_x_nat_t_port_reserved = 0;
3475 
3476 	return pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_REGISTERED, NULL,
3477 			       xs_net(x));
3478 }
3479 
3480 #ifdef CONFIG_NET_KEY_MIGRATE
3481 static int set_sadb_address(struct sk_buff *skb, int sasize, int type,
3482 			    const struct xfrm_selector *sel)
3483 {
3484 	struct sadb_address *addr;
3485 	addr = skb_put(skb, sizeof(struct sadb_address) + sasize);
3486 	addr->sadb_address_len = (sizeof(struct sadb_address) + sasize)/8;
3487 	addr->sadb_address_exttype = type;
3488 	addr->sadb_address_proto = sel->proto;
3489 	addr->sadb_address_reserved = 0;
3490 
3491 	switch (type) {
3492 	case SADB_EXT_ADDRESS_SRC:
3493 		addr->sadb_address_prefixlen = sel->prefixlen_s;
3494 		pfkey_sockaddr_fill_zero_tail(&sel->saddr, 0,
3495 					      (struct sockaddr *)(addr + 1),
3496 					      sel->family);
3497 		break;
3498 	case SADB_EXT_ADDRESS_DST:
3499 		addr->sadb_address_prefixlen = sel->prefixlen_d;
3500 		pfkey_sockaddr_fill_zero_tail(&sel->daddr, 0,
3501 					      (struct sockaddr *)(addr + 1),
3502 					      sel->family);
3503 		break;
3504 	default:
3505 		return -EINVAL;
3506 	}
3507 
3508 	return 0;
3509 }
3510 
3511 
3512 static int set_sadb_kmaddress(struct sk_buff *skb, const struct xfrm_kmaddress *k)
3513 {
3514 	struct sadb_x_kmaddress *kma;
3515 	u8 *sa;
3516 	int family = k->family;
3517 	int socklen = pfkey_sockaddr_len(family);
3518 	int size_req;
3519 
3520 	size_req = (sizeof(struct sadb_x_kmaddress) +
3521 		    pfkey_sockaddr_pair_size(family));
3522 
3523 	kma = skb_put_zero(skb, size_req);
3524 	kma->sadb_x_kmaddress_len = size_req / 8;
3525 	kma->sadb_x_kmaddress_exttype = SADB_X_EXT_KMADDRESS;
3526 	kma->sadb_x_kmaddress_reserved = k->reserved;
3527 
3528 	sa = (u8 *)(kma + 1);
3529 	if (!pfkey_sockaddr_fill(&k->local, 0, (struct sockaddr *)sa, family) ||
3530 	    !pfkey_sockaddr_fill(&k->remote, 0, (struct sockaddr *)(sa+socklen), family))
3531 		return -EINVAL;
3532 
3533 	return 0;
3534 }
3535 
3536 static int set_ipsecrequest(struct sk_buff *skb,
3537 			    uint8_t proto, uint8_t mode, int level,
3538 			    uint32_t reqid, sa_family_t family,
3539 			    const xfrm_address_t *src, const xfrm_address_t *dst)
3540 {
3541 	struct sadb_x_ipsecrequest *rq;
3542 	u8 *sa;
3543 	int socklen = pfkey_sockaddr_len(family);
3544 	int size_req;
3545 
3546 	size_req = sizeof(struct sadb_x_ipsecrequest) +
3547 		   pfkey_sockaddr_pair_size(family);
3548 
3549 	rq = skb_put_zero(skb, size_req);
3550 	rq->sadb_x_ipsecrequest_len = size_req;
3551 	rq->sadb_x_ipsecrequest_proto = proto;
3552 	rq->sadb_x_ipsecrequest_mode = mode;
3553 	rq->sadb_x_ipsecrequest_level = level;
3554 	rq->sadb_x_ipsecrequest_reqid = reqid;
3555 
3556 	sa = (u8 *) (rq + 1);
3557 	if (!pfkey_sockaddr_fill(src, 0, (struct sockaddr *)sa, family) ||
3558 	    !pfkey_sockaddr_fill(dst, 0, (struct sockaddr *)(sa + socklen), family))
3559 		return -EINVAL;
3560 
3561 	return 0;
3562 }
3563 #endif
3564 
3565 #ifdef CONFIG_NET_KEY_MIGRATE
3566 static int pfkey_send_migrate(const struct xfrm_selector *sel, u8 dir, u8 type,
3567 			      const struct xfrm_migrate *m, int num_bundles,
3568 			      const struct xfrm_kmaddress *k, struct net *net,
3569 			      const struct xfrm_encap_tmpl *encap)
3570 {
3571 	int i;
3572 	int sasize_sel;
3573 	int size = 0;
3574 	int size_pol = 0;
3575 	struct sk_buff *skb;
3576 	struct sadb_msg *hdr;
3577 	struct sadb_x_policy *pol;
3578 	const struct xfrm_migrate *mp;
3579 
3580 	if (type != XFRM_POLICY_TYPE_MAIN)
3581 		return 0;
3582 
3583 	if (num_bundles <= 0 || num_bundles > XFRM_MAX_DEPTH)
3584 		return -EINVAL;
3585 
3586 	if (k != NULL) {
3587 		/* addresses for KM */
3588 		size += PFKEY_ALIGN8(sizeof(struct sadb_x_kmaddress) +
3589 				     pfkey_sockaddr_pair_size(k->family));
3590 	}
3591 
3592 	/* selector */
3593 	sasize_sel = pfkey_sockaddr_size(sel->family);
3594 	if (!sasize_sel)
3595 		return -EINVAL;
3596 	size += (sizeof(struct sadb_address) + sasize_sel) * 2;
3597 
3598 	/* policy info */
3599 	size_pol += sizeof(struct sadb_x_policy);
3600 
3601 	/* ipsecrequests */
3602 	for (i = 0, mp = m; i < num_bundles; i++, mp++) {
3603 		int pair_size;
3604 
3605 		pair_size = pfkey_sockaddr_pair_size(mp->old_family);
3606 		if (!pair_size)
3607 			return -EINVAL;
3608 		size_pol += sizeof(struct sadb_x_ipsecrequest) + pair_size;
3609 
3610 		pair_size = pfkey_sockaddr_pair_size(mp->new_family);
3611 		if (!pair_size)
3612 			return -EINVAL;
3613 		size_pol += sizeof(struct sadb_x_ipsecrequest) + pair_size;
3614 	}
3615 
3616 	size += sizeof(struct sadb_msg) + size_pol;
3617 
3618 	/* alloc buffer */
3619 	skb = alloc_skb(size, GFP_ATOMIC);
3620 	if (skb == NULL)
3621 		return -ENOMEM;
3622 
3623 	hdr = skb_put(skb, sizeof(struct sadb_msg));
3624 	hdr->sadb_msg_version = PF_KEY_V2;
3625 	hdr->sadb_msg_type = SADB_X_MIGRATE;
3626 	hdr->sadb_msg_satype = pfkey_proto2satype(m->proto);
3627 	hdr->sadb_msg_len = size / 8;
3628 	hdr->sadb_msg_errno = 0;
3629 	hdr->sadb_msg_reserved = 0;
3630 	hdr->sadb_msg_seq = 0;
3631 	hdr->sadb_msg_pid = 0;
3632 
3633 	/* Addresses to be used by KM for negotiation, if ext is available */
3634 	if (k != NULL && (set_sadb_kmaddress(skb, k) < 0))
3635 		goto err;
3636 
3637 	/* selector src */
3638 	set_sadb_address(skb, sasize_sel, SADB_EXT_ADDRESS_SRC, sel);
3639 
3640 	/* selector dst */
3641 	set_sadb_address(skb, sasize_sel, SADB_EXT_ADDRESS_DST, sel);
3642 
3643 	/* policy information */
3644 	pol = skb_put(skb, sizeof(struct sadb_x_policy));
3645 	pol->sadb_x_policy_len = size_pol / 8;
3646 	pol->sadb_x_policy_exttype = SADB_X_EXT_POLICY;
3647 	pol->sadb_x_policy_type = IPSEC_POLICY_IPSEC;
3648 	pol->sadb_x_policy_dir = dir + 1;
3649 	pol->sadb_x_policy_reserved = 0;
3650 	pol->sadb_x_policy_id = 0;
3651 	pol->sadb_x_policy_priority = 0;
3652 
3653 	for (i = 0, mp = m; i < num_bundles; i++, mp++) {
3654 		/* old ipsecrequest */
3655 		int mode = pfkey_mode_from_xfrm(mp->mode);
3656 		if (mode < 0)
3657 			goto err;
3658 		if (set_ipsecrequest(skb, mp->proto, mode,
3659 				     (mp->old_reqid ? IPSEC_LEVEL_UNIQUE : IPSEC_LEVEL_REQUIRE),
3660 				     mp->old_reqid, mp->old_family,
3661 				     &mp->old_saddr, &mp->old_daddr) < 0)
3662 			goto err;
3663 
3664 		/* new ipsecrequest */
3665 		if (set_ipsecrequest(skb, mp->proto, mode,
3666 				     (mp->old_reqid ? IPSEC_LEVEL_UNIQUE : IPSEC_LEVEL_REQUIRE),
3667 				     mp->old_reqid, mp->new_family,
3668 				     &mp->new_saddr, &mp->new_daddr) < 0)
3669 			goto err;
3670 	}
3671 
3672 	/* broadcast migrate message to sockets */
3673 	pfkey_broadcast(skb, GFP_ATOMIC, BROADCAST_ALL, NULL, net);
3674 
3675 	return 0;
3676 
3677 err:
3678 	kfree_skb(skb);
3679 	return -EINVAL;
3680 }
3681 #else
3682 static int pfkey_send_migrate(const struct xfrm_selector *sel, u8 dir, u8 type,
3683 			      const struct xfrm_migrate *m, int num_bundles,
3684 			      const struct xfrm_kmaddress *k, struct net *net,
3685 			      const struct xfrm_encap_tmpl *encap)
3686 {
3687 	return -ENOPROTOOPT;
3688 }
3689 #endif
3690 
3691 static int pfkey_sendmsg(struct socket *sock, struct msghdr *msg, size_t len)
3692 {
3693 	struct sock *sk = sock->sk;
3694 	struct sk_buff *skb = NULL;
3695 	struct sadb_msg *hdr = NULL;
3696 	int err;
3697 	struct net *net = sock_net(sk);
3698 
3699 	err = -EOPNOTSUPP;
3700 	if (msg->msg_flags & MSG_OOB)
3701 		goto out;
3702 
3703 	err = -EMSGSIZE;
3704 	if ((unsigned int)len > sk->sk_sndbuf - 32)
3705 		goto out;
3706 
3707 	err = -ENOBUFS;
3708 	skb = alloc_skb(len, GFP_KERNEL);
3709 	if (skb == NULL)
3710 		goto out;
3711 
3712 	err = -EFAULT;
3713 	if (memcpy_from_msg(skb_put(skb,len), msg, len))
3714 		goto out;
3715 
3716 	hdr = pfkey_get_base_msg(skb, &err);
3717 	if (!hdr)
3718 		goto out;
3719 
3720 	mutex_lock(&net->xfrm.xfrm_cfg_mutex);
3721 	err = pfkey_process(sk, skb, hdr);
3722 	mutex_unlock(&net->xfrm.xfrm_cfg_mutex);
3723 
3724 out:
3725 	if (err && hdr && pfkey_error(hdr, err, sk) == 0)
3726 		err = 0;
3727 	kfree_skb(skb);
3728 
3729 	return err ? : len;
3730 }
3731 
3732 static int pfkey_recvmsg(struct socket *sock, struct msghdr *msg, size_t len,
3733 			 int flags)
3734 {
3735 	struct sock *sk = sock->sk;
3736 	struct pfkey_sock *pfk = pfkey_sk(sk);
3737 	struct sk_buff *skb;
3738 	int copied, err;
3739 
3740 	err = -EINVAL;
3741 	if (flags & ~(MSG_PEEK|MSG_DONTWAIT|MSG_TRUNC|MSG_CMSG_COMPAT))
3742 		goto out;
3743 
3744 	skb = skb_recv_datagram(sk, flags, &err);
3745 	if (skb == NULL)
3746 		goto out;
3747 
3748 	copied = skb->len;
3749 	if (copied > len) {
3750 		msg->msg_flags |= MSG_TRUNC;
3751 		copied = len;
3752 	}
3753 
3754 	skb_reset_transport_header(skb);
3755 	err = skb_copy_datagram_msg(skb, 0, msg, copied);
3756 	if (err)
3757 		goto out_free;
3758 
3759 	sock_recv_cmsgs(msg, sk, skb);
3760 
3761 	err = (flags & MSG_TRUNC) ? skb->len : copied;
3762 
3763 	if (pfk->dump.dump != NULL &&
3764 	    3 * atomic_read(&sk->sk_rmem_alloc) <= sk->sk_rcvbuf)
3765 		pfkey_do_dump(pfk);
3766 
3767 out_free:
3768 	skb_free_datagram(sk, skb);
3769 out:
3770 	return err;
3771 }
3772 
3773 static const struct proto_ops pfkey_ops = {
3774 	.family		=	PF_KEY,
3775 	.owner		=	THIS_MODULE,
3776 	/* Operations that make no sense on pfkey sockets. */
3777 	.bind		=	sock_no_bind,
3778 	.connect	=	sock_no_connect,
3779 	.socketpair	=	sock_no_socketpair,
3780 	.accept		=	sock_no_accept,
3781 	.getname	=	sock_no_getname,
3782 	.ioctl		=	sock_no_ioctl,
3783 	.listen		=	sock_no_listen,
3784 	.shutdown	=	sock_no_shutdown,
3785 	.mmap		=	sock_no_mmap,
3786 
3787 	/* Now the operations that really occur. */
3788 	.release	=	pfkey_release,
3789 	.poll		=	datagram_poll,
3790 	.sendmsg	=	pfkey_sendmsg,
3791 	.recvmsg	=	pfkey_recvmsg,
3792 };
3793 
3794 static const struct net_proto_family pfkey_family_ops = {
3795 	.family	=	PF_KEY,
3796 	.create	=	pfkey_create,
3797 	.owner	=	THIS_MODULE,
3798 };
3799 
3800 #ifdef CONFIG_PROC_FS
3801 static int pfkey_seq_show(struct seq_file *f, void *v)
3802 {
3803 	struct sock *s = sk_entry(v);
3804 
3805 	if (v == SEQ_START_TOKEN)
3806 		seq_printf(f ,"sk       RefCnt Rmem   Wmem   User   Inode\n");
3807 	else
3808 		seq_printf(f, "%pK %-6d %-6u %-6u %-6u %-6llu\n",
3809 			       s,
3810 			       refcount_read(&s->sk_refcnt),
3811 			       sk_rmem_alloc_get(s),
3812 			       sk_wmem_alloc_get(s),
3813 			       from_kuid_munged(seq_user_ns(f), sk_uid(s)),
3814 			       sock_i_ino(s)
3815 			       );
3816 	return 0;
3817 }
3818 
3819 static void *pfkey_seq_start(struct seq_file *f, loff_t *ppos)
3820 	__acquires(rcu)
3821 {
3822 	struct net *net = seq_file_net(f);
3823 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3824 
3825 	rcu_read_lock();
3826 	return seq_hlist_start_head_rcu(&net_pfkey->table, *ppos);
3827 }
3828 
3829 static void *pfkey_seq_next(struct seq_file *f, void *v, loff_t *ppos)
3830 {
3831 	struct net *net = seq_file_net(f);
3832 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3833 
3834 	return seq_hlist_next_rcu(v, &net_pfkey->table, ppos);
3835 }
3836 
3837 static void pfkey_seq_stop(struct seq_file *f, void *v)
3838 	__releases(rcu)
3839 {
3840 	rcu_read_unlock();
3841 }
3842 
3843 static const struct seq_operations pfkey_seq_ops = {
3844 	.start	= pfkey_seq_start,
3845 	.next	= pfkey_seq_next,
3846 	.stop	= pfkey_seq_stop,
3847 	.show	= pfkey_seq_show,
3848 };
3849 
3850 static int __net_init pfkey_init_proc(struct net *net)
3851 {
3852 	struct proc_dir_entry *e;
3853 
3854 	e = proc_create_net("pfkey", 0, net->proc_net, &pfkey_seq_ops,
3855 			sizeof(struct seq_net_private));
3856 	if (e == NULL)
3857 		return -ENOMEM;
3858 
3859 	return 0;
3860 }
3861 
3862 static void __net_exit pfkey_exit_proc(struct net *net)
3863 {
3864 	remove_proc_entry("pfkey", net->proc_net);
3865 }
3866 #else
3867 static inline int pfkey_init_proc(struct net *net)
3868 {
3869 	return 0;
3870 }
3871 
3872 static inline void pfkey_exit_proc(struct net *net)
3873 {
3874 }
3875 #endif
3876 
3877 static struct xfrm_mgr pfkeyv2_mgr =
3878 {
3879 	.notify		= pfkey_send_notify,
3880 	.acquire	= pfkey_send_acquire,
3881 	.compile_policy	= pfkey_compile_policy,
3882 	.new_mapping	= pfkey_send_new_mapping,
3883 	.notify_policy	= pfkey_send_policy_notify,
3884 	.migrate	= pfkey_send_migrate,
3885 	.is_alive	= pfkey_is_alive,
3886 };
3887 
3888 static int __net_init pfkey_net_init(struct net *net)
3889 {
3890 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3891 	int rv;
3892 
3893 	INIT_HLIST_HEAD(&net_pfkey->table);
3894 	atomic_set(&net_pfkey->socks_nr, 0);
3895 
3896 	rv = pfkey_init_proc(net);
3897 
3898 	return rv;
3899 }
3900 
3901 static void __net_exit pfkey_net_exit(struct net *net)
3902 {
3903 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3904 
3905 	pfkey_exit_proc(net);
3906 	WARN_ON(!hlist_empty(&net_pfkey->table));
3907 }
3908 
3909 static struct pernet_operations pfkey_net_ops = {
3910 	.init = pfkey_net_init,
3911 	.exit = pfkey_net_exit,
3912 	.id   = &pfkey_net_id,
3913 	.size = sizeof(struct netns_pfkey),
3914 };
3915 
3916 static void __exit ipsec_pfkey_exit(void)
3917 {
3918 	xfrm_unregister_km(&pfkeyv2_mgr);
3919 	sock_unregister(PF_KEY);
3920 	unregister_pernet_subsys(&pfkey_net_ops);
3921 	proto_unregister(&key_proto);
3922 }
3923 
3924 static int __init ipsec_pfkey_init(void)
3925 {
3926 	int err = proto_register(&key_proto, 0);
3927 
3928 	pr_warn_once("PFKEY is deprecated and scheduled to be removed in 2027, "
3929 	             "please contact the netdev mailing list\n");
3930 	if (err != 0)
3931 		goto out;
3932 
3933 	err = register_pernet_subsys(&pfkey_net_ops);
3934 	if (err != 0)
3935 		goto out_unregister_key_proto;
3936 	err = sock_register(&pfkey_family_ops);
3937 	if (err != 0)
3938 		goto out_unregister_pernet;
3939 	xfrm_register_km(&pfkeyv2_mgr);
3940 out:
3941 	return err;
3942 
3943 out_unregister_pernet:
3944 	unregister_pernet_subsys(&pfkey_net_ops);
3945 out_unregister_key_proto:
3946 	proto_unregister(&key_proto);
3947 	goto out;
3948 }
3949 
3950 module_init(ipsec_pfkey_init);
3951 module_exit(ipsec_pfkey_exit);
3952 MODULE_DESCRIPTION("PF_KEY socket helpers");
3953 MODULE_LICENSE("GPL");
3954 MODULE_ALIAS_NETPROTO(PF_KEY);
3955