xref: /linux/net/key/af_key.c (revision 6ede2b7df92f4f8da1abfa831a038688fcf409ea)
1 /*
2  * net/key/af_key.c	An implementation of PF_KEYv2 sockets.
3  *
4  *		This program is free software; you can redistribute it and/or
5  *		modify it under the terms of the GNU General Public License
6  *		as published by the Free Software Foundation; either version
7  *		2 of the License, or (at your option) any later version.
8  *
9  * Authors:	Maxim Giryaev	<gem@asplinux.ru>
10  *		David S. Miller	<davem@redhat.com>
11  *		Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
12  *		Kunihiro Ishiguro <kunihiro@ipinfusion.com>
13  *		Kazunori MIYAZAWA / USAGI Project <miyazawa@linux-ipv6.org>
14  *		Derek Atkins <derek@ihtfp.com>
15  */
16 
17 #include <linux/capability.h>
18 #include <linux/module.h>
19 #include <linux/kernel.h>
20 #include <linux/socket.h>
21 #include <linux/pfkeyv2.h>
22 #include <linux/ipsec.h>
23 #include <linux/skbuff.h>
24 #include <linux/rtnetlink.h>
25 #include <linux/in.h>
26 #include <linux/in6.h>
27 #include <linux/proc_fs.h>
28 #include <linux/init.h>
29 #include <linux/slab.h>
30 #include <net/net_namespace.h>
31 #include <net/netns/generic.h>
32 #include <net/xfrm.h>
33 
34 #include <net/sock.h>
35 
36 #define _X2KEY(x) ((x) == XFRM_INF ? 0 : (x))
37 #define _KEY2X(x) ((x) == 0 ? XFRM_INF : (x))
38 
39 static unsigned int pfkey_net_id __read_mostly;
40 struct netns_pfkey {
41 	/* List of all pfkey sockets. */
42 	struct hlist_head table;
43 	atomic_t socks_nr;
44 };
45 static DEFINE_MUTEX(pfkey_mutex);
46 
47 #define DUMMY_MARK 0
48 static const struct xfrm_mark dummy_mark = {0, 0};
49 struct pfkey_sock {
50 	/* struct sock must be the first member of struct pfkey_sock */
51 	struct sock	sk;
52 	int		registered;
53 	int		promisc;
54 
55 	struct {
56 		uint8_t		msg_version;
57 		uint32_t	msg_portid;
58 		int		(*dump)(struct pfkey_sock *sk);
59 		void		(*done)(struct pfkey_sock *sk);
60 		union {
61 			struct xfrm_policy_walk	policy;
62 			struct xfrm_state_walk	state;
63 		} u;
64 		struct sk_buff	*skb;
65 	} dump;
66 	struct mutex dump_lock;
67 };
68 
69 static int parse_sockaddr_pair(struct sockaddr *sa, int ext_len,
70 			       xfrm_address_t *saddr, xfrm_address_t *daddr,
71 			       u16 *family);
72 
73 static inline struct pfkey_sock *pfkey_sk(struct sock *sk)
74 {
75 	return (struct pfkey_sock *)sk;
76 }
77 
78 static int pfkey_can_dump(const struct sock *sk)
79 {
80 	if (3 * atomic_read(&sk->sk_rmem_alloc) <= 2 * sk->sk_rcvbuf)
81 		return 1;
82 	return 0;
83 }
84 
85 static void pfkey_terminate_dump(struct pfkey_sock *pfk)
86 {
87 	if (pfk->dump.dump) {
88 		if (pfk->dump.skb) {
89 			kfree_skb(pfk->dump.skb);
90 			pfk->dump.skb = NULL;
91 		}
92 		pfk->dump.done(pfk);
93 		pfk->dump.dump = NULL;
94 		pfk->dump.done = NULL;
95 	}
96 }
97 
98 static void pfkey_sock_destruct(struct sock *sk)
99 {
100 	struct net *net = sock_net(sk);
101 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
102 
103 	pfkey_terminate_dump(pfkey_sk(sk));
104 	skb_queue_purge(&sk->sk_receive_queue);
105 
106 	if (!sock_flag(sk, SOCK_DEAD)) {
107 		pr_err("Attempt to release alive pfkey socket: %p\n", sk);
108 		return;
109 	}
110 
111 	WARN_ON(atomic_read(&sk->sk_rmem_alloc));
112 	WARN_ON(atomic_read(&sk->sk_wmem_alloc));
113 
114 	atomic_dec(&net_pfkey->socks_nr);
115 }
116 
117 static const struct proto_ops pfkey_ops;
118 
119 static void pfkey_insert(struct sock *sk)
120 {
121 	struct net *net = sock_net(sk);
122 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
123 
124 	mutex_lock(&pfkey_mutex);
125 	sk_add_node_rcu(sk, &net_pfkey->table);
126 	mutex_unlock(&pfkey_mutex);
127 }
128 
129 static void pfkey_remove(struct sock *sk)
130 {
131 	mutex_lock(&pfkey_mutex);
132 	sk_del_node_init_rcu(sk);
133 	mutex_unlock(&pfkey_mutex);
134 }
135 
136 static struct proto key_proto = {
137 	.name	  = "KEY",
138 	.owner	  = THIS_MODULE,
139 	.obj_size = sizeof(struct pfkey_sock),
140 };
141 
142 static int pfkey_create(struct net *net, struct socket *sock, int protocol,
143 			int kern)
144 {
145 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
146 	struct sock *sk;
147 	struct pfkey_sock *pfk;
148 	int err;
149 
150 	if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
151 		return -EPERM;
152 	if (sock->type != SOCK_RAW)
153 		return -ESOCKTNOSUPPORT;
154 	if (protocol != PF_KEY_V2)
155 		return -EPROTONOSUPPORT;
156 
157 	err = -ENOMEM;
158 	sk = sk_alloc(net, PF_KEY, GFP_KERNEL, &key_proto, kern);
159 	if (sk == NULL)
160 		goto out;
161 
162 	pfk = pfkey_sk(sk);
163 	mutex_init(&pfk->dump_lock);
164 
165 	sock->ops = &pfkey_ops;
166 	sock_init_data(sock, sk);
167 
168 	sk->sk_family = PF_KEY;
169 	sk->sk_destruct = pfkey_sock_destruct;
170 
171 	atomic_inc(&net_pfkey->socks_nr);
172 
173 	pfkey_insert(sk);
174 
175 	return 0;
176 out:
177 	return err;
178 }
179 
180 static int pfkey_release(struct socket *sock)
181 {
182 	struct sock *sk = sock->sk;
183 
184 	if (!sk)
185 		return 0;
186 
187 	pfkey_remove(sk);
188 
189 	sock_orphan(sk);
190 	sock->sk = NULL;
191 	skb_queue_purge(&sk->sk_write_queue);
192 
193 	synchronize_rcu();
194 	sock_put(sk);
195 
196 	return 0;
197 }
198 
199 static int pfkey_broadcast_one(struct sk_buff *skb, struct sk_buff **skb2,
200 			       gfp_t allocation, struct sock *sk)
201 {
202 	int err = -ENOBUFS;
203 
204 	sock_hold(sk);
205 	if (*skb2 == NULL) {
206 		if (atomic_read(&skb->users) != 1) {
207 			*skb2 = skb_clone(skb, allocation);
208 		} else {
209 			*skb2 = skb;
210 			atomic_inc(&skb->users);
211 		}
212 	}
213 	if (*skb2 != NULL) {
214 		if (atomic_read(&sk->sk_rmem_alloc) <= sk->sk_rcvbuf) {
215 			skb_set_owner_r(*skb2, sk);
216 			skb_queue_tail(&sk->sk_receive_queue, *skb2);
217 			sk->sk_data_ready(sk);
218 			*skb2 = NULL;
219 			err = 0;
220 		}
221 	}
222 	sock_put(sk);
223 	return err;
224 }
225 
226 /* Send SKB to all pfkey sockets matching selected criteria.  */
227 #define BROADCAST_ALL		0
228 #define BROADCAST_ONE		1
229 #define BROADCAST_REGISTERED	2
230 #define BROADCAST_PROMISC_ONLY	4
231 static int pfkey_broadcast(struct sk_buff *skb,
232 			   int broadcast_flags, struct sock *one_sk,
233 			   struct net *net)
234 {
235 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
236 	struct sock *sk;
237 	struct sk_buff *skb2 = NULL;
238 	int err = -ESRCH;
239 
240 	/* XXX Do we need something like netlink_overrun?  I think
241 	 * XXX PF_KEY socket apps will not mind current behavior.
242 	 */
243 	if (!skb)
244 		return -ENOMEM;
245 
246 	rcu_read_lock();
247 	sk_for_each_rcu(sk, &net_pfkey->table) {
248 		struct pfkey_sock *pfk = pfkey_sk(sk);
249 		int err2;
250 
251 		/* Yes, it means that if you are meant to receive this
252 		 * pfkey message you receive it twice as promiscuous
253 		 * socket.
254 		 */
255 		if (pfk->promisc)
256 			pfkey_broadcast_one(skb, &skb2, GFP_ATOMIC, sk);
257 
258 		/* the exact target will be processed later */
259 		if (sk == one_sk)
260 			continue;
261 		if (broadcast_flags != BROADCAST_ALL) {
262 			if (broadcast_flags & BROADCAST_PROMISC_ONLY)
263 				continue;
264 			if ((broadcast_flags & BROADCAST_REGISTERED) &&
265 			    !pfk->registered)
266 				continue;
267 			if (broadcast_flags & BROADCAST_ONE)
268 				continue;
269 		}
270 
271 		err2 = pfkey_broadcast_one(skb, &skb2, GFP_ATOMIC, sk);
272 
273 		/* Error is cleared after successful sending to at least one
274 		 * registered KM */
275 		if ((broadcast_flags & BROADCAST_REGISTERED) && err)
276 			err = err2;
277 	}
278 	rcu_read_unlock();
279 
280 	if (one_sk != NULL)
281 		err = pfkey_broadcast_one(skb, &skb2, GFP_KERNEL, one_sk);
282 
283 	kfree_skb(skb2);
284 	kfree_skb(skb);
285 	return err;
286 }
287 
288 static int pfkey_do_dump(struct pfkey_sock *pfk)
289 {
290 	struct sadb_msg *hdr;
291 	int rc;
292 
293 	mutex_lock(&pfk->dump_lock);
294 	if (!pfk->dump.dump) {
295 		rc = 0;
296 		goto out;
297 	}
298 
299 	rc = pfk->dump.dump(pfk);
300 	if (rc == -ENOBUFS) {
301 		rc = 0;
302 		goto out;
303 	}
304 
305 	if (pfk->dump.skb) {
306 		if (!pfkey_can_dump(&pfk->sk)) {
307 			rc = 0;
308 			goto out;
309 		}
310 
311 		hdr = (struct sadb_msg *) pfk->dump.skb->data;
312 		hdr->sadb_msg_seq = 0;
313 		hdr->sadb_msg_errno = rc;
314 		pfkey_broadcast(pfk->dump.skb, BROADCAST_ONE,
315 				&pfk->sk, sock_net(&pfk->sk));
316 		pfk->dump.skb = NULL;
317 	}
318 
319 	pfkey_terminate_dump(pfk);
320 
321 out:
322 	mutex_unlock(&pfk->dump_lock);
323 	return rc;
324 }
325 
326 static inline void pfkey_hdr_dup(struct sadb_msg *new,
327 				 const struct sadb_msg *orig)
328 {
329 	*new = *orig;
330 }
331 
332 static int pfkey_error(const struct sadb_msg *orig, int err, struct sock *sk)
333 {
334 	struct sk_buff *skb = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_KERNEL);
335 	struct sadb_msg *hdr;
336 
337 	if (!skb)
338 		return -ENOBUFS;
339 
340 	/* Woe be to the platform trying to support PFKEY yet
341 	 * having normal errnos outside the 1-255 range, inclusive.
342 	 */
343 	err = -err;
344 	if (err == ERESTARTSYS ||
345 	    err == ERESTARTNOHAND ||
346 	    err == ERESTARTNOINTR)
347 		err = EINTR;
348 	if (err >= 512)
349 		err = EINVAL;
350 	BUG_ON(err <= 0 || err >= 256);
351 
352 	hdr = (struct sadb_msg *) skb_put(skb, sizeof(struct sadb_msg));
353 	pfkey_hdr_dup(hdr, orig);
354 	hdr->sadb_msg_errno = (uint8_t) err;
355 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) /
356 			     sizeof(uint64_t));
357 
358 	pfkey_broadcast(skb, BROADCAST_ONE, sk, sock_net(sk));
359 
360 	return 0;
361 }
362 
363 static const u8 sadb_ext_min_len[] = {
364 	[SADB_EXT_RESERVED]		= (u8) 0,
365 	[SADB_EXT_SA]			= (u8) sizeof(struct sadb_sa),
366 	[SADB_EXT_LIFETIME_CURRENT]	= (u8) sizeof(struct sadb_lifetime),
367 	[SADB_EXT_LIFETIME_HARD]	= (u8) sizeof(struct sadb_lifetime),
368 	[SADB_EXT_LIFETIME_SOFT]	= (u8) sizeof(struct sadb_lifetime),
369 	[SADB_EXT_ADDRESS_SRC]		= (u8) sizeof(struct sadb_address),
370 	[SADB_EXT_ADDRESS_DST]		= (u8) sizeof(struct sadb_address),
371 	[SADB_EXT_ADDRESS_PROXY]	= (u8) sizeof(struct sadb_address),
372 	[SADB_EXT_KEY_AUTH]		= (u8) sizeof(struct sadb_key),
373 	[SADB_EXT_KEY_ENCRYPT]		= (u8) sizeof(struct sadb_key),
374 	[SADB_EXT_IDENTITY_SRC]		= (u8) sizeof(struct sadb_ident),
375 	[SADB_EXT_IDENTITY_DST]		= (u8) sizeof(struct sadb_ident),
376 	[SADB_EXT_SENSITIVITY]		= (u8) sizeof(struct sadb_sens),
377 	[SADB_EXT_PROPOSAL]		= (u8) sizeof(struct sadb_prop),
378 	[SADB_EXT_SUPPORTED_AUTH]	= (u8) sizeof(struct sadb_supported),
379 	[SADB_EXT_SUPPORTED_ENCRYPT]	= (u8) sizeof(struct sadb_supported),
380 	[SADB_EXT_SPIRANGE]		= (u8) sizeof(struct sadb_spirange),
381 	[SADB_X_EXT_KMPRIVATE]		= (u8) sizeof(struct sadb_x_kmprivate),
382 	[SADB_X_EXT_POLICY]		= (u8) sizeof(struct sadb_x_policy),
383 	[SADB_X_EXT_SA2]		= (u8) sizeof(struct sadb_x_sa2),
384 	[SADB_X_EXT_NAT_T_TYPE]		= (u8) sizeof(struct sadb_x_nat_t_type),
385 	[SADB_X_EXT_NAT_T_SPORT]	= (u8) sizeof(struct sadb_x_nat_t_port),
386 	[SADB_X_EXT_NAT_T_DPORT]	= (u8) sizeof(struct sadb_x_nat_t_port),
387 	[SADB_X_EXT_NAT_T_OA]		= (u8) sizeof(struct sadb_address),
388 	[SADB_X_EXT_SEC_CTX]		= (u8) sizeof(struct sadb_x_sec_ctx),
389 	[SADB_X_EXT_KMADDRESS]		= (u8) sizeof(struct sadb_x_kmaddress),
390 	[SADB_X_EXT_FILTER]		= (u8) sizeof(struct sadb_x_filter),
391 };
392 
393 /* Verify sadb_address_{len,prefixlen} against sa_family.  */
394 static int verify_address_len(const void *p)
395 {
396 	const struct sadb_address *sp = p;
397 	const struct sockaddr *addr = (const struct sockaddr *)(sp + 1);
398 	const struct sockaddr_in *sin;
399 #if IS_ENABLED(CONFIG_IPV6)
400 	const struct sockaddr_in6 *sin6;
401 #endif
402 	int len;
403 
404 	switch (addr->sa_family) {
405 	case AF_INET:
406 		len = DIV_ROUND_UP(sizeof(*sp) + sizeof(*sin), sizeof(uint64_t));
407 		if (sp->sadb_address_len != len ||
408 		    sp->sadb_address_prefixlen > 32)
409 			return -EINVAL;
410 		break;
411 #if IS_ENABLED(CONFIG_IPV6)
412 	case AF_INET6:
413 		len = DIV_ROUND_UP(sizeof(*sp) + sizeof(*sin6), sizeof(uint64_t));
414 		if (sp->sadb_address_len != len ||
415 		    sp->sadb_address_prefixlen > 128)
416 			return -EINVAL;
417 		break;
418 #endif
419 	default:
420 		/* It is user using kernel to keep track of security
421 		 * associations for another protocol, such as
422 		 * OSPF/RSVP/RIPV2/MIP.  It is user's job to verify
423 		 * lengths.
424 		 *
425 		 * XXX Actually, association/policy database is not yet
426 		 * XXX able to cope with arbitrary sockaddr families.
427 		 * XXX When it can, remove this -EINVAL.  -DaveM
428 		 */
429 		return -EINVAL;
430 	}
431 
432 	return 0;
433 }
434 
435 static inline int pfkey_sec_ctx_len(const struct sadb_x_sec_ctx *sec_ctx)
436 {
437 	return DIV_ROUND_UP(sizeof(struct sadb_x_sec_ctx) +
438 			    sec_ctx->sadb_x_ctx_len,
439 			    sizeof(uint64_t));
440 }
441 
442 static inline int verify_sec_ctx_len(const void *p)
443 {
444 	const struct sadb_x_sec_ctx *sec_ctx = p;
445 	int len = sec_ctx->sadb_x_ctx_len;
446 
447 	if (len > PAGE_SIZE)
448 		return -EINVAL;
449 
450 	len = pfkey_sec_ctx_len(sec_ctx);
451 
452 	if (sec_ctx->sadb_x_sec_len != len)
453 		return -EINVAL;
454 
455 	return 0;
456 }
457 
458 static inline struct xfrm_user_sec_ctx *pfkey_sadb2xfrm_user_sec_ctx(const struct sadb_x_sec_ctx *sec_ctx,
459 								     gfp_t gfp)
460 {
461 	struct xfrm_user_sec_ctx *uctx = NULL;
462 	int ctx_size = sec_ctx->sadb_x_ctx_len;
463 
464 	uctx = kmalloc((sizeof(*uctx)+ctx_size), gfp);
465 
466 	if (!uctx)
467 		return NULL;
468 
469 	uctx->len = pfkey_sec_ctx_len(sec_ctx);
470 	uctx->exttype = sec_ctx->sadb_x_sec_exttype;
471 	uctx->ctx_doi = sec_ctx->sadb_x_ctx_doi;
472 	uctx->ctx_alg = sec_ctx->sadb_x_ctx_alg;
473 	uctx->ctx_len = sec_ctx->sadb_x_ctx_len;
474 	memcpy(uctx + 1, sec_ctx + 1,
475 	       uctx->ctx_len);
476 
477 	return uctx;
478 }
479 
480 static int present_and_same_family(const struct sadb_address *src,
481 				   const struct sadb_address *dst)
482 {
483 	const struct sockaddr *s_addr, *d_addr;
484 
485 	if (!src || !dst)
486 		return 0;
487 
488 	s_addr = (const struct sockaddr *)(src + 1);
489 	d_addr = (const struct sockaddr *)(dst + 1);
490 	if (s_addr->sa_family != d_addr->sa_family)
491 		return 0;
492 	if (s_addr->sa_family != AF_INET
493 #if IS_ENABLED(CONFIG_IPV6)
494 	    && s_addr->sa_family != AF_INET6
495 #endif
496 		)
497 		return 0;
498 
499 	return 1;
500 }
501 
502 static int parse_exthdrs(struct sk_buff *skb, const struct sadb_msg *hdr, void **ext_hdrs)
503 {
504 	const char *p = (char *) hdr;
505 	int len = skb->len;
506 
507 	len -= sizeof(*hdr);
508 	p += sizeof(*hdr);
509 	while (len > 0) {
510 		const struct sadb_ext *ehdr = (const struct sadb_ext *) p;
511 		uint16_t ext_type;
512 		int ext_len;
513 
514 		ext_len  = ehdr->sadb_ext_len;
515 		ext_len *= sizeof(uint64_t);
516 		ext_type = ehdr->sadb_ext_type;
517 		if (ext_len < sizeof(uint64_t) ||
518 		    ext_len > len ||
519 		    ext_type == SADB_EXT_RESERVED)
520 			return -EINVAL;
521 
522 		if (ext_type <= SADB_EXT_MAX) {
523 			int min = (int) sadb_ext_min_len[ext_type];
524 			if (ext_len < min)
525 				return -EINVAL;
526 			if (ext_hdrs[ext_type-1] != NULL)
527 				return -EINVAL;
528 			if (ext_type == SADB_EXT_ADDRESS_SRC ||
529 			    ext_type == SADB_EXT_ADDRESS_DST ||
530 			    ext_type == SADB_EXT_ADDRESS_PROXY ||
531 			    ext_type == SADB_X_EXT_NAT_T_OA) {
532 				if (verify_address_len(p))
533 					return -EINVAL;
534 			}
535 			if (ext_type == SADB_X_EXT_SEC_CTX) {
536 				if (verify_sec_ctx_len(p))
537 					return -EINVAL;
538 			}
539 			ext_hdrs[ext_type-1] = (void *) p;
540 		}
541 		p   += ext_len;
542 		len -= ext_len;
543 	}
544 
545 	return 0;
546 }
547 
548 static uint16_t
549 pfkey_satype2proto(uint8_t satype)
550 {
551 	switch (satype) {
552 	case SADB_SATYPE_UNSPEC:
553 		return IPSEC_PROTO_ANY;
554 	case SADB_SATYPE_AH:
555 		return IPPROTO_AH;
556 	case SADB_SATYPE_ESP:
557 		return IPPROTO_ESP;
558 	case SADB_X_SATYPE_IPCOMP:
559 		return IPPROTO_COMP;
560 	default:
561 		return 0;
562 	}
563 	/* NOTREACHED */
564 }
565 
566 static uint8_t
567 pfkey_proto2satype(uint16_t proto)
568 {
569 	switch (proto) {
570 	case IPPROTO_AH:
571 		return SADB_SATYPE_AH;
572 	case IPPROTO_ESP:
573 		return SADB_SATYPE_ESP;
574 	case IPPROTO_COMP:
575 		return SADB_X_SATYPE_IPCOMP;
576 	default:
577 		return 0;
578 	}
579 	/* NOTREACHED */
580 }
581 
582 /* BTW, this scheme means that there is no way with PFKEY2 sockets to
583  * say specifically 'just raw sockets' as we encode them as 255.
584  */
585 
586 static uint8_t pfkey_proto_to_xfrm(uint8_t proto)
587 {
588 	return proto == IPSEC_PROTO_ANY ? 0 : proto;
589 }
590 
591 static uint8_t pfkey_proto_from_xfrm(uint8_t proto)
592 {
593 	return proto ? proto : IPSEC_PROTO_ANY;
594 }
595 
596 static inline int pfkey_sockaddr_len(sa_family_t family)
597 {
598 	switch (family) {
599 	case AF_INET:
600 		return sizeof(struct sockaddr_in);
601 #if IS_ENABLED(CONFIG_IPV6)
602 	case AF_INET6:
603 		return sizeof(struct sockaddr_in6);
604 #endif
605 	}
606 	return 0;
607 }
608 
609 static
610 int pfkey_sockaddr_extract(const struct sockaddr *sa, xfrm_address_t *xaddr)
611 {
612 	switch (sa->sa_family) {
613 	case AF_INET:
614 		xaddr->a4 =
615 			((struct sockaddr_in *)sa)->sin_addr.s_addr;
616 		return AF_INET;
617 #if IS_ENABLED(CONFIG_IPV6)
618 	case AF_INET6:
619 		memcpy(xaddr->a6,
620 		       &((struct sockaddr_in6 *)sa)->sin6_addr,
621 		       sizeof(struct in6_addr));
622 		return AF_INET6;
623 #endif
624 	}
625 	return 0;
626 }
627 
628 static
629 int pfkey_sadb_addr2xfrm_addr(const struct sadb_address *addr, xfrm_address_t *xaddr)
630 {
631 	return pfkey_sockaddr_extract((struct sockaddr *)(addr + 1),
632 				      xaddr);
633 }
634 
635 static struct  xfrm_state *pfkey_xfrm_state_lookup(struct net *net, const struct sadb_msg *hdr, void * const *ext_hdrs)
636 {
637 	const struct sadb_sa *sa;
638 	const struct sadb_address *addr;
639 	uint16_t proto;
640 	unsigned short family;
641 	xfrm_address_t *xaddr;
642 
643 	sa = ext_hdrs[SADB_EXT_SA - 1];
644 	if (sa == NULL)
645 		return NULL;
646 
647 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
648 	if (proto == 0)
649 		return NULL;
650 
651 	/* sadb_address_len should be checked by caller */
652 	addr = ext_hdrs[SADB_EXT_ADDRESS_DST - 1];
653 	if (addr == NULL)
654 		return NULL;
655 
656 	family = ((const struct sockaddr *)(addr + 1))->sa_family;
657 	switch (family) {
658 	case AF_INET:
659 		xaddr = (xfrm_address_t *)&((const struct sockaddr_in *)(addr + 1))->sin_addr;
660 		break;
661 #if IS_ENABLED(CONFIG_IPV6)
662 	case AF_INET6:
663 		xaddr = (xfrm_address_t *)&((const struct sockaddr_in6 *)(addr + 1))->sin6_addr;
664 		break;
665 #endif
666 	default:
667 		xaddr = NULL;
668 	}
669 
670 	if (!xaddr)
671 		return NULL;
672 
673 	return xfrm_state_lookup(net, DUMMY_MARK, xaddr, sa->sadb_sa_spi, proto, family);
674 }
675 
676 #define PFKEY_ALIGN8(a) (1 + (((a) - 1) | (8 - 1)))
677 
678 static int
679 pfkey_sockaddr_size(sa_family_t family)
680 {
681 	return PFKEY_ALIGN8(pfkey_sockaddr_len(family));
682 }
683 
684 static inline int pfkey_mode_from_xfrm(int mode)
685 {
686 	switch(mode) {
687 	case XFRM_MODE_TRANSPORT:
688 		return IPSEC_MODE_TRANSPORT;
689 	case XFRM_MODE_TUNNEL:
690 		return IPSEC_MODE_TUNNEL;
691 	case XFRM_MODE_BEET:
692 		return IPSEC_MODE_BEET;
693 	default:
694 		return -1;
695 	}
696 }
697 
698 static inline int pfkey_mode_to_xfrm(int mode)
699 {
700 	switch(mode) {
701 	case IPSEC_MODE_ANY:	/*XXX*/
702 	case IPSEC_MODE_TRANSPORT:
703 		return XFRM_MODE_TRANSPORT;
704 	case IPSEC_MODE_TUNNEL:
705 		return XFRM_MODE_TUNNEL;
706 	case IPSEC_MODE_BEET:
707 		return XFRM_MODE_BEET;
708 	default:
709 		return -1;
710 	}
711 }
712 
713 static unsigned int pfkey_sockaddr_fill(const xfrm_address_t *xaddr, __be16 port,
714 					struct sockaddr *sa,
715 					unsigned short family)
716 {
717 	switch (family) {
718 	case AF_INET:
719 	    {
720 		struct sockaddr_in *sin = (struct sockaddr_in *)sa;
721 		sin->sin_family = AF_INET;
722 		sin->sin_port = port;
723 		sin->sin_addr.s_addr = xaddr->a4;
724 		memset(sin->sin_zero, 0, sizeof(sin->sin_zero));
725 		return 32;
726 	    }
727 #if IS_ENABLED(CONFIG_IPV6)
728 	case AF_INET6:
729 	    {
730 		struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)sa;
731 		sin6->sin6_family = AF_INET6;
732 		sin6->sin6_port = port;
733 		sin6->sin6_flowinfo = 0;
734 		sin6->sin6_addr = xaddr->in6;
735 		sin6->sin6_scope_id = 0;
736 		return 128;
737 	    }
738 #endif
739 	}
740 	return 0;
741 }
742 
743 static struct sk_buff *__pfkey_xfrm_state2msg(const struct xfrm_state *x,
744 					      int add_keys, int hsc)
745 {
746 	struct sk_buff *skb;
747 	struct sadb_msg *hdr;
748 	struct sadb_sa *sa;
749 	struct sadb_lifetime *lifetime;
750 	struct sadb_address *addr;
751 	struct sadb_key *key;
752 	struct sadb_x_sa2 *sa2;
753 	struct sadb_x_sec_ctx *sec_ctx;
754 	struct xfrm_sec_ctx *xfrm_ctx;
755 	int ctx_size = 0;
756 	int size;
757 	int auth_key_size = 0;
758 	int encrypt_key_size = 0;
759 	int sockaddr_size;
760 	struct xfrm_encap_tmpl *natt = NULL;
761 	int mode;
762 
763 	/* address family check */
764 	sockaddr_size = pfkey_sockaddr_size(x->props.family);
765 	if (!sockaddr_size)
766 		return ERR_PTR(-EINVAL);
767 
768 	/* base, SA, (lifetime (HSC),) address(SD), (address(P),)
769 	   key(AE), (identity(SD),) (sensitivity)> */
770 	size = sizeof(struct sadb_msg) +sizeof(struct sadb_sa) +
771 		sizeof(struct sadb_lifetime) +
772 		((hsc & 1) ? sizeof(struct sadb_lifetime) : 0) +
773 		((hsc & 2) ? sizeof(struct sadb_lifetime) : 0) +
774 			sizeof(struct sadb_address)*2 +
775 				sockaddr_size*2 +
776 					sizeof(struct sadb_x_sa2);
777 
778 	if ((xfrm_ctx = x->security)) {
779 		ctx_size = PFKEY_ALIGN8(xfrm_ctx->ctx_len);
780 		size += sizeof(struct sadb_x_sec_ctx) + ctx_size;
781 	}
782 
783 	/* identity & sensitivity */
784 	if (!xfrm_addr_equal(&x->sel.saddr, &x->props.saddr, x->props.family))
785 		size += sizeof(struct sadb_address) + sockaddr_size;
786 
787 	if (add_keys) {
788 		if (x->aalg && x->aalg->alg_key_len) {
789 			auth_key_size =
790 				PFKEY_ALIGN8((x->aalg->alg_key_len + 7) / 8);
791 			size += sizeof(struct sadb_key) + auth_key_size;
792 		}
793 		if (x->ealg && x->ealg->alg_key_len) {
794 			encrypt_key_size =
795 				PFKEY_ALIGN8((x->ealg->alg_key_len+7) / 8);
796 			size += sizeof(struct sadb_key) + encrypt_key_size;
797 		}
798 	}
799 	if (x->encap)
800 		natt = x->encap;
801 
802 	if (natt && natt->encap_type) {
803 		size += sizeof(struct sadb_x_nat_t_type);
804 		size += sizeof(struct sadb_x_nat_t_port);
805 		size += sizeof(struct sadb_x_nat_t_port);
806 	}
807 
808 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
809 	if (skb == NULL)
810 		return ERR_PTR(-ENOBUFS);
811 
812 	/* call should fill header later */
813 	hdr = (struct sadb_msg *) skb_put(skb, sizeof(struct sadb_msg));
814 	memset(hdr, 0, size);	/* XXX do we need this ? */
815 	hdr->sadb_msg_len = size / sizeof(uint64_t);
816 
817 	/* sa */
818 	sa = (struct sadb_sa *)  skb_put(skb, sizeof(struct sadb_sa));
819 	sa->sadb_sa_len = sizeof(struct sadb_sa)/sizeof(uint64_t);
820 	sa->sadb_sa_exttype = SADB_EXT_SA;
821 	sa->sadb_sa_spi = x->id.spi;
822 	sa->sadb_sa_replay = x->props.replay_window;
823 	switch (x->km.state) {
824 	case XFRM_STATE_VALID:
825 		sa->sadb_sa_state = x->km.dying ?
826 			SADB_SASTATE_DYING : SADB_SASTATE_MATURE;
827 		break;
828 	case XFRM_STATE_ACQ:
829 		sa->sadb_sa_state = SADB_SASTATE_LARVAL;
830 		break;
831 	default:
832 		sa->sadb_sa_state = SADB_SASTATE_DEAD;
833 		break;
834 	}
835 	sa->sadb_sa_auth = 0;
836 	if (x->aalg) {
837 		struct xfrm_algo_desc *a = xfrm_aalg_get_byname(x->aalg->alg_name, 0);
838 		sa->sadb_sa_auth = (a && a->pfkey_supported) ?
839 					a->desc.sadb_alg_id : 0;
840 	}
841 	sa->sadb_sa_encrypt = 0;
842 	BUG_ON(x->ealg && x->calg);
843 	if (x->ealg) {
844 		struct xfrm_algo_desc *a = xfrm_ealg_get_byname(x->ealg->alg_name, 0);
845 		sa->sadb_sa_encrypt = (a && a->pfkey_supported) ?
846 					a->desc.sadb_alg_id : 0;
847 	}
848 	/* KAME compatible: sadb_sa_encrypt is overloaded with calg id */
849 	if (x->calg) {
850 		struct xfrm_algo_desc *a = xfrm_calg_get_byname(x->calg->alg_name, 0);
851 		sa->sadb_sa_encrypt = (a && a->pfkey_supported) ?
852 					a->desc.sadb_alg_id : 0;
853 	}
854 
855 	sa->sadb_sa_flags = 0;
856 	if (x->props.flags & XFRM_STATE_NOECN)
857 		sa->sadb_sa_flags |= SADB_SAFLAGS_NOECN;
858 	if (x->props.flags & XFRM_STATE_DECAP_DSCP)
859 		sa->sadb_sa_flags |= SADB_SAFLAGS_DECAP_DSCP;
860 	if (x->props.flags & XFRM_STATE_NOPMTUDISC)
861 		sa->sadb_sa_flags |= SADB_SAFLAGS_NOPMTUDISC;
862 
863 	/* hard time */
864 	if (hsc & 2) {
865 		lifetime = (struct sadb_lifetime *)  skb_put(skb,
866 							     sizeof(struct sadb_lifetime));
867 		lifetime->sadb_lifetime_len =
868 			sizeof(struct sadb_lifetime)/sizeof(uint64_t);
869 		lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_HARD;
870 		lifetime->sadb_lifetime_allocations =  _X2KEY(x->lft.hard_packet_limit);
871 		lifetime->sadb_lifetime_bytes = _X2KEY(x->lft.hard_byte_limit);
872 		lifetime->sadb_lifetime_addtime = x->lft.hard_add_expires_seconds;
873 		lifetime->sadb_lifetime_usetime = x->lft.hard_use_expires_seconds;
874 	}
875 	/* soft time */
876 	if (hsc & 1) {
877 		lifetime = (struct sadb_lifetime *)  skb_put(skb,
878 							     sizeof(struct sadb_lifetime));
879 		lifetime->sadb_lifetime_len =
880 			sizeof(struct sadb_lifetime)/sizeof(uint64_t);
881 		lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_SOFT;
882 		lifetime->sadb_lifetime_allocations =  _X2KEY(x->lft.soft_packet_limit);
883 		lifetime->sadb_lifetime_bytes = _X2KEY(x->lft.soft_byte_limit);
884 		lifetime->sadb_lifetime_addtime = x->lft.soft_add_expires_seconds;
885 		lifetime->sadb_lifetime_usetime = x->lft.soft_use_expires_seconds;
886 	}
887 	/* current time */
888 	lifetime = (struct sadb_lifetime *)  skb_put(skb,
889 						     sizeof(struct sadb_lifetime));
890 	lifetime->sadb_lifetime_len =
891 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
892 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_CURRENT;
893 	lifetime->sadb_lifetime_allocations = x->curlft.packets;
894 	lifetime->sadb_lifetime_bytes = x->curlft.bytes;
895 	lifetime->sadb_lifetime_addtime = x->curlft.add_time;
896 	lifetime->sadb_lifetime_usetime = x->curlft.use_time;
897 	/* src address */
898 	addr = (struct sadb_address*) skb_put(skb,
899 					      sizeof(struct sadb_address)+sockaddr_size);
900 	addr->sadb_address_len =
901 		(sizeof(struct sadb_address)+sockaddr_size)/
902 			sizeof(uint64_t);
903 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
904 	/* "if the ports are non-zero, then the sadb_address_proto field,
905 	   normally zero, MUST be filled in with the transport
906 	   protocol's number." - RFC2367 */
907 	addr->sadb_address_proto = 0;
908 	addr->sadb_address_reserved = 0;
909 
910 	addr->sadb_address_prefixlen =
911 		pfkey_sockaddr_fill(&x->props.saddr, 0,
912 				    (struct sockaddr *) (addr + 1),
913 				    x->props.family);
914 	if (!addr->sadb_address_prefixlen)
915 		BUG();
916 
917 	/* dst address */
918 	addr = (struct sadb_address*) skb_put(skb,
919 					      sizeof(struct sadb_address)+sockaddr_size);
920 	addr->sadb_address_len =
921 		(sizeof(struct sadb_address)+sockaddr_size)/
922 			sizeof(uint64_t);
923 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
924 	addr->sadb_address_proto = 0;
925 	addr->sadb_address_reserved = 0;
926 
927 	addr->sadb_address_prefixlen =
928 		pfkey_sockaddr_fill(&x->id.daddr, 0,
929 				    (struct sockaddr *) (addr + 1),
930 				    x->props.family);
931 	if (!addr->sadb_address_prefixlen)
932 		BUG();
933 
934 	if (!xfrm_addr_equal(&x->sel.saddr, &x->props.saddr,
935 			     x->props.family)) {
936 		addr = (struct sadb_address*) skb_put(skb,
937 			sizeof(struct sadb_address)+sockaddr_size);
938 		addr->sadb_address_len =
939 			(sizeof(struct sadb_address)+sockaddr_size)/
940 			sizeof(uint64_t);
941 		addr->sadb_address_exttype = SADB_EXT_ADDRESS_PROXY;
942 		addr->sadb_address_proto =
943 			pfkey_proto_from_xfrm(x->sel.proto);
944 		addr->sadb_address_prefixlen = x->sel.prefixlen_s;
945 		addr->sadb_address_reserved = 0;
946 
947 		pfkey_sockaddr_fill(&x->sel.saddr, x->sel.sport,
948 				    (struct sockaddr *) (addr + 1),
949 				    x->props.family);
950 	}
951 
952 	/* auth key */
953 	if (add_keys && auth_key_size) {
954 		key = (struct sadb_key *) skb_put(skb,
955 						  sizeof(struct sadb_key)+auth_key_size);
956 		key->sadb_key_len = (sizeof(struct sadb_key) + auth_key_size) /
957 			sizeof(uint64_t);
958 		key->sadb_key_exttype = SADB_EXT_KEY_AUTH;
959 		key->sadb_key_bits = x->aalg->alg_key_len;
960 		key->sadb_key_reserved = 0;
961 		memcpy(key + 1, x->aalg->alg_key, (x->aalg->alg_key_len+7)/8);
962 	}
963 	/* encrypt key */
964 	if (add_keys && encrypt_key_size) {
965 		key = (struct sadb_key *) skb_put(skb,
966 						  sizeof(struct sadb_key)+encrypt_key_size);
967 		key->sadb_key_len = (sizeof(struct sadb_key) +
968 				     encrypt_key_size) / sizeof(uint64_t);
969 		key->sadb_key_exttype = SADB_EXT_KEY_ENCRYPT;
970 		key->sadb_key_bits = x->ealg->alg_key_len;
971 		key->sadb_key_reserved = 0;
972 		memcpy(key + 1, x->ealg->alg_key,
973 		       (x->ealg->alg_key_len+7)/8);
974 	}
975 
976 	/* sa */
977 	sa2 = (struct sadb_x_sa2 *)  skb_put(skb, sizeof(struct sadb_x_sa2));
978 	sa2->sadb_x_sa2_len = sizeof(struct sadb_x_sa2)/sizeof(uint64_t);
979 	sa2->sadb_x_sa2_exttype = SADB_X_EXT_SA2;
980 	if ((mode = pfkey_mode_from_xfrm(x->props.mode)) < 0) {
981 		kfree_skb(skb);
982 		return ERR_PTR(-EINVAL);
983 	}
984 	sa2->sadb_x_sa2_mode = mode;
985 	sa2->sadb_x_sa2_reserved1 = 0;
986 	sa2->sadb_x_sa2_reserved2 = 0;
987 	sa2->sadb_x_sa2_sequence = 0;
988 	sa2->sadb_x_sa2_reqid = x->props.reqid;
989 
990 	if (natt && natt->encap_type) {
991 		struct sadb_x_nat_t_type *n_type;
992 		struct sadb_x_nat_t_port *n_port;
993 
994 		/* type */
995 		n_type = (struct sadb_x_nat_t_type*) skb_put(skb, sizeof(*n_type));
996 		n_type->sadb_x_nat_t_type_len = sizeof(*n_type)/sizeof(uint64_t);
997 		n_type->sadb_x_nat_t_type_exttype = SADB_X_EXT_NAT_T_TYPE;
998 		n_type->sadb_x_nat_t_type_type = natt->encap_type;
999 		n_type->sadb_x_nat_t_type_reserved[0] = 0;
1000 		n_type->sadb_x_nat_t_type_reserved[1] = 0;
1001 		n_type->sadb_x_nat_t_type_reserved[2] = 0;
1002 
1003 		/* source port */
1004 		n_port = (struct sadb_x_nat_t_port*) skb_put(skb, sizeof (*n_port));
1005 		n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
1006 		n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_SPORT;
1007 		n_port->sadb_x_nat_t_port_port = natt->encap_sport;
1008 		n_port->sadb_x_nat_t_port_reserved = 0;
1009 
1010 		/* dest port */
1011 		n_port = (struct sadb_x_nat_t_port*) skb_put(skb, sizeof (*n_port));
1012 		n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
1013 		n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_DPORT;
1014 		n_port->sadb_x_nat_t_port_port = natt->encap_dport;
1015 		n_port->sadb_x_nat_t_port_reserved = 0;
1016 	}
1017 
1018 	/* security context */
1019 	if (xfrm_ctx) {
1020 		sec_ctx = (struct sadb_x_sec_ctx *) skb_put(skb,
1021 				sizeof(struct sadb_x_sec_ctx) + ctx_size);
1022 		sec_ctx->sadb_x_sec_len =
1023 		  (sizeof(struct sadb_x_sec_ctx) + ctx_size) / sizeof(uint64_t);
1024 		sec_ctx->sadb_x_sec_exttype = SADB_X_EXT_SEC_CTX;
1025 		sec_ctx->sadb_x_ctx_doi = xfrm_ctx->ctx_doi;
1026 		sec_ctx->sadb_x_ctx_alg = xfrm_ctx->ctx_alg;
1027 		sec_ctx->sadb_x_ctx_len = xfrm_ctx->ctx_len;
1028 		memcpy(sec_ctx + 1, xfrm_ctx->ctx_str,
1029 		       xfrm_ctx->ctx_len);
1030 	}
1031 
1032 	return skb;
1033 }
1034 
1035 
1036 static inline struct sk_buff *pfkey_xfrm_state2msg(const struct xfrm_state *x)
1037 {
1038 	struct sk_buff *skb;
1039 
1040 	skb = __pfkey_xfrm_state2msg(x, 1, 3);
1041 
1042 	return skb;
1043 }
1044 
1045 static inline struct sk_buff *pfkey_xfrm_state2msg_expire(const struct xfrm_state *x,
1046 							  int hsc)
1047 {
1048 	return __pfkey_xfrm_state2msg(x, 0, hsc);
1049 }
1050 
1051 static struct xfrm_state * pfkey_msg2xfrm_state(struct net *net,
1052 						const struct sadb_msg *hdr,
1053 						void * const *ext_hdrs)
1054 {
1055 	struct xfrm_state *x;
1056 	const struct sadb_lifetime *lifetime;
1057 	const struct sadb_sa *sa;
1058 	const struct sadb_key *key;
1059 	const struct sadb_x_sec_ctx *sec_ctx;
1060 	uint16_t proto;
1061 	int err;
1062 
1063 
1064 	sa = ext_hdrs[SADB_EXT_SA - 1];
1065 	if (!sa ||
1066 	    !present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1067 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1068 		return ERR_PTR(-EINVAL);
1069 	if (hdr->sadb_msg_satype == SADB_SATYPE_ESP &&
1070 	    !ext_hdrs[SADB_EXT_KEY_ENCRYPT-1])
1071 		return ERR_PTR(-EINVAL);
1072 	if (hdr->sadb_msg_satype == SADB_SATYPE_AH &&
1073 	    !ext_hdrs[SADB_EXT_KEY_AUTH-1])
1074 		return ERR_PTR(-EINVAL);
1075 	if (!!ext_hdrs[SADB_EXT_LIFETIME_HARD-1] !=
1076 	    !!ext_hdrs[SADB_EXT_LIFETIME_SOFT-1])
1077 		return ERR_PTR(-EINVAL);
1078 
1079 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1080 	if (proto == 0)
1081 		return ERR_PTR(-EINVAL);
1082 
1083 	/* default error is no buffer space */
1084 	err = -ENOBUFS;
1085 
1086 	/* RFC2367:
1087 
1088    Only SADB_SASTATE_MATURE SAs may be submitted in an SADB_ADD message.
1089    SADB_SASTATE_LARVAL SAs are created by SADB_GETSPI and it is not
1090    sensible to add a new SA in the DYING or SADB_SASTATE_DEAD state.
1091    Therefore, the sadb_sa_state field of all submitted SAs MUST be
1092    SADB_SASTATE_MATURE and the kernel MUST return an error if this is
1093    not true.
1094 
1095 	   However, KAME setkey always uses SADB_SASTATE_LARVAL.
1096 	   Hence, we have to _ignore_ sadb_sa_state, which is also reasonable.
1097 	 */
1098 	if (sa->sadb_sa_auth > SADB_AALG_MAX ||
1099 	    (hdr->sadb_msg_satype == SADB_X_SATYPE_IPCOMP &&
1100 	     sa->sadb_sa_encrypt > SADB_X_CALG_MAX) ||
1101 	    sa->sadb_sa_encrypt > SADB_EALG_MAX)
1102 		return ERR_PTR(-EINVAL);
1103 	key = ext_hdrs[SADB_EXT_KEY_AUTH - 1];
1104 	if (key != NULL &&
1105 	    sa->sadb_sa_auth != SADB_X_AALG_NULL &&
1106 	    ((key->sadb_key_bits+7) / 8 == 0 ||
1107 	     (key->sadb_key_bits+7) / 8 > key->sadb_key_len * sizeof(uint64_t)))
1108 		return ERR_PTR(-EINVAL);
1109 	key = ext_hdrs[SADB_EXT_KEY_ENCRYPT-1];
1110 	if (key != NULL &&
1111 	    sa->sadb_sa_encrypt != SADB_EALG_NULL &&
1112 	    ((key->sadb_key_bits+7) / 8 == 0 ||
1113 	     (key->sadb_key_bits+7) / 8 > key->sadb_key_len * sizeof(uint64_t)))
1114 		return ERR_PTR(-EINVAL);
1115 
1116 	x = xfrm_state_alloc(net);
1117 	if (x == NULL)
1118 		return ERR_PTR(-ENOBUFS);
1119 
1120 	x->id.proto = proto;
1121 	x->id.spi = sa->sadb_sa_spi;
1122 	x->props.replay_window = min_t(unsigned int, sa->sadb_sa_replay,
1123 					(sizeof(x->replay.bitmap) * 8));
1124 	if (sa->sadb_sa_flags & SADB_SAFLAGS_NOECN)
1125 		x->props.flags |= XFRM_STATE_NOECN;
1126 	if (sa->sadb_sa_flags & SADB_SAFLAGS_DECAP_DSCP)
1127 		x->props.flags |= XFRM_STATE_DECAP_DSCP;
1128 	if (sa->sadb_sa_flags & SADB_SAFLAGS_NOPMTUDISC)
1129 		x->props.flags |= XFRM_STATE_NOPMTUDISC;
1130 
1131 	lifetime = ext_hdrs[SADB_EXT_LIFETIME_HARD - 1];
1132 	if (lifetime != NULL) {
1133 		x->lft.hard_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
1134 		x->lft.hard_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
1135 		x->lft.hard_add_expires_seconds = lifetime->sadb_lifetime_addtime;
1136 		x->lft.hard_use_expires_seconds = lifetime->sadb_lifetime_usetime;
1137 	}
1138 	lifetime = ext_hdrs[SADB_EXT_LIFETIME_SOFT - 1];
1139 	if (lifetime != NULL) {
1140 		x->lft.soft_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
1141 		x->lft.soft_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
1142 		x->lft.soft_add_expires_seconds = lifetime->sadb_lifetime_addtime;
1143 		x->lft.soft_use_expires_seconds = lifetime->sadb_lifetime_usetime;
1144 	}
1145 
1146 	sec_ctx = ext_hdrs[SADB_X_EXT_SEC_CTX - 1];
1147 	if (sec_ctx != NULL) {
1148 		struct xfrm_user_sec_ctx *uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_KERNEL);
1149 
1150 		if (!uctx)
1151 			goto out;
1152 
1153 		err = security_xfrm_state_alloc(x, uctx);
1154 		kfree(uctx);
1155 
1156 		if (err)
1157 			goto out;
1158 	}
1159 
1160 	err = -ENOBUFS;
1161 	key = ext_hdrs[SADB_EXT_KEY_AUTH - 1];
1162 	if (sa->sadb_sa_auth) {
1163 		int keysize = 0;
1164 		struct xfrm_algo_desc *a = xfrm_aalg_get_byid(sa->sadb_sa_auth);
1165 		if (!a || !a->pfkey_supported) {
1166 			err = -ENOSYS;
1167 			goto out;
1168 		}
1169 		if (key)
1170 			keysize = (key->sadb_key_bits + 7) / 8;
1171 		x->aalg = kmalloc(sizeof(*x->aalg) + keysize, GFP_KERNEL);
1172 		if (!x->aalg) {
1173 			err = -ENOMEM;
1174 			goto out;
1175 		}
1176 		strcpy(x->aalg->alg_name, a->name);
1177 		x->aalg->alg_key_len = 0;
1178 		if (key) {
1179 			x->aalg->alg_key_len = key->sadb_key_bits;
1180 			memcpy(x->aalg->alg_key, key+1, keysize);
1181 		}
1182 		x->aalg->alg_trunc_len = a->uinfo.auth.icv_truncbits;
1183 		x->props.aalgo = sa->sadb_sa_auth;
1184 		/* x->algo.flags = sa->sadb_sa_flags; */
1185 	}
1186 	if (sa->sadb_sa_encrypt) {
1187 		if (hdr->sadb_msg_satype == SADB_X_SATYPE_IPCOMP) {
1188 			struct xfrm_algo_desc *a = xfrm_calg_get_byid(sa->sadb_sa_encrypt);
1189 			if (!a || !a->pfkey_supported) {
1190 				err = -ENOSYS;
1191 				goto out;
1192 			}
1193 			x->calg = kmalloc(sizeof(*x->calg), GFP_KERNEL);
1194 			if (!x->calg) {
1195 				err = -ENOMEM;
1196 				goto out;
1197 			}
1198 			strcpy(x->calg->alg_name, a->name);
1199 			x->props.calgo = sa->sadb_sa_encrypt;
1200 		} else {
1201 			int keysize = 0;
1202 			struct xfrm_algo_desc *a = xfrm_ealg_get_byid(sa->sadb_sa_encrypt);
1203 			if (!a || !a->pfkey_supported) {
1204 				err = -ENOSYS;
1205 				goto out;
1206 			}
1207 			key = (struct sadb_key*) ext_hdrs[SADB_EXT_KEY_ENCRYPT-1];
1208 			if (key)
1209 				keysize = (key->sadb_key_bits + 7) / 8;
1210 			x->ealg = kmalloc(sizeof(*x->ealg) + keysize, GFP_KERNEL);
1211 			if (!x->ealg) {
1212 				err = -ENOMEM;
1213 				goto out;
1214 			}
1215 			strcpy(x->ealg->alg_name, a->name);
1216 			x->ealg->alg_key_len = 0;
1217 			if (key) {
1218 				x->ealg->alg_key_len = key->sadb_key_bits;
1219 				memcpy(x->ealg->alg_key, key+1, keysize);
1220 			}
1221 			x->props.ealgo = sa->sadb_sa_encrypt;
1222 			x->geniv = a->uinfo.encr.geniv;
1223 		}
1224 	}
1225 	/* x->algo.flags = sa->sadb_sa_flags; */
1226 
1227 	x->props.family = pfkey_sadb_addr2xfrm_addr((struct sadb_address *) ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1228 						    &x->props.saddr);
1229 	pfkey_sadb_addr2xfrm_addr((struct sadb_address *) ext_hdrs[SADB_EXT_ADDRESS_DST-1],
1230 				  &x->id.daddr);
1231 
1232 	if (ext_hdrs[SADB_X_EXT_SA2-1]) {
1233 		const struct sadb_x_sa2 *sa2 = ext_hdrs[SADB_X_EXT_SA2-1];
1234 		int mode = pfkey_mode_to_xfrm(sa2->sadb_x_sa2_mode);
1235 		if (mode < 0) {
1236 			err = -EINVAL;
1237 			goto out;
1238 		}
1239 		x->props.mode = mode;
1240 		x->props.reqid = sa2->sadb_x_sa2_reqid;
1241 	}
1242 
1243 	if (ext_hdrs[SADB_EXT_ADDRESS_PROXY-1]) {
1244 		const struct sadb_address *addr = ext_hdrs[SADB_EXT_ADDRESS_PROXY-1];
1245 
1246 		/* Nobody uses this, but we try. */
1247 		x->sel.family = pfkey_sadb_addr2xfrm_addr(addr, &x->sel.saddr);
1248 		x->sel.prefixlen_s = addr->sadb_address_prefixlen;
1249 	}
1250 
1251 	if (!x->sel.family)
1252 		x->sel.family = x->props.family;
1253 
1254 	if (ext_hdrs[SADB_X_EXT_NAT_T_TYPE-1]) {
1255 		const struct sadb_x_nat_t_type* n_type;
1256 		struct xfrm_encap_tmpl *natt;
1257 
1258 		x->encap = kmalloc(sizeof(*x->encap), GFP_KERNEL);
1259 		if (!x->encap) {
1260 			err = -ENOMEM;
1261 			goto out;
1262 		}
1263 
1264 		natt = x->encap;
1265 		n_type = ext_hdrs[SADB_X_EXT_NAT_T_TYPE-1];
1266 		natt->encap_type = n_type->sadb_x_nat_t_type_type;
1267 
1268 		if (ext_hdrs[SADB_X_EXT_NAT_T_SPORT-1]) {
1269 			const struct sadb_x_nat_t_port *n_port =
1270 				ext_hdrs[SADB_X_EXT_NAT_T_SPORT-1];
1271 			natt->encap_sport = n_port->sadb_x_nat_t_port_port;
1272 		}
1273 		if (ext_hdrs[SADB_X_EXT_NAT_T_DPORT-1]) {
1274 			const struct sadb_x_nat_t_port *n_port =
1275 				ext_hdrs[SADB_X_EXT_NAT_T_DPORT-1];
1276 			natt->encap_dport = n_port->sadb_x_nat_t_port_port;
1277 		}
1278 		memset(&natt->encap_oa, 0, sizeof(natt->encap_oa));
1279 	}
1280 
1281 	err = xfrm_init_state(x);
1282 	if (err)
1283 		goto out;
1284 
1285 	x->km.seq = hdr->sadb_msg_seq;
1286 	return x;
1287 
1288 out:
1289 	x->km.state = XFRM_STATE_DEAD;
1290 	xfrm_state_put(x);
1291 	return ERR_PTR(err);
1292 }
1293 
1294 static int pfkey_reserved(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1295 {
1296 	return -EOPNOTSUPP;
1297 }
1298 
1299 static int pfkey_getspi(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1300 {
1301 	struct net *net = sock_net(sk);
1302 	struct sk_buff *resp_skb;
1303 	struct sadb_x_sa2 *sa2;
1304 	struct sadb_address *saddr, *daddr;
1305 	struct sadb_msg *out_hdr;
1306 	struct sadb_spirange *range;
1307 	struct xfrm_state *x = NULL;
1308 	int mode;
1309 	int err;
1310 	u32 min_spi, max_spi;
1311 	u32 reqid;
1312 	u8 proto;
1313 	unsigned short family;
1314 	xfrm_address_t *xsaddr = NULL, *xdaddr = NULL;
1315 
1316 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1317 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1318 		return -EINVAL;
1319 
1320 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1321 	if (proto == 0)
1322 		return -EINVAL;
1323 
1324 	if ((sa2 = ext_hdrs[SADB_X_EXT_SA2-1]) != NULL) {
1325 		mode = pfkey_mode_to_xfrm(sa2->sadb_x_sa2_mode);
1326 		if (mode < 0)
1327 			return -EINVAL;
1328 		reqid = sa2->sadb_x_sa2_reqid;
1329 	} else {
1330 		mode = 0;
1331 		reqid = 0;
1332 	}
1333 
1334 	saddr = ext_hdrs[SADB_EXT_ADDRESS_SRC-1];
1335 	daddr = ext_hdrs[SADB_EXT_ADDRESS_DST-1];
1336 
1337 	family = ((struct sockaddr *)(saddr + 1))->sa_family;
1338 	switch (family) {
1339 	case AF_INET:
1340 		xdaddr = (xfrm_address_t *)&((struct sockaddr_in *)(daddr + 1))->sin_addr.s_addr;
1341 		xsaddr = (xfrm_address_t *)&((struct sockaddr_in *)(saddr + 1))->sin_addr.s_addr;
1342 		break;
1343 #if IS_ENABLED(CONFIG_IPV6)
1344 	case AF_INET6:
1345 		xdaddr = (xfrm_address_t *)&((struct sockaddr_in6 *)(daddr + 1))->sin6_addr;
1346 		xsaddr = (xfrm_address_t *)&((struct sockaddr_in6 *)(saddr + 1))->sin6_addr;
1347 		break;
1348 #endif
1349 	}
1350 
1351 	if (hdr->sadb_msg_seq) {
1352 		x = xfrm_find_acq_byseq(net, DUMMY_MARK, hdr->sadb_msg_seq);
1353 		if (x && !xfrm_addr_equal(&x->id.daddr, xdaddr, family)) {
1354 			xfrm_state_put(x);
1355 			x = NULL;
1356 		}
1357 	}
1358 
1359 	if (!x)
1360 		x = xfrm_find_acq(net, &dummy_mark, mode, reqid, proto, xdaddr, xsaddr, 1, family);
1361 
1362 	if (x == NULL)
1363 		return -ENOENT;
1364 
1365 	min_spi = 0x100;
1366 	max_spi = 0x0fffffff;
1367 
1368 	range = ext_hdrs[SADB_EXT_SPIRANGE-1];
1369 	if (range) {
1370 		min_spi = range->sadb_spirange_min;
1371 		max_spi = range->sadb_spirange_max;
1372 	}
1373 
1374 	err = verify_spi_info(x->id.proto, min_spi, max_spi);
1375 	if (err) {
1376 		xfrm_state_put(x);
1377 		return err;
1378 	}
1379 
1380 	err = xfrm_alloc_spi(x, min_spi, max_spi);
1381 	resp_skb = err ? ERR_PTR(err) : pfkey_xfrm_state2msg(x);
1382 
1383 	if (IS_ERR(resp_skb)) {
1384 		xfrm_state_put(x);
1385 		return  PTR_ERR(resp_skb);
1386 	}
1387 
1388 	out_hdr = (struct sadb_msg *) resp_skb->data;
1389 	out_hdr->sadb_msg_version = hdr->sadb_msg_version;
1390 	out_hdr->sadb_msg_type = SADB_GETSPI;
1391 	out_hdr->sadb_msg_satype = pfkey_proto2satype(proto);
1392 	out_hdr->sadb_msg_errno = 0;
1393 	out_hdr->sadb_msg_reserved = 0;
1394 	out_hdr->sadb_msg_seq = hdr->sadb_msg_seq;
1395 	out_hdr->sadb_msg_pid = hdr->sadb_msg_pid;
1396 
1397 	xfrm_state_put(x);
1398 
1399 	pfkey_broadcast(resp_skb, BROADCAST_ONE, sk, net);
1400 
1401 	return 0;
1402 }
1403 
1404 static int pfkey_acquire(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1405 {
1406 	struct net *net = sock_net(sk);
1407 	struct xfrm_state *x;
1408 
1409 	if (hdr->sadb_msg_len != sizeof(struct sadb_msg)/8)
1410 		return -EOPNOTSUPP;
1411 
1412 	if (hdr->sadb_msg_seq == 0 || hdr->sadb_msg_errno == 0)
1413 		return 0;
1414 
1415 	x = xfrm_find_acq_byseq(net, DUMMY_MARK, hdr->sadb_msg_seq);
1416 	if (x == NULL)
1417 		return 0;
1418 
1419 	spin_lock_bh(&x->lock);
1420 	if (x->km.state == XFRM_STATE_ACQ)
1421 		x->km.state = XFRM_STATE_ERROR;
1422 
1423 	spin_unlock_bh(&x->lock);
1424 	xfrm_state_put(x);
1425 	return 0;
1426 }
1427 
1428 static inline int event2poltype(int event)
1429 {
1430 	switch (event) {
1431 	case XFRM_MSG_DELPOLICY:
1432 		return SADB_X_SPDDELETE;
1433 	case XFRM_MSG_NEWPOLICY:
1434 		return SADB_X_SPDADD;
1435 	case XFRM_MSG_UPDPOLICY:
1436 		return SADB_X_SPDUPDATE;
1437 	case XFRM_MSG_POLEXPIRE:
1438 	//	return SADB_X_SPDEXPIRE;
1439 	default:
1440 		pr_err("pfkey: Unknown policy event %d\n", event);
1441 		break;
1442 	}
1443 
1444 	return 0;
1445 }
1446 
1447 static inline int event2keytype(int event)
1448 {
1449 	switch (event) {
1450 	case XFRM_MSG_DELSA:
1451 		return SADB_DELETE;
1452 	case XFRM_MSG_NEWSA:
1453 		return SADB_ADD;
1454 	case XFRM_MSG_UPDSA:
1455 		return SADB_UPDATE;
1456 	case XFRM_MSG_EXPIRE:
1457 		return SADB_EXPIRE;
1458 	default:
1459 		pr_err("pfkey: Unknown SA event %d\n", event);
1460 		break;
1461 	}
1462 
1463 	return 0;
1464 }
1465 
1466 /* ADD/UPD/DEL */
1467 static int key_notify_sa(struct xfrm_state *x, const struct km_event *c)
1468 {
1469 	struct sk_buff *skb;
1470 	struct sadb_msg *hdr;
1471 
1472 	skb = pfkey_xfrm_state2msg(x);
1473 
1474 	if (IS_ERR(skb))
1475 		return PTR_ERR(skb);
1476 
1477 	hdr = (struct sadb_msg *) skb->data;
1478 	hdr->sadb_msg_version = PF_KEY_V2;
1479 	hdr->sadb_msg_type = event2keytype(c->event);
1480 	hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
1481 	hdr->sadb_msg_errno = 0;
1482 	hdr->sadb_msg_reserved = 0;
1483 	hdr->sadb_msg_seq = c->seq;
1484 	hdr->sadb_msg_pid = c->portid;
1485 
1486 	pfkey_broadcast(skb, BROADCAST_ALL, NULL, xs_net(x));
1487 
1488 	return 0;
1489 }
1490 
1491 static int pfkey_add(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1492 {
1493 	struct net *net = sock_net(sk);
1494 	struct xfrm_state *x;
1495 	int err;
1496 	struct km_event c;
1497 
1498 	x = pfkey_msg2xfrm_state(net, hdr, ext_hdrs);
1499 	if (IS_ERR(x))
1500 		return PTR_ERR(x);
1501 
1502 	xfrm_state_hold(x);
1503 	if (hdr->sadb_msg_type == SADB_ADD)
1504 		err = xfrm_state_add(x);
1505 	else
1506 		err = xfrm_state_update(x);
1507 
1508 	xfrm_audit_state_add(x, err ? 0 : 1, true);
1509 
1510 	if (err < 0) {
1511 		x->km.state = XFRM_STATE_DEAD;
1512 		__xfrm_state_put(x);
1513 		goto out;
1514 	}
1515 
1516 	if (hdr->sadb_msg_type == SADB_ADD)
1517 		c.event = XFRM_MSG_NEWSA;
1518 	else
1519 		c.event = XFRM_MSG_UPDSA;
1520 	c.seq = hdr->sadb_msg_seq;
1521 	c.portid = hdr->sadb_msg_pid;
1522 	km_state_notify(x, &c);
1523 out:
1524 	xfrm_state_put(x);
1525 	return err;
1526 }
1527 
1528 static int pfkey_delete(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1529 {
1530 	struct net *net = sock_net(sk);
1531 	struct xfrm_state *x;
1532 	struct km_event c;
1533 	int err;
1534 
1535 	if (!ext_hdrs[SADB_EXT_SA-1] ||
1536 	    !present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1537 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1538 		return -EINVAL;
1539 
1540 	x = pfkey_xfrm_state_lookup(net, hdr, ext_hdrs);
1541 	if (x == NULL)
1542 		return -ESRCH;
1543 
1544 	if ((err = security_xfrm_state_delete(x)))
1545 		goto out;
1546 
1547 	if (xfrm_state_kern(x)) {
1548 		err = -EPERM;
1549 		goto out;
1550 	}
1551 
1552 	err = xfrm_state_delete(x);
1553 
1554 	if (err < 0)
1555 		goto out;
1556 
1557 	c.seq = hdr->sadb_msg_seq;
1558 	c.portid = hdr->sadb_msg_pid;
1559 	c.event = XFRM_MSG_DELSA;
1560 	km_state_notify(x, &c);
1561 out:
1562 	xfrm_audit_state_delete(x, err ? 0 : 1, true);
1563 	xfrm_state_put(x);
1564 
1565 	return err;
1566 }
1567 
1568 static int pfkey_get(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1569 {
1570 	struct net *net = sock_net(sk);
1571 	__u8 proto;
1572 	struct sk_buff *out_skb;
1573 	struct sadb_msg *out_hdr;
1574 	struct xfrm_state *x;
1575 
1576 	if (!ext_hdrs[SADB_EXT_SA-1] ||
1577 	    !present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
1578 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]))
1579 		return -EINVAL;
1580 
1581 	x = pfkey_xfrm_state_lookup(net, hdr, ext_hdrs);
1582 	if (x == NULL)
1583 		return -ESRCH;
1584 
1585 	out_skb = pfkey_xfrm_state2msg(x);
1586 	proto = x->id.proto;
1587 	xfrm_state_put(x);
1588 	if (IS_ERR(out_skb))
1589 		return  PTR_ERR(out_skb);
1590 
1591 	out_hdr = (struct sadb_msg *) out_skb->data;
1592 	out_hdr->sadb_msg_version = hdr->sadb_msg_version;
1593 	out_hdr->sadb_msg_type = SADB_GET;
1594 	out_hdr->sadb_msg_satype = pfkey_proto2satype(proto);
1595 	out_hdr->sadb_msg_errno = 0;
1596 	out_hdr->sadb_msg_reserved = 0;
1597 	out_hdr->sadb_msg_seq = hdr->sadb_msg_seq;
1598 	out_hdr->sadb_msg_pid = hdr->sadb_msg_pid;
1599 	pfkey_broadcast(out_skb, BROADCAST_ONE, sk, sock_net(sk));
1600 
1601 	return 0;
1602 }
1603 
1604 static struct sk_buff *compose_sadb_supported(const struct sadb_msg *orig,
1605 					      gfp_t allocation)
1606 {
1607 	struct sk_buff *skb;
1608 	struct sadb_msg *hdr;
1609 	int len, auth_len, enc_len, i;
1610 
1611 	auth_len = xfrm_count_pfkey_auth_supported();
1612 	if (auth_len) {
1613 		auth_len *= sizeof(struct sadb_alg);
1614 		auth_len += sizeof(struct sadb_supported);
1615 	}
1616 
1617 	enc_len = xfrm_count_pfkey_enc_supported();
1618 	if (enc_len) {
1619 		enc_len *= sizeof(struct sadb_alg);
1620 		enc_len += sizeof(struct sadb_supported);
1621 	}
1622 
1623 	len = enc_len + auth_len + sizeof(struct sadb_msg);
1624 
1625 	skb = alloc_skb(len + 16, allocation);
1626 	if (!skb)
1627 		goto out_put_algs;
1628 
1629 	hdr = (struct sadb_msg *) skb_put(skb, sizeof(*hdr));
1630 	pfkey_hdr_dup(hdr, orig);
1631 	hdr->sadb_msg_errno = 0;
1632 	hdr->sadb_msg_len = len / sizeof(uint64_t);
1633 
1634 	if (auth_len) {
1635 		struct sadb_supported *sp;
1636 		struct sadb_alg *ap;
1637 
1638 		sp = (struct sadb_supported *) skb_put(skb, auth_len);
1639 		ap = (struct sadb_alg *) (sp + 1);
1640 
1641 		sp->sadb_supported_len = auth_len / sizeof(uint64_t);
1642 		sp->sadb_supported_exttype = SADB_EXT_SUPPORTED_AUTH;
1643 
1644 		for (i = 0; ; i++) {
1645 			struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(i);
1646 			if (!aalg)
1647 				break;
1648 			if (!aalg->pfkey_supported)
1649 				continue;
1650 			if (aalg->available)
1651 				*ap++ = aalg->desc;
1652 		}
1653 	}
1654 
1655 	if (enc_len) {
1656 		struct sadb_supported *sp;
1657 		struct sadb_alg *ap;
1658 
1659 		sp = (struct sadb_supported *) skb_put(skb, enc_len);
1660 		ap = (struct sadb_alg *) (sp + 1);
1661 
1662 		sp->sadb_supported_len = enc_len / sizeof(uint64_t);
1663 		sp->sadb_supported_exttype = SADB_EXT_SUPPORTED_ENCRYPT;
1664 
1665 		for (i = 0; ; i++) {
1666 			struct xfrm_algo_desc *ealg = xfrm_ealg_get_byidx(i);
1667 			if (!ealg)
1668 				break;
1669 			if (!ealg->pfkey_supported)
1670 				continue;
1671 			if (ealg->available)
1672 				*ap++ = ealg->desc;
1673 		}
1674 	}
1675 
1676 out_put_algs:
1677 	return skb;
1678 }
1679 
1680 static int pfkey_register(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1681 {
1682 	struct pfkey_sock *pfk = pfkey_sk(sk);
1683 	struct sk_buff *supp_skb;
1684 
1685 	if (hdr->sadb_msg_satype > SADB_SATYPE_MAX)
1686 		return -EINVAL;
1687 
1688 	if (hdr->sadb_msg_satype != SADB_SATYPE_UNSPEC) {
1689 		if (pfk->registered&(1<<hdr->sadb_msg_satype))
1690 			return -EEXIST;
1691 		pfk->registered |= (1<<hdr->sadb_msg_satype);
1692 	}
1693 
1694 	xfrm_probe_algs();
1695 
1696 	supp_skb = compose_sadb_supported(hdr, GFP_KERNEL);
1697 	if (!supp_skb) {
1698 		if (hdr->sadb_msg_satype != SADB_SATYPE_UNSPEC)
1699 			pfk->registered &= ~(1<<hdr->sadb_msg_satype);
1700 
1701 		return -ENOBUFS;
1702 	}
1703 
1704 	pfkey_broadcast(supp_skb, BROADCAST_REGISTERED, sk, sock_net(sk));
1705 
1706 	return 0;
1707 }
1708 
1709 static int unicast_flush_resp(struct sock *sk, const struct sadb_msg *ihdr)
1710 {
1711 	struct sk_buff *skb;
1712 	struct sadb_msg *hdr;
1713 
1714 	skb = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_ATOMIC);
1715 	if (!skb)
1716 		return -ENOBUFS;
1717 
1718 	hdr = (struct sadb_msg *) skb_put(skb, sizeof(struct sadb_msg));
1719 	memcpy(hdr, ihdr, sizeof(struct sadb_msg));
1720 	hdr->sadb_msg_errno = (uint8_t) 0;
1721 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) / sizeof(uint64_t));
1722 
1723 	return pfkey_broadcast(skb, BROADCAST_ONE, sk, sock_net(sk));
1724 }
1725 
1726 static int key_notify_sa_flush(const struct km_event *c)
1727 {
1728 	struct sk_buff *skb;
1729 	struct sadb_msg *hdr;
1730 
1731 	skb = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_ATOMIC);
1732 	if (!skb)
1733 		return -ENOBUFS;
1734 	hdr = (struct sadb_msg *) skb_put(skb, sizeof(struct sadb_msg));
1735 	hdr->sadb_msg_satype = pfkey_proto2satype(c->data.proto);
1736 	hdr->sadb_msg_type = SADB_FLUSH;
1737 	hdr->sadb_msg_seq = c->seq;
1738 	hdr->sadb_msg_pid = c->portid;
1739 	hdr->sadb_msg_version = PF_KEY_V2;
1740 	hdr->sadb_msg_errno = (uint8_t) 0;
1741 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) / sizeof(uint64_t));
1742 	hdr->sadb_msg_reserved = 0;
1743 
1744 	pfkey_broadcast(skb, BROADCAST_ALL, NULL, c->net);
1745 
1746 	return 0;
1747 }
1748 
1749 static int pfkey_flush(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1750 {
1751 	struct net *net = sock_net(sk);
1752 	unsigned int proto;
1753 	struct km_event c;
1754 	int err, err2;
1755 
1756 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1757 	if (proto == 0)
1758 		return -EINVAL;
1759 
1760 	err = xfrm_state_flush(net, proto, true);
1761 	err2 = unicast_flush_resp(sk, hdr);
1762 	if (err || err2) {
1763 		if (err == -ESRCH) /* empty table - go quietly */
1764 			err = 0;
1765 		return err ? err : err2;
1766 	}
1767 
1768 	c.data.proto = proto;
1769 	c.seq = hdr->sadb_msg_seq;
1770 	c.portid = hdr->sadb_msg_pid;
1771 	c.event = XFRM_MSG_FLUSHSA;
1772 	c.net = net;
1773 	km_state_notify(NULL, &c);
1774 
1775 	return 0;
1776 }
1777 
1778 static int dump_sa(struct xfrm_state *x, int count, void *ptr)
1779 {
1780 	struct pfkey_sock *pfk = ptr;
1781 	struct sk_buff *out_skb;
1782 	struct sadb_msg *out_hdr;
1783 
1784 	if (!pfkey_can_dump(&pfk->sk))
1785 		return -ENOBUFS;
1786 
1787 	out_skb = pfkey_xfrm_state2msg(x);
1788 	if (IS_ERR(out_skb))
1789 		return PTR_ERR(out_skb);
1790 
1791 	out_hdr = (struct sadb_msg *) out_skb->data;
1792 	out_hdr->sadb_msg_version = pfk->dump.msg_version;
1793 	out_hdr->sadb_msg_type = SADB_DUMP;
1794 	out_hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
1795 	out_hdr->sadb_msg_errno = 0;
1796 	out_hdr->sadb_msg_reserved = 0;
1797 	out_hdr->sadb_msg_seq = count + 1;
1798 	out_hdr->sadb_msg_pid = pfk->dump.msg_portid;
1799 
1800 	if (pfk->dump.skb)
1801 		pfkey_broadcast(pfk->dump.skb, BROADCAST_ONE,
1802 				&pfk->sk, sock_net(&pfk->sk));
1803 	pfk->dump.skb = out_skb;
1804 
1805 	return 0;
1806 }
1807 
1808 static int pfkey_dump_sa(struct pfkey_sock *pfk)
1809 {
1810 	struct net *net = sock_net(&pfk->sk);
1811 	return xfrm_state_walk(net, &pfk->dump.u.state, dump_sa, (void *) pfk);
1812 }
1813 
1814 static void pfkey_dump_sa_done(struct pfkey_sock *pfk)
1815 {
1816 	struct net *net = sock_net(&pfk->sk);
1817 
1818 	xfrm_state_walk_done(&pfk->dump.u.state, net);
1819 }
1820 
1821 static int pfkey_dump(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1822 {
1823 	u8 proto;
1824 	struct xfrm_address_filter *filter = NULL;
1825 	struct pfkey_sock *pfk = pfkey_sk(sk);
1826 
1827 	mutex_lock(&pfk->dump_lock);
1828 	if (pfk->dump.dump != NULL) {
1829 		mutex_unlock(&pfk->dump_lock);
1830 		return -EBUSY;
1831 	}
1832 
1833 	proto = pfkey_satype2proto(hdr->sadb_msg_satype);
1834 	if (proto == 0) {
1835 		mutex_unlock(&pfk->dump_lock);
1836 		return -EINVAL;
1837 	}
1838 
1839 	if (ext_hdrs[SADB_X_EXT_FILTER - 1]) {
1840 		struct sadb_x_filter *xfilter = ext_hdrs[SADB_X_EXT_FILTER - 1];
1841 
1842 		filter = kmalloc(sizeof(*filter), GFP_KERNEL);
1843 		if (filter == NULL) {
1844 			mutex_unlock(&pfk->dump_lock);
1845 			return -ENOMEM;
1846 		}
1847 
1848 		memcpy(&filter->saddr, &xfilter->sadb_x_filter_saddr,
1849 		       sizeof(xfrm_address_t));
1850 		memcpy(&filter->daddr, &xfilter->sadb_x_filter_daddr,
1851 		       sizeof(xfrm_address_t));
1852 		filter->family = xfilter->sadb_x_filter_family;
1853 		filter->splen = xfilter->sadb_x_filter_splen;
1854 		filter->dplen = xfilter->sadb_x_filter_dplen;
1855 	}
1856 
1857 	pfk->dump.msg_version = hdr->sadb_msg_version;
1858 	pfk->dump.msg_portid = hdr->sadb_msg_pid;
1859 	pfk->dump.dump = pfkey_dump_sa;
1860 	pfk->dump.done = pfkey_dump_sa_done;
1861 	xfrm_state_walk_init(&pfk->dump.u.state, proto, filter);
1862 	mutex_unlock(&pfk->dump_lock);
1863 
1864 	return pfkey_do_dump(pfk);
1865 }
1866 
1867 static int pfkey_promisc(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
1868 {
1869 	struct pfkey_sock *pfk = pfkey_sk(sk);
1870 	int satype = hdr->sadb_msg_satype;
1871 	bool reset_errno = false;
1872 
1873 	if (hdr->sadb_msg_len == (sizeof(*hdr) / sizeof(uint64_t))) {
1874 		reset_errno = true;
1875 		if (satype != 0 && satype != 1)
1876 			return -EINVAL;
1877 		pfk->promisc = satype;
1878 	}
1879 	if (reset_errno && skb_cloned(skb))
1880 		skb = skb_copy(skb, GFP_KERNEL);
1881 	else
1882 		skb = skb_clone(skb, GFP_KERNEL);
1883 
1884 	if (reset_errno && skb) {
1885 		struct sadb_msg *new_hdr = (struct sadb_msg *) skb->data;
1886 		new_hdr->sadb_msg_errno = 0;
1887 	}
1888 
1889 	pfkey_broadcast(skb, BROADCAST_ALL, NULL, sock_net(sk));
1890 	return 0;
1891 }
1892 
1893 static int check_reqid(struct xfrm_policy *xp, int dir, int count, void *ptr)
1894 {
1895 	int i;
1896 	u32 reqid = *(u32*)ptr;
1897 
1898 	for (i=0; i<xp->xfrm_nr; i++) {
1899 		if (xp->xfrm_vec[i].reqid == reqid)
1900 			return -EEXIST;
1901 	}
1902 	return 0;
1903 }
1904 
1905 static u32 gen_reqid(struct net *net)
1906 {
1907 	struct xfrm_policy_walk walk;
1908 	u32 start;
1909 	int rc;
1910 	static u32 reqid = IPSEC_MANUAL_REQID_MAX;
1911 
1912 	start = reqid;
1913 	do {
1914 		++reqid;
1915 		if (reqid == 0)
1916 			reqid = IPSEC_MANUAL_REQID_MAX+1;
1917 		xfrm_policy_walk_init(&walk, XFRM_POLICY_TYPE_MAIN);
1918 		rc = xfrm_policy_walk(net, &walk, check_reqid, (void*)&reqid);
1919 		xfrm_policy_walk_done(&walk, net);
1920 		if (rc != -EEXIST)
1921 			return reqid;
1922 	} while (reqid != start);
1923 	return 0;
1924 }
1925 
1926 static int
1927 parse_ipsecrequest(struct xfrm_policy *xp, struct sadb_x_ipsecrequest *rq)
1928 {
1929 	struct net *net = xp_net(xp);
1930 	struct xfrm_tmpl *t = xp->xfrm_vec + xp->xfrm_nr;
1931 	int mode;
1932 
1933 	if (xp->xfrm_nr >= XFRM_MAX_DEPTH)
1934 		return -ELOOP;
1935 
1936 	if (rq->sadb_x_ipsecrequest_mode == 0)
1937 		return -EINVAL;
1938 
1939 	t->id.proto = rq->sadb_x_ipsecrequest_proto; /* XXX check proto */
1940 	if ((mode = pfkey_mode_to_xfrm(rq->sadb_x_ipsecrequest_mode)) < 0)
1941 		return -EINVAL;
1942 	t->mode = mode;
1943 	if (rq->sadb_x_ipsecrequest_level == IPSEC_LEVEL_USE)
1944 		t->optional = 1;
1945 	else if (rq->sadb_x_ipsecrequest_level == IPSEC_LEVEL_UNIQUE) {
1946 		t->reqid = rq->sadb_x_ipsecrequest_reqid;
1947 		if (t->reqid > IPSEC_MANUAL_REQID_MAX)
1948 			t->reqid = 0;
1949 		if (!t->reqid && !(t->reqid = gen_reqid(net)))
1950 			return -ENOBUFS;
1951 	}
1952 
1953 	/* addresses present only in tunnel mode */
1954 	if (t->mode == XFRM_MODE_TUNNEL) {
1955 		int err;
1956 
1957 		err = parse_sockaddr_pair(
1958 			(struct sockaddr *)(rq + 1),
1959 			rq->sadb_x_ipsecrequest_len - sizeof(*rq),
1960 			&t->saddr, &t->id.daddr, &t->encap_family);
1961 		if (err)
1962 			return err;
1963 	} else
1964 		t->encap_family = xp->family;
1965 
1966 	/* No way to set this via kame pfkey */
1967 	t->allalgs = 1;
1968 	xp->xfrm_nr++;
1969 	return 0;
1970 }
1971 
1972 static int
1973 parse_ipsecrequests(struct xfrm_policy *xp, struct sadb_x_policy *pol)
1974 {
1975 	int err;
1976 	int len = pol->sadb_x_policy_len*8 - sizeof(struct sadb_x_policy);
1977 	struct sadb_x_ipsecrequest *rq = (void*)(pol+1);
1978 
1979 	if (pol->sadb_x_policy_len * 8 < sizeof(struct sadb_x_policy))
1980 		return -EINVAL;
1981 
1982 	while (len >= sizeof(*rq)) {
1983 		if (len < rq->sadb_x_ipsecrequest_len ||
1984 		    rq->sadb_x_ipsecrequest_len < sizeof(*rq))
1985 			return -EINVAL;
1986 
1987 		if ((err = parse_ipsecrequest(xp, rq)) < 0)
1988 			return err;
1989 		len -= rq->sadb_x_ipsecrequest_len;
1990 		rq = (void*)((u8*)rq + rq->sadb_x_ipsecrequest_len);
1991 	}
1992 	return 0;
1993 }
1994 
1995 static inline int pfkey_xfrm_policy2sec_ctx_size(const struct xfrm_policy *xp)
1996 {
1997   struct xfrm_sec_ctx *xfrm_ctx = xp->security;
1998 
1999 	if (xfrm_ctx) {
2000 		int len = sizeof(struct sadb_x_sec_ctx);
2001 		len += xfrm_ctx->ctx_len;
2002 		return PFKEY_ALIGN8(len);
2003 	}
2004 	return 0;
2005 }
2006 
2007 static int pfkey_xfrm_policy2msg_size(const struct xfrm_policy *xp)
2008 {
2009 	const struct xfrm_tmpl *t;
2010 	int sockaddr_size = pfkey_sockaddr_size(xp->family);
2011 	int socklen = 0;
2012 	int i;
2013 
2014 	for (i=0; i<xp->xfrm_nr; i++) {
2015 		t = xp->xfrm_vec + i;
2016 		socklen += pfkey_sockaddr_len(t->encap_family);
2017 	}
2018 
2019 	return sizeof(struct sadb_msg) +
2020 		(sizeof(struct sadb_lifetime) * 3) +
2021 		(sizeof(struct sadb_address) * 2) +
2022 		(sockaddr_size * 2) +
2023 		sizeof(struct sadb_x_policy) +
2024 		(xp->xfrm_nr * sizeof(struct sadb_x_ipsecrequest)) +
2025 		(socklen * 2) +
2026 		pfkey_xfrm_policy2sec_ctx_size(xp);
2027 }
2028 
2029 static struct sk_buff * pfkey_xfrm_policy2msg_prep(const struct xfrm_policy *xp)
2030 {
2031 	struct sk_buff *skb;
2032 	int size;
2033 
2034 	size = pfkey_xfrm_policy2msg_size(xp);
2035 
2036 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
2037 	if (skb == NULL)
2038 		return ERR_PTR(-ENOBUFS);
2039 
2040 	return skb;
2041 }
2042 
2043 static int pfkey_xfrm_policy2msg(struct sk_buff *skb, const struct xfrm_policy *xp, int dir)
2044 {
2045 	struct sadb_msg *hdr;
2046 	struct sadb_address *addr;
2047 	struct sadb_lifetime *lifetime;
2048 	struct sadb_x_policy *pol;
2049 	struct sadb_x_sec_ctx *sec_ctx;
2050 	struct xfrm_sec_ctx *xfrm_ctx;
2051 	int i;
2052 	int size;
2053 	int sockaddr_size = pfkey_sockaddr_size(xp->family);
2054 	int socklen = pfkey_sockaddr_len(xp->family);
2055 
2056 	size = pfkey_xfrm_policy2msg_size(xp);
2057 
2058 	/* call should fill header later */
2059 	hdr = (struct sadb_msg *) skb_put(skb, sizeof(struct sadb_msg));
2060 	memset(hdr, 0, size);	/* XXX do we need this ? */
2061 
2062 	/* src address */
2063 	addr = (struct sadb_address*) skb_put(skb,
2064 					      sizeof(struct sadb_address)+sockaddr_size);
2065 	addr->sadb_address_len =
2066 		(sizeof(struct sadb_address)+sockaddr_size)/
2067 			sizeof(uint64_t);
2068 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
2069 	addr->sadb_address_proto = pfkey_proto_from_xfrm(xp->selector.proto);
2070 	addr->sadb_address_prefixlen = xp->selector.prefixlen_s;
2071 	addr->sadb_address_reserved = 0;
2072 	if (!pfkey_sockaddr_fill(&xp->selector.saddr,
2073 				 xp->selector.sport,
2074 				 (struct sockaddr *) (addr + 1),
2075 				 xp->family))
2076 		BUG();
2077 
2078 	/* dst address */
2079 	addr = (struct sadb_address*) skb_put(skb,
2080 					      sizeof(struct sadb_address)+sockaddr_size);
2081 	addr->sadb_address_len =
2082 		(sizeof(struct sadb_address)+sockaddr_size)/
2083 			sizeof(uint64_t);
2084 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
2085 	addr->sadb_address_proto = pfkey_proto_from_xfrm(xp->selector.proto);
2086 	addr->sadb_address_prefixlen = xp->selector.prefixlen_d;
2087 	addr->sadb_address_reserved = 0;
2088 
2089 	pfkey_sockaddr_fill(&xp->selector.daddr, xp->selector.dport,
2090 			    (struct sockaddr *) (addr + 1),
2091 			    xp->family);
2092 
2093 	/* hard time */
2094 	lifetime = (struct sadb_lifetime *)  skb_put(skb,
2095 						     sizeof(struct sadb_lifetime));
2096 	lifetime->sadb_lifetime_len =
2097 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
2098 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_HARD;
2099 	lifetime->sadb_lifetime_allocations =  _X2KEY(xp->lft.hard_packet_limit);
2100 	lifetime->sadb_lifetime_bytes = _X2KEY(xp->lft.hard_byte_limit);
2101 	lifetime->sadb_lifetime_addtime = xp->lft.hard_add_expires_seconds;
2102 	lifetime->sadb_lifetime_usetime = xp->lft.hard_use_expires_seconds;
2103 	/* soft time */
2104 	lifetime = (struct sadb_lifetime *)  skb_put(skb,
2105 						     sizeof(struct sadb_lifetime));
2106 	lifetime->sadb_lifetime_len =
2107 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
2108 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_SOFT;
2109 	lifetime->sadb_lifetime_allocations =  _X2KEY(xp->lft.soft_packet_limit);
2110 	lifetime->sadb_lifetime_bytes = _X2KEY(xp->lft.soft_byte_limit);
2111 	lifetime->sadb_lifetime_addtime = xp->lft.soft_add_expires_seconds;
2112 	lifetime->sadb_lifetime_usetime = xp->lft.soft_use_expires_seconds;
2113 	/* current time */
2114 	lifetime = (struct sadb_lifetime *)  skb_put(skb,
2115 						     sizeof(struct sadb_lifetime));
2116 	lifetime->sadb_lifetime_len =
2117 		sizeof(struct sadb_lifetime)/sizeof(uint64_t);
2118 	lifetime->sadb_lifetime_exttype = SADB_EXT_LIFETIME_CURRENT;
2119 	lifetime->sadb_lifetime_allocations = xp->curlft.packets;
2120 	lifetime->sadb_lifetime_bytes = xp->curlft.bytes;
2121 	lifetime->sadb_lifetime_addtime = xp->curlft.add_time;
2122 	lifetime->sadb_lifetime_usetime = xp->curlft.use_time;
2123 
2124 	pol = (struct sadb_x_policy *)  skb_put(skb, sizeof(struct sadb_x_policy));
2125 	pol->sadb_x_policy_len = sizeof(struct sadb_x_policy)/sizeof(uint64_t);
2126 	pol->sadb_x_policy_exttype = SADB_X_EXT_POLICY;
2127 	pol->sadb_x_policy_type = IPSEC_POLICY_DISCARD;
2128 	if (xp->action == XFRM_POLICY_ALLOW) {
2129 		if (xp->xfrm_nr)
2130 			pol->sadb_x_policy_type = IPSEC_POLICY_IPSEC;
2131 		else
2132 			pol->sadb_x_policy_type = IPSEC_POLICY_NONE;
2133 	}
2134 	pol->sadb_x_policy_dir = dir+1;
2135 	pol->sadb_x_policy_reserved = 0;
2136 	pol->sadb_x_policy_id = xp->index;
2137 	pol->sadb_x_policy_priority = xp->priority;
2138 
2139 	for (i=0; i<xp->xfrm_nr; i++) {
2140 		const struct xfrm_tmpl *t = xp->xfrm_vec + i;
2141 		struct sadb_x_ipsecrequest *rq;
2142 		int req_size;
2143 		int mode;
2144 
2145 		req_size = sizeof(struct sadb_x_ipsecrequest);
2146 		if (t->mode == XFRM_MODE_TUNNEL) {
2147 			socklen = pfkey_sockaddr_len(t->encap_family);
2148 			req_size += socklen * 2;
2149 		} else {
2150 			size -= 2*socklen;
2151 		}
2152 		rq = (void*)skb_put(skb, req_size);
2153 		pol->sadb_x_policy_len += req_size/8;
2154 		memset(rq, 0, sizeof(*rq));
2155 		rq->sadb_x_ipsecrequest_len = req_size;
2156 		rq->sadb_x_ipsecrequest_proto = t->id.proto;
2157 		if ((mode = pfkey_mode_from_xfrm(t->mode)) < 0)
2158 			return -EINVAL;
2159 		rq->sadb_x_ipsecrequest_mode = mode;
2160 		rq->sadb_x_ipsecrequest_level = IPSEC_LEVEL_REQUIRE;
2161 		if (t->reqid)
2162 			rq->sadb_x_ipsecrequest_level = IPSEC_LEVEL_UNIQUE;
2163 		if (t->optional)
2164 			rq->sadb_x_ipsecrequest_level = IPSEC_LEVEL_USE;
2165 		rq->sadb_x_ipsecrequest_reqid = t->reqid;
2166 
2167 		if (t->mode == XFRM_MODE_TUNNEL) {
2168 			u8 *sa = (void *)(rq + 1);
2169 			pfkey_sockaddr_fill(&t->saddr, 0,
2170 					    (struct sockaddr *)sa,
2171 					    t->encap_family);
2172 			pfkey_sockaddr_fill(&t->id.daddr, 0,
2173 					    (struct sockaddr *) (sa + socklen),
2174 					    t->encap_family);
2175 		}
2176 	}
2177 
2178 	/* security context */
2179 	if ((xfrm_ctx = xp->security)) {
2180 		int ctx_size = pfkey_xfrm_policy2sec_ctx_size(xp);
2181 
2182 		sec_ctx = (struct sadb_x_sec_ctx *) skb_put(skb, ctx_size);
2183 		sec_ctx->sadb_x_sec_len = ctx_size / sizeof(uint64_t);
2184 		sec_ctx->sadb_x_sec_exttype = SADB_X_EXT_SEC_CTX;
2185 		sec_ctx->sadb_x_ctx_doi = xfrm_ctx->ctx_doi;
2186 		sec_ctx->sadb_x_ctx_alg = xfrm_ctx->ctx_alg;
2187 		sec_ctx->sadb_x_ctx_len = xfrm_ctx->ctx_len;
2188 		memcpy(sec_ctx + 1, xfrm_ctx->ctx_str,
2189 		       xfrm_ctx->ctx_len);
2190 	}
2191 
2192 	hdr->sadb_msg_len = size / sizeof(uint64_t);
2193 	hdr->sadb_msg_reserved = atomic_read(&xp->refcnt);
2194 
2195 	return 0;
2196 }
2197 
2198 static int key_notify_policy(struct xfrm_policy *xp, int dir, const struct km_event *c)
2199 {
2200 	struct sk_buff *out_skb;
2201 	struct sadb_msg *out_hdr;
2202 	int err;
2203 
2204 	out_skb = pfkey_xfrm_policy2msg_prep(xp);
2205 	if (IS_ERR(out_skb))
2206 		return PTR_ERR(out_skb);
2207 
2208 	err = pfkey_xfrm_policy2msg(out_skb, xp, dir);
2209 	if (err < 0)
2210 		return err;
2211 
2212 	out_hdr = (struct sadb_msg *) out_skb->data;
2213 	out_hdr->sadb_msg_version = PF_KEY_V2;
2214 
2215 	if (c->data.byid && c->event == XFRM_MSG_DELPOLICY)
2216 		out_hdr->sadb_msg_type = SADB_X_SPDDELETE2;
2217 	else
2218 		out_hdr->sadb_msg_type = event2poltype(c->event);
2219 	out_hdr->sadb_msg_errno = 0;
2220 	out_hdr->sadb_msg_seq = c->seq;
2221 	out_hdr->sadb_msg_pid = c->portid;
2222 	pfkey_broadcast(out_skb, BROADCAST_ALL, NULL, xp_net(xp));
2223 	return 0;
2224 
2225 }
2226 
2227 static int pfkey_spdadd(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2228 {
2229 	struct net *net = sock_net(sk);
2230 	int err = 0;
2231 	struct sadb_lifetime *lifetime;
2232 	struct sadb_address *sa;
2233 	struct sadb_x_policy *pol;
2234 	struct xfrm_policy *xp;
2235 	struct km_event c;
2236 	struct sadb_x_sec_ctx *sec_ctx;
2237 
2238 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
2239 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]) ||
2240 	    !ext_hdrs[SADB_X_EXT_POLICY-1])
2241 		return -EINVAL;
2242 
2243 	pol = ext_hdrs[SADB_X_EXT_POLICY-1];
2244 	if (pol->sadb_x_policy_type > IPSEC_POLICY_IPSEC)
2245 		return -EINVAL;
2246 	if (!pol->sadb_x_policy_dir || pol->sadb_x_policy_dir >= IPSEC_DIR_MAX)
2247 		return -EINVAL;
2248 
2249 	xp = xfrm_policy_alloc(net, GFP_KERNEL);
2250 	if (xp == NULL)
2251 		return -ENOBUFS;
2252 
2253 	xp->action = (pol->sadb_x_policy_type == IPSEC_POLICY_DISCARD ?
2254 		      XFRM_POLICY_BLOCK : XFRM_POLICY_ALLOW);
2255 	xp->priority = pol->sadb_x_policy_priority;
2256 
2257 	sa = ext_hdrs[SADB_EXT_ADDRESS_SRC-1];
2258 	xp->family = pfkey_sadb_addr2xfrm_addr(sa, &xp->selector.saddr);
2259 	xp->selector.family = xp->family;
2260 	xp->selector.prefixlen_s = sa->sadb_address_prefixlen;
2261 	xp->selector.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2262 	xp->selector.sport = ((struct sockaddr_in *)(sa+1))->sin_port;
2263 	if (xp->selector.sport)
2264 		xp->selector.sport_mask = htons(0xffff);
2265 
2266 	sa = ext_hdrs[SADB_EXT_ADDRESS_DST-1];
2267 	pfkey_sadb_addr2xfrm_addr(sa, &xp->selector.daddr);
2268 	xp->selector.prefixlen_d = sa->sadb_address_prefixlen;
2269 
2270 	/* Amusing, we set this twice.  KAME apps appear to set same value
2271 	 * in both addresses.
2272 	 */
2273 	xp->selector.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2274 
2275 	xp->selector.dport = ((struct sockaddr_in *)(sa+1))->sin_port;
2276 	if (xp->selector.dport)
2277 		xp->selector.dport_mask = htons(0xffff);
2278 
2279 	sec_ctx = ext_hdrs[SADB_X_EXT_SEC_CTX - 1];
2280 	if (sec_ctx != NULL) {
2281 		struct xfrm_user_sec_ctx *uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_KERNEL);
2282 
2283 		if (!uctx) {
2284 			err = -ENOBUFS;
2285 			goto out;
2286 		}
2287 
2288 		err = security_xfrm_policy_alloc(&xp->security, uctx, GFP_KERNEL);
2289 		kfree(uctx);
2290 
2291 		if (err)
2292 			goto out;
2293 	}
2294 
2295 	xp->lft.soft_byte_limit = XFRM_INF;
2296 	xp->lft.hard_byte_limit = XFRM_INF;
2297 	xp->lft.soft_packet_limit = XFRM_INF;
2298 	xp->lft.hard_packet_limit = XFRM_INF;
2299 	if ((lifetime = ext_hdrs[SADB_EXT_LIFETIME_HARD-1]) != NULL) {
2300 		xp->lft.hard_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
2301 		xp->lft.hard_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
2302 		xp->lft.hard_add_expires_seconds = lifetime->sadb_lifetime_addtime;
2303 		xp->lft.hard_use_expires_seconds = lifetime->sadb_lifetime_usetime;
2304 	}
2305 	if ((lifetime = ext_hdrs[SADB_EXT_LIFETIME_SOFT-1]) != NULL) {
2306 		xp->lft.soft_packet_limit = _KEY2X(lifetime->sadb_lifetime_allocations);
2307 		xp->lft.soft_byte_limit = _KEY2X(lifetime->sadb_lifetime_bytes);
2308 		xp->lft.soft_add_expires_seconds = lifetime->sadb_lifetime_addtime;
2309 		xp->lft.soft_use_expires_seconds = lifetime->sadb_lifetime_usetime;
2310 	}
2311 	xp->xfrm_nr = 0;
2312 	if (pol->sadb_x_policy_type == IPSEC_POLICY_IPSEC &&
2313 	    (err = parse_ipsecrequests(xp, pol)) < 0)
2314 		goto out;
2315 
2316 	err = xfrm_policy_insert(pol->sadb_x_policy_dir-1, xp,
2317 				 hdr->sadb_msg_type != SADB_X_SPDUPDATE);
2318 
2319 	xfrm_audit_policy_add(xp, err ? 0 : 1, true);
2320 
2321 	if (err)
2322 		goto out;
2323 
2324 	if (hdr->sadb_msg_type == SADB_X_SPDUPDATE)
2325 		c.event = XFRM_MSG_UPDPOLICY;
2326 	else
2327 		c.event = XFRM_MSG_NEWPOLICY;
2328 
2329 	c.seq = hdr->sadb_msg_seq;
2330 	c.portid = hdr->sadb_msg_pid;
2331 
2332 	km_policy_notify(xp, pol->sadb_x_policy_dir-1, &c);
2333 	xfrm_pol_put(xp);
2334 	return 0;
2335 
2336 out:
2337 	xp->walk.dead = 1;
2338 	xfrm_policy_destroy(xp);
2339 	return err;
2340 }
2341 
2342 static int pfkey_spddelete(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2343 {
2344 	struct net *net = sock_net(sk);
2345 	int err;
2346 	struct sadb_address *sa;
2347 	struct sadb_x_policy *pol;
2348 	struct xfrm_policy *xp;
2349 	struct xfrm_selector sel;
2350 	struct km_event c;
2351 	struct sadb_x_sec_ctx *sec_ctx;
2352 	struct xfrm_sec_ctx *pol_ctx = NULL;
2353 
2354 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC-1],
2355 				     ext_hdrs[SADB_EXT_ADDRESS_DST-1]) ||
2356 	    !ext_hdrs[SADB_X_EXT_POLICY-1])
2357 		return -EINVAL;
2358 
2359 	pol = ext_hdrs[SADB_X_EXT_POLICY-1];
2360 	if (!pol->sadb_x_policy_dir || pol->sadb_x_policy_dir >= IPSEC_DIR_MAX)
2361 		return -EINVAL;
2362 
2363 	memset(&sel, 0, sizeof(sel));
2364 
2365 	sa = ext_hdrs[SADB_EXT_ADDRESS_SRC-1];
2366 	sel.family = pfkey_sadb_addr2xfrm_addr(sa, &sel.saddr);
2367 	sel.prefixlen_s = sa->sadb_address_prefixlen;
2368 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2369 	sel.sport = ((struct sockaddr_in *)(sa+1))->sin_port;
2370 	if (sel.sport)
2371 		sel.sport_mask = htons(0xffff);
2372 
2373 	sa = ext_hdrs[SADB_EXT_ADDRESS_DST-1];
2374 	pfkey_sadb_addr2xfrm_addr(sa, &sel.daddr);
2375 	sel.prefixlen_d = sa->sadb_address_prefixlen;
2376 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2377 	sel.dport = ((struct sockaddr_in *)(sa+1))->sin_port;
2378 	if (sel.dport)
2379 		sel.dport_mask = htons(0xffff);
2380 
2381 	sec_ctx = ext_hdrs[SADB_X_EXT_SEC_CTX - 1];
2382 	if (sec_ctx != NULL) {
2383 		struct xfrm_user_sec_ctx *uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_KERNEL);
2384 
2385 		if (!uctx)
2386 			return -ENOMEM;
2387 
2388 		err = security_xfrm_policy_alloc(&pol_ctx, uctx, GFP_KERNEL);
2389 		kfree(uctx);
2390 		if (err)
2391 			return err;
2392 	}
2393 
2394 	xp = xfrm_policy_bysel_ctx(net, DUMMY_MARK, XFRM_POLICY_TYPE_MAIN,
2395 				   pol->sadb_x_policy_dir - 1, &sel, pol_ctx,
2396 				   1, &err);
2397 	security_xfrm_policy_free(pol_ctx);
2398 	if (xp == NULL)
2399 		return -ENOENT;
2400 
2401 	xfrm_audit_policy_delete(xp, err ? 0 : 1, true);
2402 
2403 	if (err)
2404 		goto out;
2405 
2406 	c.seq = hdr->sadb_msg_seq;
2407 	c.portid = hdr->sadb_msg_pid;
2408 	c.data.byid = 0;
2409 	c.event = XFRM_MSG_DELPOLICY;
2410 	km_policy_notify(xp, pol->sadb_x_policy_dir-1, &c);
2411 
2412 out:
2413 	xfrm_pol_put(xp);
2414 	if (err == 0)
2415 		xfrm_garbage_collect(net);
2416 	return err;
2417 }
2418 
2419 static int key_pol_get_resp(struct sock *sk, struct xfrm_policy *xp, const struct sadb_msg *hdr, int dir)
2420 {
2421 	int err;
2422 	struct sk_buff *out_skb;
2423 	struct sadb_msg *out_hdr;
2424 	err = 0;
2425 
2426 	out_skb = pfkey_xfrm_policy2msg_prep(xp);
2427 	if (IS_ERR(out_skb)) {
2428 		err =  PTR_ERR(out_skb);
2429 		goto out;
2430 	}
2431 	err = pfkey_xfrm_policy2msg(out_skb, xp, dir);
2432 	if (err < 0)
2433 		goto out;
2434 
2435 	out_hdr = (struct sadb_msg *) out_skb->data;
2436 	out_hdr->sadb_msg_version = hdr->sadb_msg_version;
2437 	out_hdr->sadb_msg_type = hdr->sadb_msg_type;
2438 	out_hdr->sadb_msg_satype = 0;
2439 	out_hdr->sadb_msg_errno = 0;
2440 	out_hdr->sadb_msg_seq = hdr->sadb_msg_seq;
2441 	out_hdr->sadb_msg_pid = hdr->sadb_msg_pid;
2442 	pfkey_broadcast(out_skb, BROADCAST_ONE, sk, xp_net(xp));
2443 	err = 0;
2444 
2445 out:
2446 	return err;
2447 }
2448 
2449 static int pfkey_sockaddr_pair_size(sa_family_t family)
2450 {
2451 	return PFKEY_ALIGN8(pfkey_sockaddr_len(family) * 2);
2452 }
2453 
2454 static int parse_sockaddr_pair(struct sockaddr *sa, int ext_len,
2455 			       xfrm_address_t *saddr, xfrm_address_t *daddr,
2456 			       u16 *family)
2457 {
2458 	int af, socklen;
2459 
2460 	if (ext_len < 2 || ext_len < pfkey_sockaddr_pair_size(sa->sa_family))
2461 		return -EINVAL;
2462 
2463 	af = pfkey_sockaddr_extract(sa, saddr);
2464 	if (!af)
2465 		return -EINVAL;
2466 
2467 	socklen = pfkey_sockaddr_len(af);
2468 	if (pfkey_sockaddr_extract((struct sockaddr *) (((u8 *)sa) + socklen),
2469 				   daddr) != af)
2470 		return -EINVAL;
2471 
2472 	*family = af;
2473 	return 0;
2474 }
2475 
2476 #ifdef CONFIG_NET_KEY_MIGRATE
2477 static int ipsecrequests_to_migrate(struct sadb_x_ipsecrequest *rq1, int len,
2478 				    struct xfrm_migrate *m)
2479 {
2480 	int err;
2481 	struct sadb_x_ipsecrequest *rq2;
2482 	int mode;
2483 
2484 	if (len < sizeof(*rq1) ||
2485 	    len < rq1->sadb_x_ipsecrequest_len ||
2486 	    rq1->sadb_x_ipsecrequest_len < sizeof(*rq1))
2487 		return -EINVAL;
2488 
2489 	/* old endoints */
2490 	err = parse_sockaddr_pair((struct sockaddr *)(rq1 + 1),
2491 				  rq1->sadb_x_ipsecrequest_len - sizeof(*rq1),
2492 				  &m->old_saddr, &m->old_daddr,
2493 				  &m->old_family);
2494 	if (err)
2495 		return err;
2496 
2497 	rq2 = (struct sadb_x_ipsecrequest *)((u8 *)rq1 + rq1->sadb_x_ipsecrequest_len);
2498 	len -= rq1->sadb_x_ipsecrequest_len;
2499 
2500 	if (len <= sizeof(*rq2) ||
2501 	    len < rq2->sadb_x_ipsecrequest_len ||
2502 	    rq2->sadb_x_ipsecrequest_len < sizeof(*rq2))
2503 		return -EINVAL;
2504 
2505 	/* new endpoints */
2506 	err = parse_sockaddr_pair((struct sockaddr *)(rq2 + 1),
2507 				  rq2->sadb_x_ipsecrequest_len - sizeof(*rq2),
2508 				  &m->new_saddr, &m->new_daddr,
2509 				  &m->new_family);
2510 	if (err)
2511 		return err;
2512 
2513 	if (rq1->sadb_x_ipsecrequest_proto != rq2->sadb_x_ipsecrequest_proto ||
2514 	    rq1->sadb_x_ipsecrequest_mode != rq2->sadb_x_ipsecrequest_mode ||
2515 	    rq1->sadb_x_ipsecrequest_reqid != rq2->sadb_x_ipsecrequest_reqid)
2516 		return -EINVAL;
2517 
2518 	m->proto = rq1->sadb_x_ipsecrequest_proto;
2519 	if ((mode = pfkey_mode_to_xfrm(rq1->sadb_x_ipsecrequest_mode)) < 0)
2520 		return -EINVAL;
2521 	m->mode = mode;
2522 	m->reqid = rq1->sadb_x_ipsecrequest_reqid;
2523 
2524 	return ((int)(rq1->sadb_x_ipsecrequest_len +
2525 		      rq2->sadb_x_ipsecrequest_len));
2526 }
2527 
2528 static int pfkey_migrate(struct sock *sk, struct sk_buff *skb,
2529 			 const struct sadb_msg *hdr, void * const *ext_hdrs)
2530 {
2531 	int i, len, ret, err = -EINVAL;
2532 	u8 dir;
2533 	struct sadb_address *sa;
2534 	struct sadb_x_kmaddress *kma;
2535 	struct sadb_x_policy *pol;
2536 	struct sadb_x_ipsecrequest *rq;
2537 	struct xfrm_selector sel;
2538 	struct xfrm_migrate m[XFRM_MAX_DEPTH];
2539 	struct xfrm_kmaddress k;
2540 	struct net *net = sock_net(sk);
2541 
2542 	if (!present_and_same_family(ext_hdrs[SADB_EXT_ADDRESS_SRC - 1],
2543 				     ext_hdrs[SADB_EXT_ADDRESS_DST - 1]) ||
2544 	    !ext_hdrs[SADB_X_EXT_POLICY - 1]) {
2545 		err = -EINVAL;
2546 		goto out;
2547 	}
2548 
2549 	kma = ext_hdrs[SADB_X_EXT_KMADDRESS - 1];
2550 	pol = ext_hdrs[SADB_X_EXT_POLICY - 1];
2551 
2552 	if (pol->sadb_x_policy_dir >= IPSEC_DIR_MAX) {
2553 		err = -EINVAL;
2554 		goto out;
2555 	}
2556 
2557 	if (kma) {
2558 		/* convert sadb_x_kmaddress to xfrm_kmaddress */
2559 		k.reserved = kma->sadb_x_kmaddress_reserved;
2560 		ret = parse_sockaddr_pair((struct sockaddr *)(kma + 1),
2561 					  8*(kma->sadb_x_kmaddress_len) - sizeof(*kma),
2562 					  &k.local, &k.remote, &k.family);
2563 		if (ret < 0) {
2564 			err = ret;
2565 			goto out;
2566 		}
2567 	}
2568 
2569 	dir = pol->sadb_x_policy_dir - 1;
2570 	memset(&sel, 0, sizeof(sel));
2571 
2572 	/* set source address info of selector */
2573 	sa = ext_hdrs[SADB_EXT_ADDRESS_SRC - 1];
2574 	sel.family = pfkey_sadb_addr2xfrm_addr(sa, &sel.saddr);
2575 	sel.prefixlen_s = sa->sadb_address_prefixlen;
2576 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2577 	sel.sport = ((struct sockaddr_in *)(sa + 1))->sin_port;
2578 	if (sel.sport)
2579 		sel.sport_mask = htons(0xffff);
2580 
2581 	/* set destination address info of selector */
2582 	sa = ext_hdrs[SADB_EXT_ADDRESS_DST - 1];
2583 	pfkey_sadb_addr2xfrm_addr(sa, &sel.daddr);
2584 	sel.prefixlen_d = sa->sadb_address_prefixlen;
2585 	sel.proto = pfkey_proto_to_xfrm(sa->sadb_address_proto);
2586 	sel.dport = ((struct sockaddr_in *)(sa + 1))->sin_port;
2587 	if (sel.dport)
2588 		sel.dport_mask = htons(0xffff);
2589 
2590 	rq = (struct sadb_x_ipsecrequest *)(pol + 1);
2591 
2592 	/* extract ipsecrequests */
2593 	i = 0;
2594 	len = pol->sadb_x_policy_len * 8 - sizeof(struct sadb_x_policy);
2595 
2596 	while (len > 0 && i < XFRM_MAX_DEPTH) {
2597 		ret = ipsecrequests_to_migrate(rq, len, &m[i]);
2598 		if (ret < 0) {
2599 			err = ret;
2600 			goto out;
2601 		} else {
2602 			rq = (struct sadb_x_ipsecrequest *)((u8 *)rq + ret);
2603 			len -= ret;
2604 			i++;
2605 		}
2606 	}
2607 
2608 	if (!i || len > 0) {
2609 		err = -EINVAL;
2610 		goto out;
2611 	}
2612 
2613 	return xfrm_migrate(&sel, dir, XFRM_POLICY_TYPE_MAIN, m, i,
2614 			    kma ? &k : NULL, net);
2615 
2616  out:
2617 	return err;
2618 }
2619 #else
2620 static int pfkey_migrate(struct sock *sk, struct sk_buff *skb,
2621 			 const struct sadb_msg *hdr, void * const *ext_hdrs)
2622 {
2623 	return -ENOPROTOOPT;
2624 }
2625 #endif
2626 
2627 
2628 static int pfkey_spdget(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2629 {
2630 	struct net *net = sock_net(sk);
2631 	unsigned int dir;
2632 	int err = 0, delete;
2633 	struct sadb_x_policy *pol;
2634 	struct xfrm_policy *xp;
2635 	struct km_event c;
2636 
2637 	if ((pol = ext_hdrs[SADB_X_EXT_POLICY-1]) == NULL)
2638 		return -EINVAL;
2639 
2640 	dir = xfrm_policy_id2dir(pol->sadb_x_policy_id);
2641 	if (dir >= XFRM_POLICY_MAX)
2642 		return -EINVAL;
2643 
2644 	delete = (hdr->sadb_msg_type == SADB_X_SPDDELETE2);
2645 	xp = xfrm_policy_byid(net, DUMMY_MARK, XFRM_POLICY_TYPE_MAIN,
2646 			      dir, pol->sadb_x_policy_id, delete, &err);
2647 	if (xp == NULL)
2648 		return -ENOENT;
2649 
2650 	if (delete) {
2651 		xfrm_audit_policy_delete(xp, err ? 0 : 1, true);
2652 
2653 		if (err)
2654 			goto out;
2655 		c.seq = hdr->sadb_msg_seq;
2656 		c.portid = hdr->sadb_msg_pid;
2657 		c.data.byid = 1;
2658 		c.event = XFRM_MSG_DELPOLICY;
2659 		km_policy_notify(xp, dir, &c);
2660 	} else {
2661 		err = key_pol_get_resp(sk, xp, hdr, dir);
2662 	}
2663 
2664 out:
2665 	xfrm_pol_put(xp);
2666 	if (delete && err == 0)
2667 		xfrm_garbage_collect(net);
2668 	return err;
2669 }
2670 
2671 static int dump_sp(struct xfrm_policy *xp, int dir, int count, void *ptr)
2672 {
2673 	struct pfkey_sock *pfk = ptr;
2674 	struct sk_buff *out_skb;
2675 	struct sadb_msg *out_hdr;
2676 	int err;
2677 
2678 	if (!pfkey_can_dump(&pfk->sk))
2679 		return -ENOBUFS;
2680 
2681 	out_skb = pfkey_xfrm_policy2msg_prep(xp);
2682 	if (IS_ERR(out_skb))
2683 		return PTR_ERR(out_skb);
2684 
2685 	err = pfkey_xfrm_policy2msg(out_skb, xp, dir);
2686 	if (err < 0)
2687 		return err;
2688 
2689 	out_hdr = (struct sadb_msg *) out_skb->data;
2690 	out_hdr->sadb_msg_version = pfk->dump.msg_version;
2691 	out_hdr->sadb_msg_type = SADB_X_SPDDUMP;
2692 	out_hdr->sadb_msg_satype = SADB_SATYPE_UNSPEC;
2693 	out_hdr->sadb_msg_errno = 0;
2694 	out_hdr->sadb_msg_seq = count + 1;
2695 	out_hdr->sadb_msg_pid = pfk->dump.msg_portid;
2696 
2697 	if (pfk->dump.skb)
2698 		pfkey_broadcast(pfk->dump.skb, BROADCAST_ONE,
2699 				&pfk->sk, sock_net(&pfk->sk));
2700 	pfk->dump.skb = out_skb;
2701 
2702 	return 0;
2703 }
2704 
2705 static int pfkey_dump_sp(struct pfkey_sock *pfk)
2706 {
2707 	struct net *net = sock_net(&pfk->sk);
2708 	return xfrm_policy_walk(net, &pfk->dump.u.policy, dump_sp, (void *) pfk);
2709 }
2710 
2711 static void pfkey_dump_sp_done(struct pfkey_sock *pfk)
2712 {
2713 	struct net *net = sock_net((struct sock *)pfk);
2714 
2715 	xfrm_policy_walk_done(&pfk->dump.u.policy, net);
2716 }
2717 
2718 static int pfkey_spddump(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2719 {
2720 	struct pfkey_sock *pfk = pfkey_sk(sk);
2721 
2722 	mutex_lock(&pfk->dump_lock);
2723 	if (pfk->dump.dump != NULL) {
2724 		mutex_unlock(&pfk->dump_lock);
2725 		return -EBUSY;
2726 	}
2727 
2728 	pfk->dump.msg_version = hdr->sadb_msg_version;
2729 	pfk->dump.msg_portid = hdr->sadb_msg_pid;
2730 	pfk->dump.dump = pfkey_dump_sp;
2731 	pfk->dump.done = pfkey_dump_sp_done;
2732 	xfrm_policy_walk_init(&pfk->dump.u.policy, XFRM_POLICY_TYPE_MAIN);
2733 	mutex_unlock(&pfk->dump_lock);
2734 
2735 	return pfkey_do_dump(pfk);
2736 }
2737 
2738 static int key_notify_policy_flush(const struct km_event *c)
2739 {
2740 	struct sk_buff *skb_out;
2741 	struct sadb_msg *hdr;
2742 
2743 	skb_out = alloc_skb(sizeof(struct sadb_msg) + 16, GFP_ATOMIC);
2744 	if (!skb_out)
2745 		return -ENOBUFS;
2746 	hdr = (struct sadb_msg *) skb_put(skb_out, sizeof(struct sadb_msg));
2747 	hdr->sadb_msg_type = SADB_X_SPDFLUSH;
2748 	hdr->sadb_msg_seq = c->seq;
2749 	hdr->sadb_msg_pid = c->portid;
2750 	hdr->sadb_msg_version = PF_KEY_V2;
2751 	hdr->sadb_msg_errno = (uint8_t) 0;
2752 	hdr->sadb_msg_satype = SADB_SATYPE_UNSPEC;
2753 	hdr->sadb_msg_len = (sizeof(struct sadb_msg) / sizeof(uint64_t));
2754 	hdr->sadb_msg_reserved = 0;
2755 	pfkey_broadcast(skb_out, BROADCAST_ALL, NULL, c->net);
2756 	return 0;
2757 
2758 }
2759 
2760 static int pfkey_spdflush(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr, void * const *ext_hdrs)
2761 {
2762 	struct net *net = sock_net(sk);
2763 	struct km_event c;
2764 	int err, err2;
2765 
2766 	err = xfrm_policy_flush(net, XFRM_POLICY_TYPE_MAIN, true);
2767 	if (!err)
2768 		xfrm_garbage_collect(net);
2769 	err2 = unicast_flush_resp(sk, hdr);
2770 	if (err || err2) {
2771 		if (err == -ESRCH) /* empty table - old silent behavior */
2772 			return 0;
2773 		return err;
2774 	}
2775 
2776 	c.data.type = XFRM_POLICY_TYPE_MAIN;
2777 	c.event = XFRM_MSG_FLUSHPOLICY;
2778 	c.portid = hdr->sadb_msg_pid;
2779 	c.seq = hdr->sadb_msg_seq;
2780 	c.net = net;
2781 	km_policy_notify(NULL, 0, &c);
2782 
2783 	return 0;
2784 }
2785 
2786 typedef int (*pfkey_handler)(struct sock *sk, struct sk_buff *skb,
2787 			     const struct sadb_msg *hdr, void * const *ext_hdrs);
2788 static const pfkey_handler pfkey_funcs[SADB_MAX + 1] = {
2789 	[SADB_RESERVED]		= pfkey_reserved,
2790 	[SADB_GETSPI]		= pfkey_getspi,
2791 	[SADB_UPDATE]		= pfkey_add,
2792 	[SADB_ADD]		= pfkey_add,
2793 	[SADB_DELETE]		= pfkey_delete,
2794 	[SADB_GET]		= pfkey_get,
2795 	[SADB_ACQUIRE]		= pfkey_acquire,
2796 	[SADB_REGISTER]		= pfkey_register,
2797 	[SADB_EXPIRE]		= NULL,
2798 	[SADB_FLUSH]		= pfkey_flush,
2799 	[SADB_DUMP]		= pfkey_dump,
2800 	[SADB_X_PROMISC]	= pfkey_promisc,
2801 	[SADB_X_PCHANGE]	= NULL,
2802 	[SADB_X_SPDUPDATE]	= pfkey_spdadd,
2803 	[SADB_X_SPDADD]		= pfkey_spdadd,
2804 	[SADB_X_SPDDELETE]	= pfkey_spddelete,
2805 	[SADB_X_SPDGET]		= pfkey_spdget,
2806 	[SADB_X_SPDACQUIRE]	= NULL,
2807 	[SADB_X_SPDDUMP]	= pfkey_spddump,
2808 	[SADB_X_SPDFLUSH]	= pfkey_spdflush,
2809 	[SADB_X_SPDSETIDX]	= pfkey_spdadd,
2810 	[SADB_X_SPDDELETE2]	= pfkey_spdget,
2811 	[SADB_X_MIGRATE]	= pfkey_migrate,
2812 };
2813 
2814 static int pfkey_process(struct sock *sk, struct sk_buff *skb, const struct sadb_msg *hdr)
2815 {
2816 	void *ext_hdrs[SADB_EXT_MAX];
2817 	int err;
2818 
2819 	pfkey_broadcast(skb_clone(skb, GFP_KERNEL),
2820 			BROADCAST_PROMISC_ONLY, NULL, sock_net(sk));
2821 
2822 	memset(ext_hdrs, 0, sizeof(ext_hdrs));
2823 	err = parse_exthdrs(skb, hdr, ext_hdrs);
2824 	if (!err) {
2825 		err = -EOPNOTSUPP;
2826 		if (pfkey_funcs[hdr->sadb_msg_type])
2827 			err = pfkey_funcs[hdr->sadb_msg_type](sk, skb, hdr, ext_hdrs);
2828 	}
2829 	return err;
2830 }
2831 
2832 static struct sadb_msg *pfkey_get_base_msg(struct sk_buff *skb, int *errp)
2833 {
2834 	struct sadb_msg *hdr = NULL;
2835 
2836 	if (skb->len < sizeof(*hdr)) {
2837 		*errp = -EMSGSIZE;
2838 	} else {
2839 		hdr = (struct sadb_msg *) skb->data;
2840 		if (hdr->sadb_msg_version != PF_KEY_V2 ||
2841 		    hdr->sadb_msg_reserved != 0 ||
2842 		    (hdr->sadb_msg_type <= SADB_RESERVED ||
2843 		     hdr->sadb_msg_type > SADB_MAX)) {
2844 			hdr = NULL;
2845 			*errp = -EINVAL;
2846 		} else if (hdr->sadb_msg_len != (skb->len /
2847 						 sizeof(uint64_t)) ||
2848 			   hdr->sadb_msg_len < (sizeof(struct sadb_msg) /
2849 						sizeof(uint64_t))) {
2850 			hdr = NULL;
2851 			*errp = -EMSGSIZE;
2852 		} else {
2853 			*errp = 0;
2854 		}
2855 	}
2856 	return hdr;
2857 }
2858 
2859 static inline int aalg_tmpl_set(const struct xfrm_tmpl *t,
2860 				const struct xfrm_algo_desc *d)
2861 {
2862 	unsigned int id = d->desc.sadb_alg_id;
2863 
2864 	if (id >= sizeof(t->aalgos) * 8)
2865 		return 0;
2866 
2867 	return (t->aalgos >> id) & 1;
2868 }
2869 
2870 static inline int ealg_tmpl_set(const struct xfrm_tmpl *t,
2871 				const struct xfrm_algo_desc *d)
2872 {
2873 	unsigned int id = d->desc.sadb_alg_id;
2874 
2875 	if (id >= sizeof(t->ealgos) * 8)
2876 		return 0;
2877 
2878 	return (t->ealgos >> id) & 1;
2879 }
2880 
2881 static int count_ah_combs(const struct xfrm_tmpl *t)
2882 {
2883 	int i, sz = 0;
2884 
2885 	for (i = 0; ; i++) {
2886 		const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(i);
2887 		if (!aalg)
2888 			break;
2889 		if (!aalg->pfkey_supported)
2890 			continue;
2891 		if (aalg_tmpl_set(t, aalg) && aalg->available)
2892 			sz += sizeof(struct sadb_comb);
2893 	}
2894 	return sz + sizeof(struct sadb_prop);
2895 }
2896 
2897 static int count_esp_combs(const struct xfrm_tmpl *t)
2898 {
2899 	int i, k, sz = 0;
2900 
2901 	for (i = 0; ; i++) {
2902 		const struct xfrm_algo_desc *ealg = xfrm_ealg_get_byidx(i);
2903 		if (!ealg)
2904 			break;
2905 
2906 		if (!ealg->pfkey_supported)
2907 			continue;
2908 
2909 		if (!(ealg_tmpl_set(t, ealg) && ealg->available))
2910 			continue;
2911 
2912 		for (k = 1; ; k++) {
2913 			const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(k);
2914 			if (!aalg)
2915 				break;
2916 
2917 			if (!aalg->pfkey_supported)
2918 				continue;
2919 
2920 			if (aalg_tmpl_set(t, aalg) && aalg->available)
2921 				sz += sizeof(struct sadb_comb);
2922 		}
2923 	}
2924 	return sz + sizeof(struct sadb_prop);
2925 }
2926 
2927 static void dump_ah_combs(struct sk_buff *skb, const struct xfrm_tmpl *t)
2928 {
2929 	struct sadb_prop *p;
2930 	int i;
2931 
2932 	p = (struct sadb_prop*)skb_put(skb, sizeof(struct sadb_prop));
2933 	p->sadb_prop_len = sizeof(struct sadb_prop)/8;
2934 	p->sadb_prop_exttype = SADB_EXT_PROPOSAL;
2935 	p->sadb_prop_replay = 32;
2936 	memset(p->sadb_prop_reserved, 0, sizeof(p->sadb_prop_reserved));
2937 
2938 	for (i = 0; ; i++) {
2939 		const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(i);
2940 		if (!aalg)
2941 			break;
2942 
2943 		if (!aalg->pfkey_supported)
2944 			continue;
2945 
2946 		if (aalg_tmpl_set(t, aalg) && aalg->available) {
2947 			struct sadb_comb *c;
2948 			c = (struct sadb_comb*)skb_put(skb, sizeof(struct sadb_comb));
2949 			memset(c, 0, sizeof(*c));
2950 			p->sadb_prop_len += sizeof(struct sadb_comb)/8;
2951 			c->sadb_comb_auth = aalg->desc.sadb_alg_id;
2952 			c->sadb_comb_auth_minbits = aalg->desc.sadb_alg_minbits;
2953 			c->sadb_comb_auth_maxbits = aalg->desc.sadb_alg_maxbits;
2954 			c->sadb_comb_hard_addtime = 24*60*60;
2955 			c->sadb_comb_soft_addtime = 20*60*60;
2956 			c->sadb_comb_hard_usetime = 8*60*60;
2957 			c->sadb_comb_soft_usetime = 7*60*60;
2958 		}
2959 	}
2960 }
2961 
2962 static void dump_esp_combs(struct sk_buff *skb, const struct xfrm_tmpl *t)
2963 {
2964 	struct sadb_prop *p;
2965 	int i, k;
2966 
2967 	p = (struct sadb_prop*)skb_put(skb, sizeof(struct sadb_prop));
2968 	p->sadb_prop_len = sizeof(struct sadb_prop)/8;
2969 	p->sadb_prop_exttype = SADB_EXT_PROPOSAL;
2970 	p->sadb_prop_replay = 32;
2971 	memset(p->sadb_prop_reserved, 0, sizeof(p->sadb_prop_reserved));
2972 
2973 	for (i=0; ; i++) {
2974 		const struct xfrm_algo_desc *ealg = xfrm_ealg_get_byidx(i);
2975 		if (!ealg)
2976 			break;
2977 
2978 		if (!ealg->pfkey_supported)
2979 			continue;
2980 
2981 		if (!(ealg_tmpl_set(t, ealg) && ealg->available))
2982 			continue;
2983 
2984 		for (k = 1; ; k++) {
2985 			struct sadb_comb *c;
2986 			const struct xfrm_algo_desc *aalg = xfrm_aalg_get_byidx(k);
2987 			if (!aalg)
2988 				break;
2989 			if (!aalg->pfkey_supported)
2990 				continue;
2991 			if (!(aalg_tmpl_set(t, aalg) && aalg->available))
2992 				continue;
2993 			c = (struct sadb_comb*)skb_put(skb, sizeof(struct sadb_comb));
2994 			memset(c, 0, sizeof(*c));
2995 			p->sadb_prop_len += sizeof(struct sadb_comb)/8;
2996 			c->sadb_comb_auth = aalg->desc.sadb_alg_id;
2997 			c->sadb_comb_auth_minbits = aalg->desc.sadb_alg_minbits;
2998 			c->sadb_comb_auth_maxbits = aalg->desc.sadb_alg_maxbits;
2999 			c->sadb_comb_encrypt = ealg->desc.sadb_alg_id;
3000 			c->sadb_comb_encrypt_minbits = ealg->desc.sadb_alg_minbits;
3001 			c->sadb_comb_encrypt_maxbits = ealg->desc.sadb_alg_maxbits;
3002 			c->sadb_comb_hard_addtime = 24*60*60;
3003 			c->sadb_comb_soft_addtime = 20*60*60;
3004 			c->sadb_comb_hard_usetime = 8*60*60;
3005 			c->sadb_comb_soft_usetime = 7*60*60;
3006 		}
3007 	}
3008 }
3009 
3010 static int key_notify_policy_expire(struct xfrm_policy *xp, const struct km_event *c)
3011 {
3012 	return 0;
3013 }
3014 
3015 static int key_notify_sa_expire(struct xfrm_state *x, const struct km_event *c)
3016 {
3017 	struct sk_buff *out_skb;
3018 	struct sadb_msg *out_hdr;
3019 	int hard;
3020 	int hsc;
3021 
3022 	hard = c->data.hard;
3023 	if (hard)
3024 		hsc = 2;
3025 	else
3026 		hsc = 1;
3027 
3028 	out_skb = pfkey_xfrm_state2msg_expire(x, hsc);
3029 	if (IS_ERR(out_skb))
3030 		return PTR_ERR(out_skb);
3031 
3032 	out_hdr = (struct sadb_msg *) out_skb->data;
3033 	out_hdr->sadb_msg_version = PF_KEY_V2;
3034 	out_hdr->sadb_msg_type = SADB_EXPIRE;
3035 	out_hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
3036 	out_hdr->sadb_msg_errno = 0;
3037 	out_hdr->sadb_msg_reserved = 0;
3038 	out_hdr->sadb_msg_seq = 0;
3039 	out_hdr->sadb_msg_pid = 0;
3040 
3041 	pfkey_broadcast(out_skb, BROADCAST_REGISTERED, NULL, xs_net(x));
3042 	return 0;
3043 }
3044 
3045 static int pfkey_send_notify(struct xfrm_state *x, const struct km_event *c)
3046 {
3047 	struct net *net = x ? xs_net(x) : c->net;
3048 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3049 
3050 	if (atomic_read(&net_pfkey->socks_nr) == 0)
3051 		return 0;
3052 
3053 	switch (c->event) {
3054 	case XFRM_MSG_EXPIRE:
3055 		return key_notify_sa_expire(x, c);
3056 	case XFRM_MSG_DELSA:
3057 	case XFRM_MSG_NEWSA:
3058 	case XFRM_MSG_UPDSA:
3059 		return key_notify_sa(x, c);
3060 	case XFRM_MSG_FLUSHSA:
3061 		return key_notify_sa_flush(c);
3062 	case XFRM_MSG_NEWAE: /* not yet supported */
3063 		break;
3064 	default:
3065 		pr_err("pfkey: Unknown SA event %d\n", c->event);
3066 		break;
3067 	}
3068 
3069 	return 0;
3070 }
3071 
3072 static int pfkey_send_policy_notify(struct xfrm_policy *xp, int dir, const struct km_event *c)
3073 {
3074 	if (xp && xp->type != XFRM_POLICY_TYPE_MAIN)
3075 		return 0;
3076 
3077 	switch (c->event) {
3078 	case XFRM_MSG_POLEXPIRE:
3079 		return key_notify_policy_expire(xp, c);
3080 	case XFRM_MSG_DELPOLICY:
3081 	case XFRM_MSG_NEWPOLICY:
3082 	case XFRM_MSG_UPDPOLICY:
3083 		return key_notify_policy(xp, dir, c);
3084 	case XFRM_MSG_FLUSHPOLICY:
3085 		if (c->data.type != XFRM_POLICY_TYPE_MAIN)
3086 			break;
3087 		return key_notify_policy_flush(c);
3088 	default:
3089 		pr_err("pfkey: Unknown policy event %d\n", c->event);
3090 		break;
3091 	}
3092 
3093 	return 0;
3094 }
3095 
3096 static u32 get_acqseq(void)
3097 {
3098 	u32 res;
3099 	static atomic_t acqseq;
3100 
3101 	do {
3102 		res = atomic_inc_return(&acqseq);
3103 	} while (!res);
3104 	return res;
3105 }
3106 
3107 static bool pfkey_is_alive(const struct km_event *c)
3108 {
3109 	struct netns_pfkey *net_pfkey = net_generic(c->net, pfkey_net_id);
3110 	struct sock *sk;
3111 	bool is_alive = false;
3112 
3113 	rcu_read_lock();
3114 	sk_for_each_rcu(sk, &net_pfkey->table) {
3115 		if (pfkey_sk(sk)->registered) {
3116 			is_alive = true;
3117 			break;
3118 		}
3119 	}
3120 	rcu_read_unlock();
3121 
3122 	return is_alive;
3123 }
3124 
3125 static int pfkey_send_acquire(struct xfrm_state *x, struct xfrm_tmpl *t, struct xfrm_policy *xp)
3126 {
3127 	struct sk_buff *skb;
3128 	struct sadb_msg *hdr;
3129 	struct sadb_address *addr;
3130 	struct sadb_x_policy *pol;
3131 	int sockaddr_size;
3132 	int size;
3133 	struct sadb_x_sec_ctx *sec_ctx;
3134 	struct xfrm_sec_ctx *xfrm_ctx;
3135 	int ctx_size = 0;
3136 
3137 	sockaddr_size = pfkey_sockaddr_size(x->props.family);
3138 	if (!sockaddr_size)
3139 		return -EINVAL;
3140 
3141 	size = sizeof(struct sadb_msg) +
3142 		(sizeof(struct sadb_address) * 2) +
3143 		(sockaddr_size * 2) +
3144 		sizeof(struct sadb_x_policy);
3145 
3146 	if (x->id.proto == IPPROTO_AH)
3147 		size += count_ah_combs(t);
3148 	else if (x->id.proto == IPPROTO_ESP)
3149 		size += count_esp_combs(t);
3150 
3151 	if ((xfrm_ctx = x->security)) {
3152 		ctx_size = PFKEY_ALIGN8(xfrm_ctx->ctx_len);
3153 		size +=  sizeof(struct sadb_x_sec_ctx) + ctx_size;
3154 	}
3155 
3156 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
3157 	if (skb == NULL)
3158 		return -ENOMEM;
3159 
3160 	hdr = (struct sadb_msg *) skb_put(skb, sizeof(struct sadb_msg));
3161 	hdr->sadb_msg_version = PF_KEY_V2;
3162 	hdr->sadb_msg_type = SADB_ACQUIRE;
3163 	hdr->sadb_msg_satype = pfkey_proto2satype(x->id.proto);
3164 	hdr->sadb_msg_len = size / sizeof(uint64_t);
3165 	hdr->sadb_msg_errno = 0;
3166 	hdr->sadb_msg_reserved = 0;
3167 	hdr->sadb_msg_seq = x->km.seq = get_acqseq();
3168 	hdr->sadb_msg_pid = 0;
3169 
3170 	/* src address */
3171 	addr = (struct sadb_address*) skb_put(skb,
3172 					      sizeof(struct sadb_address)+sockaddr_size);
3173 	addr->sadb_address_len =
3174 		(sizeof(struct sadb_address)+sockaddr_size)/
3175 			sizeof(uint64_t);
3176 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
3177 	addr->sadb_address_proto = 0;
3178 	addr->sadb_address_reserved = 0;
3179 	addr->sadb_address_prefixlen =
3180 		pfkey_sockaddr_fill(&x->props.saddr, 0,
3181 				    (struct sockaddr *) (addr + 1),
3182 				    x->props.family);
3183 	if (!addr->sadb_address_prefixlen)
3184 		BUG();
3185 
3186 	/* dst address */
3187 	addr = (struct sadb_address*) skb_put(skb,
3188 					      sizeof(struct sadb_address)+sockaddr_size);
3189 	addr->sadb_address_len =
3190 		(sizeof(struct sadb_address)+sockaddr_size)/
3191 			sizeof(uint64_t);
3192 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
3193 	addr->sadb_address_proto = 0;
3194 	addr->sadb_address_reserved = 0;
3195 	addr->sadb_address_prefixlen =
3196 		pfkey_sockaddr_fill(&x->id.daddr, 0,
3197 				    (struct sockaddr *) (addr + 1),
3198 				    x->props.family);
3199 	if (!addr->sadb_address_prefixlen)
3200 		BUG();
3201 
3202 	pol = (struct sadb_x_policy *)  skb_put(skb, sizeof(struct sadb_x_policy));
3203 	pol->sadb_x_policy_len = sizeof(struct sadb_x_policy)/sizeof(uint64_t);
3204 	pol->sadb_x_policy_exttype = SADB_X_EXT_POLICY;
3205 	pol->sadb_x_policy_type = IPSEC_POLICY_IPSEC;
3206 	pol->sadb_x_policy_dir = XFRM_POLICY_OUT + 1;
3207 	pol->sadb_x_policy_reserved = 0;
3208 	pol->sadb_x_policy_id = xp->index;
3209 	pol->sadb_x_policy_priority = xp->priority;
3210 
3211 	/* Set sadb_comb's. */
3212 	if (x->id.proto == IPPROTO_AH)
3213 		dump_ah_combs(skb, t);
3214 	else if (x->id.proto == IPPROTO_ESP)
3215 		dump_esp_combs(skb, t);
3216 
3217 	/* security context */
3218 	if (xfrm_ctx) {
3219 		sec_ctx = (struct sadb_x_sec_ctx *) skb_put(skb,
3220 				sizeof(struct sadb_x_sec_ctx) + ctx_size);
3221 		sec_ctx->sadb_x_sec_len =
3222 		  (sizeof(struct sadb_x_sec_ctx) + ctx_size) / sizeof(uint64_t);
3223 		sec_ctx->sadb_x_sec_exttype = SADB_X_EXT_SEC_CTX;
3224 		sec_ctx->sadb_x_ctx_doi = xfrm_ctx->ctx_doi;
3225 		sec_ctx->sadb_x_ctx_alg = xfrm_ctx->ctx_alg;
3226 		sec_ctx->sadb_x_ctx_len = xfrm_ctx->ctx_len;
3227 		memcpy(sec_ctx + 1, xfrm_ctx->ctx_str,
3228 		       xfrm_ctx->ctx_len);
3229 	}
3230 
3231 	return pfkey_broadcast(skb, BROADCAST_REGISTERED, NULL, xs_net(x));
3232 }
3233 
3234 static struct xfrm_policy *pfkey_compile_policy(struct sock *sk, int opt,
3235 						u8 *data, int len, int *dir)
3236 {
3237 	struct net *net = sock_net(sk);
3238 	struct xfrm_policy *xp;
3239 	struct sadb_x_policy *pol = (struct sadb_x_policy*)data;
3240 	struct sadb_x_sec_ctx *sec_ctx;
3241 
3242 	switch (sk->sk_family) {
3243 	case AF_INET:
3244 		if (opt != IP_IPSEC_POLICY) {
3245 			*dir = -EOPNOTSUPP;
3246 			return NULL;
3247 		}
3248 		break;
3249 #if IS_ENABLED(CONFIG_IPV6)
3250 	case AF_INET6:
3251 		if (opt != IPV6_IPSEC_POLICY) {
3252 			*dir = -EOPNOTSUPP;
3253 			return NULL;
3254 		}
3255 		break;
3256 #endif
3257 	default:
3258 		*dir = -EINVAL;
3259 		return NULL;
3260 	}
3261 
3262 	*dir = -EINVAL;
3263 
3264 	if (len < sizeof(struct sadb_x_policy) ||
3265 	    pol->sadb_x_policy_len*8 > len ||
3266 	    pol->sadb_x_policy_type > IPSEC_POLICY_BYPASS ||
3267 	    (!pol->sadb_x_policy_dir || pol->sadb_x_policy_dir > IPSEC_DIR_OUTBOUND))
3268 		return NULL;
3269 
3270 	xp = xfrm_policy_alloc(net, GFP_ATOMIC);
3271 	if (xp == NULL) {
3272 		*dir = -ENOBUFS;
3273 		return NULL;
3274 	}
3275 
3276 	xp->action = (pol->sadb_x_policy_type == IPSEC_POLICY_DISCARD ?
3277 		      XFRM_POLICY_BLOCK : XFRM_POLICY_ALLOW);
3278 
3279 	xp->lft.soft_byte_limit = XFRM_INF;
3280 	xp->lft.hard_byte_limit = XFRM_INF;
3281 	xp->lft.soft_packet_limit = XFRM_INF;
3282 	xp->lft.hard_packet_limit = XFRM_INF;
3283 	xp->family = sk->sk_family;
3284 
3285 	xp->xfrm_nr = 0;
3286 	if (pol->sadb_x_policy_type == IPSEC_POLICY_IPSEC &&
3287 	    (*dir = parse_ipsecrequests(xp, pol)) < 0)
3288 		goto out;
3289 
3290 	/* security context too */
3291 	if (len >= (pol->sadb_x_policy_len*8 +
3292 	    sizeof(struct sadb_x_sec_ctx))) {
3293 		char *p = (char *)pol;
3294 		struct xfrm_user_sec_ctx *uctx;
3295 
3296 		p += pol->sadb_x_policy_len*8;
3297 		sec_ctx = (struct sadb_x_sec_ctx *)p;
3298 		if (len < pol->sadb_x_policy_len*8 +
3299 		    sec_ctx->sadb_x_sec_len*8) {
3300 			*dir = -EINVAL;
3301 			goto out;
3302 		}
3303 		if ((*dir = verify_sec_ctx_len(p)))
3304 			goto out;
3305 		uctx = pfkey_sadb2xfrm_user_sec_ctx(sec_ctx, GFP_ATOMIC);
3306 		*dir = security_xfrm_policy_alloc(&xp->security, uctx, GFP_ATOMIC);
3307 		kfree(uctx);
3308 
3309 		if (*dir)
3310 			goto out;
3311 	}
3312 
3313 	*dir = pol->sadb_x_policy_dir-1;
3314 	return xp;
3315 
3316 out:
3317 	xp->walk.dead = 1;
3318 	xfrm_policy_destroy(xp);
3319 	return NULL;
3320 }
3321 
3322 static int pfkey_send_new_mapping(struct xfrm_state *x, xfrm_address_t *ipaddr, __be16 sport)
3323 {
3324 	struct sk_buff *skb;
3325 	struct sadb_msg *hdr;
3326 	struct sadb_sa *sa;
3327 	struct sadb_address *addr;
3328 	struct sadb_x_nat_t_port *n_port;
3329 	int sockaddr_size;
3330 	int size;
3331 	__u8 satype = (x->id.proto == IPPROTO_ESP ? SADB_SATYPE_ESP : 0);
3332 	struct xfrm_encap_tmpl *natt = NULL;
3333 
3334 	sockaddr_size = pfkey_sockaddr_size(x->props.family);
3335 	if (!sockaddr_size)
3336 		return -EINVAL;
3337 
3338 	if (!satype)
3339 		return -EINVAL;
3340 
3341 	if (!x->encap)
3342 		return -EINVAL;
3343 
3344 	natt = x->encap;
3345 
3346 	/* Build an SADB_X_NAT_T_NEW_MAPPING message:
3347 	 *
3348 	 * HDR | SA | ADDRESS_SRC (old addr) | NAT_T_SPORT (old port) |
3349 	 * ADDRESS_DST (new addr) | NAT_T_DPORT (new port)
3350 	 */
3351 
3352 	size = sizeof(struct sadb_msg) +
3353 		sizeof(struct sadb_sa) +
3354 		(sizeof(struct sadb_address) * 2) +
3355 		(sockaddr_size * 2) +
3356 		(sizeof(struct sadb_x_nat_t_port) * 2);
3357 
3358 	skb =  alloc_skb(size + 16, GFP_ATOMIC);
3359 	if (skb == NULL)
3360 		return -ENOMEM;
3361 
3362 	hdr = (struct sadb_msg *) skb_put(skb, sizeof(struct sadb_msg));
3363 	hdr->sadb_msg_version = PF_KEY_V2;
3364 	hdr->sadb_msg_type = SADB_X_NAT_T_NEW_MAPPING;
3365 	hdr->sadb_msg_satype = satype;
3366 	hdr->sadb_msg_len = size / sizeof(uint64_t);
3367 	hdr->sadb_msg_errno = 0;
3368 	hdr->sadb_msg_reserved = 0;
3369 	hdr->sadb_msg_seq = x->km.seq = get_acqseq();
3370 	hdr->sadb_msg_pid = 0;
3371 
3372 	/* SA */
3373 	sa = (struct sadb_sa *) skb_put(skb, sizeof(struct sadb_sa));
3374 	sa->sadb_sa_len = sizeof(struct sadb_sa)/sizeof(uint64_t);
3375 	sa->sadb_sa_exttype = SADB_EXT_SA;
3376 	sa->sadb_sa_spi = x->id.spi;
3377 	sa->sadb_sa_replay = 0;
3378 	sa->sadb_sa_state = 0;
3379 	sa->sadb_sa_auth = 0;
3380 	sa->sadb_sa_encrypt = 0;
3381 	sa->sadb_sa_flags = 0;
3382 
3383 	/* ADDRESS_SRC (old addr) */
3384 	addr = (struct sadb_address*)
3385 		skb_put(skb, sizeof(struct sadb_address)+sockaddr_size);
3386 	addr->sadb_address_len =
3387 		(sizeof(struct sadb_address)+sockaddr_size)/
3388 			sizeof(uint64_t);
3389 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_SRC;
3390 	addr->sadb_address_proto = 0;
3391 	addr->sadb_address_reserved = 0;
3392 	addr->sadb_address_prefixlen =
3393 		pfkey_sockaddr_fill(&x->props.saddr, 0,
3394 				    (struct sockaddr *) (addr + 1),
3395 				    x->props.family);
3396 	if (!addr->sadb_address_prefixlen)
3397 		BUG();
3398 
3399 	/* NAT_T_SPORT (old port) */
3400 	n_port = (struct sadb_x_nat_t_port*) skb_put(skb, sizeof (*n_port));
3401 	n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
3402 	n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_SPORT;
3403 	n_port->sadb_x_nat_t_port_port = natt->encap_sport;
3404 	n_port->sadb_x_nat_t_port_reserved = 0;
3405 
3406 	/* ADDRESS_DST (new addr) */
3407 	addr = (struct sadb_address*)
3408 		skb_put(skb, sizeof(struct sadb_address)+sockaddr_size);
3409 	addr->sadb_address_len =
3410 		(sizeof(struct sadb_address)+sockaddr_size)/
3411 			sizeof(uint64_t);
3412 	addr->sadb_address_exttype = SADB_EXT_ADDRESS_DST;
3413 	addr->sadb_address_proto = 0;
3414 	addr->sadb_address_reserved = 0;
3415 	addr->sadb_address_prefixlen =
3416 		pfkey_sockaddr_fill(ipaddr, 0,
3417 				    (struct sockaddr *) (addr + 1),
3418 				    x->props.family);
3419 	if (!addr->sadb_address_prefixlen)
3420 		BUG();
3421 
3422 	/* NAT_T_DPORT (new port) */
3423 	n_port = (struct sadb_x_nat_t_port*) skb_put(skb, sizeof (*n_port));
3424 	n_port->sadb_x_nat_t_port_len = sizeof(*n_port)/sizeof(uint64_t);
3425 	n_port->sadb_x_nat_t_port_exttype = SADB_X_EXT_NAT_T_DPORT;
3426 	n_port->sadb_x_nat_t_port_port = sport;
3427 	n_port->sadb_x_nat_t_port_reserved = 0;
3428 
3429 	return pfkey_broadcast(skb, BROADCAST_REGISTERED, NULL, xs_net(x));
3430 }
3431 
3432 #ifdef CONFIG_NET_KEY_MIGRATE
3433 static int set_sadb_address(struct sk_buff *skb, int sasize, int type,
3434 			    const struct xfrm_selector *sel)
3435 {
3436 	struct sadb_address *addr;
3437 	addr = (struct sadb_address *)skb_put(skb, sizeof(struct sadb_address) + sasize);
3438 	addr->sadb_address_len = (sizeof(struct sadb_address) + sasize)/8;
3439 	addr->sadb_address_exttype = type;
3440 	addr->sadb_address_proto = sel->proto;
3441 	addr->sadb_address_reserved = 0;
3442 
3443 	switch (type) {
3444 	case SADB_EXT_ADDRESS_SRC:
3445 		addr->sadb_address_prefixlen = sel->prefixlen_s;
3446 		pfkey_sockaddr_fill(&sel->saddr, 0,
3447 				    (struct sockaddr *)(addr + 1),
3448 				    sel->family);
3449 		break;
3450 	case SADB_EXT_ADDRESS_DST:
3451 		addr->sadb_address_prefixlen = sel->prefixlen_d;
3452 		pfkey_sockaddr_fill(&sel->daddr, 0,
3453 				    (struct sockaddr *)(addr + 1),
3454 				    sel->family);
3455 		break;
3456 	default:
3457 		return -EINVAL;
3458 	}
3459 
3460 	return 0;
3461 }
3462 
3463 
3464 static int set_sadb_kmaddress(struct sk_buff *skb, const struct xfrm_kmaddress *k)
3465 {
3466 	struct sadb_x_kmaddress *kma;
3467 	u8 *sa;
3468 	int family = k->family;
3469 	int socklen = pfkey_sockaddr_len(family);
3470 	int size_req;
3471 
3472 	size_req = (sizeof(struct sadb_x_kmaddress) +
3473 		    pfkey_sockaddr_pair_size(family));
3474 
3475 	kma = (struct sadb_x_kmaddress *)skb_put(skb, size_req);
3476 	memset(kma, 0, size_req);
3477 	kma->sadb_x_kmaddress_len = size_req / 8;
3478 	kma->sadb_x_kmaddress_exttype = SADB_X_EXT_KMADDRESS;
3479 	kma->sadb_x_kmaddress_reserved = k->reserved;
3480 
3481 	sa = (u8 *)(kma + 1);
3482 	if (!pfkey_sockaddr_fill(&k->local, 0, (struct sockaddr *)sa, family) ||
3483 	    !pfkey_sockaddr_fill(&k->remote, 0, (struct sockaddr *)(sa+socklen), family))
3484 		return -EINVAL;
3485 
3486 	return 0;
3487 }
3488 
3489 static int set_ipsecrequest(struct sk_buff *skb,
3490 			    uint8_t proto, uint8_t mode, int level,
3491 			    uint32_t reqid, uint8_t family,
3492 			    const xfrm_address_t *src, const xfrm_address_t *dst)
3493 {
3494 	struct sadb_x_ipsecrequest *rq;
3495 	u8 *sa;
3496 	int socklen = pfkey_sockaddr_len(family);
3497 	int size_req;
3498 
3499 	size_req = sizeof(struct sadb_x_ipsecrequest) +
3500 		   pfkey_sockaddr_pair_size(family);
3501 
3502 	rq = (struct sadb_x_ipsecrequest *)skb_put(skb, size_req);
3503 	memset(rq, 0, size_req);
3504 	rq->sadb_x_ipsecrequest_len = size_req;
3505 	rq->sadb_x_ipsecrequest_proto = proto;
3506 	rq->sadb_x_ipsecrequest_mode = mode;
3507 	rq->sadb_x_ipsecrequest_level = level;
3508 	rq->sadb_x_ipsecrequest_reqid = reqid;
3509 
3510 	sa = (u8 *) (rq + 1);
3511 	if (!pfkey_sockaddr_fill(src, 0, (struct sockaddr *)sa, family) ||
3512 	    !pfkey_sockaddr_fill(dst, 0, (struct sockaddr *)(sa + socklen), family))
3513 		return -EINVAL;
3514 
3515 	return 0;
3516 }
3517 #endif
3518 
3519 #ifdef CONFIG_NET_KEY_MIGRATE
3520 static int pfkey_send_migrate(const struct xfrm_selector *sel, u8 dir, u8 type,
3521 			      const struct xfrm_migrate *m, int num_bundles,
3522 			      const struct xfrm_kmaddress *k)
3523 {
3524 	int i;
3525 	int sasize_sel;
3526 	int size = 0;
3527 	int size_pol = 0;
3528 	struct sk_buff *skb;
3529 	struct sadb_msg *hdr;
3530 	struct sadb_x_policy *pol;
3531 	const struct xfrm_migrate *mp;
3532 
3533 	if (type != XFRM_POLICY_TYPE_MAIN)
3534 		return 0;
3535 
3536 	if (num_bundles <= 0 || num_bundles > XFRM_MAX_DEPTH)
3537 		return -EINVAL;
3538 
3539 	if (k != NULL) {
3540 		/* addresses for KM */
3541 		size += PFKEY_ALIGN8(sizeof(struct sadb_x_kmaddress) +
3542 				     pfkey_sockaddr_pair_size(k->family));
3543 	}
3544 
3545 	/* selector */
3546 	sasize_sel = pfkey_sockaddr_size(sel->family);
3547 	if (!sasize_sel)
3548 		return -EINVAL;
3549 	size += (sizeof(struct sadb_address) + sasize_sel) * 2;
3550 
3551 	/* policy info */
3552 	size_pol += sizeof(struct sadb_x_policy);
3553 
3554 	/* ipsecrequests */
3555 	for (i = 0, mp = m; i < num_bundles; i++, mp++) {
3556 		/* old locator pair */
3557 		size_pol += sizeof(struct sadb_x_ipsecrequest) +
3558 			    pfkey_sockaddr_pair_size(mp->old_family);
3559 		/* new locator pair */
3560 		size_pol += sizeof(struct sadb_x_ipsecrequest) +
3561 			    pfkey_sockaddr_pair_size(mp->new_family);
3562 	}
3563 
3564 	size += sizeof(struct sadb_msg) + size_pol;
3565 
3566 	/* alloc buffer */
3567 	skb = alloc_skb(size, GFP_ATOMIC);
3568 	if (skb == NULL)
3569 		return -ENOMEM;
3570 
3571 	hdr = (struct sadb_msg *)skb_put(skb, sizeof(struct sadb_msg));
3572 	hdr->sadb_msg_version = PF_KEY_V2;
3573 	hdr->sadb_msg_type = SADB_X_MIGRATE;
3574 	hdr->sadb_msg_satype = pfkey_proto2satype(m->proto);
3575 	hdr->sadb_msg_len = size / 8;
3576 	hdr->sadb_msg_errno = 0;
3577 	hdr->sadb_msg_reserved = 0;
3578 	hdr->sadb_msg_seq = 0;
3579 	hdr->sadb_msg_pid = 0;
3580 
3581 	/* Addresses to be used by KM for negotiation, if ext is available */
3582 	if (k != NULL && (set_sadb_kmaddress(skb, k) < 0))
3583 		goto err;
3584 
3585 	/* selector src */
3586 	set_sadb_address(skb, sasize_sel, SADB_EXT_ADDRESS_SRC, sel);
3587 
3588 	/* selector dst */
3589 	set_sadb_address(skb, sasize_sel, SADB_EXT_ADDRESS_DST, sel);
3590 
3591 	/* policy information */
3592 	pol = (struct sadb_x_policy *)skb_put(skb, sizeof(struct sadb_x_policy));
3593 	pol->sadb_x_policy_len = size_pol / 8;
3594 	pol->sadb_x_policy_exttype = SADB_X_EXT_POLICY;
3595 	pol->sadb_x_policy_type = IPSEC_POLICY_IPSEC;
3596 	pol->sadb_x_policy_dir = dir + 1;
3597 	pol->sadb_x_policy_reserved = 0;
3598 	pol->sadb_x_policy_id = 0;
3599 	pol->sadb_x_policy_priority = 0;
3600 
3601 	for (i = 0, mp = m; i < num_bundles; i++, mp++) {
3602 		/* old ipsecrequest */
3603 		int mode = pfkey_mode_from_xfrm(mp->mode);
3604 		if (mode < 0)
3605 			goto err;
3606 		if (set_ipsecrequest(skb, mp->proto, mode,
3607 				     (mp->reqid ?  IPSEC_LEVEL_UNIQUE : IPSEC_LEVEL_REQUIRE),
3608 				     mp->reqid, mp->old_family,
3609 				     &mp->old_saddr, &mp->old_daddr) < 0)
3610 			goto err;
3611 
3612 		/* new ipsecrequest */
3613 		if (set_ipsecrequest(skb, mp->proto, mode,
3614 				     (mp->reqid ? IPSEC_LEVEL_UNIQUE : IPSEC_LEVEL_REQUIRE),
3615 				     mp->reqid, mp->new_family,
3616 				     &mp->new_saddr, &mp->new_daddr) < 0)
3617 			goto err;
3618 	}
3619 
3620 	/* broadcast migrate message to sockets */
3621 	pfkey_broadcast(skb, BROADCAST_ALL, NULL, &init_net);
3622 
3623 	return 0;
3624 
3625 err:
3626 	kfree_skb(skb);
3627 	return -EINVAL;
3628 }
3629 #else
3630 static int pfkey_send_migrate(const struct xfrm_selector *sel, u8 dir, u8 type,
3631 			      const struct xfrm_migrate *m, int num_bundles,
3632 			      const struct xfrm_kmaddress *k)
3633 {
3634 	return -ENOPROTOOPT;
3635 }
3636 #endif
3637 
3638 static int pfkey_sendmsg(struct socket *sock, struct msghdr *msg, size_t len)
3639 {
3640 	struct sock *sk = sock->sk;
3641 	struct sk_buff *skb = NULL;
3642 	struct sadb_msg *hdr = NULL;
3643 	int err;
3644 	struct net *net = sock_net(sk);
3645 
3646 	err = -EOPNOTSUPP;
3647 	if (msg->msg_flags & MSG_OOB)
3648 		goto out;
3649 
3650 	err = -EMSGSIZE;
3651 	if ((unsigned int)len > sk->sk_sndbuf - 32)
3652 		goto out;
3653 
3654 	err = -ENOBUFS;
3655 	skb = alloc_skb(len, GFP_KERNEL);
3656 	if (skb == NULL)
3657 		goto out;
3658 
3659 	err = -EFAULT;
3660 	if (memcpy_from_msg(skb_put(skb,len), msg, len))
3661 		goto out;
3662 
3663 	hdr = pfkey_get_base_msg(skb, &err);
3664 	if (!hdr)
3665 		goto out;
3666 
3667 	mutex_lock(&net->xfrm.xfrm_cfg_mutex);
3668 	err = pfkey_process(sk, skb, hdr);
3669 	mutex_unlock(&net->xfrm.xfrm_cfg_mutex);
3670 
3671 out:
3672 	if (err && hdr && pfkey_error(hdr, err, sk) == 0)
3673 		err = 0;
3674 	kfree_skb(skb);
3675 
3676 	return err ? : len;
3677 }
3678 
3679 static int pfkey_recvmsg(struct socket *sock, struct msghdr *msg, size_t len,
3680 			 int flags)
3681 {
3682 	struct sock *sk = sock->sk;
3683 	struct pfkey_sock *pfk = pfkey_sk(sk);
3684 	struct sk_buff *skb;
3685 	int copied, err;
3686 
3687 	err = -EINVAL;
3688 	if (flags & ~(MSG_PEEK|MSG_DONTWAIT|MSG_TRUNC|MSG_CMSG_COMPAT))
3689 		goto out;
3690 
3691 	skb = skb_recv_datagram(sk, flags, flags & MSG_DONTWAIT, &err);
3692 	if (skb == NULL)
3693 		goto out;
3694 
3695 	copied = skb->len;
3696 	if (copied > len) {
3697 		msg->msg_flags |= MSG_TRUNC;
3698 		copied = len;
3699 	}
3700 
3701 	skb_reset_transport_header(skb);
3702 	err = skb_copy_datagram_msg(skb, 0, msg, copied);
3703 	if (err)
3704 		goto out_free;
3705 
3706 	sock_recv_ts_and_drops(msg, sk, skb);
3707 
3708 	err = (flags & MSG_TRUNC) ? skb->len : copied;
3709 
3710 	if (pfk->dump.dump != NULL &&
3711 	    3 * atomic_read(&sk->sk_rmem_alloc) <= sk->sk_rcvbuf)
3712 		pfkey_do_dump(pfk);
3713 
3714 out_free:
3715 	skb_free_datagram(sk, skb);
3716 out:
3717 	return err;
3718 }
3719 
3720 static const struct proto_ops pfkey_ops = {
3721 	.family		=	PF_KEY,
3722 	.owner		=	THIS_MODULE,
3723 	/* Operations that make no sense on pfkey sockets. */
3724 	.bind		=	sock_no_bind,
3725 	.connect	=	sock_no_connect,
3726 	.socketpair	=	sock_no_socketpair,
3727 	.accept		=	sock_no_accept,
3728 	.getname	=	sock_no_getname,
3729 	.ioctl		=	sock_no_ioctl,
3730 	.listen		=	sock_no_listen,
3731 	.shutdown	=	sock_no_shutdown,
3732 	.setsockopt	=	sock_no_setsockopt,
3733 	.getsockopt	=	sock_no_getsockopt,
3734 	.mmap		=	sock_no_mmap,
3735 	.sendpage	=	sock_no_sendpage,
3736 
3737 	/* Now the operations that really occur. */
3738 	.release	=	pfkey_release,
3739 	.poll		=	datagram_poll,
3740 	.sendmsg	=	pfkey_sendmsg,
3741 	.recvmsg	=	pfkey_recvmsg,
3742 };
3743 
3744 static const struct net_proto_family pfkey_family_ops = {
3745 	.family	=	PF_KEY,
3746 	.create	=	pfkey_create,
3747 	.owner	=	THIS_MODULE,
3748 };
3749 
3750 #ifdef CONFIG_PROC_FS
3751 static int pfkey_seq_show(struct seq_file *f, void *v)
3752 {
3753 	struct sock *s = sk_entry(v);
3754 
3755 	if (v == SEQ_START_TOKEN)
3756 		seq_printf(f ,"sk       RefCnt Rmem   Wmem   User   Inode\n");
3757 	else
3758 		seq_printf(f, "%pK %-6d %-6u %-6u %-6u %-6lu\n",
3759 			       s,
3760 			       atomic_read(&s->sk_refcnt),
3761 			       sk_rmem_alloc_get(s),
3762 			       sk_wmem_alloc_get(s),
3763 			       from_kuid_munged(seq_user_ns(f), sock_i_uid(s)),
3764 			       sock_i_ino(s)
3765 			       );
3766 	return 0;
3767 }
3768 
3769 static void *pfkey_seq_start(struct seq_file *f, loff_t *ppos)
3770 	__acquires(rcu)
3771 {
3772 	struct net *net = seq_file_net(f);
3773 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3774 
3775 	rcu_read_lock();
3776 	return seq_hlist_start_head_rcu(&net_pfkey->table, *ppos);
3777 }
3778 
3779 static void *pfkey_seq_next(struct seq_file *f, void *v, loff_t *ppos)
3780 {
3781 	struct net *net = seq_file_net(f);
3782 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3783 
3784 	return seq_hlist_next_rcu(v, &net_pfkey->table, ppos);
3785 }
3786 
3787 static void pfkey_seq_stop(struct seq_file *f, void *v)
3788 	__releases(rcu)
3789 {
3790 	rcu_read_unlock();
3791 }
3792 
3793 static const struct seq_operations pfkey_seq_ops = {
3794 	.start	= pfkey_seq_start,
3795 	.next	= pfkey_seq_next,
3796 	.stop	= pfkey_seq_stop,
3797 	.show	= pfkey_seq_show,
3798 };
3799 
3800 static int pfkey_seq_open(struct inode *inode, struct file *file)
3801 {
3802 	return seq_open_net(inode, file, &pfkey_seq_ops,
3803 			    sizeof(struct seq_net_private));
3804 }
3805 
3806 static const struct file_operations pfkey_proc_ops = {
3807 	.open	 = pfkey_seq_open,
3808 	.read	 = seq_read,
3809 	.llseek	 = seq_lseek,
3810 	.release = seq_release_net,
3811 };
3812 
3813 static int __net_init pfkey_init_proc(struct net *net)
3814 {
3815 	struct proc_dir_entry *e;
3816 
3817 	e = proc_create("pfkey", 0, net->proc_net, &pfkey_proc_ops);
3818 	if (e == NULL)
3819 		return -ENOMEM;
3820 
3821 	return 0;
3822 }
3823 
3824 static void __net_exit pfkey_exit_proc(struct net *net)
3825 {
3826 	remove_proc_entry("pfkey", net->proc_net);
3827 }
3828 #else
3829 static inline int pfkey_init_proc(struct net *net)
3830 {
3831 	return 0;
3832 }
3833 
3834 static inline void pfkey_exit_proc(struct net *net)
3835 {
3836 }
3837 #endif
3838 
3839 static struct xfrm_mgr pfkeyv2_mgr =
3840 {
3841 	.notify		= pfkey_send_notify,
3842 	.acquire	= pfkey_send_acquire,
3843 	.compile_policy	= pfkey_compile_policy,
3844 	.new_mapping	= pfkey_send_new_mapping,
3845 	.notify_policy	= pfkey_send_policy_notify,
3846 	.migrate	= pfkey_send_migrate,
3847 	.is_alive	= pfkey_is_alive,
3848 };
3849 
3850 static int __net_init pfkey_net_init(struct net *net)
3851 {
3852 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3853 	int rv;
3854 
3855 	INIT_HLIST_HEAD(&net_pfkey->table);
3856 	atomic_set(&net_pfkey->socks_nr, 0);
3857 
3858 	rv = pfkey_init_proc(net);
3859 
3860 	return rv;
3861 }
3862 
3863 static void __net_exit pfkey_net_exit(struct net *net)
3864 {
3865 	struct netns_pfkey *net_pfkey = net_generic(net, pfkey_net_id);
3866 
3867 	pfkey_exit_proc(net);
3868 	BUG_ON(!hlist_empty(&net_pfkey->table));
3869 }
3870 
3871 static struct pernet_operations pfkey_net_ops = {
3872 	.init = pfkey_net_init,
3873 	.exit = pfkey_net_exit,
3874 	.id   = &pfkey_net_id,
3875 	.size = sizeof(struct netns_pfkey),
3876 };
3877 
3878 static void __exit ipsec_pfkey_exit(void)
3879 {
3880 	xfrm_unregister_km(&pfkeyv2_mgr);
3881 	sock_unregister(PF_KEY);
3882 	unregister_pernet_subsys(&pfkey_net_ops);
3883 	proto_unregister(&key_proto);
3884 }
3885 
3886 static int __init ipsec_pfkey_init(void)
3887 {
3888 	int err = proto_register(&key_proto, 0);
3889 
3890 	if (err != 0)
3891 		goto out;
3892 
3893 	err = register_pernet_subsys(&pfkey_net_ops);
3894 	if (err != 0)
3895 		goto out_unregister_key_proto;
3896 	err = sock_register(&pfkey_family_ops);
3897 	if (err != 0)
3898 		goto out_unregister_pernet;
3899 	err = xfrm_register_km(&pfkeyv2_mgr);
3900 	if (err != 0)
3901 		goto out_sock_unregister;
3902 out:
3903 	return err;
3904 
3905 out_sock_unregister:
3906 	sock_unregister(PF_KEY);
3907 out_unregister_pernet:
3908 	unregister_pernet_subsys(&pfkey_net_ops);
3909 out_unregister_key_proto:
3910 	proto_unregister(&key_proto);
3911 	goto out;
3912 }
3913 
3914 module_init(ipsec_pfkey_init);
3915 module_exit(ipsec_pfkey_exit);
3916 MODULE_LICENSE("GPL");
3917 MODULE_ALIAS_NETPROTO(PF_KEY);
3918