1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3 * INET An implementation of the TCP/IP protocol suite for the LINUX
4 * operating system. INET is implemented using the BSD Socket
5 * interface as the means of communication with the user level.
6 *
7 * Routing netlink socket interface: protocol independent part.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Fixes:
12 * Vitaly E. Lavrov RTA_OK arithmetic was wrong.
13 */
14
15 #include <linux/bitops.h>
16 #include <linux/errno.h>
17 #include <linux/module.h>
18 #include <linux/types.h>
19 #include <linux/socket.h>
20 #include <linux/kernel.h>
21 #include <linux/timer.h>
22 #include <linux/string.h>
23 #include <linux/sockios.h>
24 #include <linux/net.h>
25 #include <linux/fcntl.h>
26 #include <linux/mm.h>
27 #include <linux/slab.h>
28 #include <linux/interrupt.h>
29 #include <linux/capability.h>
30 #include <linux/skbuff.h>
31 #include <linux/init.h>
32 #include <linux/security.h>
33 #include <linux/mutex.h>
34 #include <linux/if_addr.h>
35 #include <linux/if_bridge.h>
36 #include <linux/if_vlan.h>
37 #include <linux/pci.h>
38 #include <linux/etherdevice.h>
39 #include <linux/bpf.h>
40
41 #include <linux/uaccess.h>
42
43 #include <linux/inet.h>
44 #include <linux/netdevice.h>
45 #include <net/ip.h>
46 #include <net/protocol.h>
47 #include <net/arp.h>
48 #include <net/route.h>
49 #include <net/udp.h>
50 #include <net/tcp.h>
51 #include <net/sock.h>
52 #include <net/pkt_sched.h>
53 #include <net/fib_rules.h>
54 #include <net/rtnetlink.h>
55 #include <net/net_namespace.h>
56 #include <net/devlink.h>
57 #if IS_ENABLED(CONFIG_IPV6)
58 #include <net/addrconf.h>
59 #endif
60 #include <linux/dpll.h>
61
62 #include "dev.h"
63
64 #define RTNL_MAX_TYPE 50
65 #define RTNL_SLAVE_MAX_TYPE 44
66
67 struct rtnl_link {
68 rtnl_doit_func doit;
69 rtnl_dumpit_func dumpit;
70 struct module *owner;
71 unsigned int flags;
72 struct rcu_head rcu;
73 };
74
75 static DEFINE_MUTEX(rtnl_mutex);
76
rtnl_lock(void)77 void rtnl_lock(void)
78 {
79 mutex_lock(&rtnl_mutex);
80 }
81 EXPORT_SYMBOL(rtnl_lock);
82
rtnl_lock_killable(void)83 int rtnl_lock_killable(void)
84 {
85 return mutex_lock_killable(&rtnl_mutex);
86 }
87
88 static struct sk_buff *defer_kfree_skb_list;
rtnl_kfree_skbs(struct sk_buff * head,struct sk_buff * tail)89 void rtnl_kfree_skbs(struct sk_buff *head, struct sk_buff *tail)
90 {
91 if (head && tail) {
92 tail->next = defer_kfree_skb_list;
93 defer_kfree_skb_list = head;
94 }
95 }
96 EXPORT_SYMBOL(rtnl_kfree_skbs);
97
__rtnl_unlock(void)98 void __rtnl_unlock(void)
99 {
100 struct sk_buff *head = defer_kfree_skb_list;
101
102 defer_kfree_skb_list = NULL;
103
104 /* Ensure that we didn't actually add any TODO item when __rtnl_unlock()
105 * is used. In some places, e.g. in cfg80211, we have code that will do
106 * something like
107 * rtnl_lock()
108 * wiphy_lock()
109 * ...
110 * rtnl_unlock()
111 *
112 * and because netdev_run_todo() acquires the RTNL for items on the list
113 * we could cause a situation such as this:
114 * Thread 1 Thread 2
115 * rtnl_lock()
116 * unregister_netdevice()
117 * __rtnl_unlock()
118 * rtnl_lock()
119 * wiphy_lock()
120 * rtnl_unlock()
121 * netdev_run_todo()
122 * __rtnl_unlock()
123 *
124 * // list not empty now
125 * // because of thread 2
126 * rtnl_lock()
127 * while (!list_empty(...))
128 * rtnl_lock()
129 * wiphy_lock()
130 * **** DEADLOCK ****
131 *
132 * However, usage of __rtnl_unlock() is rare, and so we can ensure that
133 * it's not used in cases where something is added to do the list.
134 */
135 WARN_ON(!list_empty(&net_todo_list));
136
137 mutex_unlock(&rtnl_mutex);
138
139 while (head) {
140 struct sk_buff *next = head->next;
141
142 kfree_skb(head);
143 cond_resched();
144 head = next;
145 }
146 }
147
rtnl_unlock(void)148 void rtnl_unlock(void)
149 {
150 /* This fellow will unlock it for us. */
151 netdev_run_todo();
152 }
153 EXPORT_SYMBOL(rtnl_unlock);
154
rtnl_trylock(void)155 int rtnl_trylock(void)
156 {
157 return mutex_trylock(&rtnl_mutex);
158 }
159 EXPORT_SYMBOL(rtnl_trylock);
160
rtnl_is_locked(void)161 int rtnl_is_locked(void)
162 {
163 return mutex_is_locked(&rtnl_mutex);
164 }
165 EXPORT_SYMBOL(rtnl_is_locked);
166
refcount_dec_and_rtnl_lock(refcount_t * r)167 bool refcount_dec_and_rtnl_lock(refcount_t *r)
168 {
169 return refcount_dec_and_mutex_lock(r, &rtnl_mutex);
170 }
171 EXPORT_SYMBOL(refcount_dec_and_rtnl_lock);
172
173 #ifdef CONFIG_PROVE_LOCKING
lockdep_rtnl_is_held(void)174 bool lockdep_rtnl_is_held(void)
175 {
176 return lockdep_is_held(&rtnl_mutex);
177 }
178 EXPORT_SYMBOL(lockdep_rtnl_is_held);
179 #endif /* #ifdef CONFIG_PROVE_LOCKING */
180
181 #ifdef CONFIG_DEBUG_NET_SMALL_RTNL
__rtnl_net_lock(struct net * net)182 void __rtnl_net_lock(struct net *net)
183 {
184 ASSERT_RTNL();
185
186 mutex_lock(&net->rtnl_mutex);
187 }
188 EXPORT_SYMBOL(__rtnl_net_lock);
189
__rtnl_net_unlock(struct net * net)190 void __rtnl_net_unlock(struct net *net)
191 {
192 ASSERT_RTNL();
193
194 mutex_unlock(&net->rtnl_mutex);
195 }
196 EXPORT_SYMBOL(__rtnl_net_unlock);
197
rtnl_net_lock(struct net * net)198 void rtnl_net_lock(struct net *net)
199 {
200 rtnl_lock();
201 __rtnl_net_lock(net);
202 }
203 EXPORT_SYMBOL(rtnl_net_lock);
204
rtnl_net_unlock(struct net * net)205 void rtnl_net_unlock(struct net *net)
206 {
207 __rtnl_net_unlock(net);
208 rtnl_unlock();
209 }
210 EXPORT_SYMBOL(rtnl_net_unlock);
211
rtnl_net_trylock(struct net * net)212 int rtnl_net_trylock(struct net *net)
213 {
214 int ret = rtnl_trylock();
215
216 if (ret)
217 __rtnl_net_lock(net);
218
219 return ret;
220 }
221 EXPORT_SYMBOL(rtnl_net_trylock);
222
rtnl_net_lock_killable(struct net * net)223 int rtnl_net_lock_killable(struct net *net)
224 {
225 int ret = rtnl_lock_killable();
226
227 if (!ret)
228 __rtnl_net_lock(net);
229
230 return ret;
231 }
232
rtnl_net_cmp_locks(const struct net * net_a,const struct net * net_b)233 static int rtnl_net_cmp_locks(const struct net *net_a, const struct net *net_b)
234 {
235 if (net_eq(net_a, net_b))
236 return 0;
237
238 /* always init_net first */
239 if (net_eq(net_a, &init_net))
240 return -1;
241
242 if (net_eq(net_b, &init_net))
243 return 1;
244
245 /* otherwise lock in ascending order */
246 return net_a < net_b ? -1 : 1;
247 }
248
rtnl_net_lock_cmp_fn(const struct lockdep_map * a,const struct lockdep_map * b)249 int rtnl_net_lock_cmp_fn(const struct lockdep_map *a, const struct lockdep_map *b)
250 {
251 const struct net *net_a, *net_b;
252
253 net_a = container_of(a, struct net, rtnl_mutex.dep_map);
254 net_b = container_of(b, struct net, rtnl_mutex.dep_map);
255
256 return rtnl_net_cmp_locks(net_a, net_b);
257 }
258
rtnl_net_is_locked(struct net * net)259 bool rtnl_net_is_locked(struct net *net)
260 {
261 return rtnl_is_locked() && mutex_is_locked(&net->rtnl_mutex);
262 }
263 EXPORT_SYMBOL(rtnl_net_is_locked);
264
lockdep_rtnl_net_is_held(struct net * net)265 bool lockdep_rtnl_net_is_held(struct net *net)
266 {
267 return lockdep_rtnl_is_held() && lockdep_is_held(&net->rtnl_mutex);
268 }
269 EXPORT_SYMBOL(lockdep_rtnl_net_is_held);
270 #else
rtnl_net_cmp_locks(const struct net * net_a,const struct net * net_b)271 static int rtnl_net_cmp_locks(const struct net *net_a, const struct net *net_b)
272 {
273 /* No need to swap */
274 return -1;
275 }
276 #endif
277
278 struct rtnl_nets {
279 /* ->newlink() needs to freeze 3 netns at most;
280 * 2 for the new device, 1 for its peer.
281 */
282 struct net *net[3];
283 unsigned char len;
284 };
285
rtnl_nets_init(struct rtnl_nets * rtnl_nets)286 static void rtnl_nets_init(struct rtnl_nets *rtnl_nets)
287 {
288 memset(rtnl_nets, 0, sizeof(*rtnl_nets));
289 }
290
rtnl_nets_destroy(struct rtnl_nets * rtnl_nets)291 static void rtnl_nets_destroy(struct rtnl_nets *rtnl_nets)
292 {
293 int i;
294
295 for (i = 0; i < rtnl_nets->len; i++) {
296 put_net(rtnl_nets->net[i]);
297 rtnl_nets->net[i] = NULL;
298 }
299
300 rtnl_nets->len = 0;
301 }
302
303 /**
304 * rtnl_nets_add - Add netns to be locked before ->newlink().
305 *
306 * @rtnl_nets: rtnl_nets pointer passed to ->get_peer_net().
307 * @net: netns pointer with an extra refcnt held.
308 *
309 * The extra refcnt is released in rtnl_nets_destroy().
310 */
rtnl_nets_add(struct rtnl_nets * rtnl_nets,struct net * net)311 static void rtnl_nets_add(struct rtnl_nets *rtnl_nets, struct net *net)
312 {
313 int i;
314
315 DEBUG_NET_WARN_ON_ONCE(rtnl_nets->len == ARRAY_SIZE(rtnl_nets->net));
316
317 for (i = 0; i < rtnl_nets->len; i++) {
318 switch (rtnl_net_cmp_locks(rtnl_nets->net[i], net)) {
319 case 0:
320 put_net(net);
321 return;
322 case 1:
323 swap(rtnl_nets->net[i], net);
324 }
325 }
326
327 rtnl_nets->net[i] = net;
328 rtnl_nets->len++;
329 }
330
rtnl_nets_lock(struct rtnl_nets * rtnl_nets)331 static void rtnl_nets_lock(struct rtnl_nets *rtnl_nets)
332 {
333 int i;
334
335 rtnl_lock();
336
337 for (i = 0; i < rtnl_nets->len; i++)
338 __rtnl_net_lock(rtnl_nets->net[i]);
339 }
340
rtnl_nets_unlock(struct rtnl_nets * rtnl_nets)341 static void rtnl_nets_unlock(struct rtnl_nets *rtnl_nets)
342 {
343 int i;
344
345 for (i = 0; i < rtnl_nets->len; i++)
346 __rtnl_net_unlock(rtnl_nets->net[i]);
347
348 rtnl_unlock();
349 }
350
351 static struct rtnl_link __rcu *__rcu *rtnl_msg_handlers[RTNL_FAMILY_MAX + 1];
352
rtm_msgindex(int msgtype)353 static inline int rtm_msgindex(int msgtype)
354 {
355 int msgindex = msgtype - RTM_BASE;
356
357 /*
358 * msgindex < 0 implies someone tried to register a netlink
359 * control code. msgindex >= RTM_NR_MSGTYPES may indicate that
360 * the message type has not been added to linux/rtnetlink.h
361 */
362 BUG_ON(msgindex < 0 || msgindex >= RTM_NR_MSGTYPES);
363
364 return msgindex;
365 }
366
rtnl_get_link(int protocol,int msgtype)367 static struct rtnl_link *rtnl_get_link(int protocol, int msgtype)
368 {
369 struct rtnl_link __rcu **tab;
370
371 if (protocol >= ARRAY_SIZE(rtnl_msg_handlers))
372 protocol = PF_UNSPEC;
373
374 tab = rcu_dereference_rtnl(rtnl_msg_handlers[protocol]);
375 if (!tab)
376 tab = rcu_dereference_rtnl(rtnl_msg_handlers[PF_UNSPEC]);
377
378 return rcu_dereference_rtnl(tab[msgtype]);
379 }
380
rtnl_register_internal(struct module * owner,int protocol,int msgtype,rtnl_doit_func doit,rtnl_dumpit_func dumpit,unsigned int flags)381 static int rtnl_register_internal(struct module *owner,
382 int protocol, int msgtype,
383 rtnl_doit_func doit, rtnl_dumpit_func dumpit,
384 unsigned int flags)
385 {
386 struct rtnl_link *link, *old;
387 struct rtnl_link __rcu **tab;
388 int msgindex;
389 int ret = -ENOBUFS;
390
391 BUG_ON(protocol < 0 || protocol > RTNL_FAMILY_MAX);
392 msgindex = rtm_msgindex(msgtype);
393
394 rtnl_lock();
395 tab = rtnl_dereference(rtnl_msg_handlers[protocol]);
396 if (tab == NULL) {
397 tab = kcalloc(RTM_NR_MSGTYPES, sizeof(void *), GFP_KERNEL);
398 if (!tab)
399 goto unlock;
400
401 /* ensures we see the 0 stores */
402 rcu_assign_pointer(rtnl_msg_handlers[protocol], tab);
403 }
404
405 old = rtnl_dereference(tab[msgindex]);
406 if (old) {
407 link = kmemdup(old, sizeof(*old), GFP_KERNEL);
408 if (!link)
409 goto unlock;
410 } else {
411 link = kzalloc(sizeof(*link), GFP_KERNEL);
412 if (!link)
413 goto unlock;
414 }
415
416 WARN_ON(link->owner && link->owner != owner);
417 link->owner = owner;
418
419 WARN_ON(doit && link->doit && link->doit != doit);
420 if (doit)
421 link->doit = doit;
422 WARN_ON(dumpit && link->dumpit && link->dumpit != dumpit);
423 if (dumpit)
424 link->dumpit = dumpit;
425
426 WARN_ON(rtnl_msgtype_kind(msgtype) != RTNL_KIND_DEL &&
427 (flags & RTNL_FLAG_BULK_DEL_SUPPORTED));
428 link->flags |= flags;
429
430 /* publish protocol:msgtype */
431 rcu_assign_pointer(tab[msgindex], link);
432 ret = 0;
433 if (old)
434 kfree_rcu(old, rcu);
435 unlock:
436 rtnl_unlock();
437 return ret;
438 }
439
440 /**
441 * rtnl_unregister - Unregister a rtnetlink message type
442 * @protocol: Protocol family or PF_UNSPEC
443 * @msgtype: rtnetlink message type
444 *
445 * Returns 0 on success or a negative error code.
446 */
rtnl_unregister(int protocol,int msgtype)447 static int rtnl_unregister(int protocol, int msgtype)
448 {
449 struct rtnl_link __rcu **tab;
450 struct rtnl_link *link;
451 int msgindex;
452
453 BUG_ON(protocol < 0 || protocol > RTNL_FAMILY_MAX);
454 msgindex = rtm_msgindex(msgtype);
455
456 rtnl_lock();
457 tab = rtnl_dereference(rtnl_msg_handlers[protocol]);
458 if (!tab) {
459 rtnl_unlock();
460 return -ENOENT;
461 }
462
463 link = rcu_replace_pointer_rtnl(tab[msgindex], NULL);
464 rtnl_unlock();
465
466 kfree_rcu(link, rcu);
467
468 return 0;
469 }
470
471 /**
472 * rtnl_unregister_all - Unregister all rtnetlink message type of a protocol
473 * @protocol : Protocol family or PF_UNSPEC
474 *
475 * Identical to calling rtnl_unregster() for all registered message types
476 * of a certain protocol family.
477 */
rtnl_unregister_all(int protocol)478 void rtnl_unregister_all(int protocol)
479 {
480 struct rtnl_link __rcu **tab;
481 struct rtnl_link *link;
482 int msgindex;
483
484 BUG_ON(protocol < 0 || protocol > RTNL_FAMILY_MAX);
485
486 rtnl_lock();
487 tab = rcu_replace_pointer_rtnl(rtnl_msg_handlers[protocol], NULL);
488 if (!tab) {
489 rtnl_unlock();
490 return;
491 }
492 for (msgindex = 0; msgindex < RTM_NR_MSGTYPES; msgindex++) {
493 link = rcu_replace_pointer_rtnl(tab[msgindex], NULL);
494 kfree_rcu(link, rcu);
495 }
496 rtnl_unlock();
497
498 synchronize_net();
499
500 kfree(tab);
501 }
502 EXPORT_SYMBOL_GPL(rtnl_unregister_all);
503
504 /**
505 * __rtnl_register_many - Register rtnetlink message types
506 * @handlers: Array of struct rtnl_msg_handlers
507 * @n: The length of @handlers
508 *
509 * Registers the specified function pointers (at least one of them has
510 * to be non-NULL) to be called whenever a request message for the
511 * specified protocol family and message type is received.
512 *
513 * The special protocol family PF_UNSPEC may be used to define fallback
514 * function pointers for the case when no entry for the specific protocol
515 * family exists.
516 *
517 * When one element of @handlers fails to register,
518 * 1) built-in: panics.
519 * 2) modules : the previous successful registrations are unwinded
520 * and an error is returned.
521 *
522 * Use rtnl_register_many().
523 */
__rtnl_register_many(const struct rtnl_msg_handler * handlers,int n)524 int __rtnl_register_many(const struct rtnl_msg_handler *handlers, int n)
525 {
526 const struct rtnl_msg_handler *handler;
527 int i, err;
528
529 for (i = 0, handler = handlers; i < n; i++, handler++) {
530 err = rtnl_register_internal(handler->owner, handler->protocol,
531 handler->msgtype, handler->doit,
532 handler->dumpit, handler->flags);
533 if (err) {
534 if (!handler->owner)
535 panic("Unable to register rtnetlink message "
536 "handlers, %pS\n", handlers);
537
538 __rtnl_unregister_many(handlers, i);
539 break;
540 }
541 }
542
543 return err;
544 }
545 EXPORT_SYMBOL_GPL(__rtnl_register_many);
546
__rtnl_unregister_many(const struct rtnl_msg_handler * handlers,int n)547 void __rtnl_unregister_many(const struct rtnl_msg_handler *handlers, int n)
548 {
549 const struct rtnl_msg_handler *handler;
550 int i;
551
552 for (i = n - 1, handler = handlers + n - 1; i >= 0; i--, handler--)
553 rtnl_unregister(handler->protocol, handler->msgtype);
554 }
555 EXPORT_SYMBOL_GPL(__rtnl_unregister_many);
556
557 static DEFINE_MUTEX(link_ops_mutex);
558 static LIST_HEAD(link_ops);
559
rtnl_link_ops_get(const char * kind,int * srcu_index)560 static struct rtnl_link_ops *rtnl_link_ops_get(const char *kind, int *srcu_index)
561 {
562 struct rtnl_link_ops *ops;
563
564 rcu_read_lock();
565
566 list_for_each_entry_rcu(ops, &link_ops, list) {
567 if (!strcmp(ops->kind, kind)) {
568 *srcu_index = srcu_read_lock(&ops->srcu);
569 goto unlock;
570 }
571 }
572
573 ops = NULL;
574 unlock:
575 rcu_read_unlock();
576
577 return ops;
578 }
579
rtnl_link_ops_put(struct rtnl_link_ops * ops,int srcu_index)580 static void rtnl_link_ops_put(struct rtnl_link_ops *ops, int srcu_index)
581 {
582 srcu_read_unlock(&ops->srcu, srcu_index);
583 }
584
585 /**
586 * rtnl_link_register - Register rtnl_link_ops with rtnetlink.
587 * @ops: struct rtnl_link_ops * to register
588 *
589 * Returns 0 on success or a negative error code.
590 */
rtnl_link_register(struct rtnl_link_ops * ops)591 int rtnl_link_register(struct rtnl_link_ops *ops)
592 {
593 struct rtnl_link_ops *tmp;
594 int err;
595
596 /* Sanity-check max sizes to avoid stack buffer overflow. */
597 if (WARN_ON(ops->maxtype > RTNL_MAX_TYPE ||
598 ops->slave_maxtype > RTNL_SLAVE_MAX_TYPE))
599 return -EINVAL;
600
601 /* The check for alloc/setup is here because if ops
602 * does not have that filled up, it is not possible
603 * to use the ops for creating device. So do not
604 * fill up dellink as well. That disables rtnl_dellink.
605 */
606 if ((ops->alloc || ops->setup) && !ops->dellink)
607 ops->dellink = unregister_netdevice_queue;
608
609 err = init_srcu_struct(&ops->srcu);
610 if (err)
611 return err;
612
613 mutex_lock(&link_ops_mutex);
614
615 list_for_each_entry(tmp, &link_ops, list) {
616 if (!strcmp(ops->kind, tmp->kind)) {
617 err = -EEXIST;
618 goto unlock;
619 }
620 }
621
622 list_add_tail_rcu(&ops->list, &link_ops);
623 unlock:
624 mutex_unlock(&link_ops_mutex);
625
626 return err;
627 }
628 EXPORT_SYMBOL_GPL(rtnl_link_register);
629
__rtnl_kill_links(struct net * net,struct rtnl_link_ops * ops)630 static void __rtnl_kill_links(struct net *net, struct rtnl_link_ops *ops)
631 {
632 struct net_device *dev;
633 LIST_HEAD(list_kill);
634
635 for_each_netdev(net, dev) {
636 if (dev->rtnl_link_ops == ops)
637 ops->dellink(dev, &list_kill);
638 }
639 unregister_netdevice_many(&list_kill);
640 }
641
642 /* Return with the rtnl_lock held when there are no network
643 * devices unregistering in any network namespace.
644 */
rtnl_lock_unregistering_all(void)645 static void rtnl_lock_unregistering_all(void)
646 {
647 DEFINE_WAIT_FUNC(wait, woken_wake_function);
648
649 add_wait_queue(&netdev_unregistering_wq, &wait);
650 for (;;) {
651 rtnl_lock();
652 /* We held write locked pernet_ops_rwsem, and parallel
653 * setup_net() and cleanup_net() are not possible.
654 */
655 if (!atomic_read(&dev_unreg_count))
656 break;
657 __rtnl_unlock();
658
659 wait_woken(&wait, TASK_UNINTERRUPTIBLE, MAX_SCHEDULE_TIMEOUT);
660 }
661 remove_wait_queue(&netdev_unregistering_wq, &wait);
662 }
663
664 /**
665 * rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
666 * @ops: struct rtnl_link_ops * to unregister
667 */
rtnl_link_unregister(struct rtnl_link_ops * ops)668 void rtnl_link_unregister(struct rtnl_link_ops *ops)
669 {
670 struct net *net;
671
672 mutex_lock(&link_ops_mutex);
673 list_del_rcu(&ops->list);
674 mutex_unlock(&link_ops_mutex);
675
676 synchronize_srcu(&ops->srcu);
677 cleanup_srcu_struct(&ops->srcu);
678
679 /* Close the race with setup_net() and cleanup_net() */
680 down_write(&pernet_ops_rwsem);
681 rtnl_lock_unregistering_all();
682
683 for_each_net(net)
684 __rtnl_kill_links(net, ops);
685
686 rtnl_unlock();
687 up_write(&pernet_ops_rwsem);
688 }
689 EXPORT_SYMBOL_GPL(rtnl_link_unregister);
690
rtnl_link_get_slave_info_data_size(const struct net_device * dev)691 static size_t rtnl_link_get_slave_info_data_size(const struct net_device *dev)
692 {
693 struct net_device *master_dev;
694 const struct rtnl_link_ops *ops;
695 size_t size = 0;
696
697 rcu_read_lock();
698
699 master_dev = netdev_master_upper_dev_get_rcu((struct net_device *)dev);
700 if (!master_dev)
701 goto out;
702
703 ops = master_dev->rtnl_link_ops;
704 if (!ops || !ops->get_slave_size)
705 goto out;
706 /* IFLA_INFO_SLAVE_DATA + nested data */
707 size = nla_total_size(sizeof(struct nlattr)) +
708 ops->get_slave_size(master_dev, dev);
709
710 out:
711 rcu_read_unlock();
712 return size;
713 }
714
rtnl_link_get_size(const struct net_device * dev)715 static size_t rtnl_link_get_size(const struct net_device *dev)
716 {
717 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
718 size_t size;
719
720 if (!ops)
721 return 0;
722
723 size = nla_total_size(sizeof(struct nlattr)) + /* IFLA_LINKINFO */
724 nla_total_size(strlen(ops->kind) + 1); /* IFLA_INFO_KIND */
725
726 if (ops->get_size)
727 /* IFLA_INFO_DATA + nested data */
728 size += nla_total_size(sizeof(struct nlattr)) +
729 ops->get_size(dev);
730
731 if (ops->get_xstats_size)
732 /* IFLA_INFO_XSTATS */
733 size += nla_total_size(ops->get_xstats_size(dev));
734
735 size += rtnl_link_get_slave_info_data_size(dev);
736
737 return size;
738 }
739
740 static LIST_HEAD(rtnl_af_ops);
741
rtnl_af_lookup(const int family,int * srcu_index)742 static struct rtnl_af_ops *rtnl_af_lookup(const int family, int *srcu_index)
743 {
744 struct rtnl_af_ops *ops;
745
746 ASSERT_RTNL();
747
748 rcu_read_lock();
749
750 list_for_each_entry_rcu(ops, &rtnl_af_ops, list) {
751 if (ops->family == family) {
752 *srcu_index = srcu_read_lock(&ops->srcu);
753 goto unlock;
754 }
755 }
756
757 ops = NULL;
758 unlock:
759 rcu_read_unlock();
760
761 return ops;
762 }
763
rtnl_af_put(struct rtnl_af_ops * ops,int srcu_index)764 static void rtnl_af_put(struct rtnl_af_ops *ops, int srcu_index)
765 {
766 srcu_read_unlock(&ops->srcu, srcu_index);
767 }
768
769 /**
770 * rtnl_af_register - Register rtnl_af_ops with rtnetlink.
771 * @ops: struct rtnl_af_ops * to register
772 *
773 * Return: 0 on success or a negative error code.
774 */
rtnl_af_register(struct rtnl_af_ops * ops)775 int rtnl_af_register(struct rtnl_af_ops *ops)
776 {
777 int err = init_srcu_struct(&ops->srcu);
778
779 if (err)
780 return err;
781
782 rtnl_lock();
783 list_add_tail_rcu(&ops->list, &rtnl_af_ops);
784 rtnl_unlock();
785
786 return 0;
787 }
788 EXPORT_SYMBOL_GPL(rtnl_af_register);
789
790 /**
791 * rtnl_af_unregister - Unregister rtnl_af_ops from rtnetlink.
792 * @ops: struct rtnl_af_ops * to unregister
793 */
rtnl_af_unregister(struct rtnl_af_ops * ops)794 void rtnl_af_unregister(struct rtnl_af_ops *ops)
795 {
796 rtnl_lock();
797 list_del_rcu(&ops->list);
798 rtnl_unlock();
799
800 synchronize_rcu();
801 synchronize_srcu(&ops->srcu);
802 cleanup_srcu_struct(&ops->srcu);
803 }
804 EXPORT_SYMBOL_GPL(rtnl_af_unregister);
805
rtnl_link_get_af_size(const struct net_device * dev,u32 ext_filter_mask)806 static size_t rtnl_link_get_af_size(const struct net_device *dev,
807 u32 ext_filter_mask)
808 {
809 struct rtnl_af_ops *af_ops;
810 size_t size;
811
812 /* IFLA_AF_SPEC */
813 size = nla_total_size(sizeof(struct nlattr));
814
815 rcu_read_lock();
816 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
817 if (af_ops->get_link_af_size) {
818 /* AF_* + nested data */
819 size += nla_total_size(sizeof(struct nlattr)) +
820 af_ops->get_link_af_size(dev, ext_filter_mask);
821 }
822 }
823 rcu_read_unlock();
824
825 return size;
826 }
827
rtnl_have_link_slave_info(const struct net_device * dev)828 static bool rtnl_have_link_slave_info(const struct net_device *dev)
829 {
830 struct net_device *master_dev;
831 bool ret = false;
832
833 rcu_read_lock();
834
835 master_dev = netdev_master_upper_dev_get_rcu((struct net_device *)dev);
836 if (master_dev && master_dev->rtnl_link_ops)
837 ret = true;
838 rcu_read_unlock();
839 return ret;
840 }
841
rtnl_link_slave_info_fill(struct sk_buff * skb,const struct net_device * dev)842 static int rtnl_link_slave_info_fill(struct sk_buff *skb,
843 const struct net_device *dev)
844 {
845 struct net_device *master_dev;
846 const struct rtnl_link_ops *ops;
847 struct nlattr *slave_data;
848 int err;
849
850 master_dev = netdev_master_upper_dev_get((struct net_device *) dev);
851 if (!master_dev)
852 return 0;
853 ops = master_dev->rtnl_link_ops;
854 if (!ops)
855 return 0;
856 if (nla_put_string(skb, IFLA_INFO_SLAVE_KIND, ops->kind) < 0)
857 return -EMSGSIZE;
858 if (ops->fill_slave_info) {
859 slave_data = nla_nest_start_noflag(skb, IFLA_INFO_SLAVE_DATA);
860 if (!slave_data)
861 return -EMSGSIZE;
862 err = ops->fill_slave_info(skb, master_dev, dev);
863 if (err < 0)
864 goto err_cancel_slave_data;
865 nla_nest_end(skb, slave_data);
866 }
867 return 0;
868
869 err_cancel_slave_data:
870 nla_nest_cancel(skb, slave_data);
871 return err;
872 }
873
rtnl_link_info_fill(struct sk_buff * skb,const struct net_device * dev)874 static int rtnl_link_info_fill(struct sk_buff *skb,
875 const struct net_device *dev)
876 {
877 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
878 struct nlattr *data;
879 int err;
880
881 if (!ops)
882 return 0;
883 if (nla_put_string(skb, IFLA_INFO_KIND, ops->kind) < 0)
884 return -EMSGSIZE;
885 if (ops->fill_xstats) {
886 err = ops->fill_xstats(skb, dev);
887 if (err < 0)
888 return err;
889 }
890 if (ops->fill_info) {
891 data = nla_nest_start_noflag(skb, IFLA_INFO_DATA);
892 if (data == NULL)
893 return -EMSGSIZE;
894 err = ops->fill_info(skb, dev);
895 if (err < 0)
896 goto err_cancel_data;
897 nla_nest_end(skb, data);
898 }
899 return 0;
900
901 err_cancel_data:
902 nla_nest_cancel(skb, data);
903 return err;
904 }
905
rtnl_link_fill(struct sk_buff * skb,const struct net_device * dev)906 static int rtnl_link_fill(struct sk_buff *skb, const struct net_device *dev)
907 {
908 struct nlattr *linkinfo;
909 int err = -EMSGSIZE;
910
911 linkinfo = nla_nest_start_noflag(skb, IFLA_LINKINFO);
912 if (linkinfo == NULL)
913 goto out;
914
915 err = rtnl_link_info_fill(skb, dev);
916 if (err < 0)
917 goto err_cancel_link;
918
919 err = rtnl_link_slave_info_fill(skb, dev);
920 if (err < 0)
921 goto err_cancel_link;
922
923 nla_nest_end(skb, linkinfo);
924 return 0;
925
926 err_cancel_link:
927 nla_nest_cancel(skb, linkinfo);
928 out:
929 return err;
930 }
931
rtnetlink_send(struct sk_buff * skb,struct net * net,u32 pid,unsigned int group,int echo)932 int rtnetlink_send(struct sk_buff *skb, struct net *net, u32 pid, unsigned int group, int echo)
933 {
934 struct sock *rtnl = net->rtnl;
935
936 return nlmsg_notify(rtnl, skb, pid, group, echo, GFP_KERNEL);
937 }
938
rtnl_unicast(struct sk_buff * skb,struct net * net,u32 pid)939 int rtnl_unicast(struct sk_buff *skb, struct net *net, u32 pid)
940 {
941 struct sock *rtnl = net->rtnl;
942
943 return nlmsg_unicast(rtnl, skb, pid);
944 }
945 EXPORT_SYMBOL(rtnl_unicast);
946
rtnl_notify(struct sk_buff * skb,struct net * net,u32 pid,u32 group,const struct nlmsghdr * nlh,gfp_t flags)947 void rtnl_notify(struct sk_buff *skb, struct net *net, u32 pid, u32 group,
948 const struct nlmsghdr *nlh, gfp_t flags)
949 {
950 struct sock *rtnl = net->rtnl;
951
952 nlmsg_notify(rtnl, skb, pid, group, nlmsg_report(nlh), flags);
953 }
954 EXPORT_SYMBOL(rtnl_notify);
955
rtnl_set_sk_err(struct net * net,u32 group,int error)956 void rtnl_set_sk_err(struct net *net, u32 group, int error)
957 {
958 struct sock *rtnl = net->rtnl;
959
960 netlink_set_err(rtnl, 0, group, error);
961 }
962 EXPORT_SYMBOL(rtnl_set_sk_err);
963
rtnetlink_put_metrics(struct sk_buff * skb,u32 * metrics)964 int rtnetlink_put_metrics(struct sk_buff *skb, u32 *metrics)
965 {
966 struct nlattr *mx;
967 int i, valid = 0;
968
969 /* nothing is dumped for dst_default_metrics, so just skip the loop */
970 if (metrics == dst_default_metrics.metrics)
971 return 0;
972
973 mx = nla_nest_start_noflag(skb, RTA_METRICS);
974 if (mx == NULL)
975 return -ENOBUFS;
976
977 for (i = 0; i < RTAX_MAX; i++) {
978 if (metrics[i]) {
979 if (i == RTAX_CC_ALGO - 1) {
980 char tmp[TCP_CA_NAME_MAX], *name;
981
982 name = tcp_ca_get_name_by_key(metrics[i], tmp);
983 if (!name)
984 continue;
985 if (nla_put_string(skb, i + 1, name))
986 goto nla_put_failure;
987 } else if (i == RTAX_FEATURES - 1) {
988 u32 user_features = metrics[i] & RTAX_FEATURE_MASK;
989
990 if (!user_features)
991 continue;
992 BUILD_BUG_ON(RTAX_FEATURE_MASK & DST_FEATURE_MASK);
993 if (nla_put_u32(skb, i + 1, user_features))
994 goto nla_put_failure;
995 } else {
996 if (nla_put_u32(skb, i + 1, metrics[i]))
997 goto nla_put_failure;
998 }
999 valid++;
1000 }
1001 }
1002
1003 if (!valid) {
1004 nla_nest_cancel(skb, mx);
1005 return 0;
1006 }
1007
1008 return nla_nest_end(skb, mx);
1009
1010 nla_put_failure:
1011 nla_nest_cancel(skb, mx);
1012 return -EMSGSIZE;
1013 }
1014 EXPORT_SYMBOL(rtnetlink_put_metrics);
1015
rtnl_put_cacheinfo(struct sk_buff * skb,struct dst_entry * dst,u32 id,long expires,u32 error)1016 int rtnl_put_cacheinfo(struct sk_buff *skb, struct dst_entry *dst, u32 id,
1017 long expires, u32 error)
1018 {
1019 struct rta_cacheinfo ci = {
1020 .rta_error = error,
1021 .rta_id = id,
1022 };
1023
1024 if (dst) {
1025 ci.rta_lastuse = jiffies_delta_to_clock_t(jiffies - dst->lastuse);
1026 ci.rta_used = dst->__use;
1027 ci.rta_clntref = rcuref_read(&dst->__rcuref);
1028 }
1029 if (expires) {
1030 unsigned long clock;
1031
1032 clock = jiffies_to_clock_t(abs(expires));
1033 clock = min_t(unsigned long, clock, INT_MAX);
1034 ci.rta_expires = (expires > 0) ? clock : -clock;
1035 }
1036 return nla_put(skb, RTA_CACHEINFO, sizeof(ci), &ci);
1037 }
1038 EXPORT_SYMBOL_GPL(rtnl_put_cacheinfo);
1039
netdev_set_operstate(struct net_device * dev,int newstate)1040 void netdev_set_operstate(struct net_device *dev, int newstate)
1041 {
1042 unsigned int old = READ_ONCE(dev->operstate);
1043
1044 do {
1045 if (old == newstate)
1046 return;
1047 } while (!try_cmpxchg(&dev->operstate, &old, newstate));
1048
1049 netdev_state_change(dev);
1050 }
1051 EXPORT_SYMBOL(netdev_set_operstate);
1052
set_operstate(struct net_device * dev,unsigned char transition)1053 static void set_operstate(struct net_device *dev, unsigned char transition)
1054 {
1055 unsigned char operstate = READ_ONCE(dev->operstate);
1056
1057 switch (transition) {
1058 case IF_OPER_UP:
1059 if ((operstate == IF_OPER_DORMANT ||
1060 operstate == IF_OPER_TESTING ||
1061 operstate == IF_OPER_UNKNOWN) &&
1062 !netif_dormant(dev) && !netif_testing(dev))
1063 operstate = IF_OPER_UP;
1064 break;
1065
1066 case IF_OPER_TESTING:
1067 if (netif_oper_up(dev))
1068 operstate = IF_OPER_TESTING;
1069 break;
1070
1071 case IF_OPER_DORMANT:
1072 if (netif_oper_up(dev))
1073 operstate = IF_OPER_DORMANT;
1074 break;
1075 }
1076
1077 netdev_set_operstate(dev, operstate);
1078 }
1079
rtnl_dev_get_flags(const struct net_device * dev)1080 static unsigned int rtnl_dev_get_flags(const struct net_device *dev)
1081 {
1082 return (dev->flags & ~(IFF_PROMISC | IFF_ALLMULTI)) |
1083 (dev->gflags & (IFF_PROMISC | IFF_ALLMULTI));
1084 }
1085
rtnl_dev_combine_flags(const struct net_device * dev,const struct ifinfomsg * ifm)1086 static unsigned int rtnl_dev_combine_flags(const struct net_device *dev,
1087 const struct ifinfomsg *ifm)
1088 {
1089 unsigned int flags = ifm->ifi_flags;
1090
1091 /* bugwards compatibility: ifi_change == 0 is treated as ~0 */
1092 if (ifm->ifi_change)
1093 flags = (flags & ifm->ifi_change) |
1094 (rtnl_dev_get_flags(dev) & ~ifm->ifi_change);
1095
1096 return flags;
1097 }
1098
copy_rtnl_link_stats(struct rtnl_link_stats * a,const struct rtnl_link_stats64 * b)1099 static void copy_rtnl_link_stats(struct rtnl_link_stats *a,
1100 const struct rtnl_link_stats64 *b)
1101 {
1102 a->rx_packets = b->rx_packets;
1103 a->tx_packets = b->tx_packets;
1104 a->rx_bytes = b->rx_bytes;
1105 a->tx_bytes = b->tx_bytes;
1106 a->rx_errors = b->rx_errors;
1107 a->tx_errors = b->tx_errors;
1108 a->rx_dropped = b->rx_dropped;
1109 a->tx_dropped = b->tx_dropped;
1110
1111 a->multicast = b->multicast;
1112 a->collisions = b->collisions;
1113
1114 a->rx_length_errors = b->rx_length_errors;
1115 a->rx_over_errors = b->rx_over_errors;
1116 a->rx_crc_errors = b->rx_crc_errors;
1117 a->rx_frame_errors = b->rx_frame_errors;
1118 a->rx_fifo_errors = b->rx_fifo_errors;
1119 a->rx_missed_errors = b->rx_missed_errors;
1120
1121 a->tx_aborted_errors = b->tx_aborted_errors;
1122 a->tx_carrier_errors = b->tx_carrier_errors;
1123 a->tx_fifo_errors = b->tx_fifo_errors;
1124 a->tx_heartbeat_errors = b->tx_heartbeat_errors;
1125 a->tx_window_errors = b->tx_window_errors;
1126
1127 a->rx_compressed = b->rx_compressed;
1128 a->tx_compressed = b->tx_compressed;
1129
1130 a->rx_nohandler = b->rx_nohandler;
1131 }
1132
1133 /* All VF info */
rtnl_vfinfo_size(const struct net_device * dev,u32 ext_filter_mask)1134 static inline int rtnl_vfinfo_size(const struct net_device *dev,
1135 u32 ext_filter_mask)
1136 {
1137 if (dev->dev.parent && (ext_filter_mask & RTEXT_FILTER_VF)) {
1138 int num_vfs = dev_num_vf(dev->dev.parent);
1139 size_t size = nla_total_size(0);
1140 size += num_vfs *
1141 (nla_total_size(0) +
1142 nla_total_size(sizeof(struct ifla_vf_mac)) +
1143 nla_total_size(sizeof(struct ifla_vf_broadcast)) +
1144 nla_total_size(sizeof(struct ifla_vf_vlan)) +
1145 nla_total_size(0) + /* nest IFLA_VF_VLAN_LIST */
1146 nla_total_size(MAX_VLAN_LIST_LEN *
1147 sizeof(struct ifla_vf_vlan_info)) +
1148 nla_total_size(sizeof(struct ifla_vf_spoofchk)) +
1149 nla_total_size(sizeof(struct ifla_vf_tx_rate)) +
1150 nla_total_size(sizeof(struct ifla_vf_rate)) +
1151 nla_total_size(sizeof(struct ifla_vf_link_state)) +
1152 nla_total_size(sizeof(struct ifla_vf_rss_query_en)) +
1153 nla_total_size(sizeof(struct ifla_vf_trust)));
1154 if (~ext_filter_mask & RTEXT_FILTER_SKIP_STATS) {
1155 size += num_vfs *
1156 (nla_total_size(0) + /* nest IFLA_VF_STATS */
1157 /* IFLA_VF_STATS_RX_PACKETS */
1158 nla_total_size_64bit(sizeof(__u64)) +
1159 /* IFLA_VF_STATS_TX_PACKETS */
1160 nla_total_size_64bit(sizeof(__u64)) +
1161 /* IFLA_VF_STATS_RX_BYTES */
1162 nla_total_size_64bit(sizeof(__u64)) +
1163 /* IFLA_VF_STATS_TX_BYTES */
1164 nla_total_size_64bit(sizeof(__u64)) +
1165 /* IFLA_VF_STATS_BROADCAST */
1166 nla_total_size_64bit(sizeof(__u64)) +
1167 /* IFLA_VF_STATS_MULTICAST */
1168 nla_total_size_64bit(sizeof(__u64)) +
1169 /* IFLA_VF_STATS_RX_DROPPED */
1170 nla_total_size_64bit(sizeof(__u64)) +
1171 /* IFLA_VF_STATS_TX_DROPPED */
1172 nla_total_size_64bit(sizeof(__u64)));
1173 }
1174 return size;
1175 } else
1176 return 0;
1177 }
1178
rtnl_port_size(const struct net_device * dev,u32 ext_filter_mask)1179 static size_t rtnl_port_size(const struct net_device *dev,
1180 u32 ext_filter_mask)
1181 {
1182 size_t port_size = nla_total_size(4) /* PORT_VF */
1183 + nla_total_size(PORT_PROFILE_MAX) /* PORT_PROFILE */
1184 + nla_total_size(PORT_UUID_MAX) /* PORT_INSTANCE_UUID */
1185 + nla_total_size(PORT_UUID_MAX) /* PORT_HOST_UUID */
1186 + nla_total_size(1) /* PROT_VDP_REQUEST */
1187 + nla_total_size(2); /* PORT_VDP_RESPONSE */
1188 size_t vf_ports_size = nla_total_size(sizeof(struct nlattr));
1189 size_t vf_port_size = nla_total_size(sizeof(struct nlattr))
1190 + port_size;
1191 size_t port_self_size = nla_total_size(sizeof(struct nlattr))
1192 + port_size;
1193
1194 if (!dev->netdev_ops->ndo_get_vf_port || !dev->dev.parent ||
1195 !(ext_filter_mask & RTEXT_FILTER_VF))
1196 return 0;
1197 if (dev_num_vf(dev->dev.parent))
1198 return port_self_size + vf_ports_size +
1199 vf_port_size * dev_num_vf(dev->dev.parent);
1200 else
1201 return port_self_size;
1202 }
1203
rtnl_xdp_size(void)1204 static size_t rtnl_xdp_size(void)
1205 {
1206 size_t xdp_size = nla_total_size(0) + /* nest IFLA_XDP */
1207 nla_total_size(1) + /* XDP_ATTACHED */
1208 nla_total_size(4) + /* XDP_PROG_ID (or 1st mode) */
1209 nla_total_size(4); /* XDP_<mode>_PROG_ID */
1210
1211 return xdp_size;
1212 }
1213
rtnl_prop_list_size(const struct net_device * dev)1214 static size_t rtnl_prop_list_size(const struct net_device *dev)
1215 {
1216 struct netdev_name_node *name_node;
1217 unsigned int cnt = 0;
1218
1219 rcu_read_lock();
1220 list_for_each_entry_rcu(name_node, &dev->name_node->list, list)
1221 cnt++;
1222 rcu_read_unlock();
1223
1224 if (!cnt)
1225 return 0;
1226
1227 return nla_total_size(0) + cnt * nla_total_size(ALTIFNAMSIZ);
1228 }
1229
rtnl_proto_down_size(const struct net_device * dev)1230 static size_t rtnl_proto_down_size(const struct net_device *dev)
1231 {
1232 size_t size = nla_total_size(1);
1233
1234 /* Assume dev->proto_down_reason is not zero. */
1235 size += nla_total_size(0) + nla_total_size(4);
1236
1237 return size;
1238 }
1239
rtnl_devlink_port_size(const struct net_device * dev)1240 static size_t rtnl_devlink_port_size(const struct net_device *dev)
1241 {
1242 size_t size = nla_total_size(0); /* nest IFLA_DEVLINK_PORT */
1243
1244 if (dev->devlink_port)
1245 size += devlink_nl_port_handle_size(dev->devlink_port);
1246
1247 return size;
1248 }
1249
rtnl_dpll_pin_size(const struct net_device * dev)1250 static size_t rtnl_dpll_pin_size(const struct net_device *dev)
1251 {
1252 size_t size = nla_total_size(0); /* nest IFLA_DPLL_PIN */
1253
1254 size += dpll_netdev_pin_handle_size(dev);
1255
1256 return size;
1257 }
1258
if_nlmsg_size(const struct net_device * dev,u32 ext_filter_mask)1259 static noinline size_t if_nlmsg_size(const struct net_device *dev,
1260 u32 ext_filter_mask)
1261 {
1262 return NLMSG_ALIGN(sizeof(struct ifinfomsg))
1263 + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */
1264 + nla_total_size(IFALIASZ) /* IFLA_IFALIAS */
1265 + nla_total_size(IFNAMSIZ) /* IFLA_QDISC */
1266 + nla_total_size_64bit(sizeof(struct rtnl_link_ifmap))
1267 + nla_total_size(sizeof(struct rtnl_link_stats))
1268 + nla_total_size_64bit(sizeof(struct rtnl_link_stats64))
1269 + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */
1270 + nla_total_size(MAX_ADDR_LEN) /* IFLA_BROADCAST */
1271 + nla_total_size(4) /* IFLA_TXQLEN */
1272 + nla_total_size(4) /* IFLA_WEIGHT */
1273 + nla_total_size(4) /* IFLA_MTU */
1274 + nla_total_size(4) /* IFLA_LINK */
1275 + nla_total_size(4) /* IFLA_MASTER */
1276 + nla_total_size(1) /* IFLA_CARRIER */
1277 + nla_total_size(4) /* IFLA_PROMISCUITY */
1278 + nla_total_size(4) /* IFLA_ALLMULTI */
1279 + nla_total_size(4) /* IFLA_NUM_TX_QUEUES */
1280 + nla_total_size(4) /* IFLA_NUM_RX_QUEUES */
1281 + nla_total_size(4) /* IFLA_GSO_MAX_SEGS */
1282 + nla_total_size(4) /* IFLA_GSO_MAX_SIZE */
1283 + nla_total_size(4) /* IFLA_GRO_MAX_SIZE */
1284 + nla_total_size(4) /* IFLA_GSO_IPV4_MAX_SIZE */
1285 + nla_total_size(4) /* IFLA_GRO_IPV4_MAX_SIZE */
1286 + nla_total_size(4) /* IFLA_TSO_MAX_SIZE */
1287 + nla_total_size(4) /* IFLA_TSO_MAX_SEGS */
1288 + nla_total_size(1) /* IFLA_OPERSTATE */
1289 + nla_total_size(1) /* IFLA_LINKMODE */
1290 + nla_total_size(4) /* IFLA_CARRIER_CHANGES */
1291 + nla_total_size(4) /* IFLA_LINK_NETNSID */
1292 + nla_total_size(4) /* IFLA_GROUP */
1293 + nla_total_size(ext_filter_mask
1294 & RTEXT_FILTER_VF ? 4 : 0) /* IFLA_NUM_VF */
1295 + rtnl_vfinfo_size(dev, ext_filter_mask) /* IFLA_VFINFO_LIST */
1296 + rtnl_port_size(dev, ext_filter_mask) /* IFLA_VF_PORTS + IFLA_PORT_SELF */
1297 + rtnl_link_get_size(dev) /* IFLA_LINKINFO */
1298 + rtnl_link_get_af_size(dev, ext_filter_mask) /* IFLA_AF_SPEC */
1299 + nla_total_size(MAX_PHYS_ITEM_ID_LEN) /* IFLA_PHYS_PORT_ID */
1300 + nla_total_size(MAX_PHYS_ITEM_ID_LEN) /* IFLA_PHYS_SWITCH_ID */
1301 + nla_total_size(IFNAMSIZ) /* IFLA_PHYS_PORT_NAME */
1302 + rtnl_xdp_size() /* IFLA_XDP */
1303 + nla_total_size(4) /* IFLA_EVENT */
1304 + nla_total_size(4) /* IFLA_NEW_NETNSID */
1305 + nla_total_size(4) /* IFLA_NEW_IFINDEX */
1306 + rtnl_proto_down_size(dev) /* proto down */
1307 + nla_total_size(4) /* IFLA_TARGET_NETNSID */
1308 + nla_total_size(4) /* IFLA_CARRIER_UP_COUNT */
1309 + nla_total_size(4) /* IFLA_CARRIER_DOWN_COUNT */
1310 + nla_total_size(4) /* IFLA_MIN_MTU */
1311 + nla_total_size(4) /* IFLA_MAX_MTU */
1312 + rtnl_prop_list_size(dev)
1313 + nla_total_size(MAX_ADDR_LEN) /* IFLA_PERM_ADDRESS */
1314 + rtnl_devlink_port_size(dev)
1315 + rtnl_dpll_pin_size(dev)
1316 + nla_total_size(8) /* IFLA_MAX_PACING_OFFLOAD_HORIZON */
1317 + 0;
1318 }
1319
rtnl_vf_ports_fill(struct sk_buff * skb,struct net_device * dev)1320 static int rtnl_vf_ports_fill(struct sk_buff *skb, struct net_device *dev)
1321 {
1322 struct nlattr *vf_ports;
1323 struct nlattr *vf_port;
1324 int vf;
1325 int err;
1326
1327 vf_ports = nla_nest_start_noflag(skb, IFLA_VF_PORTS);
1328 if (!vf_ports)
1329 return -EMSGSIZE;
1330
1331 for (vf = 0; vf < dev_num_vf(dev->dev.parent); vf++) {
1332 vf_port = nla_nest_start_noflag(skb, IFLA_VF_PORT);
1333 if (!vf_port)
1334 goto nla_put_failure;
1335 if (nla_put_u32(skb, IFLA_PORT_VF, vf))
1336 goto nla_put_failure;
1337 err = dev->netdev_ops->ndo_get_vf_port(dev, vf, skb);
1338 if (err == -EMSGSIZE)
1339 goto nla_put_failure;
1340 if (err) {
1341 nla_nest_cancel(skb, vf_port);
1342 continue;
1343 }
1344 nla_nest_end(skb, vf_port);
1345 }
1346
1347 nla_nest_end(skb, vf_ports);
1348
1349 return 0;
1350
1351 nla_put_failure:
1352 nla_nest_cancel(skb, vf_ports);
1353 return -EMSGSIZE;
1354 }
1355
rtnl_port_self_fill(struct sk_buff * skb,struct net_device * dev)1356 static int rtnl_port_self_fill(struct sk_buff *skb, struct net_device *dev)
1357 {
1358 struct nlattr *port_self;
1359 int err;
1360
1361 port_self = nla_nest_start_noflag(skb, IFLA_PORT_SELF);
1362 if (!port_self)
1363 return -EMSGSIZE;
1364
1365 err = dev->netdev_ops->ndo_get_vf_port(dev, PORT_SELF_VF, skb);
1366 if (err) {
1367 nla_nest_cancel(skb, port_self);
1368 return (err == -EMSGSIZE) ? err : 0;
1369 }
1370
1371 nla_nest_end(skb, port_self);
1372
1373 return 0;
1374 }
1375
rtnl_port_fill(struct sk_buff * skb,struct net_device * dev,u32 ext_filter_mask)1376 static int rtnl_port_fill(struct sk_buff *skb, struct net_device *dev,
1377 u32 ext_filter_mask)
1378 {
1379 int err;
1380
1381 if (!dev->netdev_ops->ndo_get_vf_port || !dev->dev.parent ||
1382 !(ext_filter_mask & RTEXT_FILTER_VF))
1383 return 0;
1384
1385 err = rtnl_port_self_fill(skb, dev);
1386 if (err)
1387 return err;
1388
1389 if (dev_num_vf(dev->dev.parent)) {
1390 err = rtnl_vf_ports_fill(skb, dev);
1391 if (err)
1392 return err;
1393 }
1394
1395 return 0;
1396 }
1397
rtnl_phys_port_id_fill(struct sk_buff * skb,struct net_device * dev)1398 static int rtnl_phys_port_id_fill(struct sk_buff *skb, struct net_device *dev)
1399 {
1400 int err;
1401 struct netdev_phys_item_id ppid;
1402
1403 err = dev_get_phys_port_id(dev, &ppid);
1404 if (err) {
1405 if (err == -EOPNOTSUPP)
1406 return 0;
1407 return err;
1408 }
1409
1410 if (nla_put(skb, IFLA_PHYS_PORT_ID, ppid.id_len, ppid.id))
1411 return -EMSGSIZE;
1412
1413 return 0;
1414 }
1415
rtnl_phys_port_name_fill(struct sk_buff * skb,struct net_device * dev)1416 static int rtnl_phys_port_name_fill(struct sk_buff *skb, struct net_device *dev)
1417 {
1418 char name[IFNAMSIZ];
1419 int err;
1420
1421 err = dev_get_phys_port_name(dev, name, sizeof(name));
1422 if (err) {
1423 if (err == -EOPNOTSUPP)
1424 return 0;
1425 return err;
1426 }
1427
1428 if (nla_put_string(skb, IFLA_PHYS_PORT_NAME, name))
1429 return -EMSGSIZE;
1430
1431 return 0;
1432 }
1433
rtnl_phys_switch_id_fill(struct sk_buff * skb,struct net_device * dev)1434 static int rtnl_phys_switch_id_fill(struct sk_buff *skb, struct net_device *dev)
1435 {
1436 struct netdev_phys_item_id ppid = { };
1437 int err;
1438
1439 err = dev_get_port_parent_id(dev, &ppid, false);
1440 if (err) {
1441 if (err == -EOPNOTSUPP)
1442 return 0;
1443 return err;
1444 }
1445
1446 if (nla_put(skb, IFLA_PHYS_SWITCH_ID, ppid.id_len, ppid.id))
1447 return -EMSGSIZE;
1448
1449 return 0;
1450 }
1451
rtnl_fill_stats(struct sk_buff * skb,struct net_device * dev)1452 static noinline_for_stack int rtnl_fill_stats(struct sk_buff *skb,
1453 struct net_device *dev)
1454 {
1455 struct rtnl_link_stats64 *sp;
1456 struct nlattr *attr;
1457
1458 attr = nla_reserve_64bit(skb, IFLA_STATS64,
1459 sizeof(struct rtnl_link_stats64), IFLA_PAD);
1460 if (!attr)
1461 return -EMSGSIZE;
1462
1463 sp = nla_data(attr);
1464 dev_get_stats(dev, sp);
1465
1466 attr = nla_reserve(skb, IFLA_STATS,
1467 sizeof(struct rtnl_link_stats));
1468 if (!attr)
1469 return -EMSGSIZE;
1470
1471 copy_rtnl_link_stats(nla_data(attr), sp);
1472
1473 return 0;
1474 }
1475
rtnl_fill_vfinfo(struct sk_buff * skb,struct net_device * dev,int vfs_num,u32 ext_filter_mask)1476 static noinline_for_stack int rtnl_fill_vfinfo(struct sk_buff *skb,
1477 struct net_device *dev,
1478 int vfs_num,
1479 u32 ext_filter_mask)
1480 {
1481 struct ifla_vf_rss_query_en vf_rss_query_en;
1482 struct nlattr *vf, *vfstats, *vfvlanlist;
1483 struct ifla_vf_link_state vf_linkstate;
1484 struct ifla_vf_vlan_info vf_vlan_info;
1485 struct ifla_vf_spoofchk vf_spoofchk;
1486 struct ifla_vf_tx_rate vf_tx_rate;
1487 struct ifla_vf_stats vf_stats;
1488 struct ifla_vf_trust vf_trust;
1489 struct ifla_vf_vlan vf_vlan;
1490 struct ifla_vf_rate vf_rate;
1491 struct ifla_vf_mac vf_mac;
1492 struct ifla_vf_broadcast vf_broadcast;
1493 struct ifla_vf_info ivi;
1494 struct ifla_vf_guid node_guid;
1495 struct ifla_vf_guid port_guid;
1496
1497 memset(&ivi, 0, sizeof(ivi));
1498
1499 /* Not all SR-IOV capable drivers support the
1500 * spoofcheck and "RSS query enable" query. Preset to
1501 * -1 so the user space tool can detect that the driver
1502 * didn't report anything.
1503 */
1504 ivi.spoofchk = -1;
1505 ivi.rss_query_en = -1;
1506 ivi.trusted = -1;
1507 /* The default value for VF link state is "auto"
1508 * IFLA_VF_LINK_STATE_AUTO which equals zero
1509 */
1510 ivi.linkstate = 0;
1511 /* VLAN Protocol by default is 802.1Q */
1512 ivi.vlan_proto = htons(ETH_P_8021Q);
1513 if (dev->netdev_ops->ndo_get_vf_config(dev, vfs_num, &ivi))
1514 return 0;
1515
1516 memset(&vf_vlan_info, 0, sizeof(vf_vlan_info));
1517 memset(&node_guid, 0, sizeof(node_guid));
1518 memset(&port_guid, 0, sizeof(port_guid));
1519
1520 vf_mac.vf =
1521 vf_vlan.vf =
1522 vf_vlan_info.vf =
1523 vf_rate.vf =
1524 vf_tx_rate.vf =
1525 vf_spoofchk.vf =
1526 vf_linkstate.vf =
1527 vf_rss_query_en.vf =
1528 vf_trust.vf =
1529 node_guid.vf =
1530 port_guid.vf = ivi.vf;
1531
1532 memcpy(vf_mac.mac, ivi.mac, sizeof(ivi.mac));
1533 memcpy(vf_broadcast.broadcast, dev->broadcast, dev->addr_len);
1534 vf_vlan.vlan = ivi.vlan;
1535 vf_vlan.qos = ivi.qos;
1536 vf_vlan_info.vlan = ivi.vlan;
1537 vf_vlan_info.qos = ivi.qos;
1538 vf_vlan_info.vlan_proto = ivi.vlan_proto;
1539 vf_tx_rate.rate = ivi.max_tx_rate;
1540 vf_rate.min_tx_rate = ivi.min_tx_rate;
1541 vf_rate.max_tx_rate = ivi.max_tx_rate;
1542 vf_spoofchk.setting = ivi.spoofchk;
1543 vf_linkstate.link_state = ivi.linkstate;
1544 vf_rss_query_en.setting = ivi.rss_query_en;
1545 vf_trust.setting = ivi.trusted;
1546 vf = nla_nest_start_noflag(skb, IFLA_VF_INFO);
1547 if (!vf)
1548 return -EMSGSIZE;
1549 if (nla_put(skb, IFLA_VF_MAC, sizeof(vf_mac), &vf_mac) ||
1550 nla_put(skb, IFLA_VF_BROADCAST, sizeof(vf_broadcast), &vf_broadcast) ||
1551 nla_put(skb, IFLA_VF_VLAN, sizeof(vf_vlan), &vf_vlan) ||
1552 nla_put(skb, IFLA_VF_RATE, sizeof(vf_rate),
1553 &vf_rate) ||
1554 nla_put(skb, IFLA_VF_TX_RATE, sizeof(vf_tx_rate),
1555 &vf_tx_rate) ||
1556 nla_put(skb, IFLA_VF_SPOOFCHK, sizeof(vf_spoofchk),
1557 &vf_spoofchk) ||
1558 nla_put(skb, IFLA_VF_LINK_STATE, sizeof(vf_linkstate),
1559 &vf_linkstate) ||
1560 nla_put(skb, IFLA_VF_RSS_QUERY_EN,
1561 sizeof(vf_rss_query_en),
1562 &vf_rss_query_en) ||
1563 nla_put(skb, IFLA_VF_TRUST,
1564 sizeof(vf_trust), &vf_trust))
1565 goto nla_put_vf_failure;
1566
1567 if (dev->netdev_ops->ndo_get_vf_guid &&
1568 !dev->netdev_ops->ndo_get_vf_guid(dev, vfs_num, &node_guid,
1569 &port_guid)) {
1570 if (nla_put(skb, IFLA_VF_IB_NODE_GUID, sizeof(node_guid),
1571 &node_guid) ||
1572 nla_put(skb, IFLA_VF_IB_PORT_GUID, sizeof(port_guid),
1573 &port_guid))
1574 goto nla_put_vf_failure;
1575 }
1576 vfvlanlist = nla_nest_start_noflag(skb, IFLA_VF_VLAN_LIST);
1577 if (!vfvlanlist)
1578 goto nla_put_vf_failure;
1579 if (nla_put(skb, IFLA_VF_VLAN_INFO, sizeof(vf_vlan_info),
1580 &vf_vlan_info)) {
1581 nla_nest_cancel(skb, vfvlanlist);
1582 goto nla_put_vf_failure;
1583 }
1584 nla_nest_end(skb, vfvlanlist);
1585 if (~ext_filter_mask & RTEXT_FILTER_SKIP_STATS) {
1586 memset(&vf_stats, 0, sizeof(vf_stats));
1587 if (dev->netdev_ops->ndo_get_vf_stats)
1588 dev->netdev_ops->ndo_get_vf_stats(dev, vfs_num,
1589 &vf_stats);
1590 vfstats = nla_nest_start_noflag(skb, IFLA_VF_STATS);
1591 if (!vfstats)
1592 goto nla_put_vf_failure;
1593 if (nla_put_u64_64bit(skb, IFLA_VF_STATS_RX_PACKETS,
1594 vf_stats.rx_packets, IFLA_VF_STATS_PAD) ||
1595 nla_put_u64_64bit(skb, IFLA_VF_STATS_TX_PACKETS,
1596 vf_stats.tx_packets, IFLA_VF_STATS_PAD) ||
1597 nla_put_u64_64bit(skb, IFLA_VF_STATS_RX_BYTES,
1598 vf_stats.rx_bytes, IFLA_VF_STATS_PAD) ||
1599 nla_put_u64_64bit(skb, IFLA_VF_STATS_TX_BYTES,
1600 vf_stats.tx_bytes, IFLA_VF_STATS_PAD) ||
1601 nla_put_u64_64bit(skb, IFLA_VF_STATS_BROADCAST,
1602 vf_stats.broadcast, IFLA_VF_STATS_PAD) ||
1603 nla_put_u64_64bit(skb, IFLA_VF_STATS_MULTICAST,
1604 vf_stats.multicast, IFLA_VF_STATS_PAD) ||
1605 nla_put_u64_64bit(skb, IFLA_VF_STATS_RX_DROPPED,
1606 vf_stats.rx_dropped, IFLA_VF_STATS_PAD) ||
1607 nla_put_u64_64bit(skb, IFLA_VF_STATS_TX_DROPPED,
1608 vf_stats.tx_dropped, IFLA_VF_STATS_PAD)) {
1609 nla_nest_cancel(skb, vfstats);
1610 goto nla_put_vf_failure;
1611 }
1612 nla_nest_end(skb, vfstats);
1613 }
1614 nla_nest_end(skb, vf);
1615 return 0;
1616
1617 nla_put_vf_failure:
1618 nla_nest_cancel(skb, vf);
1619 return -EMSGSIZE;
1620 }
1621
rtnl_fill_vf(struct sk_buff * skb,struct net_device * dev,u32 ext_filter_mask)1622 static noinline_for_stack int rtnl_fill_vf(struct sk_buff *skb,
1623 struct net_device *dev,
1624 u32 ext_filter_mask)
1625 {
1626 struct nlattr *vfinfo;
1627 int i, num_vfs;
1628
1629 if (!dev->dev.parent || ((ext_filter_mask & RTEXT_FILTER_VF) == 0))
1630 return 0;
1631
1632 num_vfs = dev_num_vf(dev->dev.parent);
1633 if (nla_put_u32(skb, IFLA_NUM_VF, num_vfs))
1634 return -EMSGSIZE;
1635
1636 if (!dev->netdev_ops->ndo_get_vf_config)
1637 return 0;
1638
1639 vfinfo = nla_nest_start_noflag(skb, IFLA_VFINFO_LIST);
1640 if (!vfinfo)
1641 return -EMSGSIZE;
1642
1643 for (i = 0; i < num_vfs; i++) {
1644 if (rtnl_fill_vfinfo(skb, dev, i, ext_filter_mask)) {
1645 nla_nest_cancel(skb, vfinfo);
1646 return -EMSGSIZE;
1647 }
1648 }
1649
1650 nla_nest_end(skb, vfinfo);
1651 return 0;
1652 }
1653
rtnl_fill_link_ifmap(struct sk_buff * skb,const struct net_device * dev)1654 static int rtnl_fill_link_ifmap(struct sk_buff *skb,
1655 const struct net_device *dev)
1656 {
1657 struct rtnl_link_ifmap map;
1658
1659 memset(&map, 0, sizeof(map));
1660 map.mem_start = READ_ONCE(dev->mem_start);
1661 map.mem_end = READ_ONCE(dev->mem_end);
1662 map.base_addr = READ_ONCE(dev->base_addr);
1663 map.irq = READ_ONCE(dev->irq);
1664 map.dma = READ_ONCE(dev->dma);
1665 map.port = READ_ONCE(dev->if_port);
1666
1667 if (nla_put_64bit(skb, IFLA_MAP, sizeof(map), &map, IFLA_PAD))
1668 return -EMSGSIZE;
1669
1670 return 0;
1671 }
1672
rtnl_xdp_prog_skb(struct net_device * dev)1673 static u32 rtnl_xdp_prog_skb(struct net_device *dev)
1674 {
1675 const struct bpf_prog *generic_xdp_prog;
1676 u32 res = 0;
1677
1678 rcu_read_lock();
1679 generic_xdp_prog = rcu_dereference(dev->xdp_prog);
1680 if (generic_xdp_prog)
1681 res = generic_xdp_prog->aux->id;
1682 rcu_read_unlock();
1683
1684 return res;
1685 }
1686
rtnl_xdp_prog_drv(struct net_device * dev)1687 static u32 rtnl_xdp_prog_drv(struct net_device *dev)
1688 {
1689 return dev_xdp_prog_id(dev, XDP_MODE_DRV);
1690 }
1691
rtnl_xdp_prog_hw(struct net_device * dev)1692 static u32 rtnl_xdp_prog_hw(struct net_device *dev)
1693 {
1694 return dev_xdp_prog_id(dev, XDP_MODE_HW);
1695 }
1696
rtnl_xdp_report_one(struct sk_buff * skb,struct net_device * dev,u32 * prog_id,u8 * mode,u8 tgt_mode,u32 attr,u32 (* get_prog_id)(struct net_device * dev))1697 static int rtnl_xdp_report_one(struct sk_buff *skb, struct net_device *dev,
1698 u32 *prog_id, u8 *mode, u8 tgt_mode, u32 attr,
1699 u32 (*get_prog_id)(struct net_device *dev))
1700 {
1701 u32 curr_id;
1702 int err;
1703
1704 curr_id = get_prog_id(dev);
1705 if (!curr_id)
1706 return 0;
1707
1708 *prog_id = curr_id;
1709 err = nla_put_u32(skb, attr, curr_id);
1710 if (err)
1711 return err;
1712
1713 if (*mode != XDP_ATTACHED_NONE)
1714 *mode = XDP_ATTACHED_MULTI;
1715 else
1716 *mode = tgt_mode;
1717
1718 return 0;
1719 }
1720
rtnl_xdp_fill(struct sk_buff * skb,struct net_device * dev)1721 static int rtnl_xdp_fill(struct sk_buff *skb, struct net_device *dev)
1722 {
1723 struct nlattr *xdp;
1724 u32 prog_id;
1725 int err;
1726 u8 mode;
1727
1728 xdp = nla_nest_start_noflag(skb, IFLA_XDP);
1729 if (!xdp)
1730 return -EMSGSIZE;
1731
1732 prog_id = 0;
1733 mode = XDP_ATTACHED_NONE;
1734 err = rtnl_xdp_report_one(skb, dev, &prog_id, &mode, XDP_ATTACHED_SKB,
1735 IFLA_XDP_SKB_PROG_ID, rtnl_xdp_prog_skb);
1736 if (err)
1737 goto err_cancel;
1738 err = rtnl_xdp_report_one(skb, dev, &prog_id, &mode, XDP_ATTACHED_DRV,
1739 IFLA_XDP_DRV_PROG_ID, rtnl_xdp_prog_drv);
1740 if (err)
1741 goto err_cancel;
1742 err = rtnl_xdp_report_one(skb, dev, &prog_id, &mode, XDP_ATTACHED_HW,
1743 IFLA_XDP_HW_PROG_ID, rtnl_xdp_prog_hw);
1744 if (err)
1745 goto err_cancel;
1746
1747 err = nla_put_u8(skb, IFLA_XDP_ATTACHED, mode);
1748 if (err)
1749 goto err_cancel;
1750
1751 if (prog_id && mode != XDP_ATTACHED_MULTI) {
1752 err = nla_put_u32(skb, IFLA_XDP_PROG_ID, prog_id);
1753 if (err)
1754 goto err_cancel;
1755 }
1756
1757 nla_nest_end(skb, xdp);
1758 return 0;
1759
1760 err_cancel:
1761 nla_nest_cancel(skb, xdp);
1762 return err;
1763 }
1764
rtnl_get_event(unsigned long event)1765 static u32 rtnl_get_event(unsigned long event)
1766 {
1767 u32 rtnl_event_type = IFLA_EVENT_NONE;
1768
1769 switch (event) {
1770 case NETDEV_REBOOT:
1771 rtnl_event_type = IFLA_EVENT_REBOOT;
1772 break;
1773 case NETDEV_FEAT_CHANGE:
1774 rtnl_event_type = IFLA_EVENT_FEATURES;
1775 break;
1776 case NETDEV_BONDING_FAILOVER:
1777 rtnl_event_type = IFLA_EVENT_BONDING_FAILOVER;
1778 break;
1779 case NETDEV_NOTIFY_PEERS:
1780 rtnl_event_type = IFLA_EVENT_NOTIFY_PEERS;
1781 break;
1782 case NETDEV_RESEND_IGMP:
1783 rtnl_event_type = IFLA_EVENT_IGMP_RESEND;
1784 break;
1785 case NETDEV_CHANGEINFODATA:
1786 rtnl_event_type = IFLA_EVENT_BONDING_OPTIONS;
1787 break;
1788 default:
1789 break;
1790 }
1791
1792 return rtnl_event_type;
1793 }
1794
put_master_ifindex(struct sk_buff * skb,struct net_device * dev)1795 static int put_master_ifindex(struct sk_buff *skb, struct net_device *dev)
1796 {
1797 const struct net_device *upper_dev;
1798 int ret = 0;
1799
1800 rcu_read_lock();
1801
1802 upper_dev = netdev_master_upper_dev_get_rcu(dev);
1803 if (upper_dev)
1804 ret = nla_put_u32(skb, IFLA_MASTER,
1805 READ_ONCE(upper_dev->ifindex));
1806
1807 rcu_read_unlock();
1808 return ret;
1809 }
1810
nla_put_iflink(struct sk_buff * skb,const struct net_device * dev,bool force)1811 static int nla_put_iflink(struct sk_buff *skb, const struct net_device *dev,
1812 bool force)
1813 {
1814 int iflink = dev_get_iflink(dev);
1815
1816 if (force || READ_ONCE(dev->ifindex) != iflink)
1817 return nla_put_u32(skb, IFLA_LINK, iflink);
1818
1819 return 0;
1820 }
1821
nla_put_ifalias(struct sk_buff * skb,struct net_device * dev)1822 static noinline_for_stack int nla_put_ifalias(struct sk_buff *skb,
1823 struct net_device *dev)
1824 {
1825 char buf[IFALIASZ];
1826 int ret;
1827
1828 ret = dev_get_alias(dev, buf, sizeof(buf));
1829 return ret > 0 ? nla_put_string(skb, IFLA_IFALIAS, buf) : 0;
1830 }
1831
rtnl_fill_link_netnsid(struct sk_buff * skb,const struct net_device * dev,struct net * src_net,gfp_t gfp)1832 static int rtnl_fill_link_netnsid(struct sk_buff *skb,
1833 const struct net_device *dev,
1834 struct net *src_net, gfp_t gfp)
1835 {
1836 bool put_iflink = false;
1837
1838 if (dev->rtnl_link_ops && dev->rtnl_link_ops->get_link_net) {
1839 struct net *link_net = dev->rtnl_link_ops->get_link_net(dev);
1840
1841 if (!net_eq(dev_net(dev), link_net)) {
1842 int id = peernet2id_alloc(src_net, link_net, gfp);
1843
1844 if (nla_put_s32(skb, IFLA_LINK_NETNSID, id))
1845 return -EMSGSIZE;
1846
1847 put_iflink = true;
1848 }
1849 }
1850
1851 return nla_put_iflink(skb, dev, put_iflink);
1852 }
1853
rtnl_fill_link_af(struct sk_buff * skb,const struct net_device * dev,u32 ext_filter_mask)1854 static int rtnl_fill_link_af(struct sk_buff *skb,
1855 const struct net_device *dev,
1856 u32 ext_filter_mask)
1857 {
1858 const struct rtnl_af_ops *af_ops;
1859 struct nlattr *af_spec;
1860
1861 af_spec = nla_nest_start_noflag(skb, IFLA_AF_SPEC);
1862 if (!af_spec)
1863 return -EMSGSIZE;
1864
1865 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
1866 struct nlattr *af;
1867 int err;
1868
1869 if (!af_ops->fill_link_af)
1870 continue;
1871
1872 af = nla_nest_start_noflag(skb, af_ops->family);
1873 if (!af)
1874 return -EMSGSIZE;
1875
1876 err = af_ops->fill_link_af(skb, dev, ext_filter_mask);
1877 /*
1878 * Caller may return ENODATA to indicate that there
1879 * was no data to be dumped. This is not an error, it
1880 * means we should trim the attribute header and
1881 * continue.
1882 */
1883 if (err == -ENODATA)
1884 nla_nest_cancel(skb, af);
1885 else if (err < 0)
1886 return -EMSGSIZE;
1887
1888 nla_nest_end(skb, af);
1889 }
1890
1891 nla_nest_end(skb, af_spec);
1892 return 0;
1893 }
1894
rtnl_fill_alt_ifnames(struct sk_buff * skb,const struct net_device * dev)1895 static int rtnl_fill_alt_ifnames(struct sk_buff *skb,
1896 const struct net_device *dev)
1897 {
1898 struct netdev_name_node *name_node;
1899 int count = 0;
1900
1901 list_for_each_entry_rcu(name_node, &dev->name_node->list, list) {
1902 if (nla_put_string(skb, IFLA_ALT_IFNAME, name_node->name))
1903 return -EMSGSIZE;
1904 count++;
1905 }
1906 return count;
1907 }
1908
1909 /* RCU protected. */
rtnl_fill_prop_list(struct sk_buff * skb,const struct net_device * dev)1910 static int rtnl_fill_prop_list(struct sk_buff *skb,
1911 const struct net_device *dev)
1912 {
1913 struct nlattr *prop_list;
1914 int ret;
1915
1916 prop_list = nla_nest_start(skb, IFLA_PROP_LIST);
1917 if (!prop_list)
1918 return -EMSGSIZE;
1919
1920 ret = rtnl_fill_alt_ifnames(skb, dev);
1921 if (ret <= 0)
1922 goto nest_cancel;
1923
1924 nla_nest_end(skb, prop_list);
1925 return 0;
1926
1927 nest_cancel:
1928 nla_nest_cancel(skb, prop_list);
1929 return ret;
1930 }
1931
rtnl_fill_proto_down(struct sk_buff * skb,const struct net_device * dev)1932 static int rtnl_fill_proto_down(struct sk_buff *skb,
1933 const struct net_device *dev)
1934 {
1935 struct nlattr *pr;
1936 u32 preason;
1937
1938 if (nla_put_u8(skb, IFLA_PROTO_DOWN, READ_ONCE(dev->proto_down)))
1939 goto nla_put_failure;
1940
1941 preason = READ_ONCE(dev->proto_down_reason);
1942 if (!preason)
1943 return 0;
1944
1945 pr = nla_nest_start(skb, IFLA_PROTO_DOWN_REASON);
1946 if (!pr)
1947 return -EMSGSIZE;
1948
1949 if (nla_put_u32(skb, IFLA_PROTO_DOWN_REASON_VALUE, preason)) {
1950 nla_nest_cancel(skb, pr);
1951 goto nla_put_failure;
1952 }
1953
1954 nla_nest_end(skb, pr);
1955 return 0;
1956
1957 nla_put_failure:
1958 return -EMSGSIZE;
1959 }
1960
rtnl_fill_devlink_port(struct sk_buff * skb,const struct net_device * dev)1961 static int rtnl_fill_devlink_port(struct sk_buff *skb,
1962 const struct net_device *dev)
1963 {
1964 struct nlattr *devlink_port_nest;
1965 int ret;
1966
1967 devlink_port_nest = nla_nest_start(skb, IFLA_DEVLINK_PORT);
1968 if (!devlink_port_nest)
1969 return -EMSGSIZE;
1970
1971 if (dev->devlink_port) {
1972 ret = devlink_nl_port_handle_fill(skb, dev->devlink_port);
1973 if (ret < 0)
1974 goto nest_cancel;
1975 }
1976
1977 nla_nest_end(skb, devlink_port_nest);
1978 return 0;
1979
1980 nest_cancel:
1981 nla_nest_cancel(skb, devlink_port_nest);
1982 return ret;
1983 }
1984
rtnl_fill_dpll_pin(struct sk_buff * skb,const struct net_device * dev)1985 static int rtnl_fill_dpll_pin(struct sk_buff *skb,
1986 const struct net_device *dev)
1987 {
1988 struct nlattr *dpll_pin_nest;
1989 int ret;
1990
1991 dpll_pin_nest = nla_nest_start(skb, IFLA_DPLL_PIN);
1992 if (!dpll_pin_nest)
1993 return -EMSGSIZE;
1994
1995 ret = dpll_netdev_add_pin_handle(skb, dev);
1996 if (ret < 0)
1997 goto nest_cancel;
1998
1999 nla_nest_end(skb, dpll_pin_nest);
2000 return 0;
2001
2002 nest_cancel:
2003 nla_nest_cancel(skb, dpll_pin_nest);
2004 return ret;
2005 }
2006
rtnl_fill_ifinfo(struct sk_buff * skb,struct net_device * dev,struct net * src_net,int type,u32 pid,u32 seq,u32 change,unsigned int flags,u32 ext_filter_mask,u32 event,int * new_nsid,int new_ifindex,int tgt_netnsid,gfp_t gfp)2007 static int rtnl_fill_ifinfo(struct sk_buff *skb,
2008 struct net_device *dev, struct net *src_net,
2009 int type, u32 pid, u32 seq, u32 change,
2010 unsigned int flags, u32 ext_filter_mask,
2011 u32 event, int *new_nsid, int new_ifindex,
2012 int tgt_netnsid, gfp_t gfp)
2013 {
2014 char devname[IFNAMSIZ];
2015 struct ifinfomsg *ifm;
2016 struct nlmsghdr *nlh;
2017 struct Qdisc *qdisc;
2018
2019 ASSERT_RTNL();
2020 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ifm), flags);
2021 if (nlh == NULL)
2022 return -EMSGSIZE;
2023
2024 ifm = nlmsg_data(nlh);
2025 ifm->ifi_family = AF_UNSPEC;
2026 ifm->__ifi_pad = 0;
2027 ifm->ifi_type = READ_ONCE(dev->type);
2028 ifm->ifi_index = READ_ONCE(dev->ifindex);
2029 ifm->ifi_flags = dev_get_flags(dev);
2030 ifm->ifi_change = change;
2031
2032 if (tgt_netnsid >= 0 && nla_put_s32(skb, IFLA_TARGET_NETNSID, tgt_netnsid))
2033 goto nla_put_failure;
2034
2035 netdev_copy_name(dev, devname);
2036 if (nla_put_string(skb, IFLA_IFNAME, devname))
2037 goto nla_put_failure;
2038
2039 if (nla_put_u32(skb, IFLA_TXQLEN, READ_ONCE(dev->tx_queue_len)) ||
2040 nla_put_u8(skb, IFLA_OPERSTATE,
2041 netif_running(dev) ? READ_ONCE(dev->operstate) :
2042 IF_OPER_DOWN) ||
2043 nla_put_u8(skb, IFLA_LINKMODE, READ_ONCE(dev->link_mode)) ||
2044 nla_put_u32(skb, IFLA_MTU, READ_ONCE(dev->mtu)) ||
2045 nla_put_u32(skb, IFLA_MIN_MTU, READ_ONCE(dev->min_mtu)) ||
2046 nla_put_u32(skb, IFLA_MAX_MTU, READ_ONCE(dev->max_mtu)) ||
2047 nla_put_u32(skb, IFLA_GROUP, READ_ONCE(dev->group)) ||
2048 nla_put_u32(skb, IFLA_PROMISCUITY, READ_ONCE(dev->promiscuity)) ||
2049 nla_put_u32(skb, IFLA_ALLMULTI, READ_ONCE(dev->allmulti)) ||
2050 nla_put_u32(skb, IFLA_NUM_TX_QUEUES,
2051 READ_ONCE(dev->num_tx_queues)) ||
2052 nla_put_u32(skb, IFLA_GSO_MAX_SEGS,
2053 READ_ONCE(dev->gso_max_segs)) ||
2054 nla_put_u32(skb, IFLA_GSO_MAX_SIZE,
2055 READ_ONCE(dev->gso_max_size)) ||
2056 nla_put_u32(skb, IFLA_GRO_MAX_SIZE,
2057 READ_ONCE(dev->gro_max_size)) ||
2058 nla_put_u32(skb, IFLA_GSO_IPV4_MAX_SIZE,
2059 READ_ONCE(dev->gso_ipv4_max_size)) ||
2060 nla_put_u32(skb, IFLA_GRO_IPV4_MAX_SIZE,
2061 READ_ONCE(dev->gro_ipv4_max_size)) ||
2062 nla_put_u32(skb, IFLA_TSO_MAX_SIZE,
2063 READ_ONCE(dev->tso_max_size)) ||
2064 nla_put_u32(skb, IFLA_TSO_MAX_SEGS,
2065 READ_ONCE(dev->tso_max_segs)) ||
2066 nla_put_uint(skb, IFLA_MAX_PACING_OFFLOAD_HORIZON,
2067 READ_ONCE(dev->max_pacing_offload_horizon)) ||
2068 #ifdef CONFIG_RPS
2069 nla_put_u32(skb, IFLA_NUM_RX_QUEUES,
2070 READ_ONCE(dev->num_rx_queues)) ||
2071 #endif
2072 put_master_ifindex(skb, dev) ||
2073 nla_put_u8(skb, IFLA_CARRIER, netif_carrier_ok(dev)) ||
2074 nla_put_ifalias(skb, dev) ||
2075 nla_put_u32(skb, IFLA_CARRIER_CHANGES,
2076 atomic_read(&dev->carrier_up_count) +
2077 atomic_read(&dev->carrier_down_count)) ||
2078 nla_put_u32(skb, IFLA_CARRIER_UP_COUNT,
2079 atomic_read(&dev->carrier_up_count)) ||
2080 nla_put_u32(skb, IFLA_CARRIER_DOWN_COUNT,
2081 atomic_read(&dev->carrier_down_count)))
2082 goto nla_put_failure;
2083
2084 if (rtnl_fill_proto_down(skb, dev))
2085 goto nla_put_failure;
2086
2087 if (event != IFLA_EVENT_NONE) {
2088 if (nla_put_u32(skb, IFLA_EVENT, event))
2089 goto nla_put_failure;
2090 }
2091
2092 if (dev->addr_len) {
2093 if (nla_put(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr) ||
2094 nla_put(skb, IFLA_BROADCAST, dev->addr_len, dev->broadcast))
2095 goto nla_put_failure;
2096 }
2097
2098 if (rtnl_phys_port_id_fill(skb, dev))
2099 goto nla_put_failure;
2100
2101 if (rtnl_phys_port_name_fill(skb, dev))
2102 goto nla_put_failure;
2103
2104 if (rtnl_phys_switch_id_fill(skb, dev))
2105 goto nla_put_failure;
2106
2107 if (rtnl_fill_stats(skb, dev))
2108 goto nla_put_failure;
2109
2110 if (rtnl_fill_vf(skb, dev, ext_filter_mask))
2111 goto nla_put_failure;
2112
2113 if (rtnl_port_fill(skb, dev, ext_filter_mask))
2114 goto nla_put_failure;
2115
2116 if (rtnl_xdp_fill(skb, dev))
2117 goto nla_put_failure;
2118
2119 if (dev->rtnl_link_ops || rtnl_have_link_slave_info(dev)) {
2120 if (rtnl_link_fill(skb, dev) < 0)
2121 goto nla_put_failure;
2122 }
2123
2124 if (new_nsid &&
2125 nla_put_s32(skb, IFLA_NEW_NETNSID, *new_nsid) < 0)
2126 goto nla_put_failure;
2127 if (new_ifindex &&
2128 nla_put_s32(skb, IFLA_NEW_IFINDEX, new_ifindex) < 0)
2129 goto nla_put_failure;
2130
2131 if (memchr_inv(dev->perm_addr, '\0', dev->addr_len) &&
2132 nla_put(skb, IFLA_PERM_ADDRESS, dev->addr_len, dev->perm_addr))
2133 goto nla_put_failure;
2134
2135 rcu_read_lock();
2136 if (rtnl_fill_link_netnsid(skb, dev, src_net, GFP_ATOMIC))
2137 goto nla_put_failure_rcu;
2138 qdisc = rcu_dereference(dev->qdisc);
2139 if (qdisc && nla_put_string(skb, IFLA_QDISC, qdisc->ops->id))
2140 goto nla_put_failure_rcu;
2141 if (rtnl_fill_link_af(skb, dev, ext_filter_mask))
2142 goto nla_put_failure_rcu;
2143 if (rtnl_fill_link_ifmap(skb, dev))
2144 goto nla_put_failure_rcu;
2145 if (rtnl_fill_prop_list(skb, dev))
2146 goto nla_put_failure_rcu;
2147 rcu_read_unlock();
2148
2149 if (dev->dev.parent &&
2150 nla_put_string(skb, IFLA_PARENT_DEV_NAME,
2151 dev_name(dev->dev.parent)))
2152 goto nla_put_failure;
2153
2154 if (dev->dev.parent && dev->dev.parent->bus &&
2155 nla_put_string(skb, IFLA_PARENT_DEV_BUS_NAME,
2156 dev->dev.parent->bus->name))
2157 goto nla_put_failure;
2158
2159 if (rtnl_fill_devlink_port(skb, dev))
2160 goto nla_put_failure;
2161
2162 if (rtnl_fill_dpll_pin(skb, dev))
2163 goto nla_put_failure;
2164
2165 nlmsg_end(skb, nlh);
2166 return 0;
2167
2168 nla_put_failure_rcu:
2169 rcu_read_unlock();
2170 nla_put_failure:
2171 nlmsg_cancel(skb, nlh);
2172 return -EMSGSIZE;
2173 }
2174
2175 static const struct nla_policy ifla_policy[IFLA_MAX+1] = {
2176 [IFLA_UNSPEC] = { .strict_start_type = IFLA_DPLL_PIN },
2177 [IFLA_IFNAME] = { .type = NLA_STRING, .len = IFNAMSIZ-1 },
2178 [IFLA_ADDRESS] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
2179 [IFLA_BROADCAST] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
2180 [IFLA_MAP] = { .len = sizeof(struct rtnl_link_ifmap) },
2181 [IFLA_MTU] = { .type = NLA_U32 },
2182 [IFLA_LINK] = { .type = NLA_U32 },
2183 [IFLA_MASTER] = { .type = NLA_U32 },
2184 [IFLA_CARRIER] = { .type = NLA_U8 },
2185 [IFLA_TXQLEN] = { .type = NLA_U32 },
2186 [IFLA_WEIGHT] = { .type = NLA_U32 },
2187 [IFLA_OPERSTATE] = { .type = NLA_U8 },
2188 [IFLA_LINKMODE] = { .type = NLA_U8 },
2189 [IFLA_LINKINFO] = { .type = NLA_NESTED },
2190 [IFLA_NET_NS_PID] = { .type = NLA_U32 },
2191 [IFLA_NET_NS_FD] = { .type = NLA_U32 },
2192 /* IFLA_IFALIAS is a string, but policy is set to NLA_BINARY to
2193 * allow 0-length string (needed to remove an alias).
2194 */
2195 [IFLA_IFALIAS] = { .type = NLA_BINARY, .len = IFALIASZ - 1 },
2196 [IFLA_VFINFO_LIST] = {. type = NLA_NESTED },
2197 [IFLA_VF_PORTS] = { .type = NLA_NESTED },
2198 [IFLA_PORT_SELF] = { .type = NLA_NESTED },
2199 [IFLA_AF_SPEC] = { .type = NLA_NESTED },
2200 [IFLA_EXT_MASK] = { .type = NLA_U32 },
2201 [IFLA_PROMISCUITY] = { .type = NLA_U32 },
2202 [IFLA_NUM_TX_QUEUES] = { .type = NLA_U32 },
2203 [IFLA_NUM_RX_QUEUES] = { .type = NLA_U32 },
2204 [IFLA_GSO_MAX_SEGS] = { .type = NLA_U32 },
2205 [IFLA_GSO_MAX_SIZE] = NLA_POLICY_MIN(NLA_U32, MAX_TCP_HEADER + 1),
2206 [IFLA_PHYS_PORT_ID] = { .type = NLA_BINARY, .len = MAX_PHYS_ITEM_ID_LEN },
2207 [IFLA_CARRIER_CHANGES] = { .type = NLA_U32 }, /* ignored */
2208 [IFLA_PHYS_SWITCH_ID] = { .type = NLA_BINARY, .len = MAX_PHYS_ITEM_ID_LEN },
2209 [IFLA_LINK_NETNSID] = { .type = NLA_S32 },
2210 [IFLA_PROTO_DOWN] = { .type = NLA_U8 },
2211 [IFLA_XDP] = { .type = NLA_NESTED },
2212 [IFLA_EVENT] = { .type = NLA_U32 },
2213 [IFLA_GROUP] = { .type = NLA_U32 },
2214 [IFLA_TARGET_NETNSID] = { .type = NLA_S32 },
2215 [IFLA_CARRIER_UP_COUNT] = { .type = NLA_U32 },
2216 [IFLA_CARRIER_DOWN_COUNT] = { .type = NLA_U32 },
2217 [IFLA_MIN_MTU] = { .type = NLA_U32 },
2218 [IFLA_MAX_MTU] = { .type = NLA_U32 },
2219 [IFLA_PROP_LIST] = { .type = NLA_NESTED },
2220 [IFLA_ALT_IFNAME] = { .type = NLA_STRING,
2221 .len = ALTIFNAMSIZ - 1 },
2222 [IFLA_PERM_ADDRESS] = { .type = NLA_REJECT },
2223 [IFLA_PROTO_DOWN_REASON] = { .type = NLA_NESTED },
2224 [IFLA_NEW_IFINDEX] = NLA_POLICY_MIN(NLA_S32, 1),
2225 [IFLA_PARENT_DEV_NAME] = { .type = NLA_NUL_STRING },
2226 [IFLA_GRO_MAX_SIZE] = { .type = NLA_U32 },
2227 [IFLA_TSO_MAX_SIZE] = { .type = NLA_REJECT },
2228 [IFLA_TSO_MAX_SEGS] = { .type = NLA_REJECT },
2229 [IFLA_ALLMULTI] = { .type = NLA_REJECT },
2230 [IFLA_GSO_IPV4_MAX_SIZE] = NLA_POLICY_MIN(NLA_U32, MAX_TCP_HEADER + 1),
2231 [IFLA_GRO_IPV4_MAX_SIZE] = { .type = NLA_U32 },
2232 };
2233
2234 static const struct nla_policy ifla_info_policy[IFLA_INFO_MAX+1] = {
2235 [IFLA_INFO_KIND] = { .type = NLA_STRING },
2236 [IFLA_INFO_DATA] = { .type = NLA_NESTED },
2237 [IFLA_INFO_SLAVE_KIND] = { .type = NLA_STRING },
2238 [IFLA_INFO_SLAVE_DATA] = { .type = NLA_NESTED },
2239 };
2240
2241 static const struct nla_policy ifla_vf_policy[IFLA_VF_MAX+1] = {
2242 [IFLA_VF_MAC] = { .len = sizeof(struct ifla_vf_mac) },
2243 [IFLA_VF_BROADCAST] = { .type = NLA_REJECT },
2244 [IFLA_VF_VLAN] = { .len = sizeof(struct ifla_vf_vlan) },
2245 [IFLA_VF_VLAN_LIST] = { .type = NLA_NESTED },
2246 [IFLA_VF_TX_RATE] = { .len = sizeof(struct ifla_vf_tx_rate) },
2247 [IFLA_VF_SPOOFCHK] = { .len = sizeof(struct ifla_vf_spoofchk) },
2248 [IFLA_VF_RATE] = { .len = sizeof(struct ifla_vf_rate) },
2249 [IFLA_VF_LINK_STATE] = { .len = sizeof(struct ifla_vf_link_state) },
2250 [IFLA_VF_RSS_QUERY_EN] = { .len = sizeof(struct ifla_vf_rss_query_en) },
2251 [IFLA_VF_STATS] = { .type = NLA_NESTED },
2252 [IFLA_VF_TRUST] = { .len = sizeof(struct ifla_vf_trust) },
2253 [IFLA_VF_IB_NODE_GUID] = { .len = sizeof(struct ifla_vf_guid) },
2254 [IFLA_VF_IB_PORT_GUID] = { .len = sizeof(struct ifla_vf_guid) },
2255 };
2256
2257 static const struct nla_policy ifla_port_policy[IFLA_PORT_MAX+1] = {
2258 [IFLA_PORT_VF] = { .type = NLA_U32 },
2259 [IFLA_PORT_PROFILE] = { .type = NLA_STRING,
2260 .len = PORT_PROFILE_MAX },
2261 [IFLA_PORT_INSTANCE_UUID] = { .type = NLA_BINARY,
2262 .len = PORT_UUID_MAX },
2263 [IFLA_PORT_HOST_UUID] = { .type = NLA_STRING,
2264 .len = PORT_UUID_MAX },
2265 [IFLA_PORT_REQUEST] = { .type = NLA_U8, },
2266 [IFLA_PORT_RESPONSE] = { .type = NLA_U16, },
2267
2268 /* Unused, but we need to keep it here since user space could
2269 * fill it. It's also broken with regard to NLA_BINARY use in
2270 * combination with structs.
2271 */
2272 [IFLA_PORT_VSI_TYPE] = { .type = NLA_BINARY,
2273 .len = sizeof(struct ifla_port_vsi) },
2274 };
2275
2276 static const struct nla_policy ifla_xdp_policy[IFLA_XDP_MAX + 1] = {
2277 [IFLA_XDP_UNSPEC] = { .strict_start_type = IFLA_XDP_EXPECTED_FD },
2278 [IFLA_XDP_FD] = { .type = NLA_S32 },
2279 [IFLA_XDP_EXPECTED_FD] = { .type = NLA_S32 },
2280 [IFLA_XDP_ATTACHED] = { .type = NLA_U8 },
2281 [IFLA_XDP_FLAGS] = { .type = NLA_U32 },
2282 [IFLA_XDP_PROG_ID] = { .type = NLA_U32 },
2283 };
2284
linkinfo_to_kind_ops(const struct nlattr * nla,int * ops_srcu_index)2285 static struct rtnl_link_ops *linkinfo_to_kind_ops(const struct nlattr *nla,
2286 int *ops_srcu_index)
2287 {
2288 struct nlattr *linfo[IFLA_INFO_MAX + 1];
2289 struct rtnl_link_ops *ops = NULL;
2290
2291 if (nla_parse_nested_deprecated(linfo, IFLA_INFO_MAX, nla, ifla_info_policy, NULL) < 0)
2292 return NULL;
2293
2294 if (linfo[IFLA_INFO_KIND]) {
2295 char kind[MODULE_NAME_LEN];
2296
2297 nla_strscpy(kind, linfo[IFLA_INFO_KIND], sizeof(kind));
2298 ops = rtnl_link_ops_get(kind, ops_srcu_index);
2299 }
2300
2301 return ops;
2302 }
2303
link_master_filtered(struct net_device * dev,int master_idx)2304 static bool link_master_filtered(struct net_device *dev, int master_idx)
2305 {
2306 struct net_device *master;
2307
2308 if (!master_idx)
2309 return false;
2310
2311 master = netdev_master_upper_dev_get(dev);
2312
2313 /* 0 is already used to denote IFLA_MASTER wasn't passed, therefore need
2314 * another invalid value for ifindex to denote "no master".
2315 */
2316 if (master_idx == -1)
2317 return !!master;
2318
2319 if (!master || master->ifindex != master_idx)
2320 return true;
2321
2322 return false;
2323 }
2324
link_kind_filtered(const struct net_device * dev,const struct rtnl_link_ops * kind_ops)2325 static bool link_kind_filtered(const struct net_device *dev,
2326 const struct rtnl_link_ops *kind_ops)
2327 {
2328 if (kind_ops && dev->rtnl_link_ops != kind_ops)
2329 return true;
2330
2331 return false;
2332 }
2333
link_dump_filtered(struct net_device * dev,int master_idx,const struct rtnl_link_ops * kind_ops)2334 static bool link_dump_filtered(struct net_device *dev,
2335 int master_idx,
2336 const struct rtnl_link_ops *kind_ops)
2337 {
2338 if (link_master_filtered(dev, master_idx) ||
2339 link_kind_filtered(dev, kind_ops))
2340 return true;
2341
2342 return false;
2343 }
2344
2345 /**
2346 * rtnl_get_net_ns_capable - Get netns if sufficiently privileged.
2347 * @sk: netlink socket
2348 * @netnsid: network namespace identifier
2349 *
2350 * Returns the network namespace identified by netnsid on success or an error
2351 * pointer on failure.
2352 */
rtnl_get_net_ns_capable(struct sock * sk,int netnsid)2353 struct net *rtnl_get_net_ns_capable(struct sock *sk, int netnsid)
2354 {
2355 struct net *net;
2356
2357 net = get_net_ns_by_id(sock_net(sk), netnsid);
2358 if (!net)
2359 return ERR_PTR(-EINVAL);
2360
2361 /* For now, the caller is required to have CAP_NET_ADMIN in
2362 * the user namespace owning the target net ns.
2363 */
2364 if (!sk_ns_capable(sk, net->user_ns, CAP_NET_ADMIN)) {
2365 put_net(net);
2366 return ERR_PTR(-EACCES);
2367 }
2368 return net;
2369 }
2370 EXPORT_SYMBOL_GPL(rtnl_get_net_ns_capable);
2371
rtnl_valid_dump_ifinfo_req(const struct nlmsghdr * nlh,bool strict_check,struct nlattr ** tb,struct netlink_ext_ack * extack)2372 static int rtnl_valid_dump_ifinfo_req(const struct nlmsghdr *nlh,
2373 bool strict_check, struct nlattr **tb,
2374 struct netlink_ext_ack *extack)
2375 {
2376 int hdrlen;
2377
2378 if (strict_check) {
2379 struct ifinfomsg *ifm;
2380
2381 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifm))) {
2382 NL_SET_ERR_MSG(extack, "Invalid header for link dump");
2383 return -EINVAL;
2384 }
2385
2386 ifm = nlmsg_data(nlh);
2387 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags ||
2388 ifm->ifi_change) {
2389 NL_SET_ERR_MSG(extack, "Invalid values in header for link dump request");
2390 return -EINVAL;
2391 }
2392 if (ifm->ifi_index) {
2393 NL_SET_ERR_MSG(extack, "Filter by device index not supported for link dumps");
2394 return -EINVAL;
2395 }
2396
2397 return nlmsg_parse_deprecated_strict(nlh, sizeof(*ifm), tb,
2398 IFLA_MAX, ifla_policy,
2399 extack);
2400 }
2401
2402 /* A hack to preserve kernel<->userspace interface.
2403 * The correct header is ifinfomsg. It is consistent with rtnl_getlink.
2404 * However, before Linux v3.9 the code here assumed rtgenmsg and that's
2405 * what iproute2 < v3.9.0 used.
2406 * We can detect the old iproute2. Even including the IFLA_EXT_MASK
2407 * attribute, its netlink message is shorter than struct ifinfomsg.
2408 */
2409 hdrlen = nlmsg_len(nlh) < sizeof(struct ifinfomsg) ?
2410 sizeof(struct rtgenmsg) : sizeof(struct ifinfomsg);
2411
2412 return nlmsg_parse_deprecated(nlh, hdrlen, tb, IFLA_MAX, ifla_policy,
2413 extack);
2414 }
2415
rtnl_dump_ifinfo(struct sk_buff * skb,struct netlink_callback * cb)2416 static int rtnl_dump_ifinfo(struct sk_buff *skb, struct netlink_callback *cb)
2417 {
2418 struct netlink_ext_ack *extack = cb->extack;
2419 struct rtnl_link_ops *kind_ops = NULL;
2420 const struct nlmsghdr *nlh = cb->nlh;
2421 struct net *net = sock_net(skb->sk);
2422 unsigned int flags = NLM_F_MULTI;
2423 struct nlattr *tb[IFLA_MAX+1];
2424 struct {
2425 unsigned long ifindex;
2426 } *ctx = (void *)cb->ctx;
2427 struct net *tgt_net = net;
2428 u32 ext_filter_mask = 0;
2429 struct net_device *dev;
2430 int ops_srcu_index;
2431 int master_idx = 0;
2432 int netnsid = -1;
2433 int err, i;
2434
2435 err = rtnl_valid_dump_ifinfo_req(nlh, cb->strict_check, tb, extack);
2436 if (err < 0) {
2437 if (cb->strict_check)
2438 return err;
2439
2440 goto walk_entries;
2441 }
2442
2443 for (i = 0; i <= IFLA_MAX; ++i) {
2444 if (!tb[i])
2445 continue;
2446
2447 /* new attributes should only be added with strict checking */
2448 switch (i) {
2449 case IFLA_TARGET_NETNSID:
2450 netnsid = nla_get_s32(tb[i]);
2451 tgt_net = rtnl_get_net_ns_capable(skb->sk, netnsid);
2452 if (IS_ERR(tgt_net)) {
2453 NL_SET_ERR_MSG(extack, "Invalid target network namespace id");
2454 err = PTR_ERR(tgt_net);
2455 netnsid = -1;
2456 goto out;
2457 }
2458 break;
2459 case IFLA_EXT_MASK:
2460 ext_filter_mask = nla_get_u32(tb[i]);
2461 break;
2462 case IFLA_MASTER:
2463 master_idx = nla_get_u32(tb[i]);
2464 break;
2465 case IFLA_LINKINFO:
2466 kind_ops = linkinfo_to_kind_ops(tb[i], &ops_srcu_index);
2467 break;
2468 default:
2469 if (cb->strict_check) {
2470 NL_SET_ERR_MSG(extack, "Unsupported attribute in link dump request");
2471 err = -EINVAL;
2472 goto out;
2473 }
2474 }
2475 }
2476
2477 if (master_idx || kind_ops)
2478 flags |= NLM_F_DUMP_FILTERED;
2479
2480 walk_entries:
2481 err = 0;
2482 for_each_netdev_dump(tgt_net, dev, ctx->ifindex) {
2483 if (link_dump_filtered(dev, master_idx, kind_ops))
2484 continue;
2485 err = rtnl_fill_ifinfo(skb, dev, net, RTM_NEWLINK,
2486 NETLINK_CB(cb->skb).portid,
2487 nlh->nlmsg_seq, 0, flags,
2488 ext_filter_mask, 0, NULL, 0,
2489 netnsid, GFP_KERNEL);
2490 if (err < 0)
2491 break;
2492 }
2493
2494
2495 cb->seq = tgt_net->dev_base_seq;
2496 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2497
2498 out:
2499
2500 if (kind_ops)
2501 rtnl_link_ops_put(kind_ops, ops_srcu_index);
2502 if (netnsid >= 0)
2503 put_net(tgt_net);
2504
2505 return err;
2506 }
2507
rtnl_nla_parse_ifinfomsg(struct nlattr ** tb,const struct nlattr * nla_peer,struct netlink_ext_ack * exterr)2508 int rtnl_nla_parse_ifinfomsg(struct nlattr **tb, const struct nlattr *nla_peer,
2509 struct netlink_ext_ack *exterr)
2510 {
2511 const struct ifinfomsg *ifmp;
2512 const struct nlattr *attrs;
2513 size_t len;
2514
2515 ifmp = nla_data(nla_peer);
2516 attrs = nla_data(nla_peer) + sizeof(struct ifinfomsg);
2517 len = nla_len(nla_peer) - sizeof(struct ifinfomsg);
2518
2519 if (ifmp->ifi_index < 0) {
2520 NL_SET_ERR_MSG_ATTR(exterr, nla_peer,
2521 "ifindex can't be negative");
2522 return -EINVAL;
2523 }
2524
2525 return nla_parse_deprecated(tb, IFLA_MAX, attrs, len, ifla_policy,
2526 exterr);
2527 }
2528 EXPORT_SYMBOL(rtnl_nla_parse_ifinfomsg);
2529
rtnl_link_get_net_ifla(struct nlattr * tb[])2530 static struct net *rtnl_link_get_net_ifla(struct nlattr *tb[])
2531 {
2532 struct net *net = NULL;
2533
2534 /* Examine the link attributes and figure out which
2535 * network namespace we are talking about.
2536 */
2537 if (tb[IFLA_NET_NS_PID])
2538 net = get_net_ns_by_pid(nla_get_u32(tb[IFLA_NET_NS_PID]));
2539 else if (tb[IFLA_NET_NS_FD])
2540 net = get_net_ns_by_fd(nla_get_u32(tb[IFLA_NET_NS_FD]));
2541
2542 return net;
2543 }
2544
rtnl_link_get_net(struct net * src_net,struct nlattr * tb[])2545 struct net *rtnl_link_get_net(struct net *src_net, struct nlattr *tb[])
2546 {
2547 struct net *net = rtnl_link_get_net_ifla(tb);
2548
2549 if (!net)
2550 net = get_net(src_net);
2551
2552 return net;
2553 }
2554 EXPORT_SYMBOL(rtnl_link_get_net);
2555
2556 /* Figure out which network namespace we are talking about by
2557 * examining the link attributes in the following order:
2558 *
2559 * 1. IFLA_NET_NS_PID
2560 * 2. IFLA_NET_NS_FD
2561 * 3. IFLA_TARGET_NETNSID
2562 */
rtnl_link_get_net_by_nlattr(struct net * src_net,struct nlattr * tb[])2563 static struct net *rtnl_link_get_net_by_nlattr(struct net *src_net,
2564 struct nlattr *tb[])
2565 {
2566 struct net *net;
2567
2568 if (tb[IFLA_NET_NS_PID] || tb[IFLA_NET_NS_FD])
2569 return rtnl_link_get_net(src_net, tb);
2570
2571 if (!tb[IFLA_TARGET_NETNSID])
2572 return get_net(src_net);
2573
2574 net = get_net_ns_by_id(src_net, nla_get_u32(tb[IFLA_TARGET_NETNSID]));
2575 if (!net)
2576 return ERR_PTR(-EINVAL);
2577
2578 return net;
2579 }
2580
rtnl_link_get_net_capable(const struct sk_buff * skb,struct net * src_net,struct nlattr * tb[],int cap)2581 static struct net *rtnl_link_get_net_capable(const struct sk_buff *skb,
2582 struct net *src_net,
2583 struct nlattr *tb[], int cap)
2584 {
2585 struct net *net;
2586
2587 net = rtnl_link_get_net_by_nlattr(src_net, tb);
2588 if (IS_ERR(net))
2589 return net;
2590
2591 if (!netlink_ns_capable(skb, net->user_ns, cap)) {
2592 put_net(net);
2593 return ERR_PTR(-EPERM);
2594 }
2595
2596 return net;
2597 }
2598
2599 /* Verify that rtnetlink requests do not pass additional properties
2600 * potentially referring to different network namespaces.
2601 */
rtnl_ensure_unique_netns(struct nlattr * tb[],struct netlink_ext_ack * extack,bool netns_id_only)2602 static int rtnl_ensure_unique_netns(struct nlattr *tb[],
2603 struct netlink_ext_ack *extack,
2604 bool netns_id_only)
2605 {
2606
2607 if (netns_id_only) {
2608 if (!tb[IFLA_NET_NS_PID] && !tb[IFLA_NET_NS_FD])
2609 return 0;
2610
2611 NL_SET_ERR_MSG(extack, "specified netns attribute not supported");
2612 return -EOPNOTSUPP;
2613 }
2614
2615 if (tb[IFLA_TARGET_NETNSID] && (tb[IFLA_NET_NS_PID] || tb[IFLA_NET_NS_FD]))
2616 goto invalid_attr;
2617
2618 if (tb[IFLA_NET_NS_PID] && (tb[IFLA_TARGET_NETNSID] || tb[IFLA_NET_NS_FD]))
2619 goto invalid_attr;
2620
2621 if (tb[IFLA_NET_NS_FD] && (tb[IFLA_TARGET_NETNSID] || tb[IFLA_NET_NS_PID]))
2622 goto invalid_attr;
2623
2624 return 0;
2625
2626 invalid_attr:
2627 NL_SET_ERR_MSG(extack, "multiple netns identifying attributes specified");
2628 return -EINVAL;
2629 }
2630
rtnl_set_vf_rate(struct net_device * dev,int vf,int min_tx_rate,int max_tx_rate)2631 static int rtnl_set_vf_rate(struct net_device *dev, int vf, int min_tx_rate,
2632 int max_tx_rate)
2633 {
2634 const struct net_device_ops *ops = dev->netdev_ops;
2635
2636 if (!ops->ndo_set_vf_rate)
2637 return -EOPNOTSUPP;
2638 if (max_tx_rate && max_tx_rate < min_tx_rate)
2639 return -EINVAL;
2640
2641 return ops->ndo_set_vf_rate(dev, vf, min_tx_rate, max_tx_rate);
2642 }
2643
validate_linkmsg(struct net_device * dev,struct nlattr * tb[],struct netlink_ext_ack * extack)2644 static int validate_linkmsg(struct net_device *dev, struct nlattr *tb[],
2645 struct netlink_ext_ack *extack)
2646 {
2647 if (tb[IFLA_ADDRESS] &&
2648 nla_len(tb[IFLA_ADDRESS]) < dev->addr_len)
2649 return -EINVAL;
2650
2651 if (tb[IFLA_BROADCAST] &&
2652 nla_len(tb[IFLA_BROADCAST]) < dev->addr_len)
2653 return -EINVAL;
2654
2655 if (tb[IFLA_GSO_MAX_SIZE] &&
2656 nla_get_u32(tb[IFLA_GSO_MAX_SIZE]) > dev->tso_max_size) {
2657 NL_SET_ERR_MSG(extack, "too big gso_max_size");
2658 return -EINVAL;
2659 }
2660
2661 if (tb[IFLA_GSO_MAX_SEGS] &&
2662 (nla_get_u32(tb[IFLA_GSO_MAX_SEGS]) > GSO_MAX_SEGS ||
2663 nla_get_u32(tb[IFLA_GSO_MAX_SEGS]) > dev->tso_max_segs)) {
2664 NL_SET_ERR_MSG(extack, "too big gso_max_segs");
2665 return -EINVAL;
2666 }
2667
2668 if (tb[IFLA_GRO_MAX_SIZE] &&
2669 nla_get_u32(tb[IFLA_GRO_MAX_SIZE]) > GRO_MAX_SIZE) {
2670 NL_SET_ERR_MSG(extack, "too big gro_max_size");
2671 return -EINVAL;
2672 }
2673
2674 if (tb[IFLA_GSO_IPV4_MAX_SIZE] &&
2675 nla_get_u32(tb[IFLA_GSO_IPV4_MAX_SIZE]) > dev->tso_max_size) {
2676 NL_SET_ERR_MSG(extack, "too big gso_ipv4_max_size");
2677 return -EINVAL;
2678 }
2679
2680 if (tb[IFLA_GRO_IPV4_MAX_SIZE] &&
2681 nla_get_u32(tb[IFLA_GRO_IPV4_MAX_SIZE]) > GRO_MAX_SIZE) {
2682 NL_SET_ERR_MSG(extack, "too big gro_ipv4_max_size");
2683 return -EINVAL;
2684 }
2685
2686 if (tb[IFLA_AF_SPEC]) {
2687 struct nlattr *af;
2688 int rem, err;
2689
2690 nla_for_each_nested(af, tb[IFLA_AF_SPEC], rem) {
2691 struct rtnl_af_ops *af_ops;
2692 int af_ops_srcu_index;
2693
2694 af_ops = rtnl_af_lookup(nla_type(af), &af_ops_srcu_index);
2695 if (!af_ops)
2696 return -EAFNOSUPPORT;
2697
2698 if (!af_ops->set_link_af)
2699 err = -EOPNOTSUPP;
2700 else if (af_ops->validate_link_af)
2701 err = af_ops->validate_link_af(dev, af, extack);
2702 else
2703 err = 0;
2704
2705 rtnl_af_put(af_ops, af_ops_srcu_index);
2706
2707 if (err < 0)
2708 return err;
2709 }
2710 }
2711
2712 return 0;
2713 }
2714
handle_infiniband_guid(struct net_device * dev,struct ifla_vf_guid * ivt,int guid_type)2715 static int handle_infiniband_guid(struct net_device *dev, struct ifla_vf_guid *ivt,
2716 int guid_type)
2717 {
2718 const struct net_device_ops *ops = dev->netdev_ops;
2719
2720 return ops->ndo_set_vf_guid(dev, ivt->vf, ivt->guid, guid_type);
2721 }
2722
handle_vf_guid(struct net_device * dev,struct ifla_vf_guid * ivt,int guid_type)2723 static int handle_vf_guid(struct net_device *dev, struct ifla_vf_guid *ivt, int guid_type)
2724 {
2725 if (dev->type != ARPHRD_INFINIBAND)
2726 return -EOPNOTSUPP;
2727
2728 return handle_infiniband_guid(dev, ivt, guid_type);
2729 }
2730
do_setvfinfo(struct net_device * dev,struct nlattr ** tb)2731 static int do_setvfinfo(struct net_device *dev, struct nlattr **tb)
2732 {
2733 const struct net_device_ops *ops = dev->netdev_ops;
2734 int err = -EINVAL;
2735
2736 if (tb[IFLA_VF_MAC]) {
2737 struct ifla_vf_mac *ivm = nla_data(tb[IFLA_VF_MAC]);
2738
2739 if (ivm->vf >= INT_MAX)
2740 return -EINVAL;
2741 err = -EOPNOTSUPP;
2742 if (ops->ndo_set_vf_mac)
2743 err = ops->ndo_set_vf_mac(dev, ivm->vf,
2744 ivm->mac);
2745 if (err < 0)
2746 return err;
2747 }
2748
2749 if (tb[IFLA_VF_VLAN]) {
2750 struct ifla_vf_vlan *ivv = nla_data(tb[IFLA_VF_VLAN]);
2751
2752 if (ivv->vf >= INT_MAX)
2753 return -EINVAL;
2754 err = -EOPNOTSUPP;
2755 if (ops->ndo_set_vf_vlan)
2756 err = ops->ndo_set_vf_vlan(dev, ivv->vf, ivv->vlan,
2757 ivv->qos,
2758 htons(ETH_P_8021Q));
2759 if (err < 0)
2760 return err;
2761 }
2762
2763 if (tb[IFLA_VF_VLAN_LIST]) {
2764 struct ifla_vf_vlan_info *ivvl[MAX_VLAN_LIST_LEN];
2765 struct nlattr *attr;
2766 int rem, len = 0;
2767
2768 err = -EOPNOTSUPP;
2769 if (!ops->ndo_set_vf_vlan)
2770 return err;
2771
2772 nla_for_each_nested(attr, tb[IFLA_VF_VLAN_LIST], rem) {
2773 if (nla_type(attr) != IFLA_VF_VLAN_INFO ||
2774 nla_len(attr) < sizeof(struct ifla_vf_vlan_info)) {
2775 return -EINVAL;
2776 }
2777 if (len >= MAX_VLAN_LIST_LEN)
2778 return -EOPNOTSUPP;
2779 ivvl[len] = nla_data(attr);
2780
2781 len++;
2782 }
2783 if (len == 0)
2784 return -EINVAL;
2785
2786 if (ivvl[0]->vf >= INT_MAX)
2787 return -EINVAL;
2788 err = ops->ndo_set_vf_vlan(dev, ivvl[0]->vf, ivvl[0]->vlan,
2789 ivvl[0]->qos, ivvl[0]->vlan_proto);
2790 if (err < 0)
2791 return err;
2792 }
2793
2794 if (tb[IFLA_VF_TX_RATE]) {
2795 struct ifla_vf_tx_rate *ivt = nla_data(tb[IFLA_VF_TX_RATE]);
2796 struct ifla_vf_info ivf;
2797
2798 if (ivt->vf >= INT_MAX)
2799 return -EINVAL;
2800 err = -EOPNOTSUPP;
2801 if (ops->ndo_get_vf_config)
2802 err = ops->ndo_get_vf_config(dev, ivt->vf, &ivf);
2803 if (err < 0)
2804 return err;
2805
2806 err = rtnl_set_vf_rate(dev, ivt->vf,
2807 ivf.min_tx_rate, ivt->rate);
2808 if (err < 0)
2809 return err;
2810 }
2811
2812 if (tb[IFLA_VF_RATE]) {
2813 struct ifla_vf_rate *ivt = nla_data(tb[IFLA_VF_RATE]);
2814
2815 if (ivt->vf >= INT_MAX)
2816 return -EINVAL;
2817
2818 err = rtnl_set_vf_rate(dev, ivt->vf,
2819 ivt->min_tx_rate, ivt->max_tx_rate);
2820 if (err < 0)
2821 return err;
2822 }
2823
2824 if (tb[IFLA_VF_SPOOFCHK]) {
2825 struct ifla_vf_spoofchk *ivs = nla_data(tb[IFLA_VF_SPOOFCHK]);
2826
2827 if (ivs->vf >= INT_MAX)
2828 return -EINVAL;
2829 err = -EOPNOTSUPP;
2830 if (ops->ndo_set_vf_spoofchk)
2831 err = ops->ndo_set_vf_spoofchk(dev, ivs->vf,
2832 ivs->setting);
2833 if (err < 0)
2834 return err;
2835 }
2836
2837 if (tb[IFLA_VF_LINK_STATE]) {
2838 struct ifla_vf_link_state *ivl = nla_data(tb[IFLA_VF_LINK_STATE]);
2839
2840 if (ivl->vf >= INT_MAX)
2841 return -EINVAL;
2842 err = -EOPNOTSUPP;
2843 if (ops->ndo_set_vf_link_state)
2844 err = ops->ndo_set_vf_link_state(dev, ivl->vf,
2845 ivl->link_state);
2846 if (err < 0)
2847 return err;
2848 }
2849
2850 if (tb[IFLA_VF_RSS_QUERY_EN]) {
2851 struct ifla_vf_rss_query_en *ivrssq_en;
2852
2853 err = -EOPNOTSUPP;
2854 ivrssq_en = nla_data(tb[IFLA_VF_RSS_QUERY_EN]);
2855 if (ivrssq_en->vf >= INT_MAX)
2856 return -EINVAL;
2857 if (ops->ndo_set_vf_rss_query_en)
2858 err = ops->ndo_set_vf_rss_query_en(dev, ivrssq_en->vf,
2859 ivrssq_en->setting);
2860 if (err < 0)
2861 return err;
2862 }
2863
2864 if (tb[IFLA_VF_TRUST]) {
2865 struct ifla_vf_trust *ivt = nla_data(tb[IFLA_VF_TRUST]);
2866
2867 if (ivt->vf >= INT_MAX)
2868 return -EINVAL;
2869 err = -EOPNOTSUPP;
2870 if (ops->ndo_set_vf_trust)
2871 err = ops->ndo_set_vf_trust(dev, ivt->vf, ivt->setting);
2872 if (err < 0)
2873 return err;
2874 }
2875
2876 if (tb[IFLA_VF_IB_NODE_GUID]) {
2877 struct ifla_vf_guid *ivt = nla_data(tb[IFLA_VF_IB_NODE_GUID]);
2878
2879 if (ivt->vf >= INT_MAX)
2880 return -EINVAL;
2881 if (!ops->ndo_set_vf_guid)
2882 return -EOPNOTSUPP;
2883 return handle_vf_guid(dev, ivt, IFLA_VF_IB_NODE_GUID);
2884 }
2885
2886 if (tb[IFLA_VF_IB_PORT_GUID]) {
2887 struct ifla_vf_guid *ivt = nla_data(tb[IFLA_VF_IB_PORT_GUID]);
2888
2889 if (ivt->vf >= INT_MAX)
2890 return -EINVAL;
2891 if (!ops->ndo_set_vf_guid)
2892 return -EOPNOTSUPP;
2893
2894 return handle_vf_guid(dev, ivt, IFLA_VF_IB_PORT_GUID);
2895 }
2896
2897 return err;
2898 }
2899
do_set_master(struct net_device * dev,int ifindex,struct netlink_ext_ack * extack)2900 static int do_set_master(struct net_device *dev, int ifindex,
2901 struct netlink_ext_ack *extack)
2902 {
2903 struct net_device *upper_dev = netdev_master_upper_dev_get(dev);
2904 const struct net_device_ops *ops;
2905 int err;
2906
2907 if (upper_dev) {
2908 if (upper_dev->ifindex == ifindex)
2909 return 0;
2910 ops = upper_dev->netdev_ops;
2911 if (ops->ndo_del_slave) {
2912 err = ops->ndo_del_slave(upper_dev, dev);
2913 if (err)
2914 return err;
2915 } else {
2916 return -EOPNOTSUPP;
2917 }
2918 }
2919
2920 if (ifindex) {
2921 upper_dev = __dev_get_by_index(dev_net(dev), ifindex);
2922 if (!upper_dev)
2923 return -EINVAL;
2924 ops = upper_dev->netdev_ops;
2925 if (ops->ndo_add_slave) {
2926 err = ops->ndo_add_slave(upper_dev, dev, extack);
2927 if (err)
2928 return err;
2929 } else {
2930 return -EOPNOTSUPP;
2931 }
2932 }
2933 return 0;
2934 }
2935
2936 static const struct nla_policy ifla_proto_down_reason_policy[IFLA_PROTO_DOWN_REASON_VALUE + 1] = {
2937 [IFLA_PROTO_DOWN_REASON_MASK] = { .type = NLA_U32 },
2938 [IFLA_PROTO_DOWN_REASON_VALUE] = { .type = NLA_U32 },
2939 };
2940
do_set_proto_down(struct net_device * dev,struct nlattr * nl_proto_down,struct nlattr * nl_proto_down_reason,struct netlink_ext_ack * extack)2941 static int do_set_proto_down(struct net_device *dev,
2942 struct nlattr *nl_proto_down,
2943 struct nlattr *nl_proto_down_reason,
2944 struct netlink_ext_ack *extack)
2945 {
2946 struct nlattr *pdreason[IFLA_PROTO_DOWN_REASON_MAX + 1];
2947 unsigned long mask = 0;
2948 u32 value;
2949 bool proto_down;
2950 int err;
2951
2952 if (!dev->change_proto_down) {
2953 NL_SET_ERR_MSG(extack, "Protodown not supported by device");
2954 return -EOPNOTSUPP;
2955 }
2956
2957 if (nl_proto_down_reason) {
2958 err = nla_parse_nested_deprecated(pdreason,
2959 IFLA_PROTO_DOWN_REASON_MAX,
2960 nl_proto_down_reason,
2961 ifla_proto_down_reason_policy,
2962 NULL);
2963 if (err < 0)
2964 return err;
2965
2966 if (!pdreason[IFLA_PROTO_DOWN_REASON_VALUE]) {
2967 NL_SET_ERR_MSG(extack, "Invalid protodown reason value");
2968 return -EINVAL;
2969 }
2970
2971 value = nla_get_u32(pdreason[IFLA_PROTO_DOWN_REASON_VALUE]);
2972
2973 if (pdreason[IFLA_PROTO_DOWN_REASON_MASK])
2974 mask = nla_get_u32(pdreason[IFLA_PROTO_DOWN_REASON_MASK]);
2975
2976 dev_change_proto_down_reason(dev, mask, value);
2977 }
2978
2979 if (nl_proto_down) {
2980 proto_down = nla_get_u8(nl_proto_down);
2981
2982 /* Don't turn off protodown if there are active reasons */
2983 if (!proto_down && dev->proto_down_reason) {
2984 NL_SET_ERR_MSG(extack, "Cannot clear protodown, active reasons");
2985 return -EBUSY;
2986 }
2987 err = dev_change_proto_down(dev,
2988 proto_down);
2989 if (err)
2990 return err;
2991 }
2992
2993 return 0;
2994 }
2995
2996 #define DO_SETLINK_MODIFIED 0x01
2997 /* notify flag means notify + modified. */
2998 #define DO_SETLINK_NOTIFY 0x03
do_setlink(const struct sk_buff * skb,struct net_device * dev,struct net * tgt_net,struct ifinfomsg * ifm,struct netlink_ext_ack * extack,struct nlattr ** tb,int status)2999 static int do_setlink(const struct sk_buff *skb, struct net_device *dev,
3000 struct net *tgt_net, struct ifinfomsg *ifm,
3001 struct netlink_ext_ack *extack,
3002 struct nlattr **tb, int status)
3003 {
3004 const struct net_device_ops *ops = dev->netdev_ops;
3005 char ifname[IFNAMSIZ];
3006 int err;
3007
3008 err = validate_linkmsg(dev, tb, extack);
3009 if (err < 0)
3010 goto errout;
3011
3012 if (tb[IFLA_IFNAME])
3013 nla_strscpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
3014 else
3015 ifname[0] = '\0';
3016
3017 if (!net_eq(tgt_net, dev_net(dev))) {
3018 const char *pat = ifname[0] ? ifname : NULL;
3019 int new_ifindex;
3020
3021 new_ifindex = nla_get_s32_default(tb[IFLA_NEW_IFINDEX], 0);
3022
3023 err = __dev_change_net_namespace(dev, tgt_net, pat, new_ifindex);
3024 if (err)
3025 goto errout;
3026
3027 status |= DO_SETLINK_MODIFIED;
3028 }
3029
3030 if (tb[IFLA_MAP]) {
3031 struct rtnl_link_ifmap *u_map;
3032 struct ifmap k_map;
3033
3034 if (!ops->ndo_set_config) {
3035 err = -EOPNOTSUPP;
3036 goto errout;
3037 }
3038
3039 if (!netif_device_present(dev)) {
3040 err = -ENODEV;
3041 goto errout;
3042 }
3043
3044 u_map = nla_data(tb[IFLA_MAP]);
3045 k_map.mem_start = (unsigned long) u_map->mem_start;
3046 k_map.mem_end = (unsigned long) u_map->mem_end;
3047 k_map.base_addr = (unsigned short) u_map->base_addr;
3048 k_map.irq = (unsigned char) u_map->irq;
3049 k_map.dma = (unsigned char) u_map->dma;
3050 k_map.port = (unsigned char) u_map->port;
3051
3052 err = ops->ndo_set_config(dev, &k_map);
3053 if (err < 0)
3054 goto errout;
3055
3056 status |= DO_SETLINK_NOTIFY;
3057 }
3058
3059 if (tb[IFLA_ADDRESS]) {
3060 struct sockaddr *sa;
3061 int len;
3062
3063 len = sizeof(sa_family_t) + max_t(size_t, dev->addr_len,
3064 sizeof(*sa));
3065 sa = kmalloc(len, GFP_KERNEL);
3066 if (!sa) {
3067 err = -ENOMEM;
3068 goto errout;
3069 }
3070 sa->sa_family = dev->type;
3071 memcpy(sa->sa_data, nla_data(tb[IFLA_ADDRESS]),
3072 dev->addr_len);
3073 err = dev_set_mac_address_user(dev, sa, extack);
3074 kfree(sa);
3075 if (err)
3076 goto errout;
3077 status |= DO_SETLINK_MODIFIED;
3078 }
3079
3080 if (tb[IFLA_MTU]) {
3081 err = dev_set_mtu_ext(dev, nla_get_u32(tb[IFLA_MTU]), extack);
3082 if (err < 0)
3083 goto errout;
3084 status |= DO_SETLINK_MODIFIED;
3085 }
3086
3087 if (tb[IFLA_GROUP]) {
3088 dev_set_group(dev, nla_get_u32(tb[IFLA_GROUP]));
3089 status |= DO_SETLINK_NOTIFY;
3090 }
3091
3092 /*
3093 * Interface selected by interface index but interface
3094 * name provided implies that a name change has been
3095 * requested.
3096 */
3097 if (ifm->ifi_index > 0 && ifname[0]) {
3098 err = dev_change_name(dev, ifname);
3099 if (err < 0)
3100 goto errout;
3101 status |= DO_SETLINK_MODIFIED;
3102 }
3103
3104 if (tb[IFLA_IFALIAS]) {
3105 err = dev_set_alias(dev, nla_data(tb[IFLA_IFALIAS]),
3106 nla_len(tb[IFLA_IFALIAS]));
3107 if (err < 0)
3108 goto errout;
3109 status |= DO_SETLINK_NOTIFY;
3110 }
3111
3112 if (tb[IFLA_BROADCAST]) {
3113 nla_memcpy(dev->broadcast, tb[IFLA_BROADCAST], dev->addr_len);
3114 call_netdevice_notifiers(NETDEV_CHANGEADDR, dev);
3115 }
3116
3117 if (ifm->ifi_flags || ifm->ifi_change) {
3118 err = dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm),
3119 extack);
3120 if (err < 0)
3121 goto errout;
3122 }
3123
3124 if (tb[IFLA_MASTER]) {
3125 err = do_set_master(dev, nla_get_u32(tb[IFLA_MASTER]), extack);
3126 if (err)
3127 goto errout;
3128 status |= DO_SETLINK_MODIFIED;
3129 }
3130
3131 if (tb[IFLA_CARRIER]) {
3132 err = dev_change_carrier(dev, nla_get_u8(tb[IFLA_CARRIER]));
3133 if (err)
3134 goto errout;
3135 status |= DO_SETLINK_MODIFIED;
3136 }
3137
3138 if (tb[IFLA_TXQLEN]) {
3139 unsigned int value = nla_get_u32(tb[IFLA_TXQLEN]);
3140
3141 err = dev_change_tx_queue_len(dev, value);
3142 if (err)
3143 goto errout;
3144 status |= DO_SETLINK_MODIFIED;
3145 }
3146
3147 if (tb[IFLA_GSO_MAX_SIZE]) {
3148 u32 max_size = nla_get_u32(tb[IFLA_GSO_MAX_SIZE]);
3149
3150 if (dev->gso_max_size ^ max_size) {
3151 netif_set_gso_max_size(dev, max_size);
3152 status |= DO_SETLINK_MODIFIED;
3153 }
3154 }
3155
3156 if (tb[IFLA_GSO_MAX_SEGS]) {
3157 u32 max_segs = nla_get_u32(tb[IFLA_GSO_MAX_SEGS]);
3158
3159 if (dev->gso_max_segs ^ max_segs) {
3160 netif_set_gso_max_segs(dev, max_segs);
3161 status |= DO_SETLINK_MODIFIED;
3162 }
3163 }
3164
3165 if (tb[IFLA_GRO_MAX_SIZE]) {
3166 u32 gro_max_size = nla_get_u32(tb[IFLA_GRO_MAX_SIZE]);
3167
3168 if (dev->gro_max_size ^ gro_max_size) {
3169 netif_set_gro_max_size(dev, gro_max_size);
3170 status |= DO_SETLINK_MODIFIED;
3171 }
3172 }
3173
3174 if (tb[IFLA_GSO_IPV4_MAX_SIZE]) {
3175 u32 max_size = nla_get_u32(tb[IFLA_GSO_IPV4_MAX_SIZE]);
3176
3177 if (dev->gso_ipv4_max_size ^ max_size) {
3178 netif_set_gso_ipv4_max_size(dev, max_size);
3179 status |= DO_SETLINK_MODIFIED;
3180 }
3181 }
3182
3183 if (tb[IFLA_GRO_IPV4_MAX_SIZE]) {
3184 u32 gro_max_size = nla_get_u32(tb[IFLA_GRO_IPV4_MAX_SIZE]);
3185
3186 if (dev->gro_ipv4_max_size ^ gro_max_size) {
3187 netif_set_gro_ipv4_max_size(dev, gro_max_size);
3188 status |= DO_SETLINK_MODIFIED;
3189 }
3190 }
3191
3192 if (tb[IFLA_OPERSTATE])
3193 set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
3194
3195 if (tb[IFLA_LINKMODE]) {
3196 unsigned char value = nla_get_u8(tb[IFLA_LINKMODE]);
3197
3198 if (dev->link_mode ^ value)
3199 status |= DO_SETLINK_NOTIFY;
3200 WRITE_ONCE(dev->link_mode, value);
3201 }
3202
3203 if (tb[IFLA_VFINFO_LIST]) {
3204 struct nlattr *vfinfo[IFLA_VF_MAX + 1];
3205 struct nlattr *attr;
3206 int rem;
3207
3208 nla_for_each_nested(attr, tb[IFLA_VFINFO_LIST], rem) {
3209 if (nla_type(attr) != IFLA_VF_INFO ||
3210 nla_len(attr) < NLA_HDRLEN) {
3211 err = -EINVAL;
3212 goto errout;
3213 }
3214 err = nla_parse_nested_deprecated(vfinfo, IFLA_VF_MAX,
3215 attr,
3216 ifla_vf_policy,
3217 NULL);
3218 if (err < 0)
3219 goto errout;
3220 err = do_setvfinfo(dev, vfinfo);
3221 if (err < 0)
3222 goto errout;
3223 status |= DO_SETLINK_NOTIFY;
3224 }
3225 }
3226 err = 0;
3227
3228 if (tb[IFLA_VF_PORTS]) {
3229 struct nlattr *port[IFLA_PORT_MAX+1];
3230 struct nlattr *attr;
3231 int vf;
3232 int rem;
3233
3234 err = -EOPNOTSUPP;
3235 if (!ops->ndo_set_vf_port)
3236 goto errout;
3237
3238 nla_for_each_nested(attr, tb[IFLA_VF_PORTS], rem) {
3239 if (nla_type(attr) != IFLA_VF_PORT ||
3240 nla_len(attr) < NLA_HDRLEN) {
3241 err = -EINVAL;
3242 goto errout;
3243 }
3244 err = nla_parse_nested_deprecated(port, IFLA_PORT_MAX,
3245 attr,
3246 ifla_port_policy,
3247 NULL);
3248 if (err < 0)
3249 goto errout;
3250 if (!port[IFLA_PORT_VF]) {
3251 err = -EOPNOTSUPP;
3252 goto errout;
3253 }
3254 vf = nla_get_u32(port[IFLA_PORT_VF]);
3255 err = ops->ndo_set_vf_port(dev, vf, port);
3256 if (err < 0)
3257 goto errout;
3258 status |= DO_SETLINK_NOTIFY;
3259 }
3260 }
3261 err = 0;
3262
3263 if (tb[IFLA_PORT_SELF]) {
3264 struct nlattr *port[IFLA_PORT_MAX+1];
3265
3266 err = nla_parse_nested_deprecated(port, IFLA_PORT_MAX,
3267 tb[IFLA_PORT_SELF],
3268 ifla_port_policy, NULL);
3269 if (err < 0)
3270 goto errout;
3271
3272 err = -EOPNOTSUPP;
3273 if (ops->ndo_set_vf_port)
3274 err = ops->ndo_set_vf_port(dev, PORT_SELF_VF, port);
3275 if (err < 0)
3276 goto errout;
3277 status |= DO_SETLINK_NOTIFY;
3278 }
3279
3280 if (tb[IFLA_AF_SPEC]) {
3281 struct nlattr *af;
3282 int rem;
3283
3284 nla_for_each_nested(af, tb[IFLA_AF_SPEC], rem) {
3285 struct rtnl_af_ops *af_ops;
3286 int af_ops_srcu_index;
3287
3288 af_ops = rtnl_af_lookup(nla_type(af), &af_ops_srcu_index);
3289 if (!af_ops) {
3290 err = -EAFNOSUPPORT;
3291 goto errout;
3292 }
3293
3294 err = af_ops->set_link_af(dev, af, extack);
3295 rtnl_af_put(af_ops, af_ops_srcu_index);
3296
3297 if (err < 0)
3298 goto errout;
3299
3300 status |= DO_SETLINK_NOTIFY;
3301 }
3302 }
3303 err = 0;
3304
3305 if (tb[IFLA_PROTO_DOWN] || tb[IFLA_PROTO_DOWN_REASON]) {
3306 err = do_set_proto_down(dev, tb[IFLA_PROTO_DOWN],
3307 tb[IFLA_PROTO_DOWN_REASON], extack);
3308 if (err)
3309 goto errout;
3310 status |= DO_SETLINK_NOTIFY;
3311 }
3312
3313 if (tb[IFLA_XDP]) {
3314 struct nlattr *xdp[IFLA_XDP_MAX + 1];
3315 u32 xdp_flags = 0;
3316
3317 err = nla_parse_nested_deprecated(xdp, IFLA_XDP_MAX,
3318 tb[IFLA_XDP],
3319 ifla_xdp_policy, NULL);
3320 if (err < 0)
3321 goto errout;
3322
3323 if (xdp[IFLA_XDP_ATTACHED] || xdp[IFLA_XDP_PROG_ID]) {
3324 err = -EINVAL;
3325 goto errout;
3326 }
3327
3328 if (xdp[IFLA_XDP_FLAGS]) {
3329 xdp_flags = nla_get_u32(xdp[IFLA_XDP_FLAGS]);
3330 if (xdp_flags & ~XDP_FLAGS_MASK) {
3331 err = -EINVAL;
3332 goto errout;
3333 }
3334 if (hweight32(xdp_flags & XDP_FLAGS_MODES) > 1) {
3335 err = -EINVAL;
3336 goto errout;
3337 }
3338 }
3339
3340 if (xdp[IFLA_XDP_FD]) {
3341 int expected_fd = -1;
3342
3343 if (xdp_flags & XDP_FLAGS_REPLACE) {
3344 if (!xdp[IFLA_XDP_EXPECTED_FD]) {
3345 err = -EINVAL;
3346 goto errout;
3347 }
3348 expected_fd =
3349 nla_get_s32(xdp[IFLA_XDP_EXPECTED_FD]);
3350 }
3351
3352 err = dev_change_xdp_fd(dev, extack,
3353 nla_get_s32(xdp[IFLA_XDP_FD]),
3354 expected_fd,
3355 xdp_flags);
3356 if (err)
3357 goto errout;
3358 status |= DO_SETLINK_NOTIFY;
3359 }
3360 }
3361
3362 errout:
3363 if (status & DO_SETLINK_MODIFIED) {
3364 if ((status & DO_SETLINK_NOTIFY) == DO_SETLINK_NOTIFY)
3365 netdev_state_change(dev);
3366
3367 if (err < 0)
3368 net_warn_ratelimited("A link change request failed with some changes committed already. Interface %s may have been left with an inconsistent configuration, please check.\n",
3369 dev->name);
3370 }
3371
3372 return err;
3373 }
3374
rtnl_dev_get(struct net * net,struct nlattr * tb[])3375 static struct net_device *rtnl_dev_get(struct net *net,
3376 struct nlattr *tb[])
3377 {
3378 char ifname[ALTIFNAMSIZ];
3379
3380 if (tb[IFLA_IFNAME])
3381 nla_strscpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
3382 else if (tb[IFLA_ALT_IFNAME])
3383 nla_strscpy(ifname, tb[IFLA_ALT_IFNAME], ALTIFNAMSIZ);
3384 else
3385 return NULL;
3386
3387 return __dev_get_by_name(net, ifname);
3388 }
3389
rtnl_setlink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3390 static int rtnl_setlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3391 struct netlink_ext_ack *extack)
3392 {
3393 struct ifinfomsg *ifm = nlmsg_data(nlh);
3394 struct net *net = sock_net(skb->sk);
3395 struct nlattr *tb[IFLA_MAX+1];
3396 struct net_device *dev = NULL;
3397 struct rtnl_nets rtnl_nets;
3398 struct net *tgt_net;
3399 int err;
3400
3401 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3402 ifla_policy, extack);
3403 if (err < 0)
3404 goto errout;
3405
3406 err = rtnl_ensure_unique_netns(tb, extack, false);
3407 if (err < 0)
3408 goto errout;
3409
3410 tgt_net = rtnl_link_get_net_capable(skb, net, tb, CAP_NET_ADMIN);
3411 if (IS_ERR(tgt_net)) {
3412 err = PTR_ERR(tgt_net);
3413 goto errout;
3414 }
3415
3416 rtnl_nets_init(&rtnl_nets);
3417 rtnl_nets_add(&rtnl_nets, get_net(net));
3418 rtnl_nets_add(&rtnl_nets, tgt_net);
3419
3420 rtnl_nets_lock(&rtnl_nets);
3421
3422 if (ifm->ifi_index > 0)
3423 dev = __dev_get_by_index(net, ifm->ifi_index);
3424 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3425 dev = rtnl_dev_get(net, tb);
3426 else
3427 err = -EINVAL;
3428
3429 if (dev)
3430 err = do_setlink(skb, dev, tgt_net, ifm, extack, tb, 0);
3431 else if (!err)
3432 err = -ENODEV;
3433
3434 rtnl_nets_unlock(&rtnl_nets);
3435 rtnl_nets_destroy(&rtnl_nets);
3436 errout:
3437 return err;
3438 }
3439
rtnl_group_dellink(const struct net * net,int group)3440 static int rtnl_group_dellink(const struct net *net, int group)
3441 {
3442 struct net_device *dev, *aux;
3443 LIST_HEAD(list_kill);
3444 bool found = false;
3445
3446 if (!group)
3447 return -EPERM;
3448
3449 for_each_netdev(net, dev) {
3450 if (dev->group == group) {
3451 const struct rtnl_link_ops *ops;
3452
3453 found = true;
3454 ops = dev->rtnl_link_ops;
3455 if (!ops || !ops->dellink)
3456 return -EOPNOTSUPP;
3457 }
3458 }
3459
3460 if (!found)
3461 return -ENODEV;
3462
3463 for_each_netdev_safe(net, dev, aux) {
3464 if (dev->group == group) {
3465 const struct rtnl_link_ops *ops;
3466
3467 ops = dev->rtnl_link_ops;
3468 ops->dellink(dev, &list_kill);
3469 }
3470 }
3471 unregister_netdevice_many(&list_kill);
3472
3473 return 0;
3474 }
3475
rtnl_delete_link(struct net_device * dev,u32 portid,const struct nlmsghdr * nlh)3476 int rtnl_delete_link(struct net_device *dev, u32 portid, const struct nlmsghdr *nlh)
3477 {
3478 const struct rtnl_link_ops *ops;
3479 LIST_HEAD(list_kill);
3480
3481 ops = dev->rtnl_link_ops;
3482 if (!ops || !ops->dellink)
3483 return -EOPNOTSUPP;
3484
3485 ops->dellink(dev, &list_kill);
3486 unregister_netdevice_many_notify(&list_kill, portid, nlh);
3487
3488 return 0;
3489 }
3490 EXPORT_SYMBOL_GPL(rtnl_delete_link);
3491
rtnl_dellink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3492 static int rtnl_dellink(struct sk_buff *skb, struct nlmsghdr *nlh,
3493 struct netlink_ext_ack *extack)
3494 {
3495 struct ifinfomsg *ifm = nlmsg_data(nlh);
3496 struct net *net = sock_net(skb->sk);
3497 u32 portid = NETLINK_CB(skb).portid;
3498 struct nlattr *tb[IFLA_MAX+1];
3499 struct net_device *dev = NULL;
3500 struct net *tgt_net = net;
3501 int netnsid = -1;
3502 int err;
3503
3504 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3505 ifla_policy, extack);
3506 if (err < 0)
3507 return err;
3508
3509 err = rtnl_ensure_unique_netns(tb, extack, true);
3510 if (err < 0)
3511 return err;
3512
3513 if (tb[IFLA_TARGET_NETNSID]) {
3514 netnsid = nla_get_s32(tb[IFLA_TARGET_NETNSID]);
3515 tgt_net = rtnl_get_net_ns_capable(NETLINK_CB(skb).sk, netnsid);
3516 if (IS_ERR(tgt_net))
3517 return PTR_ERR(tgt_net);
3518 }
3519
3520 rtnl_net_lock(tgt_net);
3521
3522 if (ifm->ifi_index > 0)
3523 dev = __dev_get_by_index(tgt_net, ifm->ifi_index);
3524 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3525 dev = rtnl_dev_get(tgt_net, tb);
3526
3527 if (dev)
3528 err = rtnl_delete_link(dev, portid, nlh);
3529 else if (ifm->ifi_index > 0 || tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3530 err = -ENODEV;
3531 else if (tb[IFLA_GROUP])
3532 err = rtnl_group_dellink(tgt_net, nla_get_u32(tb[IFLA_GROUP]));
3533 else
3534 err = -EINVAL;
3535
3536 rtnl_net_unlock(tgt_net);
3537
3538 if (netnsid >= 0)
3539 put_net(tgt_net);
3540
3541 return err;
3542 }
3543
rtnl_configure_link(struct net_device * dev,const struct ifinfomsg * ifm,u32 portid,const struct nlmsghdr * nlh)3544 int rtnl_configure_link(struct net_device *dev, const struct ifinfomsg *ifm,
3545 u32 portid, const struct nlmsghdr *nlh)
3546 {
3547 unsigned int old_flags;
3548 int err;
3549
3550 old_flags = dev->flags;
3551 if (ifm && (ifm->ifi_flags || ifm->ifi_change)) {
3552 err = __dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm),
3553 NULL);
3554 if (err < 0)
3555 return err;
3556 }
3557
3558 if (dev->rtnl_link_state == RTNL_LINK_INITIALIZED) {
3559 __dev_notify_flags(dev, old_flags, (old_flags ^ dev->flags), portid, nlh);
3560 } else {
3561 dev->rtnl_link_state = RTNL_LINK_INITIALIZED;
3562 __dev_notify_flags(dev, old_flags, ~0U, portid, nlh);
3563 }
3564 return 0;
3565 }
3566 EXPORT_SYMBOL(rtnl_configure_link);
3567
rtnl_create_link(struct net * net,const char * ifname,unsigned char name_assign_type,const struct rtnl_link_ops * ops,struct nlattr * tb[],struct netlink_ext_ack * extack)3568 struct net_device *rtnl_create_link(struct net *net, const char *ifname,
3569 unsigned char name_assign_type,
3570 const struct rtnl_link_ops *ops,
3571 struct nlattr *tb[],
3572 struct netlink_ext_ack *extack)
3573 {
3574 struct net_device *dev;
3575 unsigned int num_tx_queues = 1;
3576 unsigned int num_rx_queues = 1;
3577 int err;
3578
3579 if (tb[IFLA_NUM_TX_QUEUES])
3580 num_tx_queues = nla_get_u32(tb[IFLA_NUM_TX_QUEUES]);
3581 else if (ops->get_num_tx_queues)
3582 num_tx_queues = ops->get_num_tx_queues();
3583
3584 if (tb[IFLA_NUM_RX_QUEUES])
3585 num_rx_queues = nla_get_u32(tb[IFLA_NUM_RX_QUEUES]);
3586 else if (ops->get_num_rx_queues)
3587 num_rx_queues = ops->get_num_rx_queues();
3588
3589 if (num_tx_queues < 1 || num_tx_queues > 4096) {
3590 NL_SET_ERR_MSG(extack, "Invalid number of transmit queues");
3591 return ERR_PTR(-EINVAL);
3592 }
3593
3594 if (num_rx_queues < 1 || num_rx_queues > 4096) {
3595 NL_SET_ERR_MSG(extack, "Invalid number of receive queues");
3596 return ERR_PTR(-EINVAL);
3597 }
3598
3599 if (ops->alloc) {
3600 dev = ops->alloc(tb, ifname, name_assign_type,
3601 num_tx_queues, num_rx_queues);
3602 if (IS_ERR(dev))
3603 return dev;
3604 } else {
3605 dev = alloc_netdev_mqs(ops->priv_size, ifname,
3606 name_assign_type, ops->setup,
3607 num_tx_queues, num_rx_queues);
3608 }
3609
3610 if (!dev)
3611 return ERR_PTR(-ENOMEM);
3612
3613 err = validate_linkmsg(dev, tb, extack);
3614 if (err < 0) {
3615 free_netdev(dev);
3616 return ERR_PTR(err);
3617 }
3618
3619 dev_net_set(dev, net);
3620 dev->rtnl_link_ops = ops;
3621 dev->rtnl_link_state = RTNL_LINK_INITIALIZING;
3622
3623 if (tb[IFLA_MTU]) {
3624 u32 mtu = nla_get_u32(tb[IFLA_MTU]);
3625
3626 err = dev_validate_mtu(dev, mtu, extack);
3627 if (err) {
3628 free_netdev(dev);
3629 return ERR_PTR(err);
3630 }
3631 dev->mtu = mtu;
3632 }
3633 if (tb[IFLA_ADDRESS]) {
3634 __dev_addr_set(dev, nla_data(tb[IFLA_ADDRESS]),
3635 nla_len(tb[IFLA_ADDRESS]));
3636 dev->addr_assign_type = NET_ADDR_SET;
3637 }
3638 if (tb[IFLA_BROADCAST])
3639 memcpy(dev->broadcast, nla_data(tb[IFLA_BROADCAST]),
3640 nla_len(tb[IFLA_BROADCAST]));
3641 if (tb[IFLA_TXQLEN])
3642 dev->tx_queue_len = nla_get_u32(tb[IFLA_TXQLEN]);
3643 if (tb[IFLA_OPERSTATE])
3644 set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
3645 if (tb[IFLA_LINKMODE])
3646 dev->link_mode = nla_get_u8(tb[IFLA_LINKMODE]);
3647 if (tb[IFLA_GROUP])
3648 dev_set_group(dev, nla_get_u32(tb[IFLA_GROUP]));
3649 if (tb[IFLA_GSO_MAX_SIZE])
3650 netif_set_gso_max_size(dev, nla_get_u32(tb[IFLA_GSO_MAX_SIZE]));
3651 if (tb[IFLA_GSO_MAX_SEGS])
3652 netif_set_gso_max_segs(dev, nla_get_u32(tb[IFLA_GSO_MAX_SEGS]));
3653 if (tb[IFLA_GRO_MAX_SIZE])
3654 netif_set_gro_max_size(dev, nla_get_u32(tb[IFLA_GRO_MAX_SIZE]));
3655 if (tb[IFLA_GSO_IPV4_MAX_SIZE])
3656 netif_set_gso_ipv4_max_size(dev, nla_get_u32(tb[IFLA_GSO_IPV4_MAX_SIZE]));
3657 if (tb[IFLA_GRO_IPV4_MAX_SIZE])
3658 netif_set_gro_ipv4_max_size(dev, nla_get_u32(tb[IFLA_GRO_IPV4_MAX_SIZE]));
3659
3660 return dev;
3661 }
3662 EXPORT_SYMBOL(rtnl_create_link);
3663
3664 struct rtnl_newlink_tbs {
3665 struct nlattr *tb[IFLA_MAX + 1];
3666 struct nlattr *linkinfo[IFLA_INFO_MAX + 1];
3667 struct nlattr *attr[RTNL_MAX_TYPE + 1];
3668 struct nlattr *slave_attr[RTNL_SLAVE_MAX_TYPE + 1];
3669 };
3670
rtnl_changelink(const struct sk_buff * skb,struct nlmsghdr * nlh,const struct rtnl_link_ops * ops,struct net_device * dev,struct net * tgt_net,struct rtnl_newlink_tbs * tbs,struct nlattr ** data,struct netlink_ext_ack * extack)3671 static int rtnl_changelink(const struct sk_buff *skb, struct nlmsghdr *nlh,
3672 const struct rtnl_link_ops *ops,
3673 struct net_device *dev, struct net *tgt_net,
3674 struct rtnl_newlink_tbs *tbs,
3675 struct nlattr **data,
3676 struct netlink_ext_ack *extack)
3677 {
3678 struct nlattr ** const linkinfo = tbs->linkinfo;
3679 struct nlattr ** const tb = tbs->tb;
3680 int status = 0;
3681 int err;
3682
3683 if (nlh->nlmsg_flags & NLM_F_EXCL)
3684 return -EEXIST;
3685
3686 if (nlh->nlmsg_flags & NLM_F_REPLACE)
3687 return -EOPNOTSUPP;
3688
3689 if (linkinfo[IFLA_INFO_DATA]) {
3690 if (!ops || ops != dev->rtnl_link_ops || !ops->changelink)
3691 return -EOPNOTSUPP;
3692
3693 err = ops->changelink(dev, tb, data, extack);
3694 if (err < 0)
3695 return err;
3696
3697 status |= DO_SETLINK_NOTIFY;
3698 }
3699
3700 if (linkinfo[IFLA_INFO_SLAVE_DATA]) {
3701 const struct rtnl_link_ops *m_ops = NULL;
3702 struct nlattr **slave_data = NULL;
3703 struct net_device *master_dev;
3704
3705 master_dev = netdev_master_upper_dev_get(dev);
3706 if (master_dev)
3707 m_ops = master_dev->rtnl_link_ops;
3708
3709 if (!m_ops || !m_ops->slave_changelink)
3710 return -EOPNOTSUPP;
3711
3712 if (m_ops->slave_maxtype > RTNL_SLAVE_MAX_TYPE)
3713 return -EINVAL;
3714
3715 if (m_ops->slave_maxtype) {
3716 err = nla_parse_nested_deprecated(tbs->slave_attr,
3717 m_ops->slave_maxtype,
3718 linkinfo[IFLA_INFO_SLAVE_DATA],
3719 m_ops->slave_policy, extack);
3720 if (err < 0)
3721 return err;
3722
3723 slave_data = tbs->slave_attr;
3724 }
3725
3726 err = m_ops->slave_changelink(master_dev, dev, tb, slave_data, extack);
3727 if (err < 0)
3728 return err;
3729
3730 status |= DO_SETLINK_NOTIFY;
3731 }
3732
3733 return do_setlink(skb, dev, tgt_net, nlmsg_data(nlh), extack, tb, status);
3734 }
3735
rtnl_group_changelink(const struct sk_buff * skb,struct net * net,struct net * tgt_net,int group,struct ifinfomsg * ifm,struct netlink_ext_ack * extack,struct nlattr ** tb)3736 static int rtnl_group_changelink(const struct sk_buff *skb,
3737 struct net *net, struct net *tgt_net,
3738 int group, struct ifinfomsg *ifm,
3739 struct netlink_ext_ack *extack,
3740 struct nlattr **tb)
3741 {
3742 struct net_device *dev, *aux;
3743 int err;
3744
3745 for_each_netdev_safe(net, dev, aux) {
3746 if (dev->group == group) {
3747 err = do_setlink(skb, dev, tgt_net, ifm, extack, tb, 0);
3748 if (err < 0)
3749 return err;
3750 }
3751 }
3752
3753 return 0;
3754 }
3755
rtnl_newlink_create(struct sk_buff * skb,struct ifinfomsg * ifm,const struct rtnl_link_ops * ops,struct net * tgt_net,struct net * link_net,struct net * peer_net,const struct nlmsghdr * nlh,struct nlattr ** tb,struct nlattr ** data,struct netlink_ext_ack * extack)3756 static int rtnl_newlink_create(struct sk_buff *skb, struct ifinfomsg *ifm,
3757 const struct rtnl_link_ops *ops,
3758 struct net *tgt_net, struct net *link_net,
3759 struct net *peer_net,
3760 const struct nlmsghdr *nlh,
3761 struct nlattr **tb, struct nlattr **data,
3762 struct netlink_ext_ack *extack)
3763 {
3764 unsigned char name_assign_type = NET_NAME_USER;
3765 struct net *net = sock_net(skb->sk);
3766 u32 portid = NETLINK_CB(skb).portid;
3767 struct net_device *dev;
3768 char ifname[IFNAMSIZ];
3769 int err;
3770
3771 if (!ops->alloc && !ops->setup)
3772 return -EOPNOTSUPP;
3773
3774 if (tb[IFLA_IFNAME]) {
3775 nla_strscpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
3776 } else {
3777 snprintf(ifname, IFNAMSIZ, "%s%%d", ops->kind);
3778 name_assign_type = NET_NAME_ENUM;
3779 }
3780
3781 dev = rtnl_create_link(link_net ? : tgt_net, ifname,
3782 name_assign_type, ops, tb, extack);
3783 if (IS_ERR(dev)) {
3784 err = PTR_ERR(dev);
3785 goto out;
3786 }
3787
3788 dev->ifindex = ifm->ifi_index;
3789
3790 if (link_net)
3791 net = link_net;
3792 if (peer_net)
3793 net = peer_net;
3794
3795 if (ops->newlink)
3796 err = ops->newlink(net, dev, tb, data, extack);
3797 else
3798 err = register_netdevice(dev);
3799 if (err < 0) {
3800 free_netdev(dev);
3801 goto out;
3802 }
3803
3804 err = rtnl_configure_link(dev, ifm, portid, nlh);
3805 if (err < 0)
3806 goto out_unregister;
3807 if (link_net) {
3808 err = dev_change_net_namespace(dev, tgt_net, ifname);
3809 if (err < 0)
3810 goto out_unregister;
3811 }
3812 if (tb[IFLA_MASTER]) {
3813 err = do_set_master(dev, nla_get_u32(tb[IFLA_MASTER]), extack);
3814 if (err)
3815 goto out_unregister;
3816 }
3817 out:
3818 return err;
3819 out_unregister:
3820 if (ops->newlink) {
3821 LIST_HEAD(list_kill);
3822
3823 ops->dellink(dev, &list_kill);
3824 unregister_netdevice_many(&list_kill);
3825 } else {
3826 unregister_netdevice(dev);
3827 }
3828 goto out;
3829 }
3830
rtnl_get_peer_net(const struct rtnl_link_ops * ops,struct nlattr * tbp[],struct nlattr * data[],struct netlink_ext_ack * extack)3831 static struct net *rtnl_get_peer_net(const struct rtnl_link_ops *ops,
3832 struct nlattr *tbp[],
3833 struct nlattr *data[],
3834 struct netlink_ext_ack *extack)
3835 {
3836 struct nlattr *tb[IFLA_MAX + 1];
3837 int err;
3838
3839 if (!data || !data[ops->peer_type])
3840 return rtnl_link_get_net_ifla(tbp);
3841
3842 err = rtnl_nla_parse_ifinfomsg(tb, data[ops->peer_type], extack);
3843 if (err < 0)
3844 return ERR_PTR(err);
3845
3846 if (ops->validate) {
3847 err = ops->validate(tb, NULL, extack);
3848 if (err < 0)
3849 return ERR_PTR(err);
3850 }
3851
3852 return rtnl_link_get_net_ifla(tb);
3853 }
3854
__rtnl_newlink(struct sk_buff * skb,struct nlmsghdr * nlh,const struct rtnl_link_ops * ops,struct net * tgt_net,struct net * link_net,struct net * peer_net,struct rtnl_newlink_tbs * tbs,struct nlattr ** data,struct netlink_ext_ack * extack)3855 static int __rtnl_newlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3856 const struct rtnl_link_ops *ops,
3857 struct net *tgt_net, struct net *link_net,
3858 struct net *peer_net,
3859 struct rtnl_newlink_tbs *tbs,
3860 struct nlattr **data,
3861 struct netlink_ext_ack *extack)
3862 {
3863 struct nlattr ** const tb = tbs->tb;
3864 struct net *net = sock_net(skb->sk);
3865 struct net_device *dev;
3866 struct ifinfomsg *ifm;
3867 bool link_specified;
3868
3869 ifm = nlmsg_data(nlh);
3870 if (ifm->ifi_index > 0) {
3871 link_specified = true;
3872 dev = __dev_get_by_index(net, ifm->ifi_index);
3873 } else if (ifm->ifi_index < 0) {
3874 NL_SET_ERR_MSG(extack, "ifindex can't be negative");
3875 return -EINVAL;
3876 } else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME]) {
3877 link_specified = true;
3878 dev = rtnl_dev_get(net, tb);
3879 } else {
3880 link_specified = false;
3881 dev = NULL;
3882 }
3883
3884 if (dev)
3885 return rtnl_changelink(skb, nlh, ops, dev, tgt_net, tbs, data, extack);
3886
3887 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
3888 /* No dev found and NLM_F_CREATE not set. Requested dev does not exist,
3889 * or it's for a group
3890 */
3891 if (link_specified || !tb[IFLA_GROUP])
3892 return -ENODEV;
3893
3894 return rtnl_group_changelink(skb, net, tgt_net,
3895 nla_get_u32(tb[IFLA_GROUP]),
3896 ifm, extack, tb);
3897 }
3898
3899 if (tb[IFLA_MAP] || tb[IFLA_PROTINFO])
3900 return -EOPNOTSUPP;
3901
3902 if (!ops) {
3903 NL_SET_ERR_MSG(extack, "Unknown device type");
3904 return -EOPNOTSUPP;
3905 }
3906
3907 return rtnl_newlink_create(skb, ifm, ops, tgt_net, link_net, peer_net, nlh,
3908 tb, data, extack);
3909 }
3910
rtnl_newlink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3911 static int rtnl_newlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3912 struct netlink_ext_ack *extack)
3913 {
3914 struct net *tgt_net, *link_net = NULL, *peer_net = NULL;
3915 struct nlattr **tb, **linkinfo, **data = NULL;
3916 struct rtnl_link_ops *ops = NULL;
3917 struct rtnl_newlink_tbs *tbs;
3918 struct rtnl_nets rtnl_nets;
3919 int ops_srcu_index;
3920 int ret;
3921
3922 tbs = kmalloc(sizeof(*tbs), GFP_KERNEL);
3923 if (!tbs)
3924 return -ENOMEM;
3925
3926 tb = tbs->tb;
3927 ret = nlmsg_parse_deprecated(nlh, sizeof(struct ifinfomsg), tb,
3928 IFLA_MAX, ifla_policy, extack);
3929 if (ret < 0)
3930 goto free;
3931
3932 ret = rtnl_ensure_unique_netns(tb, extack, false);
3933 if (ret < 0)
3934 goto free;
3935
3936 linkinfo = tbs->linkinfo;
3937 if (tb[IFLA_LINKINFO]) {
3938 ret = nla_parse_nested_deprecated(linkinfo, IFLA_INFO_MAX,
3939 tb[IFLA_LINKINFO],
3940 ifla_info_policy, NULL);
3941 if (ret < 0)
3942 goto free;
3943 } else {
3944 memset(linkinfo, 0, sizeof(tbs->linkinfo));
3945 }
3946
3947 if (linkinfo[IFLA_INFO_KIND]) {
3948 char kind[MODULE_NAME_LEN];
3949
3950 nla_strscpy(kind, linkinfo[IFLA_INFO_KIND], sizeof(kind));
3951 ops = rtnl_link_ops_get(kind, &ops_srcu_index);
3952 #ifdef CONFIG_MODULES
3953 if (!ops) {
3954 request_module("rtnl-link-%s", kind);
3955 ops = rtnl_link_ops_get(kind, &ops_srcu_index);
3956 }
3957 #endif
3958 }
3959
3960 rtnl_nets_init(&rtnl_nets);
3961
3962 if (ops) {
3963 if (ops->maxtype > RTNL_MAX_TYPE) {
3964 ret = -EINVAL;
3965 goto put_ops;
3966 }
3967
3968 if (ops->maxtype && linkinfo[IFLA_INFO_DATA]) {
3969 ret = nla_parse_nested_deprecated(tbs->attr, ops->maxtype,
3970 linkinfo[IFLA_INFO_DATA],
3971 ops->policy, extack);
3972 if (ret < 0)
3973 goto put_ops;
3974
3975 data = tbs->attr;
3976 }
3977
3978 if (ops->validate) {
3979 ret = ops->validate(tb, data, extack);
3980 if (ret < 0)
3981 goto put_ops;
3982 }
3983
3984 if (ops->peer_type) {
3985 peer_net = rtnl_get_peer_net(ops, tb, data, extack);
3986 if (IS_ERR(peer_net)) {
3987 ret = PTR_ERR(peer_net);
3988 goto put_ops;
3989 }
3990 if (peer_net)
3991 rtnl_nets_add(&rtnl_nets, peer_net);
3992 }
3993 }
3994
3995 tgt_net = rtnl_link_get_net_capable(skb, sock_net(skb->sk), tb, CAP_NET_ADMIN);
3996 if (IS_ERR(tgt_net)) {
3997 ret = PTR_ERR(tgt_net);
3998 goto put_net;
3999 }
4000
4001 rtnl_nets_add(&rtnl_nets, tgt_net);
4002
4003 if (tb[IFLA_LINK_NETNSID]) {
4004 int id = nla_get_s32(tb[IFLA_LINK_NETNSID]);
4005
4006 link_net = get_net_ns_by_id(tgt_net, id);
4007 if (!link_net) {
4008 NL_SET_ERR_MSG(extack, "Unknown network namespace id");
4009 ret = -EINVAL;
4010 goto put_net;
4011 }
4012
4013 rtnl_nets_add(&rtnl_nets, link_net);
4014
4015 if (!netlink_ns_capable(skb, link_net->user_ns, CAP_NET_ADMIN)) {
4016 ret = -EPERM;
4017 goto put_net;
4018 }
4019 }
4020
4021 rtnl_nets_lock(&rtnl_nets);
4022 ret = __rtnl_newlink(skb, nlh, ops, tgt_net, link_net, peer_net, tbs, data, extack);
4023 rtnl_nets_unlock(&rtnl_nets);
4024
4025 put_net:
4026 rtnl_nets_destroy(&rtnl_nets);
4027 put_ops:
4028 if (ops)
4029 rtnl_link_ops_put(ops, ops_srcu_index);
4030 free:
4031 kfree(tbs);
4032 return ret;
4033 }
4034
rtnl_valid_getlink_req(struct sk_buff * skb,const struct nlmsghdr * nlh,struct nlattr ** tb,struct netlink_ext_ack * extack)4035 static int rtnl_valid_getlink_req(struct sk_buff *skb,
4036 const struct nlmsghdr *nlh,
4037 struct nlattr **tb,
4038 struct netlink_ext_ack *extack)
4039 {
4040 struct ifinfomsg *ifm;
4041 int i, err;
4042
4043 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifm))) {
4044 NL_SET_ERR_MSG(extack, "Invalid header for get link");
4045 return -EINVAL;
4046 }
4047
4048 if (!netlink_strict_get_check(skb))
4049 return nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
4050 ifla_policy, extack);
4051
4052 ifm = nlmsg_data(nlh);
4053 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags ||
4054 ifm->ifi_change) {
4055 NL_SET_ERR_MSG(extack, "Invalid values in header for get link request");
4056 return -EINVAL;
4057 }
4058
4059 err = nlmsg_parse_deprecated_strict(nlh, sizeof(*ifm), tb, IFLA_MAX,
4060 ifla_policy, extack);
4061 if (err)
4062 return err;
4063
4064 for (i = 0; i <= IFLA_MAX; i++) {
4065 if (!tb[i])
4066 continue;
4067
4068 switch (i) {
4069 case IFLA_IFNAME:
4070 case IFLA_ALT_IFNAME:
4071 case IFLA_EXT_MASK:
4072 case IFLA_TARGET_NETNSID:
4073 break;
4074 default:
4075 NL_SET_ERR_MSG(extack, "Unsupported attribute in get link request");
4076 return -EINVAL;
4077 }
4078 }
4079
4080 return 0;
4081 }
4082
rtnl_getlink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)4083 static int rtnl_getlink(struct sk_buff *skb, struct nlmsghdr *nlh,
4084 struct netlink_ext_ack *extack)
4085 {
4086 struct net *net = sock_net(skb->sk);
4087 struct net *tgt_net = net;
4088 struct ifinfomsg *ifm;
4089 struct nlattr *tb[IFLA_MAX+1];
4090 struct net_device *dev = NULL;
4091 struct sk_buff *nskb;
4092 int netnsid = -1;
4093 int err;
4094 u32 ext_filter_mask = 0;
4095
4096 err = rtnl_valid_getlink_req(skb, nlh, tb, extack);
4097 if (err < 0)
4098 return err;
4099
4100 err = rtnl_ensure_unique_netns(tb, extack, true);
4101 if (err < 0)
4102 return err;
4103
4104 if (tb[IFLA_TARGET_NETNSID]) {
4105 netnsid = nla_get_s32(tb[IFLA_TARGET_NETNSID]);
4106 tgt_net = rtnl_get_net_ns_capable(NETLINK_CB(skb).sk, netnsid);
4107 if (IS_ERR(tgt_net))
4108 return PTR_ERR(tgt_net);
4109 }
4110
4111 if (tb[IFLA_EXT_MASK])
4112 ext_filter_mask = nla_get_u32(tb[IFLA_EXT_MASK]);
4113
4114 err = -EINVAL;
4115 ifm = nlmsg_data(nlh);
4116 if (ifm->ifi_index > 0)
4117 dev = __dev_get_by_index(tgt_net, ifm->ifi_index);
4118 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
4119 dev = rtnl_dev_get(tgt_net, tb);
4120 else
4121 goto out;
4122
4123 err = -ENODEV;
4124 if (dev == NULL)
4125 goto out;
4126
4127 err = -ENOBUFS;
4128 nskb = nlmsg_new_large(if_nlmsg_size(dev, ext_filter_mask));
4129 if (nskb == NULL)
4130 goto out;
4131
4132 /* Synchronize the carrier state so we don't report a state
4133 * that we're not actually going to honour immediately; if
4134 * the driver just did a carrier off->on transition, we can
4135 * only TX if link watch work has run, but without this we'd
4136 * already report carrier on, even if it doesn't work yet.
4137 */
4138 linkwatch_sync_dev(dev);
4139
4140 err = rtnl_fill_ifinfo(nskb, dev, net,
4141 RTM_NEWLINK, NETLINK_CB(skb).portid,
4142 nlh->nlmsg_seq, 0, 0, ext_filter_mask,
4143 0, NULL, 0, netnsid, GFP_KERNEL);
4144 if (err < 0) {
4145 /* -EMSGSIZE implies BUG in if_nlmsg_size */
4146 WARN_ON(err == -EMSGSIZE);
4147 kfree_skb(nskb);
4148 } else
4149 err = rtnl_unicast(nskb, net, NETLINK_CB(skb).portid);
4150 out:
4151 if (netnsid >= 0)
4152 put_net(tgt_net);
4153
4154 return err;
4155 }
4156
rtnl_alt_ifname(int cmd,struct net_device * dev,struct nlattr * attr,bool * changed,struct netlink_ext_ack * extack)4157 static int rtnl_alt_ifname(int cmd, struct net_device *dev, struct nlattr *attr,
4158 bool *changed, struct netlink_ext_ack *extack)
4159 {
4160 char *alt_ifname;
4161 size_t size;
4162 int err;
4163
4164 err = nla_validate(attr, attr->nla_len, IFLA_MAX, ifla_policy, extack);
4165 if (err)
4166 return err;
4167
4168 if (cmd == RTM_NEWLINKPROP) {
4169 size = rtnl_prop_list_size(dev);
4170 size += nla_total_size(ALTIFNAMSIZ);
4171 if (size >= U16_MAX) {
4172 NL_SET_ERR_MSG(extack,
4173 "effective property list too long");
4174 return -EINVAL;
4175 }
4176 }
4177
4178 alt_ifname = nla_strdup(attr, GFP_KERNEL_ACCOUNT);
4179 if (!alt_ifname)
4180 return -ENOMEM;
4181
4182 if (cmd == RTM_NEWLINKPROP) {
4183 err = netdev_name_node_alt_create(dev, alt_ifname);
4184 if (!err)
4185 alt_ifname = NULL;
4186 } else if (cmd == RTM_DELLINKPROP) {
4187 err = netdev_name_node_alt_destroy(dev, alt_ifname);
4188 } else {
4189 WARN_ON_ONCE(1);
4190 err = -EINVAL;
4191 }
4192
4193 kfree(alt_ifname);
4194 if (!err)
4195 *changed = true;
4196 return err;
4197 }
4198
rtnl_linkprop(int cmd,struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)4199 static int rtnl_linkprop(int cmd, struct sk_buff *skb, struct nlmsghdr *nlh,
4200 struct netlink_ext_ack *extack)
4201 {
4202 struct net *net = sock_net(skb->sk);
4203 struct nlattr *tb[IFLA_MAX + 1];
4204 struct net_device *dev;
4205 struct ifinfomsg *ifm;
4206 bool changed = false;
4207 struct nlattr *attr;
4208 int err, rem;
4209
4210 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy, extack);
4211 if (err)
4212 return err;
4213
4214 err = rtnl_ensure_unique_netns(tb, extack, true);
4215 if (err)
4216 return err;
4217
4218 ifm = nlmsg_data(nlh);
4219 if (ifm->ifi_index > 0)
4220 dev = __dev_get_by_index(net, ifm->ifi_index);
4221 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
4222 dev = rtnl_dev_get(net, tb);
4223 else
4224 return -EINVAL;
4225
4226 if (!dev)
4227 return -ENODEV;
4228
4229 if (!tb[IFLA_PROP_LIST])
4230 return 0;
4231
4232 nla_for_each_nested(attr, tb[IFLA_PROP_LIST], rem) {
4233 switch (nla_type(attr)) {
4234 case IFLA_ALT_IFNAME:
4235 err = rtnl_alt_ifname(cmd, dev, attr, &changed, extack);
4236 if (err)
4237 return err;
4238 break;
4239 }
4240 }
4241
4242 if (changed)
4243 netdev_state_change(dev);
4244 return 0;
4245 }
4246
rtnl_newlinkprop(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)4247 static int rtnl_newlinkprop(struct sk_buff *skb, struct nlmsghdr *nlh,
4248 struct netlink_ext_ack *extack)
4249 {
4250 return rtnl_linkprop(RTM_NEWLINKPROP, skb, nlh, extack);
4251 }
4252
rtnl_dellinkprop(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)4253 static int rtnl_dellinkprop(struct sk_buff *skb, struct nlmsghdr *nlh,
4254 struct netlink_ext_ack *extack)
4255 {
4256 return rtnl_linkprop(RTM_DELLINKPROP, skb, nlh, extack);
4257 }
4258
rtnl_calcit(struct sk_buff * skb,struct nlmsghdr * nlh)4259 static noinline_for_stack u32 rtnl_calcit(struct sk_buff *skb,
4260 struct nlmsghdr *nlh)
4261 {
4262 struct net *net = sock_net(skb->sk);
4263 size_t min_ifinfo_dump_size = 0;
4264 u32 ext_filter_mask = 0;
4265 struct net_device *dev;
4266 struct nlattr *nla;
4267 int hdrlen, rem;
4268
4269 /* Same kernel<->userspace interface hack as in rtnl_dump_ifinfo. */
4270 hdrlen = nlmsg_len(nlh) < sizeof(struct ifinfomsg) ?
4271 sizeof(struct rtgenmsg) : sizeof(struct ifinfomsg);
4272
4273 if (nlh->nlmsg_len < nlmsg_msg_size(hdrlen))
4274 return NLMSG_GOODSIZE;
4275
4276 nla_for_each_attr_type(nla, IFLA_EXT_MASK,
4277 nlmsg_attrdata(nlh, hdrlen),
4278 nlmsg_attrlen(nlh, hdrlen), rem) {
4279 if (nla_len(nla) == sizeof(u32))
4280 ext_filter_mask = nla_get_u32(nla);
4281 }
4282
4283 if (!ext_filter_mask)
4284 return NLMSG_GOODSIZE;
4285 /*
4286 * traverse the list of net devices and compute the minimum
4287 * buffer size based upon the filter mask.
4288 */
4289 rcu_read_lock();
4290 for_each_netdev_rcu(net, dev) {
4291 min_ifinfo_dump_size = max(min_ifinfo_dump_size,
4292 if_nlmsg_size(dev, ext_filter_mask));
4293 }
4294 rcu_read_unlock();
4295
4296 return nlmsg_total_size(min_ifinfo_dump_size);
4297 }
4298
rtnl_dump_all(struct sk_buff * skb,struct netlink_callback * cb)4299 static int rtnl_dump_all(struct sk_buff *skb, struct netlink_callback *cb)
4300 {
4301 int idx;
4302 int s_idx = cb->family;
4303 int type = cb->nlh->nlmsg_type - RTM_BASE;
4304 int ret = 0;
4305
4306 if (s_idx == 0)
4307 s_idx = 1;
4308
4309 for (idx = 1; idx <= RTNL_FAMILY_MAX; idx++) {
4310 struct rtnl_link __rcu **tab;
4311 struct rtnl_link *link;
4312 rtnl_dumpit_func dumpit;
4313
4314 if (idx < s_idx || idx == PF_PACKET)
4315 continue;
4316
4317 if (type < 0 || type >= RTM_NR_MSGTYPES)
4318 continue;
4319
4320 tab = rcu_dereference_rtnl(rtnl_msg_handlers[idx]);
4321 if (!tab)
4322 continue;
4323
4324 link = rcu_dereference_rtnl(tab[type]);
4325 if (!link)
4326 continue;
4327
4328 dumpit = link->dumpit;
4329 if (!dumpit)
4330 continue;
4331
4332 if (idx > s_idx) {
4333 memset(&cb->args[0], 0, sizeof(cb->args));
4334 cb->prev_seq = 0;
4335 cb->seq = 0;
4336 }
4337 ret = dumpit(skb, cb);
4338 if (ret)
4339 break;
4340 }
4341 cb->family = idx;
4342
4343 return skb->len ? : ret;
4344 }
4345
rtmsg_ifinfo_build_skb(int type,struct net_device * dev,unsigned int change,u32 event,gfp_t flags,int * new_nsid,int new_ifindex,u32 portid,const struct nlmsghdr * nlh)4346 struct sk_buff *rtmsg_ifinfo_build_skb(int type, struct net_device *dev,
4347 unsigned int change,
4348 u32 event, gfp_t flags, int *new_nsid,
4349 int new_ifindex, u32 portid,
4350 const struct nlmsghdr *nlh)
4351 {
4352 struct net *net = dev_net(dev);
4353 struct sk_buff *skb;
4354 int err = -ENOBUFS;
4355 u32 seq = 0;
4356
4357 skb = nlmsg_new(if_nlmsg_size(dev, 0), flags);
4358 if (skb == NULL)
4359 goto errout;
4360
4361 if (nlmsg_report(nlh))
4362 seq = nlmsg_seq(nlh);
4363 else
4364 portid = 0;
4365
4366 err = rtnl_fill_ifinfo(skb, dev, dev_net(dev),
4367 type, portid, seq, change, 0, 0, event,
4368 new_nsid, new_ifindex, -1, flags);
4369 if (err < 0) {
4370 /* -EMSGSIZE implies BUG in if_nlmsg_size() */
4371 WARN_ON(err == -EMSGSIZE);
4372 kfree_skb(skb);
4373 goto errout;
4374 }
4375 return skb;
4376 errout:
4377 rtnl_set_sk_err(net, RTNLGRP_LINK, err);
4378 return NULL;
4379 }
4380
rtmsg_ifinfo_send(struct sk_buff * skb,struct net_device * dev,gfp_t flags,u32 portid,const struct nlmsghdr * nlh)4381 void rtmsg_ifinfo_send(struct sk_buff *skb, struct net_device *dev, gfp_t flags,
4382 u32 portid, const struct nlmsghdr *nlh)
4383 {
4384 struct net *net = dev_net(dev);
4385
4386 rtnl_notify(skb, net, portid, RTNLGRP_LINK, nlh, flags);
4387 }
4388
rtmsg_ifinfo_event(int type,struct net_device * dev,unsigned int change,u32 event,gfp_t flags,int * new_nsid,int new_ifindex,u32 portid,const struct nlmsghdr * nlh)4389 static void rtmsg_ifinfo_event(int type, struct net_device *dev,
4390 unsigned int change, u32 event,
4391 gfp_t flags, int *new_nsid, int new_ifindex,
4392 u32 portid, const struct nlmsghdr *nlh)
4393 {
4394 struct sk_buff *skb;
4395
4396 if (dev->reg_state != NETREG_REGISTERED)
4397 return;
4398
4399 skb = rtmsg_ifinfo_build_skb(type, dev, change, event, flags, new_nsid,
4400 new_ifindex, portid, nlh);
4401 if (skb)
4402 rtmsg_ifinfo_send(skb, dev, flags, portid, nlh);
4403 }
4404
rtmsg_ifinfo(int type,struct net_device * dev,unsigned int change,gfp_t flags,u32 portid,const struct nlmsghdr * nlh)4405 void rtmsg_ifinfo(int type, struct net_device *dev, unsigned int change,
4406 gfp_t flags, u32 portid, const struct nlmsghdr *nlh)
4407 {
4408 rtmsg_ifinfo_event(type, dev, change, rtnl_get_event(0), flags,
4409 NULL, 0, portid, nlh);
4410 }
4411
rtmsg_ifinfo_newnet(int type,struct net_device * dev,unsigned int change,gfp_t flags,int * new_nsid,int new_ifindex)4412 void rtmsg_ifinfo_newnet(int type, struct net_device *dev, unsigned int change,
4413 gfp_t flags, int *new_nsid, int new_ifindex)
4414 {
4415 rtmsg_ifinfo_event(type, dev, change, rtnl_get_event(0), flags,
4416 new_nsid, new_ifindex, 0, NULL);
4417 }
4418
nlmsg_populate_fdb_fill(struct sk_buff * skb,struct net_device * dev,u8 * addr,u16 vid,u32 pid,u32 seq,int type,unsigned int flags,int nlflags,u16 ndm_state)4419 static int nlmsg_populate_fdb_fill(struct sk_buff *skb,
4420 struct net_device *dev,
4421 u8 *addr, u16 vid, u32 pid, u32 seq,
4422 int type, unsigned int flags,
4423 int nlflags, u16 ndm_state)
4424 {
4425 struct nlmsghdr *nlh;
4426 struct ndmsg *ndm;
4427
4428 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), nlflags);
4429 if (!nlh)
4430 return -EMSGSIZE;
4431
4432 ndm = nlmsg_data(nlh);
4433 ndm->ndm_family = AF_BRIDGE;
4434 ndm->ndm_pad1 = 0;
4435 ndm->ndm_pad2 = 0;
4436 ndm->ndm_flags = flags;
4437 ndm->ndm_type = 0;
4438 ndm->ndm_ifindex = dev->ifindex;
4439 ndm->ndm_state = ndm_state;
4440
4441 if (nla_put(skb, NDA_LLADDR, dev->addr_len, addr))
4442 goto nla_put_failure;
4443 if (vid)
4444 if (nla_put(skb, NDA_VLAN, sizeof(u16), &vid))
4445 goto nla_put_failure;
4446
4447 nlmsg_end(skb, nlh);
4448 return 0;
4449
4450 nla_put_failure:
4451 nlmsg_cancel(skb, nlh);
4452 return -EMSGSIZE;
4453 }
4454
rtnl_fdb_nlmsg_size(const struct net_device * dev)4455 static inline size_t rtnl_fdb_nlmsg_size(const struct net_device *dev)
4456 {
4457 return NLMSG_ALIGN(sizeof(struct ndmsg)) +
4458 nla_total_size(dev->addr_len) + /* NDA_LLADDR */
4459 nla_total_size(sizeof(u16)) + /* NDA_VLAN */
4460 0;
4461 }
4462
rtnl_fdb_notify(struct net_device * dev,u8 * addr,u16 vid,int type,u16 ndm_state)4463 static void rtnl_fdb_notify(struct net_device *dev, u8 *addr, u16 vid, int type,
4464 u16 ndm_state)
4465 {
4466 struct net *net = dev_net(dev);
4467 struct sk_buff *skb;
4468 int err = -ENOBUFS;
4469
4470 skb = nlmsg_new(rtnl_fdb_nlmsg_size(dev), GFP_ATOMIC);
4471 if (!skb)
4472 goto errout;
4473
4474 err = nlmsg_populate_fdb_fill(skb, dev, addr, vid,
4475 0, 0, type, NTF_SELF, 0, ndm_state);
4476 if (err < 0) {
4477 kfree_skb(skb);
4478 goto errout;
4479 }
4480
4481 rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
4482 return;
4483 errout:
4484 rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
4485 }
4486
4487 /*
4488 * ndo_dflt_fdb_add - default netdevice operation to add an FDB entry
4489 */
ndo_dflt_fdb_add(struct ndmsg * ndm,struct nlattr * tb[],struct net_device * dev,const unsigned char * addr,u16 vid,u16 flags)4490 int ndo_dflt_fdb_add(struct ndmsg *ndm,
4491 struct nlattr *tb[],
4492 struct net_device *dev,
4493 const unsigned char *addr, u16 vid,
4494 u16 flags)
4495 {
4496 int err = -EINVAL;
4497
4498 /* If aging addresses are supported device will need to
4499 * implement its own handler for this.
4500 */
4501 if (ndm->ndm_state && !(ndm->ndm_state & NUD_PERMANENT)) {
4502 netdev_info(dev, "default FDB implementation only supports local addresses\n");
4503 return err;
4504 }
4505
4506 if (tb[NDA_FLAGS_EXT]) {
4507 netdev_info(dev, "invalid flags given to default FDB implementation\n");
4508 return err;
4509 }
4510
4511 if (vid) {
4512 netdev_info(dev, "vlans aren't supported yet for dev_uc|mc_add()\n");
4513 return err;
4514 }
4515
4516 if (is_unicast_ether_addr(addr) || is_link_local_ether_addr(addr))
4517 err = dev_uc_add_excl(dev, addr);
4518 else if (is_multicast_ether_addr(addr))
4519 err = dev_mc_add_excl(dev, addr);
4520
4521 /* Only return duplicate errors if NLM_F_EXCL is set */
4522 if (err == -EEXIST && !(flags & NLM_F_EXCL))
4523 err = 0;
4524
4525 return err;
4526 }
4527 EXPORT_SYMBOL(ndo_dflt_fdb_add);
4528
fdb_vid_parse(struct nlattr * vlan_attr,u16 * p_vid,struct netlink_ext_ack * extack)4529 static int fdb_vid_parse(struct nlattr *vlan_attr, u16 *p_vid,
4530 struct netlink_ext_ack *extack)
4531 {
4532 u16 vid = 0;
4533
4534 if (vlan_attr) {
4535 if (nla_len(vlan_attr) != sizeof(u16)) {
4536 NL_SET_ERR_MSG(extack, "invalid vlan attribute size");
4537 return -EINVAL;
4538 }
4539
4540 vid = nla_get_u16(vlan_attr);
4541
4542 if (!vid || vid >= VLAN_VID_MASK) {
4543 NL_SET_ERR_MSG(extack, "invalid vlan id");
4544 return -EINVAL;
4545 }
4546 }
4547 *p_vid = vid;
4548 return 0;
4549 }
4550
rtnl_fdb_add(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)4551 static int rtnl_fdb_add(struct sk_buff *skb, struct nlmsghdr *nlh,
4552 struct netlink_ext_ack *extack)
4553 {
4554 struct net *net = sock_net(skb->sk);
4555 struct ndmsg *ndm;
4556 struct nlattr *tb[NDA_MAX+1];
4557 struct net_device *dev;
4558 u8 *addr;
4559 u16 vid;
4560 int err;
4561
4562 err = nlmsg_parse_deprecated(nlh, sizeof(*ndm), tb, NDA_MAX, NULL,
4563 extack);
4564 if (err < 0)
4565 return err;
4566
4567 ndm = nlmsg_data(nlh);
4568 if (ndm->ndm_ifindex == 0) {
4569 NL_SET_ERR_MSG(extack, "invalid ifindex");
4570 return -EINVAL;
4571 }
4572
4573 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
4574 if (dev == NULL) {
4575 NL_SET_ERR_MSG(extack, "unknown ifindex");
4576 return -ENODEV;
4577 }
4578
4579 if (!tb[NDA_LLADDR] || nla_len(tb[NDA_LLADDR]) != ETH_ALEN) {
4580 NL_SET_ERR_MSG(extack, "invalid address");
4581 return -EINVAL;
4582 }
4583
4584 if (dev->type != ARPHRD_ETHER) {
4585 NL_SET_ERR_MSG(extack, "FDB add only supported for Ethernet devices");
4586 return -EINVAL;
4587 }
4588
4589 addr = nla_data(tb[NDA_LLADDR]);
4590
4591 err = fdb_vid_parse(tb[NDA_VLAN], &vid, extack);
4592 if (err)
4593 return err;
4594
4595 err = -EOPNOTSUPP;
4596
4597 /* Support fdb on master device the net/bridge default case */
4598 if ((!ndm->ndm_flags || ndm->ndm_flags & NTF_MASTER) &&
4599 netif_is_bridge_port(dev)) {
4600 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
4601 const struct net_device_ops *ops = br_dev->netdev_ops;
4602 bool notified = false;
4603
4604 err = ops->ndo_fdb_add(ndm, tb, dev, addr, vid,
4605 nlh->nlmsg_flags, ¬ified, extack);
4606 if (err)
4607 goto out;
4608 else
4609 ndm->ndm_flags &= ~NTF_MASTER;
4610 }
4611
4612 /* Embedded bridge, macvlan, and any other device support */
4613 if ((ndm->ndm_flags & NTF_SELF)) {
4614 bool notified = false;
4615
4616 if (dev->netdev_ops->ndo_fdb_add)
4617 err = dev->netdev_ops->ndo_fdb_add(ndm, tb, dev, addr,
4618 vid,
4619 nlh->nlmsg_flags,
4620 ¬ified, extack);
4621 else
4622 err = ndo_dflt_fdb_add(ndm, tb, dev, addr, vid,
4623 nlh->nlmsg_flags);
4624
4625 if (!err && !notified) {
4626 rtnl_fdb_notify(dev, addr, vid, RTM_NEWNEIGH,
4627 ndm->ndm_state);
4628 ndm->ndm_flags &= ~NTF_SELF;
4629 }
4630 }
4631 out:
4632 return err;
4633 }
4634
4635 /*
4636 * ndo_dflt_fdb_del - default netdevice operation to delete an FDB entry
4637 */
ndo_dflt_fdb_del(struct ndmsg * ndm,struct nlattr * tb[],struct net_device * dev,const unsigned char * addr,u16 vid)4638 int ndo_dflt_fdb_del(struct ndmsg *ndm,
4639 struct nlattr *tb[],
4640 struct net_device *dev,
4641 const unsigned char *addr, u16 vid)
4642 {
4643 int err = -EINVAL;
4644
4645 /* If aging addresses are supported device will need to
4646 * implement its own handler for this.
4647 */
4648 if (!(ndm->ndm_state & NUD_PERMANENT)) {
4649 netdev_info(dev, "default FDB implementation only supports local addresses\n");
4650 return err;
4651 }
4652
4653 if (is_unicast_ether_addr(addr) || is_link_local_ether_addr(addr))
4654 err = dev_uc_del(dev, addr);
4655 else if (is_multicast_ether_addr(addr))
4656 err = dev_mc_del(dev, addr);
4657
4658 return err;
4659 }
4660 EXPORT_SYMBOL(ndo_dflt_fdb_del);
4661
rtnl_fdb_del(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)4662 static int rtnl_fdb_del(struct sk_buff *skb, struct nlmsghdr *nlh,
4663 struct netlink_ext_ack *extack)
4664 {
4665 bool del_bulk = !!(nlh->nlmsg_flags & NLM_F_BULK);
4666 struct net *net = sock_net(skb->sk);
4667 const struct net_device_ops *ops;
4668 struct ndmsg *ndm;
4669 struct nlattr *tb[NDA_MAX+1];
4670 struct net_device *dev;
4671 __u8 *addr = NULL;
4672 int err;
4673 u16 vid;
4674
4675 if (!netlink_capable(skb, CAP_NET_ADMIN))
4676 return -EPERM;
4677
4678 if (!del_bulk) {
4679 err = nlmsg_parse_deprecated(nlh, sizeof(*ndm), tb, NDA_MAX,
4680 NULL, extack);
4681 } else {
4682 /* For bulk delete, the drivers will parse the message with
4683 * policy.
4684 */
4685 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL, extack);
4686 }
4687 if (err < 0)
4688 return err;
4689
4690 ndm = nlmsg_data(nlh);
4691 if (ndm->ndm_ifindex == 0) {
4692 NL_SET_ERR_MSG(extack, "invalid ifindex");
4693 return -EINVAL;
4694 }
4695
4696 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
4697 if (dev == NULL) {
4698 NL_SET_ERR_MSG(extack, "unknown ifindex");
4699 return -ENODEV;
4700 }
4701
4702 if (!del_bulk) {
4703 if (!tb[NDA_LLADDR] || nla_len(tb[NDA_LLADDR]) != ETH_ALEN) {
4704 NL_SET_ERR_MSG(extack, "invalid address");
4705 return -EINVAL;
4706 }
4707 addr = nla_data(tb[NDA_LLADDR]);
4708
4709 err = fdb_vid_parse(tb[NDA_VLAN], &vid, extack);
4710 if (err)
4711 return err;
4712 }
4713
4714 if (dev->type != ARPHRD_ETHER) {
4715 NL_SET_ERR_MSG(extack, "FDB delete only supported for Ethernet devices");
4716 return -EINVAL;
4717 }
4718
4719 err = -EOPNOTSUPP;
4720
4721 /* Support fdb on master device the net/bridge default case */
4722 if ((!ndm->ndm_flags || ndm->ndm_flags & NTF_MASTER) &&
4723 netif_is_bridge_port(dev)) {
4724 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
4725 bool notified = false;
4726
4727 ops = br_dev->netdev_ops;
4728 if (!del_bulk) {
4729 if (ops->ndo_fdb_del)
4730 err = ops->ndo_fdb_del(ndm, tb, dev, addr, vid,
4731 ¬ified, extack);
4732 } else {
4733 if (ops->ndo_fdb_del_bulk)
4734 err = ops->ndo_fdb_del_bulk(nlh, dev, extack);
4735 }
4736
4737 if (err)
4738 goto out;
4739 else
4740 ndm->ndm_flags &= ~NTF_MASTER;
4741 }
4742
4743 /* Embedded bridge, macvlan, and any other device support */
4744 if (ndm->ndm_flags & NTF_SELF) {
4745 bool notified = false;
4746
4747 ops = dev->netdev_ops;
4748 if (!del_bulk) {
4749 if (ops->ndo_fdb_del)
4750 err = ops->ndo_fdb_del(ndm, tb, dev, addr, vid,
4751 ¬ified, extack);
4752 else
4753 err = ndo_dflt_fdb_del(ndm, tb, dev, addr, vid);
4754 } else {
4755 /* in case err was cleared by NTF_MASTER call */
4756 err = -EOPNOTSUPP;
4757 if (ops->ndo_fdb_del_bulk)
4758 err = ops->ndo_fdb_del_bulk(nlh, dev, extack);
4759 }
4760
4761 if (!err) {
4762 if (!del_bulk && !notified)
4763 rtnl_fdb_notify(dev, addr, vid, RTM_DELNEIGH,
4764 ndm->ndm_state);
4765 ndm->ndm_flags &= ~NTF_SELF;
4766 }
4767 }
4768 out:
4769 return err;
4770 }
4771
nlmsg_populate_fdb(struct sk_buff * skb,struct netlink_callback * cb,struct net_device * dev,int * idx,struct netdev_hw_addr_list * list)4772 static int nlmsg_populate_fdb(struct sk_buff *skb,
4773 struct netlink_callback *cb,
4774 struct net_device *dev,
4775 int *idx,
4776 struct netdev_hw_addr_list *list)
4777 {
4778 struct ndo_fdb_dump_context *ctx = (void *)cb->ctx;
4779 struct netdev_hw_addr *ha;
4780 u32 portid, seq;
4781 int err;
4782
4783 portid = NETLINK_CB(cb->skb).portid;
4784 seq = cb->nlh->nlmsg_seq;
4785
4786 list_for_each_entry(ha, &list->list, list) {
4787 if (*idx < ctx->fdb_idx)
4788 goto skip;
4789
4790 err = nlmsg_populate_fdb_fill(skb, dev, ha->addr, 0,
4791 portid, seq,
4792 RTM_NEWNEIGH, NTF_SELF,
4793 NLM_F_MULTI, NUD_PERMANENT);
4794 if (err < 0)
4795 return err;
4796 skip:
4797 *idx += 1;
4798 }
4799 return 0;
4800 }
4801
4802 /**
4803 * ndo_dflt_fdb_dump - default netdevice operation to dump an FDB table.
4804 * @skb: socket buffer to store message in
4805 * @cb: netlink callback
4806 * @dev: netdevice
4807 * @filter_dev: ignored
4808 * @idx: the number of FDB table entries dumped is added to *@idx
4809 *
4810 * Default netdevice operation to dump the existing unicast address list.
4811 * Returns number of addresses from list put in skb.
4812 */
ndo_dflt_fdb_dump(struct sk_buff * skb,struct netlink_callback * cb,struct net_device * dev,struct net_device * filter_dev,int * idx)4813 int ndo_dflt_fdb_dump(struct sk_buff *skb,
4814 struct netlink_callback *cb,
4815 struct net_device *dev,
4816 struct net_device *filter_dev,
4817 int *idx)
4818 {
4819 int err;
4820
4821 if (dev->type != ARPHRD_ETHER)
4822 return -EINVAL;
4823
4824 netif_addr_lock_bh(dev);
4825 err = nlmsg_populate_fdb(skb, cb, dev, idx, &dev->uc);
4826 if (err)
4827 goto out;
4828 err = nlmsg_populate_fdb(skb, cb, dev, idx, &dev->mc);
4829 out:
4830 netif_addr_unlock_bh(dev);
4831 return err;
4832 }
4833 EXPORT_SYMBOL(ndo_dflt_fdb_dump);
4834
valid_fdb_dump_strict(const struct nlmsghdr * nlh,int * br_idx,int * brport_idx,struct netlink_ext_ack * extack)4835 static int valid_fdb_dump_strict(const struct nlmsghdr *nlh,
4836 int *br_idx, int *brport_idx,
4837 struct netlink_ext_ack *extack)
4838 {
4839 struct nlattr *tb[NDA_MAX + 1];
4840 struct ndmsg *ndm;
4841 int err, i;
4842
4843 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ndm))) {
4844 NL_SET_ERR_MSG(extack, "Invalid header for fdb dump request");
4845 return -EINVAL;
4846 }
4847
4848 ndm = nlmsg_data(nlh);
4849 if (ndm->ndm_pad1 || ndm->ndm_pad2 || ndm->ndm_state ||
4850 ndm->ndm_flags || ndm->ndm_type) {
4851 NL_SET_ERR_MSG(extack, "Invalid values in header for fdb dump request");
4852 return -EINVAL;
4853 }
4854
4855 err = nlmsg_parse_deprecated_strict(nlh, sizeof(struct ndmsg), tb,
4856 NDA_MAX, NULL, extack);
4857 if (err < 0)
4858 return err;
4859
4860 *brport_idx = ndm->ndm_ifindex;
4861 for (i = 0; i <= NDA_MAX; ++i) {
4862 if (!tb[i])
4863 continue;
4864
4865 switch (i) {
4866 case NDA_IFINDEX:
4867 if (nla_len(tb[i]) != sizeof(u32)) {
4868 NL_SET_ERR_MSG(extack, "Invalid IFINDEX attribute in fdb dump request");
4869 return -EINVAL;
4870 }
4871 *brport_idx = nla_get_u32(tb[NDA_IFINDEX]);
4872 break;
4873 case NDA_MASTER:
4874 if (nla_len(tb[i]) != sizeof(u32)) {
4875 NL_SET_ERR_MSG(extack, "Invalid MASTER attribute in fdb dump request");
4876 return -EINVAL;
4877 }
4878 *br_idx = nla_get_u32(tb[NDA_MASTER]);
4879 break;
4880 default:
4881 NL_SET_ERR_MSG(extack, "Unsupported attribute in fdb dump request");
4882 return -EINVAL;
4883 }
4884 }
4885
4886 return 0;
4887 }
4888
valid_fdb_dump_legacy(const struct nlmsghdr * nlh,int * br_idx,int * brport_idx,struct netlink_ext_ack * extack)4889 static int valid_fdb_dump_legacy(const struct nlmsghdr *nlh,
4890 int *br_idx, int *brport_idx,
4891 struct netlink_ext_ack *extack)
4892 {
4893 struct nlattr *tb[IFLA_MAX+1];
4894 int err;
4895
4896 /* A hack to preserve kernel<->userspace interface.
4897 * Before Linux v4.12 this code accepted ndmsg since iproute2 v3.3.0.
4898 * However, ndmsg is shorter than ifinfomsg thus nlmsg_parse() bails.
4899 * So, check for ndmsg with an optional u32 attribute (not used here).
4900 * Fortunately these sizes don't conflict with the size of ifinfomsg
4901 * with an optional attribute.
4902 */
4903 if (nlmsg_len(nlh) != sizeof(struct ndmsg) &&
4904 (nlmsg_len(nlh) != sizeof(struct ndmsg) +
4905 nla_attr_size(sizeof(u32)))) {
4906 struct ifinfomsg *ifm;
4907
4908 err = nlmsg_parse_deprecated(nlh, sizeof(struct ifinfomsg),
4909 tb, IFLA_MAX, ifla_policy,
4910 extack);
4911 if (err < 0) {
4912 return -EINVAL;
4913 } else if (err == 0) {
4914 if (tb[IFLA_MASTER])
4915 *br_idx = nla_get_u32(tb[IFLA_MASTER]);
4916 }
4917
4918 ifm = nlmsg_data(nlh);
4919 *brport_idx = ifm->ifi_index;
4920 }
4921 return 0;
4922 }
4923
rtnl_fdb_dump(struct sk_buff * skb,struct netlink_callback * cb)4924 static int rtnl_fdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
4925 {
4926 const struct net_device_ops *ops = NULL, *cops = NULL;
4927 struct ndo_fdb_dump_context *ctx = (void *)cb->ctx;
4928 struct net_device *dev, *br_dev = NULL;
4929 struct net *net = sock_net(skb->sk);
4930 int brport_idx = 0;
4931 int br_idx = 0;
4932 int fidx = 0;
4933 int err;
4934
4935 NL_ASSERT_CTX_FITS(struct ndo_fdb_dump_context);
4936
4937 if (cb->strict_check)
4938 err = valid_fdb_dump_strict(cb->nlh, &br_idx, &brport_idx,
4939 cb->extack);
4940 else
4941 err = valid_fdb_dump_legacy(cb->nlh, &br_idx, &brport_idx,
4942 cb->extack);
4943 if (err < 0)
4944 return err;
4945
4946 if (br_idx) {
4947 br_dev = __dev_get_by_index(net, br_idx);
4948 if (!br_dev)
4949 return -ENODEV;
4950
4951 ops = br_dev->netdev_ops;
4952 }
4953
4954 for_each_netdev_dump(net, dev, ctx->ifindex) {
4955 if (brport_idx && (dev->ifindex != brport_idx))
4956 continue;
4957
4958 if (!br_idx) { /* user did not specify a specific bridge */
4959 if (netif_is_bridge_port(dev)) {
4960 br_dev = netdev_master_upper_dev_get(dev);
4961 cops = br_dev->netdev_ops;
4962 }
4963 } else {
4964 if (dev != br_dev &&
4965 !netif_is_bridge_port(dev))
4966 continue;
4967
4968 if (br_dev != netdev_master_upper_dev_get(dev) &&
4969 !netif_is_bridge_master(dev))
4970 continue;
4971 cops = ops;
4972 }
4973
4974 if (netif_is_bridge_port(dev)) {
4975 if (cops && cops->ndo_fdb_dump) {
4976 err = cops->ndo_fdb_dump(skb, cb, br_dev, dev,
4977 &fidx);
4978 if (err == -EMSGSIZE)
4979 break;
4980 }
4981 }
4982
4983 if (dev->netdev_ops->ndo_fdb_dump)
4984 err = dev->netdev_ops->ndo_fdb_dump(skb, cb, dev, NULL,
4985 &fidx);
4986 else
4987 err = ndo_dflt_fdb_dump(skb, cb, dev, NULL, &fidx);
4988 if (err == -EMSGSIZE)
4989 break;
4990
4991 cops = NULL;
4992
4993 /* reset fdb offset to 0 for rest of the interfaces */
4994 ctx->fdb_idx = 0;
4995 fidx = 0;
4996 }
4997
4998 ctx->fdb_idx = fidx;
4999
5000 return skb->len;
5001 }
5002
valid_fdb_get_strict(const struct nlmsghdr * nlh,struct nlattr ** tb,u8 * ndm_flags,int * br_idx,int * brport_idx,u8 ** addr,u16 * vid,struct netlink_ext_ack * extack)5003 static int valid_fdb_get_strict(const struct nlmsghdr *nlh,
5004 struct nlattr **tb, u8 *ndm_flags,
5005 int *br_idx, int *brport_idx, u8 **addr,
5006 u16 *vid, struct netlink_ext_ack *extack)
5007 {
5008 struct ndmsg *ndm;
5009 int err, i;
5010
5011 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ndm))) {
5012 NL_SET_ERR_MSG(extack, "Invalid header for fdb get request");
5013 return -EINVAL;
5014 }
5015
5016 ndm = nlmsg_data(nlh);
5017 if (ndm->ndm_pad1 || ndm->ndm_pad2 || ndm->ndm_state ||
5018 ndm->ndm_type) {
5019 NL_SET_ERR_MSG(extack, "Invalid values in header for fdb get request");
5020 return -EINVAL;
5021 }
5022
5023 if (ndm->ndm_flags & ~(NTF_MASTER | NTF_SELF)) {
5024 NL_SET_ERR_MSG(extack, "Invalid flags in header for fdb get request");
5025 return -EINVAL;
5026 }
5027
5028 err = nlmsg_parse_deprecated_strict(nlh, sizeof(struct ndmsg), tb,
5029 NDA_MAX, nda_policy, extack);
5030 if (err < 0)
5031 return err;
5032
5033 *ndm_flags = ndm->ndm_flags;
5034 *brport_idx = ndm->ndm_ifindex;
5035 for (i = 0; i <= NDA_MAX; ++i) {
5036 if (!tb[i])
5037 continue;
5038
5039 switch (i) {
5040 case NDA_MASTER:
5041 *br_idx = nla_get_u32(tb[i]);
5042 break;
5043 case NDA_LLADDR:
5044 if (nla_len(tb[i]) != ETH_ALEN) {
5045 NL_SET_ERR_MSG(extack, "Invalid address in fdb get request");
5046 return -EINVAL;
5047 }
5048 *addr = nla_data(tb[i]);
5049 break;
5050 case NDA_VLAN:
5051 err = fdb_vid_parse(tb[i], vid, extack);
5052 if (err)
5053 return err;
5054 break;
5055 case NDA_VNI:
5056 break;
5057 default:
5058 NL_SET_ERR_MSG(extack, "Unsupported attribute in fdb get request");
5059 return -EINVAL;
5060 }
5061 }
5062
5063 return 0;
5064 }
5065
rtnl_fdb_get(struct sk_buff * in_skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)5066 static int rtnl_fdb_get(struct sk_buff *in_skb, struct nlmsghdr *nlh,
5067 struct netlink_ext_ack *extack)
5068 {
5069 struct net_device *dev = NULL, *br_dev = NULL;
5070 const struct net_device_ops *ops = NULL;
5071 struct net *net = sock_net(in_skb->sk);
5072 struct nlattr *tb[NDA_MAX + 1];
5073 struct sk_buff *skb;
5074 int brport_idx = 0;
5075 u8 ndm_flags = 0;
5076 int br_idx = 0;
5077 u8 *addr = NULL;
5078 u16 vid = 0;
5079 int err;
5080
5081 err = valid_fdb_get_strict(nlh, tb, &ndm_flags, &br_idx,
5082 &brport_idx, &addr, &vid, extack);
5083 if (err < 0)
5084 return err;
5085
5086 if (!addr) {
5087 NL_SET_ERR_MSG(extack, "Missing lookup address for fdb get request");
5088 return -EINVAL;
5089 }
5090
5091 if (brport_idx) {
5092 dev = __dev_get_by_index(net, brport_idx);
5093 if (!dev) {
5094 NL_SET_ERR_MSG(extack, "Unknown device ifindex");
5095 return -ENODEV;
5096 }
5097 }
5098
5099 if (br_idx) {
5100 if (dev) {
5101 NL_SET_ERR_MSG(extack, "Master and device are mutually exclusive");
5102 return -EINVAL;
5103 }
5104
5105 br_dev = __dev_get_by_index(net, br_idx);
5106 if (!br_dev) {
5107 NL_SET_ERR_MSG(extack, "Invalid master ifindex");
5108 return -EINVAL;
5109 }
5110 ops = br_dev->netdev_ops;
5111 }
5112
5113 if (dev) {
5114 if (!ndm_flags || (ndm_flags & NTF_MASTER)) {
5115 if (!netif_is_bridge_port(dev)) {
5116 NL_SET_ERR_MSG(extack, "Device is not a bridge port");
5117 return -EINVAL;
5118 }
5119 br_dev = netdev_master_upper_dev_get(dev);
5120 if (!br_dev) {
5121 NL_SET_ERR_MSG(extack, "Master of device not found");
5122 return -EINVAL;
5123 }
5124 ops = br_dev->netdev_ops;
5125 } else {
5126 if (!(ndm_flags & NTF_SELF)) {
5127 NL_SET_ERR_MSG(extack, "Missing NTF_SELF");
5128 return -EINVAL;
5129 }
5130 ops = dev->netdev_ops;
5131 }
5132 }
5133
5134 if (!br_dev && !dev) {
5135 NL_SET_ERR_MSG(extack, "No device specified");
5136 return -ENODEV;
5137 }
5138
5139 if (!ops || !ops->ndo_fdb_get) {
5140 NL_SET_ERR_MSG(extack, "Fdb get operation not supported by device");
5141 return -EOPNOTSUPP;
5142 }
5143
5144 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
5145 if (!skb)
5146 return -ENOBUFS;
5147
5148 if (br_dev)
5149 dev = br_dev;
5150 err = ops->ndo_fdb_get(skb, tb, dev, addr, vid,
5151 NETLINK_CB(in_skb).portid,
5152 nlh->nlmsg_seq, extack);
5153 if (err)
5154 goto out;
5155
5156 return rtnl_unicast(skb, net, NETLINK_CB(in_skb).portid);
5157 out:
5158 kfree_skb(skb);
5159 return err;
5160 }
5161
brport_nla_put_flag(struct sk_buff * skb,u32 flags,u32 mask,unsigned int attrnum,unsigned int flag)5162 static int brport_nla_put_flag(struct sk_buff *skb, u32 flags, u32 mask,
5163 unsigned int attrnum, unsigned int flag)
5164 {
5165 if (mask & flag)
5166 return nla_put_u8(skb, attrnum, !!(flags & flag));
5167 return 0;
5168 }
5169
ndo_dflt_bridge_getlink(struct sk_buff * skb,u32 pid,u32 seq,struct net_device * dev,u16 mode,u32 flags,u32 mask,int nlflags,u32 filter_mask,int (* vlan_fill)(struct sk_buff * skb,struct net_device * dev,u32 filter_mask))5170 int ndo_dflt_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
5171 struct net_device *dev, u16 mode,
5172 u32 flags, u32 mask, int nlflags,
5173 u32 filter_mask,
5174 int (*vlan_fill)(struct sk_buff *skb,
5175 struct net_device *dev,
5176 u32 filter_mask))
5177 {
5178 struct nlmsghdr *nlh;
5179 struct ifinfomsg *ifm;
5180 struct nlattr *br_afspec;
5181 struct nlattr *protinfo;
5182 u8 operstate = netif_running(dev) ? dev->operstate : IF_OPER_DOWN;
5183 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5184 int err = 0;
5185
5186 nlh = nlmsg_put(skb, pid, seq, RTM_NEWLINK, sizeof(*ifm), nlflags);
5187 if (nlh == NULL)
5188 return -EMSGSIZE;
5189
5190 ifm = nlmsg_data(nlh);
5191 ifm->ifi_family = AF_BRIDGE;
5192 ifm->__ifi_pad = 0;
5193 ifm->ifi_type = dev->type;
5194 ifm->ifi_index = dev->ifindex;
5195 ifm->ifi_flags = dev_get_flags(dev);
5196 ifm->ifi_change = 0;
5197
5198
5199 if (nla_put_string(skb, IFLA_IFNAME, dev->name) ||
5200 nla_put_u32(skb, IFLA_MTU, dev->mtu) ||
5201 nla_put_u8(skb, IFLA_OPERSTATE, operstate) ||
5202 (br_dev &&
5203 nla_put_u32(skb, IFLA_MASTER, br_dev->ifindex)) ||
5204 (dev->addr_len &&
5205 nla_put(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr)) ||
5206 (dev->ifindex != dev_get_iflink(dev) &&
5207 nla_put_u32(skb, IFLA_LINK, dev_get_iflink(dev))))
5208 goto nla_put_failure;
5209
5210 br_afspec = nla_nest_start_noflag(skb, IFLA_AF_SPEC);
5211 if (!br_afspec)
5212 goto nla_put_failure;
5213
5214 if (nla_put_u16(skb, IFLA_BRIDGE_FLAGS, BRIDGE_FLAGS_SELF)) {
5215 nla_nest_cancel(skb, br_afspec);
5216 goto nla_put_failure;
5217 }
5218
5219 if (mode != BRIDGE_MODE_UNDEF) {
5220 if (nla_put_u16(skb, IFLA_BRIDGE_MODE, mode)) {
5221 nla_nest_cancel(skb, br_afspec);
5222 goto nla_put_failure;
5223 }
5224 }
5225 if (vlan_fill) {
5226 err = vlan_fill(skb, dev, filter_mask);
5227 if (err) {
5228 nla_nest_cancel(skb, br_afspec);
5229 goto nla_put_failure;
5230 }
5231 }
5232 nla_nest_end(skb, br_afspec);
5233
5234 protinfo = nla_nest_start(skb, IFLA_PROTINFO);
5235 if (!protinfo)
5236 goto nla_put_failure;
5237
5238 if (brport_nla_put_flag(skb, flags, mask,
5239 IFLA_BRPORT_MODE, BR_HAIRPIN_MODE) ||
5240 brport_nla_put_flag(skb, flags, mask,
5241 IFLA_BRPORT_GUARD, BR_BPDU_GUARD) ||
5242 brport_nla_put_flag(skb, flags, mask,
5243 IFLA_BRPORT_FAST_LEAVE,
5244 BR_MULTICAST_FAST_LEAVE) ||
5245 brport_nla_put_flag(skb, flags, mask,
5246 IFLA_BRPORT_PROTECT, BR_ROOT_BLOCK) ||
5247 brport_nla_put_flag(skb, flags, mask,
5248 IFLA_BRPORT_LEARNING, BR_LEARNING) ||
5249 brport_nla_put_flag(skb, flags, mask,
5250 IFLA_BRPORT_LEARNING_SYNC, BR_LEARNING_SYNC) ||
5251 brport_nla_put_flag(skb, flags, mask,
5252 IFLA_BRPORT_UNICAST_FLOOD, BR_FLOOD) ||
5253 brport_nla_put_flag(skb, flags, mask,
5254 IFLA_BRPORT_PROXYARP, BR_PROXYARP) ||
5255 brport_nla_put_flag(skb, flags, mask,
5256 IFLA_BRPORT_MCAST_FLOOD, BR_MCAST_FLOOD) ||
5257 brport_nla_put_flag(skb, flags, mask,
5258 IFLA_BRPORT_BCAST_FLOOD, BR_BCAST_FLOOD)) {
5259 nla_nest_cancel(skb, protinfo);
5260 goto nla_put_failure;
5261 }
5262
5263 nla_nest_end(skb, protinfo);
5264
5265 nlmsg_end(skb, nlh);
5266 return 0;
5267 nla_put_failure:
5268 nlmsg_cancel(skb, nlh);
5269 return err ? err : -EMSGSIZE;
5270 }
5271 EXPORT_SYMBOL_GPL(ndo_dflt_bridge_getlink);
5272
valid_bridge_getlink_req(const struct nlmsghdr * nlh,bool strict_check,u32 * filter_mask,struct netlink_ext_ack * extack)5273 static int valid_bridge_getlink_req(const struct nlmsghdr *nlh,
5274 bool strict_check, u32 *filter_mask,
5275 struct netlink_ext_ack *extack)
5276 {
5277 struct nlattr *tb[IFLA_MAX+1];
5278 int err, i;
5279
5280 if (strict_check) {
5281 struct ifinfomsg *ifm;
5282
5283 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifm))) {
5284 NL_SET_ERR_MSG(extack, "Invalid header for bridge link dump");
5285 return -EINVAL;
5286 }
5287
5288 ifm = nlmsg_data(nlh);
5289 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags ||
5290 ifm->ifi_change || ifm->ifi_index) {
5291 NL_SET_ERR_MSG(extack, "Invalid values in header for bridge link dump request");
5292 return -EINVAL;
5293 }
5294
5295 err = nlmsg_parse_deprecated_strict(nlh,
5296 sizeof(struct ifinfomsg),
5297 tb, IFLA_MAX, ifla_policy,
5298 extack);
5299 } else {
5300 err = nlmsg_parse_deprecated(nlh, sizeof(struct ifinfomsg),
5301 tb, IFLA_MAX, ifla_policy,
5302 extack);
5303 }
5304 if (err < 0)
5305 return err;
5306
5307 /* new attributes should only be added with strict checking */
5308 for (i = 0; i <= IFLA_MAX; ++i) {
5309 if (!tb[i])
5310 continue;
5311
5312 switch (i) {
5313 case IFLA_EXT_MASK:
5314 *filter_mask = nla_get_u32(tb[i]);
5315 break;
5316 default:
5317 if (strict_check) {
5318 NL_SET_ERR_MSG(extack, "Unsupported attribute in bridge link dump request");
5319 return -EINVAL;
5320 }
5321 }
5322 }
5323
5324 return 0;
5325 }
5326
rtnl_bridge_getlink(struct sk_buff * skb,struct netlink_callback * cb)5327 static int rtnl_bridge_getlink(struct sk_buff *skb, struct netlink_callback *cb)
5328 {
5329 const struct nlmsghdr *nlh = cb->nlh;
5330 struct net *net = sock_net(skb->sk);
5331 struct net_device *dev;
5332 int idx = 0;
5333 u32 portid = NETLINK_CB(cb->skb).portid;
5334 u32 seq = nlh->nlmsg_seq;
5335 u32 filter_mask = 0;
5336 int err;
5337
5338 err = valid_bridge_getlink_req(nlh, cb->strict_check, &filter_mask,
5339 cb->extack);
5340 if (err < 0 && cb->strict_check)
5341 return err;
5342
5343 rcu_read_lock();
5344 for_each_netdev_rcu(net, dev) {
5345 const struct net_device_ops *ops = dev->netdev_ops;
5346 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5347
5348 if (br_dev && br_dev->netdev_ops->ndo_bridge_getlink) {
5349 if (idx >= cb->args[0]) {
5350 err = br_dev->netdev_ops->ndo_bridge_getlink(
5351 skb, portid, seq, dev,
5352 filter_mask, NLM_F_MULTI);
5353 if (err < 0 && err != -EOPNOTSUPP) {
5354 if (likely(skb->len))
5355 break;
5356
5357 goto out_err;
5358 }
5359 }
5360 idx++;
5361 }
5362
5363 if (ops->ndo_bridge_getlink) {
5364 if (idx >= cb->args[0]) {
5365 err = ops->ndo_bridge_getlink(skb, portid,
5366 seq, dev,
5367 filter_mask,
5368 NLM_F_MULTI);
5369 if (err < 0 && err != -EOPNOTSUPP) {
5370 if (likely(skb->len))
5371 break;
5372
5373 goto out_err;
5374 }
5375 }
5376 idx++;
5377 }
5378 }
5379 err = skb->len;
5380 out_err:
5381 rcu_read_unlock();
5382 cb->args[0] = idx;
5383
5384 return err;
5385 }
5386
bridge_nlmsg_size(void)5387 static inline size_t bridge_nlmsg_size(void)
5388 {
5389 return NLMSG_ALIGN(sizeof(struct ifinfomsg))
5390 + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */
5391 + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */
5392 + nla_total_size(sizeof(u32)) /* IFLA_MASTER */
5393 + nla_total_size(sizeof(u32)) /* IFLA_MTU */
5394 + nla_total_size(sizeof(u32)) /* IFLA_LINK */
5395 + nla_total_size(sizeof(u32)) /* IFLA_OPERSTATE */
5396 + nla_total_size(sizeof(u8)) /* IFLA_PROTINFO */
5397 + nla_total_size(sizeof(struct nlattr)) /* IFLA_AF_SPEC */
5398 + nla_total_size(sizeof(u16)) /* IFLA_BRIDGE_FLAGS */
5399 + nla_total_size(sizeof(u16)); /* IFLA_BRIDGE_MODE */
5400 }
5401
rtnl_bridge_notify(struct net_device * dev)5402 static int rtnl_bridge_notify(struct net_device *dev)
5403 {
5404 struct net *net = dev_net(dev);
5405 struct sk_buff *skb;
5406 int err = -EOPNOTSUPP;
5407
5408 if (!dev->netdev_ops->ndo_bridge_getlink)
5409 return 0;
5410
5411 skb = nlmsg_new(bridge_nlmsg_size(), GFP_ATOMIC);
5412 if (!skb) {
5413 err = -ENOMEM;
5414 goto errout;
5415 }
5416
5417 err = dev->netdev_ops->ndo_bridge_getlink(skb, 0, 0, dev, 0, 0);
5418 if (err < 0)
5419 goto errout;
5420
5421 /* Notification info is only filled for bridge ports, not the bridge
5422 * device itself. Therefore, a zero notification length is valid and
5423 * should not result in an error.
5424 */
5425 if (!skb->len)
5426 goto errout;
5427
5428 rtnl_notify(skb, net, 0, RTNLGRP_LINK, NULL, GFP_ATOMIC);
5429 return 0;
5430 errout:
5431 WARN_ON(err == -EMSGSIZE);
5432 kfree_skb(skb);
5433 if (err)
5434 rtnl_set_sk_err(net, RTNLGRP_LINK, err);
5435 return err;
5436 }
5437
rtnl_bridge_setlink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)5438 static int rtnl_bridge_setlink(struct sk_buff *skb, struct nlmsghdr *nlh,
5439 struct netlink_ext_ack *extack)
5440 {
5441 struct net *net = sock_net(skb->sk);
5442 struct ifinfomsg *ifm;
5443 struct net_device *dev;
5444 struct nlattr *br_spec, *attr, *br_flags_attr = NULL;
5445 int rem, err = -EOPNOTSUPP;
5446 u16 flags = 0;
5447
5448 if (nlmsg_len(nlh) < sizeof(*ifm))
5449 return -EINVAL;
5450
5451 ifm = nlmsg_data(nlh);
5452 if (ifm->ifi_family != AF_BRIDGE)
5453 return -EPFNOSUPPORT;
5454
5455 dev = __dev_get_by_index(net, ifm->ifi_index);
5456 if (!dev) {
5457 NL_SET_ERR_MSG(extack, "unknown ifindex");
5458 return -ENODEV;
5459 }
5460
5461 br_spec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg), IFLA_AF_SPEC);
5462 if (br_spec) {
5463 nla_for_each_nested(attr, br_spec, rem) {
5464 if (nla_type(attr) == IFLA_BRIDGE_FLAGS && !br_flags_attr) {
5465 if (nla_len(attr) < sizeof(flags))
5466 return -EINVAL;
5467
5468 br_flags_attr = attr;
5469 flags = nla_get_u16(attr);
5470 }
5471
5472 if (nla_type(attr) == IFLA_BRIDGE_MODE) {
5473 if (nla_len(attr) < sizeof(u16))
5474 return -EINVAL;
5475 }
5476 }
5477 }
5478
5479 if (!flags || (flags & BRIDGE_FLAGS_MASTER)) {
5480 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5481
5482 if (!br_dev || !br_dev->netdev_ops->ndo_bridge_setlink) {
5483 err = -EOPNOTSUPP;
5484 goto out;
5485 }
5486
5487 err = br_dev->netdev_ops->ndo_bridge_setlink(dev, nlh, flags,
5488 extack);
5489 if (err)
5490 goto out;
5491
5492 flags &= ~BRIDGE_FLAGS_MASTER;
5493 }
5494
5495 if ((flags & BRIDGE_FLAGS_SELF)) {
5496 if (!dev->netdev_ops->ndo_bridge_setlink)
5497 err = -EOPNOTSUPP;
5498 else
5499 err = dev->netdev_ops->ndo_bridge_setlink(dev, nlh,
5500 flags,
5501 extack);
5502 if (!err) {
5503 flags &= ~BRIDGE_FLAGS_SELF;
5504
5505 /* Generate event to notify upper layer of bridge
5506 * change
5507 */
5508 err = rtnl_bridge_notify(dev);
5509 }
5510 }
5511
5512 if (br_flags_attr)
5513 memcpy(nla_data(br_flags_attr), &flags, sizeof(flags));
5514 out:
5515 return err;
5516 }
5517
rtnl_bridge_dellink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)5518 static int rtnl_bridge_dellink(struct sk_buff *skb, struct nlmsghdr *nlh,
5519 struct netlink_ext_ack *extack)
5520 {
5521 struct net *net = sock_net(skb->sk);
5522 struct ifinfomsg *ifm;
5523 struct net_device *dev;
5524 struct nlattr *br_spec, *attr = NULL;
5525 int rem, err = -EOPNOTSUPP;
5526 u16 flags = 0;
5527 bool have_flags = false;
5528
5529 if (nlmsg_len(nlh) < sizeof(*ifm))
5530 return -EINVAL;
5531
5532 ifm = nlmsg_data(nlh);
5533 if (ifm->ifi_family != AF_BRIDGE)
5534 return -EPFNOSUPPORT;
5535
5536 dev = __dev_get_by_index(net, ifm->ifi_index);
5537 if (!dev) {
5538 NL_SET_ERR_MSG(extack, "unknown ifindex");
5539 return -ENODEV;
5540 }
5541
5542 br_spec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg), IFLA_AF_SPEC);
5543 if (br_spec) {
5544 nla_for_each_nested_type(attr, IFLA_BRIDGE_FLAGS, br_spec,
5545 rem) {
5546 if (nla_len(attr) < sizeof(flags))
5547 return -EINVAL;
5548
5549 have_flags = true;
5550 flags = nla_get_u16(attr);
5551 break;
5552 }
5553 }
5554
5555 if (!flags || (flags & BRIDGE_FLAGS_MASTER)) {
5556 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5557
5558 if (!br_dev || !br_dev->netdev_ops->ndo_bridge_dellink) {
5559 err = -EOPNOTSUPP;
5560 goto out;
5561 }
5562
5563 err = br_dev->netdev_ops->ndo_bridge_dellink(dev, nlh, flags);
5564 if (err)
5565 goto out;
5566
5567 flags &= ~BRIDGE_FLAGS_MASTER;
5568 }
5569
5570 if ((flags & BRIDGE_FLAGS_SELF)) {
5571 if (!dev->netdev_ops->ndo_bridge_dellink)
5572 err = -EOPNOTSUPP;
5573 else
5574 err = dev->netdev_ops->ndo_bridge_dellink(dev, nlh,
5575 flags);
5576
5577 if (!err) {
5578 flags &= ~BRIDGE_FLAGS_SELF;
5579
5580 /* Generate event to notify upper layer of bridge
5581 * change
5582 */
5583 err = rtnl_bridge_notify(dev);
5584 }
5585 }
5586
5587 if (have_flags)
5588 memcpy(nla_data(attr), &flags, sizeof(flags));
5589 out:
5590 return err;
5591 }
5592
stats_attr_valid(unsigned int mask,int attrid,int idxattr)5593 static bool stats_attr_valid(unsigned int mask, int attrid, int idxattr)
5594 {
5595 return (mask & IFLA_STATS_FILTER_BIT(attrid)) &&
5596 (!idxattr || idxattr == attrid);
5597 }
5598
5599 static bool
rtnl_offload_xstats_have_ndo(const struct net_device * dev,int attr_id)5600 rtnl_offload_xstats_have_ndo(const struct net_device *dev, int attr_id)
5601 {
5602 return dev->netdev_ops &&
5603 dev->netdev_ops->ndo_has_offload_stats &&
5604 dev->netdev_ops->ndo_get_offload_stats &&
5605 dev->netdev_ops->ndo_has_offload_stats(dev, attr_id);
5606 }
5607
5608 static unsigned int
rtnl_offload_xstats_get_size_ndo(const struct net_device * dev,int attr_id)5609 rtnl_offload_xstats_get_size_ndo(const struct net_device *dev, int attr_id)
5610 {
5611 return rtnl_offload_xstats_have_ndo(dev, attr_id) ?
5612 sizeof(struct rtnl_link_stats64) : 0;
5613 }
5614
5615 static int
rtnl_offload_xstats_fill_ndo(struct net_device * dev,int attr_id,struct sk_buff * skb)5616 rtnl_offload_xstats_fill_ndo(struct net_device *dev, int attr_id,
5617 struct sk_buff *skb)
5618 {
5619 unsigned int size = rtnl_offload_xstats_get_size_ndo(dev, attr_id);
5620 struct nlattr *attr = NULL;
5621 void *attr_data;
5622 int err;
5623
5624 if (!size)
5625 return -ENODATA;
5626
5627 attr = nla_reserve_64bit(skb, attr_id, size,
5628 IFLA_OFFLOAD_XSTATS_UNSPEC);
5629 if (!attr)
5630 return -EMSGSIZE;
5631
5632 attr_data = nla_data(attr);
5633 memset(attr_data, 0, size);
5634
5635 err = dev->netdev_ops->ndo_get_offload_stats(attr_id, dev, attr_data);
5636 if (err)
5637 return err;
5638
5639 return 0;
5640 }
5641
5642 static unsigned int
rtnl_offload_xstats_get_size_stats(const struct net_device * dev,enum netdev_offload_xstats_type type)5643 rtnl_offload_xstats_get_size_stats(const struct net_device *dev,
5644 enum netdev_offload_xstats_type type)
5645 {
5646 bool enabled = netdev_offload_xstats_enabled(dev, type);
5647
5648 return enabled ? sizeof(struct rtnl_hw_stats64) : 0;
5649 }
5650
5651 struct rtnl_offload_xstats_request_used {
5652 bool request;
5653 bool used;
5654 };
5655
5656 static int
rtnl_offload_xstats_get_stats(struct net_device * dev,enum netdev_offload_xstats_type type,struct rtnl_offload_xstats_request_used * ru,struct rtnl_hw_stats64 * stats,struct netlink_ext_ack * extack)5657 rtnl_offload_xstats_get_stats(struct net_device *dev,
5658 enum netdev_offload_xstats_type type,
5659 struct rtnl_offload_xstats_request_used *ru,
5660 struct rtnl_hw_stats64 *stats,
5661 struct netlink_ext_ack *extack)
5662 {
5663 bool request;
5664 bool used;
5665 int err;
5666
5667 request = netdev_offload_xstats_enabled(dev, type);
5668 if (!request) {
5669 used = false;
5670 goto out;
5671 }
5672
5673 err = netdev_offload_xstats_get(dev, type, stats, &used, extack);
5674 if (err)
5675 return err;
5676
5677 out:
5678 if (ru) {
5679 ru->request = request;
5680 ru->used = used;
5681 }
5682 return 0;
5683 }
5684
5685 static int
rtnl_offload_xstats_fill_hw_s_info_one(struct sk_buff * skb,int attr_id,struct rtnl_offload_xstats_request_used * ru)5686 rtnl_offload_xstats_fill_hw_s_info_one(struct sk_buff *skb, int attr_id,
5687 struct rtnl_offload_xstats_request_used *ru)
5688 {
5689 struct nlattr *nest;
5690
5691 nest = nla_nest_start(skb, attr_id);
5692 if (!nest)
5693 return -EMSGSIZE;
5694
5695 if (nla_put_u8(skb, IFLA_OFFLOAD_XSTATS_HW_S_INFO_REQUEST, ru->request))
5696 goto nla_put_failure;
5697
5698 if (nla_put_u8(skb, IFLA_OFFLOAD_XSTATS_HW_S_INFO_USED, ru->used))
5699 goto nla_put_failure;
5700
5701 nla_nest_end(skb, nest);
5702 return 0;
5703
5704 nla_put_failure:
5705 nla_nest_cancel(skb, nest);
5706 return -EMSGSIZE;
5707 }
5708
5709 static int
rtnl_offload_xstats_fill_hw_s_info(struct sk_buff * skb,struct net_device * dev,struct netlink_ext_ack * extack)5710 rtnl_offload_xstats_fill_hw_s_info(struct sk_buff *skb, struct net_device *dev,
5711 struct netlink_ext_ack *extack)
5712 {
5713 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5714 struct rtnl_offload_xstats_request_used ru_l3;
5715 struct nlattr *nest;
5716 int err;
5717
5718 err = rtnl_offload_xstats_get_stats(dev, t_l3, &ru_l3, NULL, extack);
5719 if (err)
5720 return err;
5721
5722 nest = nla_nest_start(skb, IFLA_OFFLOAD_XSTATS_HW_S_INFO);
5723 if (!nest)
5724 return -EMSGSIZE;
5725
5726 if (rtnl_offload_xstats_fill_hw_s_info_one(skb,
5727 IFLA_OFFLOAD_XSTATS_L3_STATS,
5728 &ru_l3))
5729 goto nla_put_failure;
5730
5731 nla_nest_end(skb, nest);
5732 return 0;
5733
5734 nla_put_failure:
5735 nla_nest_cancel(skb, nest);
5736 return -EMSGSIZE;
5737 }
5738
rtnl_offload_xstats_fill(struct sk_buff * skb,struct net_device * dev,int * prividx,u32 off_filter_mask,struct netlink_ext_ack * extack)5739 static int rtnl_offload_xstats_fill(struct sk_buff *skb, struct net_device *dev,
5740 int *prividx, u32 off_filter_mask,
5741 struct netlink_ext_ack *extack)
5742 {
5743 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5744 int attr_id_hw_s_info = IFLA_OFFLOAD_XSTATS_HW_S_INFO;
5745 int attr_id_l3_stats = IFLA_OFFLOAD_XSTATS_L3_STATS;
5746 int attr_id_cpu_hit = IFLA_OFFLOAD_XSTATS_CPU_HIT;
5747 bool have_data = false;
5748 int err;
5749
5750 if (*prividx <= attr_id_cpu_hit &&
5751 (off_filter_mask &
5752 IFLA_STATS_FILTER_BIT(attr_id_cpu_hit))) {
5753 err = rtnl_offload_xstats_fill_ndo(dev, attr_id_cpu_hit, skb);
5754 if (!err) {
5755 have_data = true;
5756 } else if (err != -ENODATA) {
5757 *prividx = attr_id_cpu_hit;
5758 return err;
5759 }
5760 }
5761
5762 if (*prividx <= attr_id_hw_s_info &&
5763 (off_filter_mask & IFLA_STATS_FILTER_BIT(attr_id_hw_s_info))) {
5764 *prividx = attr_id_hw_s_info;
5765
5766 err = rtnl_offload_xstats_fill_hw_s_info(skb, dev, extack);
5767 if (err)
5768 return err;
5769
5770 have_data = true;
5771 *prividx = 0;
5772 }
5773
5774 if (*prividx <= attr_id_l3_stats &&
5775 (off_filter_mask & IFLA_STATS_FILTER_BIT(attr_id_l3_stats))) {
5776 unsigned int size_l3;
5777 struct nlattr *attr;
5778
5779 *prividx = attr_id_l3_stats;
5780
5781 size_l3 = rtnl_offload_xstats_get_size_stats(dev, t_l3);
5782 if (!size_l3)
5783 goto skip_l3_stats;
5784 attr = nla_reserve_64bit(skb, attr_id_l3_stats, size_l3,
5785 IFLA_OFFLOAD_XSTATS_UNSPEC);
5786 if (!attr)
5787 return -EMSGSIZE;
5788
5789 err = rtnl_offload_xstats_get_stats(dev, t_l3, NULL,
5790 nla_data(attr), extack);
5791 if (err)
5792 return err;
5793
5794 have_data = true;
5795 skip_l3_stats:
5796 *prividx = 0;
5797 }
5798
5799 if (!have_data)
5800 return -ENODATA;
5801
5802 *prividx = 0;
5803 return 0;
5804 }
5805
5806 static unsigned int
rtnl_offload_xstats_get_size_hw_s_info_one(const struct net_device * dev,enum netdev_offload_xstats_type type)5807 rtnl_offload_xstats_get_size_hw_s_info_one(const struct net_device *dev,
5808 enum netdev_offload_xstats_type type)
5809 {
5810 return nla_total_size(0) +
5811 /* IFLA_OFFLOAD_XSTATS_HW_S_INFO_REQUEST */
5812 nla_total_size(sizeof(u8)) +
5813 /* IFLA_OFFLOAD_XSTATS_HW_S_INFO_USED */
5814 nla_total_size(sizeof(u8)) +
5815 0;
5816 }
5817
5818 static unsigned int
rtnl_offload_xstats_get_size_hw_s_info(const struct net_device * dev)5819 rtnl_offload_xstats_get_size_hw_s_info(const struct net_device *dev)
5820 {
5821 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5822
5823 return nla_total_size(0) +
5824 /* IFLA_OFFLOAD_XSTATS_L3_STATS */
5825 rtnl_offload_xstats_get_size_hw_s_info_one(dev, t_l3) +
5826 0;
5827 }
5828
rtnl_offload_xstats_get_size(const struct net_device * dev,u32 off_filter_mask)5829 static int rtnl_offload_xstats_get_size(const struct net_device *dev,
5830 u32 off_filter_mask)
5831 {
5832 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5833 int attr_id_cpu_hit = IFLA_OFFLOAD_XSTATS_CPU_HIT;
5834 int nla_size = 0;
5835 int size;
5836
5837 if (off_filter_mask &
5838 IFLA_STATS_FILTER_BIT(attr_id_cpu_hit)) {
5839 size = rtnl_offload_xstats_get_size_ndo(dev, attr_id_cpu_hit);
5840 nla_size += nla_total_size_64bit(size);
5841 }
5842
5843 if (off_filter_mask &
5844 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_HW_S_INFO))
5845 nla_size += rtnl_offload_xstats_get_size_hw_s_info(dev);
5846
5847 if (off_filter_mask &
5848 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_L3_STATS)) {
5849 size = rtnl_offload_xstats_get_size_stats(dev, t_l3);
5850 nla_size += nla_total_size_64bit(size);
5851 }
5852
5853 if (nla_size != 0)
5854 nla_size += nla_total_size(0);
5855
5856 return nla_size;
5857 }
5858
5859 struct rtnl_stats_dump_filters {
5860 /* mask[0] filters outer attributes. Then individual nests have their
5861 * filtering mask at the index of the nested attribute.
5862 */
5863 u32 mask[IFLA_STATS_MAX + 1];
5864 };
5865
rtnl_fill_statsinfo(struct sk_buff * skb,struct net_device * dev,int type,u32 pid,u32 seq,u32 change,unsigned int flags,const struct rtnl_stats_dump_filters * filters,int * idxattr,int * prividx,struct netlink_ext_ack * extack)5866 static int rtnl_fill_statsinfo(struct sk_buff *skb, struct net_device *dev,
5867 int type, u32 pid, u32 seq, u32 change,
5868 unsigned int flags,
5869 const struct rtnl_stats_dump_filters *filters,
5870 int *idxattr, int *prividx,
5871 struct netlink_ext_ack *extack)
5872 {
5873 unsigned int filter_mask = filters->mask[0];
5874 struct if_stats_msg *ifsm;
5875 struct nlmsghdr *nlh;
5876 struct nlattr *attr;
5877 int s_prividx = *prividx;
5878 int err;
5879
5880 ASSERT_RTNL();
5881
5882 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ifsm), flags);
5883 if (!nlh)
5884 return -EMSGSIZE;
5885
5886 ifsm = nlmsg_data(nlh);
5887 ifsm->family = PF_UNSPEC;
5888 ifsm->pad1 = 0;
5889 ifsm->pad2 = 0;
5890 ifsm->ifindex = dev->ifindex;
5891 ifsm->filter_mask = filter_mask;
5892
5893 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_64, *idxattr)) {
5894 struct rtnl_link_stats64 *sp;
5895
5896 attr = nla_reserve_64bit(skb, IFLA_STATS_LINK_64,
5897 sizeof(struct rtnl_link_stats64),
5898 IFLA_STATS_UNSPEC);
5899 if (!attr) {
5900 err = -EMSGSIZE;
5901 goto nla_put_failure;
5902 }
5903
5904 sp = nla_data(attr);
5905 dev_get_stats(dev, sp);
5906 }
5907
5908 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS, *idxattr)) {
5909 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
5910
5911 if (ops && ops->fill_linkxstats) {
5912 *idxattr = IFLA_STATS_LINK_XSTATS;
5913 attr = nla_nest_start_noflag(skb,
5914 IFLA_STATS_LINK_XSTATS);
5915 if (!attr) {
5916 err = -EMSGSIZE;
5917 goto nla_put_failure;
5918 }
5919
5920 err = ops->fill_linkxstats(skb, dev, prividx, *idxattr);
5921 nla_nest_end(skb, attr);
5922 if (err)
5923 goto nla_put_failure;
5924 *idxattr = 0;
5925 }
5926 }
5927
5928 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS_SLAVE,
5929 *idxattr)) {
5930 const struct rtnl_link_ops *ops = NULL;
5931 const struct net_device *master;
5932
5933 master = netdev_master_upper_dev_get(dev);
5934 if (master)
5935 ops = master->rtnl_link_ops;
5936 if (ops && ops->fill_linkxstats) {
5937 *idxattr = IFLA_STATS_LINK_XSTATS_SLAVE;
5938 attr = nla_nest_start_noflag(skb,
5939 IFLA_STATS_LINK_XSTATS_SLAVE);
5940 if (!attr) {
5941 err = -EMSGSIZE;
5942 goto nla_put_failure;
5943 }
5944
5945 err = ops->fill_linkxstats(skb, dev, prividx, *idxattr);
5946 nla_nest_end(skb, attr);
5947 if (err)
5948 goto nla_put_failure;
5949 *idxattr = 0;
5950 }
5951 }
5952
5953 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_OFFLOAD_XSTATS,
5954 *idxattr)) {
5955 u32 off_filter_mask;
5956
5957 off_filter_mask = filters->mask[IFLA_STATS_LINK_OFFLOAD_XSTATS];
5958 *idxattr = IFLA_STATS_LINK_OFFLOAD_XSTATS;
5959 attr = nla_nest_start_noflag(skb,
5960 IFLA_STATS_LINK_OFFLOAD_XSTATS);
5961 if (!attr) {
5962 err = -EMSGSIZE;
5963 goto nla_put_failure;
5964 }
5965
5966 err = rtnl_offload_xstats_fill(skb, dev, prividx,
5967 off_filter_mask, extack);
5968 if (err == -ENODATA)
5969 nla_nest_cancel(skb, attr);
5970 else
5971 nla_nest_end(skb, attr);
5972
5973 if (err && err != -ENODATA)
5974 goto nla_put_failure;
5975 *idxattr = 0;
5976 }
5977
5978 if (stats_attr_valid(filter_mask, IFLA_STATS_AF_SPEC, *idxattr)) {
5979 struct rtnl_af_ops *af_ops;
5980
5981 *idxattr = IFLA_STATS_AF_SPEC;
5982 attr = nla_nest_start_noflag(skb, IFLA_STATS_AF_SPEC);
5983 if (!attr) {
5984 err = -EMSGSIZE;
5985 goto nla_put_failure;
5986 }
5987
5988 rcu_read_lock();
5989 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
5990 if (af_ops->fill_stats_af) {
5991 struct nlattr *af;
5992
5993 af = nla_nest_start_noflag(skb,
5994 af_ops->family);
5995 if (!af) {
5996 rcu_read_unlock();
5997 err = -EMSGSIZE;
5998 goto nla_put_failure;
5999 }
6000 err = af_ops->fill_stats_af(skb, dev);
6001
6002 if (err == -ENODATA) {
6003 nla_nest_cancel(skb, af);
6004 } else if (err < 0) {
6005 rcu_read_unlock();
6006 goto nla_put_failure;
6007 }
6008
6009 nla_nest_end(skb, af);
6010 }
6011 }
6012 rcu_read_unlock();
6013
6014 nla_nest_end(skb, attr);
6015
6016 *idxattr = 0;
6017 }
6018
6019 nlmsg_end(skb, nlh);
6020
6021 return 0;
6022
6023 nla_put_failure:
6024 /* not a multi message or no progress mean a real error */
6025 if (!(flags & NLM_F_MULTI) || s_prividx == *prividx)
6026 nlmsg_cancel(skb, nlh);
6027 else
6028 nlmsg_end(skb, nlh);
6029
6030 return err;
6031 }
6032
if_nlmsg_stats_size(const struct net_device * dev,const struct rtnl_stats_dump_filters * filters)6033 static size_t if_nlmsg_stats_size(const struct net_device *dev,
6034 const struct rtnl_stats_dump_filters *filters)
6035 {
6036 size_t size = NLMSG_ALIGN(sizeof(struct if_stats_msg));
6037 unsigned int filter_mask = filters->mask[0];
6038
6039 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_64, 0))
6040 size += nla_total_size_64bit(sizeof(struct rtnl_link_stats64));
6041
6042 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS, 0)) {
6043 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
6044 int attr = IFLA_STATS_LINK_XSTATS;
6045
6046 if (ops && ops->get_linkxstats_size) {
6047 size += nla_total_size(ops->get_linkxstats_size(dev,
6048 attr));
6049 /* for IFLA_STATS_LINK_XSTATS */
6050 size += nla_total_size(0);
6051 }
6052 }
6053
6054 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS_SLAVE, 0)) {
6055 struct net_device *_dev = (struct net_device *)dev;
6056 const struct rtnl_link_ops *ops = NULL;
6057 const struct net_device *master;
6058
6059 /* netdev_master_upper_dev_get can't take const */
6060 master = netdev_master_upper_dev_get(_dev);
6061 if (master)
6062 ops = master->rtnl_link_ops;
6063 if (ops && ops->get_linkxstats_size) {
6064 int attr = IFLA_STATS_LINK_XSTATS_SLAVE;
6065
6066 size += nla_total_size(ops->get_linkxstats_size(dev,
6067 attr));
6068 /* for IFLA_STATS_LINK_XSTATS_SLAVE */
6069 size += nla_total_size(0);
6070 }
6071 }
6072
6073 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_OFFLOAD_XSTATS, 0)) {
6074 u32 off_filter_mask;
6075
6076 off_filter_mask = filters->mask[IFLA_STATS_LINK_OFFLOAD_XSTATS];
6077 size += rtnl_offload_xstats_get_size(dev, off_filter_mask);
6078 }
6079
6080 if (stats_attr_valid(filter_mask, IFLA_STATS_AF_SPEC, 0)) {
6081 struct rtnl_af_ops *af_ops;
6082
6083 /* for IFLA_STATS_AF_SPEC */
6084 size += nla_total_size(0);
6085
6086 rcu_read_lock();
6087 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
6088 if (af_ops->get_stats_af_size) {
6089 size += nla_total_size(
6090 af_ops->get_stats_af_size(dev));
6091
6092 /* for AF_* */
6093 size += nla_total_size(0);
6094 }
6095 }
6096 rcu_read_unlock();
6097 }
6098
6099 return size;
6100 }
6101
6102 #define RTNL_STATS_OFFLOAD_XSTATS_VALID ((1 << __IFLA_OFFLOAD_XSTATS_MAX) - 1)
6103
6104 static const struct nla_policy
6105 rtnl_stats_get_policy_filters[IFLA_STATS_MAX + 1] = {
6106 [IFLA_STATS_LINK_OFFLOAD_XSTATS] =
6107 NLA_POLICY_MASK(NLA_U32, RTNL_STATS_OFFLOAD_XSTATS_VALID),
6108 };
6109
6110 static const struct nla_policy
6111 rtnl_stats_get_policy[IFLA_STATS_GETSET_MAX + 1] = {
6112 [IFLA_STATS_GET_FILTERS] =
6113 NLA_POLICY_NESTED(rtnl_stats_get_policy_filters),
6114 };
6115
6116 static const struct nla_policy
6117 ifla_stats_set_policy[IFLA_STATS_GETSET_MAX + 1] = {
6118 [IFLA_STATS_SET_OFFLOAD_XSTATS_L3_STATS] = NLA_POLICY_MAX(NLA_U8, 1),
6119 };
6120
rtnl_stats_get_parse_filters(struct nlattr * ifla_filters,struct rtnl_stats_dump_filters * filters,struct netlink_ext_ack * extack)6121 static int rtnl_stats_get_parse_filters(struct nlattr *ifla_filters,
6122 struct rtnl_stats_dump_filters *filters,
6123 struct netlink_ext_ack *extack)
6124 {
6125 struct nlattr *tb[IFLA_STATS_MAX + 1];
6126 int err;
6127 int at;
6128
6129 err = nla_parse_nested(tb, IFLA_STATS_MAX, ifla_filters,
6130 rtnl_stats_get_policy_filters, extack);
6131 if (err < 0)
6132 return err;
6133
6134 for (at = 1; at <= IFLA_STATS_MAX; at++) {
6135 if (tb[at]) {
6136 if (!(filters->mask[0] & IFLA_STATS_FILTER_BIT(at))) {
6137 NL_SET_ERR_MSG(extack, "Filtered attribute not enabled in filter_mask");
6138 return -EINVAL;
6139 }
6140 filters->mask[at] = nla_get_u32(tb[at]);
6141 }
6142 }
6143
6144 return 0;
6145 }
6146
rtnl_stats_get_parse(const struct nlmsghdr * nlh,u32 filter_mask,struct rtnl_stats_dump_filters * filters,struct netlink_ext_ack * extack)6147 static int rtnl_stats_get_parse(const struct nlmsghdr *nlh,
6148 u32 filter_mask,
6149 struct rtnl_stats_dump_filters *filters,
6150 struct netlink_ext_ack *extack)
6151 {
6152 struct nlattr *tb[IFLA_STATS_GETSET_MAX + 1];
6153 int err;
6154 int i;
6155
6156 filters->mask[0] = filter_mask;
6157 for (i = 1; i < ARRAY_SIZE(filters->mask); i++)
6158 filters->mask[i] = -1U;
6159
6160 err = nlmsg_parse(nlh, sizeof(struct if_stats_msg), tb,
6161 IFLA_STATS_GETSET_MAX, rtnl_stats_get_policy, extack);
6162 if (err < 0)
6163 return err;
6164
6165 if (tb[IFLA_STATS_GET_FILTERS]) {
6166 err = rtnl_stats_get_parse_filters(tb[IFLA_STATS_GET_FILTERS],
6167 filters, extack);
6168 if (err)
6169 return err;
6170 }
6171
6172 return 0;
6173 }
6174
rtnl_valid_stats_req(const struct nlmsghdr * nlh,bool strict_check,bool is_dump,struct netlink_ext_ack * extack)6175 static int rtnl_valid_stats_req(const struct nlmsghdr *nlh, bool strict_check,
6176 bool is_dump, struct netlink_ext_ack *extack)
6177 {
6178 struct if_stats_msg *ifsm;
6179
6180 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifsm))) {
6181 NL_SET_ERR_MSG(extack, "Invalid header for stats dump");
6182 return -EINVAL;
6183 }
6184
6185 if (!strict_check)
6186 return 0;
6187
6188 ifsm = nlmsg_data(nlh);
6189
6190 /* only requests using strict checks can pass data to influence
6191 * the dump. The legacy exception is filter_mask.
6192 */
6193 if (ifsm->pad1 || ifsm->pad2 || (is_dump && ifsm->ifindex)) {
6194 NL_SET_ERR_MSG(extack, "Invalid values in header for stats dump request");
6195 return -EINVAL;
6196 }
6197 if (ifsm->filter_mask >= IFLA_STATS_FILTER_BIT(IFLA_STATS_MAX + 1)) {
6198 NL_SET_ERR_MSG(extack, "Invalid stats requested through filter mask");
6199 return -EINVAL;
6200 }
6201
6202 return 0;
6203 }
6204
rtnl_stats_get(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6205 static int rtnl_stats_get(struct sk_buff *skb, struct nlmsghdr *nlh,
6206 struct netlink_ext_ack *extack)
6207 {
6208 struct rtnl_stats_dump_filters filters;
6209 struct net *net = sock_net(skb->sk);
6210 struct net_device *dev = NULL;
6211 int idxattr = 0, prividx = 0;
6212 struct if_stats_msg *ifsm;
6213 struct sk_buff *nskb;
6214 int err;
6215
6216 err = rtnl_valid_stats_req(nlh, netlink_strict_get_check(skb),
6217 false, extack);
6218 if (err)
6219 return err;
6220
6221 ifsm = nlmsg_data(nlh);
6222 if (ifsm->ifindex > 0)
6223 dev = __dev_get_by_index(net, ifsm->ifindex);
6224 else
6225 return -EINVAL;
6226
6227 if (!dev)
6228 return -ENODEV;
6229
6230 if (!ifsm->filter_mask) {
6231 NL_SET_ERR_MSG(extack, "Filter mask must be set for stats get");
6232 return -EINVAL;
6233 }
6234
6235 err = rtnl_stats_get_parse(nlh, ifsm->filter_mask, &filters, extack);
6236 if (err)
6237 return err;
6238
6239 nskb = nlmsg_new(if_nlmsg_stats_size(dev, &filters), GFP_KERNEL);
6240 if (!nskb)
6241 return -ENOBUFS;
6242
6243 err = rtnl_fill_statsinfo(nskb, dev, RTM_NEWSTATS,
6244 NETLINK_CB(skb).portid, nlh->nlmsg_seq, 0,
6245 0, &filters, &idxattr, &prividx, extack);
6246 if (err < 0) {
6247 /* -EMSGSIZE implies BUG in if_nlmsg_stats_size */
6248 WARN_ON(err == -EMSGSIZE);
6249 kfree_skb(nskb);
6250 } else {
6251 err = rtnl_unicast(nskb, net, NETLINK_CB(skb).portid);
6252 }
6253
6254 return err;
6255 }
6256
rtnl_stats_dump(struct sk_buff * skb,struct netlink_callback * cb)6257 static int rtnl_stats_dump(struct sk_buff *skb, struct netlink_callback *cb)
6258 {
6259 struct netlink_ext_ack *extack = cb->extack;
6260 struct rtnl_stats_dump_filters filters;
6261 struct net *net = sock_net(skb->sk);
6262 unsigned int flags = NLM_F_MULTI;
6263 struct if_stats_msg *ifsm;
6264 struct {
6265 unsigned long ifindex;
6266 int idxattr;
6267 int prividx;
6268 } *ctx = (void *)cb->ctx;
6269 struct net_device *dev;
6270 int err;
6271
6272 cb->seq = net->dev_base_seq;
6273
6274 err = rtnl_valid_stats_req(cb->nlh, cb->strict_check, true, extack);
6275 if (err)
6276 return err;
6277
6278 ifsm = nlmsg_data(cb->nlh);
6279 if (!ifsm->filter_mask) {
6280 NL_SET_ERR_MSG(extack, "Filter mask must be set for stats dump");
6281 return -EINVAL;
6282 }
6283
6284 err = rtnl_stats_get_parse(cb->nlh, ifsm->filter_mask, &filters,
6285 extack);
6286 if (err)
6287 return err;
6288
6289 for_each_netdev_dump(net, dev, ctx->ifindex) {
6290 err = rtnl_fill_statsinfo(skb, dev, RTM_NEWSTATS,
6291 NETLINK_CB(cb->skb).portid,
6292 cb->nlh->nlmsg_seq, 0,
6293 flags, &filters,
6294 &ctx->idxattr, &ctx->prividx,
6295 extack);
6296 /* If we ran out of room on the first message,
6297 * we're in trouble.
6298 */
6299 WARN_ON((err == -EMSGSIZE) && (skb->len == 0));
6300
6301 if (err < 0)
6302 break;
6303 ctx->prividx = 0;
6304 ctx->idxattr = 0;
6305 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
6306 }
6307
6308 return err;
6309 }
6310
rtnl_offload_xstats_notify(struct net_device * dev)6311 void rtnl_offload_xstats_notify(struct net_device *dev)
6312 {
6313 struct rtnl_stats_dump_filters response_filters = {};
6314 struct net *net = dev_net(dev);
6315 int idxattr = 0, prividx = 0;
6316 struct sk_buff *skb;
6317 int err = -ENOBUFS;
6318
6319 ASSERT_RTNL();
6320
6321 response_filters.mask[0] |=
6322 IFLA_STATS_FILTER_BIT(IFLA_STATS_LINK_OFFLOAD_XSTATS);
6323 response_filters.mask[IFLA_STATS_LINK_OFFLOAD_XSTATS] |=
6324 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_HW_S_INFO);
6325
6326 skb = nlmsg_new(if_nlmsg_stats_size(dev, &response_filters),
6327 GFP_KERNEL);
6328 if (!skb)
6329 goto errout;
6330
6331 err = rtnl_fill_statsinfo(skb, dev, RTM_NEWSTATS, 0, 0, 0, 0,
6332 &response_filters, &idxattr, &prividx, NULL);
6333 if (err < 0) {
6334 kfree_skb(skb);
6335 goto errout;
6336 }
6337
6338 rtnl_notify(skb, net, 0, RTNLGRP_STATS, NULL, GFP_KERNEL);
6339 return;
6340
6341 errout:
6342 rtnl_set_sk_err(net, RTNLGRP_STATS, err);
6343 }
6344 EXPORT_SYMBOL(rtnl_offload_xstats_notify);
6345
rtnl_stats_set(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6346 static int rtnl_stats_set(struct sk_buff *skb, struct nlmsghdr *nlh,
6347 struct netlink_ext_ack *extack)
6348 {
6349 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
6350 struct rtnl_stats_dump_filters response_filters = {};
6351 struct nlattr *tb[IFLA_STATS_GETSET_MAX + 1];
6352 struct net *net = sock_net(skb->sk);
6353 struct net_device *dev = NULL;
6354 struct if_stats_msg *ifsm;
6355 bool notify = false;
6356 int err;
6357
6358 err = rtnl_valid_stats_req(nlh, netlink_strict_get_check(skb),
6359 false, extack);
6360 if (err)
6361 return err;
6362
6363 ifsm = nlmsg_data(nlh);
6364 if (ifsm->family != AF_UNSPEC) {
6365 NL_SET_ERR_MSG(extack, "Address family should be AF_UNSPEC");
6366 return -EINVAL;
6367 }
6368
6369 if (ifsm->ifindex > 0)
6370 dev = __dev_get_by_index(net, ifsm->ifindex);
6371 else
6372 return -EINVAL;
6373
6374 if (!dev)
6375 return -ENODEV;
6376
6377 if (ifsm->filter_mask) {
6378 NL_SET_ERR_MSG(extack, "Filter mask must be 0 for stats set");
6379 return -EINVAL;
6380 }
6381
6382 err = nlmsg_parse(nlh, sizeof(*ifsm), tb, IFLA_STATS_GETSET_MAX,
6383 ifla_stats_set_policy, extack);
6384 if (err < 0)
6385 return err;
6386
6387 if (tb[IFLA_STATS_SET_OFFLOAD_XSTATS_L3_STATS]) {
6388 u8 req = nla_get_u8(tb[IFLA_STATS_SET_OFFLOAD_XSTATS_L3_STATS]);
6389
6390 if (req)
6391 err = netdev_offload_xstats_enable(dev, t_l3, extack);
6392 else
6393 err = netdev_offload_xstats_disable(dev, t_l3);
6394
6395 if (!err)
6396 notify = true;
6397 else if (err != -EALREADY)
6398 return err;
6399
6400 response_filters.mask[0] |=
6401 IFLA_STATS_FILTER_BIT(IFLA_STATS_LINK_OFFLOAD_XSTATS);
6402 response_filters.mask[IFLA_STATS_LINK_OFFLOAD_XSTATS] |=
6403 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_HW_S_INFO);
6404 }
6405
6406 if (notify)
6407 rtnl_offload_xstats_notify(dev);
6408
6409 return 0;
6410 }
6411
rtnl_mdb_valid_dump_req(const struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6412 static int rtnl_mdb_valid_dump_req(const struct nlmsghdr *nlh,
6413 struct netlink_ext_ack *extack)
6414 {
6415 struct br_port_msg *bpm;
6416
6417 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*bpm))) {
6418 NL_SET_ERR_MSG(extack, "Invalid header for mdb dump request");
6419 return -EINVAL;
6420 }
6421
6422 bpm = nlmsg_data(nlh);
6423 if (bpm->ifindex) {
6424 NL_SET_ERR_MSG(extack, "Filtering by device index is not supported for mdb dump request");
6425 return -EINVAL;
6426 }
6427 if (nlmsg_attrlen(nlh, sizeof(*bpm))) {
6428 NL_SET_ERR_MSG(extack, "Invalid data after header in mdb dump request");
6429 return -EINVAL;
6430 }
6431
6432 return 0;
6433 }
6434
6435 struct rtnl_mdb_dump_ctx {
6436 long idx;
6437 };
6438
rtnl_mdb_dump(struct sk_buff * skb,struct netlink_callback * cb)6439 static int rtnl_mdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
6440 {
6441 struct rtnl_mdb_dump_ctx *ctx = (void *)cb->ctx;
6442 struct net *net = sock_net(skb->sk);
6443 struct net_device *dev;
6444 int idx, s_idx;
6445 int err;
6446
6447 NL_ASSERT_CTX_FITS(struct rtnl_mdb_dump_ctx);
6448
6449 if (cb->strict_check) {
6450 err = rtnl_mdb_valid_dump_req(cb->nlh, cb->extack);
6451 if (err)
6452 return err;
6453 }
6454
6455 s_idx = ctx->idx;
6456 idx = 0;
6457
6458 for_each_netdev(net, dev) {
6459 if (idx < s_idx)
6460 goto skip;
6461 if (!dev->netdev_ops->ndo_mdb_dump)
6462 goto skip;
6463
6464 err = dev->netdev_ops->ndo_mdb_dump(dev, skb, cb);
6465 if (err == -EMSGSIZE)
6466 goto out;
6467 /* Moving on to next device, reset markers and sequence
6468 * counters since they are all maintained per-device.
6469 */
6470 memset(cb->ctx, 0, sizeof(cb->ctx));
6471 cb->prev_seq = 0;
6472 cb->seq = 0;
6473 skip:
6474 idx++;
6475 }
6476
6477 out:
6478 ctx->idx = idx;
6479 return skb->len;
6480 }
6481
rtnl_validate_mdb_entry_get(const struct nlattr * attr,struct netlink_ext_ack * extack)6482 static int rtnl_validate_mdb_entry_get(const struct nlattr *attr,
6483 struct netlink_ext_ack *extack)
6484 {
6485 struct br_mdb_entry *entry = nla_data(attr);
6486
6487 if (nla_len(attr) != sizeof(struct br_mdb_entry)) {
6488 NL_SET_ERR_MSG_ATTR(extack, attr, "Invalid attribute length");
6489 return -EINVAL;
6490 }
6491
6492 if (entry->ifindex) {
6493 NL_SET_ERR_MSG(extack, "Entry ifindex cannot be specified");
6494 return -EINVAL;
6495 }
6496
6497 if (entry->state) {
6498 NL_SET_ERR_MSG(extack, "Entry state cannot be specified");
6499 return -EINVAL;
6500 }
6501
6502 if (entry->flags) {
6503 NL_SET_ERR_MSG(extack, "Entry flags cannot be specified");
6504 return -EINVAL;
6505 }
6506
6507 if (entry->vid >= VLAN_VID_MASK) {
6508 NL_SET_ERR_MSG(extack, "Invalid entry VLAN id");
6509 return -EINVAL;
6510 }
6511
6512 if (entry->addr.proto != htons(ETH_P_IP) &&
6513 entry->addr.proto != htons(ETH_P_IPV6) &&
6514 entry->addr.proto != 0) {
6515 NL_SET_ERR_MSG(extack, "Unknown entry protocol");
6516 return -EINVAL;
6517 }
6518
6519 return 0;
6520 }
6521
6522 static const struct nla_policy mdba_get_policy[MDBA_GET_ENTRY_MAX + 1] = {
6523 [MDBA_GET_ENTRY] = NLA_POLICY_VALIDATE_FN(NLA_BINARY,
6524 rtnl_validate_mdb_entry_get,
6525 sizeof(struct br_mdb_entry)),
6526 [MDBA_GET_ENTRY_ATTRS] = { .type = NLA_NESTED },
6527 };
6528
rtnl_mdb_get(struct sk_buff * in_skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6529 static int rtnl_mdb_get(struct sk_buff *in_skb, struct nlmsghdr *nlh,
6530 struct netlink_ext_ack *extack)
6531 {
6532 struct nlattr *tb[MDBA_GET_ENTRY_MAX + 1];
6533 struct net *net = sock_net(in_skb->sk);
6534 struct br_port_msg *bpm;
6535 struct net_device *dev;
6536 int err;
6537
6538 err = nlmsg_parse(nlh, sizeof(struct br_port_msg), tb,
6539 MDBA_GET_ENTRY_MAX, mdba_get_policy, extack);
6540 if (err)
6541 return err;
6542
6543 bpm = nlmsg_data(nlh);
6544 if (!bpm->ifindex) {
6545 NL_SET_ERR_MSG(extack, "Invalid ifindex");
6546 return -EINVAL;
6547 }
6548
6549 dev = __dev_get_by_index(net, bpm->ifindex);
6550 if (!dev) {
6551 NL_SET_ERR_MSG(extack, "Device doesn't exist");
6552 return -ENODEV;
6553 }
6554
6555 if (NL_REQ_ATTR_CHECK(extack, NULL, tb, MDBA_GET_ENTRY)) {
6556 NL_SET_ERR_MSG(extack, "Missing MDBA_GET_ENTRY attribute");
6557 return -EINVAL;
6558 }
6559
6560 if (!dev->netdev_ops->ndo_mdb_get) {
6561 NL_SET_ERR_MSG(extack, "Device does not support MDB operations");
6562 return -EOPNOTSUPP;
6563 }
6564
6565 return dev->netdev_ops->ndo_mdb_get(dev, tb, NETLINK_CB(in_skb).portid,
6566 nlh->nlmsg_seq, extack);
6567 }
6568
rtnl_validate_mdb_entry(const struct nlattr * attr,struct netlink_ext_ack * extack)6569 static int rtnl_validate_mdb_entry(const struct nlattr *attr,
6570 struct netlink_ext_ack *extack)
6571 {
6572 struct br_mdb_entry *entry = nla_data(attr);
6573
6574 if (nla_len(attr) != sizeof(struct br_mdb_entry)) {
6575 NL_SET_ERR_MSG_ATTR(extack, attr, "Invalid attribute length");
6576 return -EINVAL;
6577 }
6578
6579 if (entry->ifindex == 0) {
6580 NL_SET_ERR_MSG(extack, "Zero entry ifindex is not allowed");
6581 return -EINVAL;
6582 }
6583
6584 if (entry->addr.proto == htons(ETH_P_IP)) {
6585 if (!ipv4_is_multicast(entry->addr.u.ip4) &&
6586 !ipv4_is_zeronet(entry->addr.u.ip4)) {
6587 NL_SET_ERR_MSG(extack, "IPv4 entry group address is not multicast or 0.0.0.0");
6588 return -EINVAL;
6589 }
6590 if (ipv4_is_local_multicast(entry->addr.u.ip4)) {
6591 NL_SET_ERR_MSG(extack, "IPv4 entry group address is local multicast");
6592 return -EINVAL;
6593 }
6594 #if IS_ENABLED(CONFIG_IPV6)
6595 } else if (entry->addr.proto == htons(ETH_P_IPV6)) {
6596 if (ipv6_addr_is_ll_all_nodes(&entry->addr.u.ip6)) {
6597 NL_SET_ERR_MSG(extack, "IPv6 entry group address is link-local all nodes");
6598 return -EINVAL;
6599 }
6600 #endif
6601 } else if (entry->addr.proto == 0) {
6602 /* L2 mdb */
6603 if (!is_multicast_ether_addr(entry->addr.u.mac_addr)) {
6604 NL_SET_ERR_MSG(extack, "L2 entry group is not multicast");
6605 return -EINVAL;
6606 }
6607 } else {
6608 NL_SET_ERR_MSG(extack, "Unknown entry protocol");
6609 return -EINVAL;
6610 }
6611
6612 if (entry->state != MDB_PERMANENT && entry->state != MDB_TEMPORARY) {
6613 NL_SET_ERR_MSG(extack, "Unknown entry state");
6614 return -EINVAL;
6615 }
6616 if (entry->vid >= VLAN_VID_MASK) {
6617 NL_SET_ERR_MSG(extack, "Invalid entry VLAN id");
6618 return -EINVAL;
6619 }
6620
6621 return 0;
6622 }
6623
6624 static const struct nla_policy mdba_policy[MDBA_SET_ENTRY_MAX + 1] = {
6625 [MDBA_SET_ENTRY_UNSPEC] = { .strict_start_type = MDBA_SET_ENTRY_ATTRS + 1 },
6626 [MDBA_SET_ENTRY] = NLA_POLICY_VALIDATE_FN(NLA_BINARY,
6627 rtnl_validate_mdb_entry,
6628 sizeof(struct br_mdb_entry)),
6629 [MDBA_SET_ENTRY_ATTRS] = { .type = NLA_NESTED },
6630 };
6631
rtnl_mdb_add(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6632 static int rtnl_mdb_add(struct sk_buff *skb, struct nlmsghdr *nlh,
6633 struct netlink_ext_ack *extack)
6634 {
6635 struct nlattr *tb[MDBA_SET_ENTRY_MAX + 1];
6636 struct net *net = sock_net(skb->sk);
6637 struct br_port_msg *bpm;
6638 struct net_device *dev;
6639 int err;
6640
6641 err = nlmsg_parse_deprecated(nlh, sizeof(*bpm), tb,
6642 MDBA_SET_ENTRY_MAX, mdba_policy, extack);
6643 if (err)
6644 return err;
6645
6646 bpm = nlmsg_data(nlh);
6647 if (!bpm->ifindex) {
6648 NL_SET_ERR_MSG(extack, "Invalid ifindex");
6649 return -EINVAL;
6650 }
6651
6652 dev = __dev_get_by_index(net, bpm->ifindex);
6653 if (!dev) {
6654 NL_SET_ERR_MSG(extack, "Device doesn't exist");
6655 return -ENODEV;
6656 }
6657
6658 if (NL_REQ_ATTR_CHECK(extack, NULL, tb, MDBA_SET_ENTRY)) {
6659 NL_SET_ERR_MSG(extack, "Missing MDBA_SET_ENTRY attribute");
6660 return -EINVAL;
6661 }
6662
6663 if (!dev->netdev_ops->ndo_mdb_add) {
6664 NL_SET_ERR_MSG(extack, "Device does not support MDB operations");
6665 return -EOPNOTSUPP;
6666 }
6667
6668 return dev->netdev_ops->ndo_mdb_add(dev, tb, nlh->nlmsg_flags, extack);
6669 }
6670
rtnl_validate_mdb_entry_del_bulk(const struct nlattr * attr,struct netlink_ext_ack * extack)6671 static int rtnl_validate_mdb_entry_del_bulk(const struct nlattr *attr,
6672 struct netlink_ext_ack *extack)
6673 {
6674 struct br_mdb_entry *entry = nla_data(attr);
6675 struct br_mdb_entry zero_entry = {};
6676
6677 if (nla_len(attr) != sizeof(struct br_mdb_entry)) {
6678 NL_SET_ERR_MSG_ATTR(extack, attr, "Invalid attribute length");
6679 return -EINVAL;
6680 }
6681
6682 if (entry->state != MDB_PERMANENT && entry->state != MDB_TEMPORARY) {
6683 NL_SET_ERR_MSG(extack, "Unknown entry state");
6684 return -EINVAL;
6685 }
6686
6687 if (entry->flags) {
6688 NL_SET_ERR_MSG(extack, "Entry flags cannot be set");
6689 return -EINVAL;
6690 }
6691
6692 if (entry->vid >= VLAN_N_VID - 1) {
6693 NL_SET_ERR_MSG(extack, "Invalid entry VLAN id");
6694 return -EINVAL;
6695 }
6696
6697 if (memcmp(&entry->addr, &zero_entry.addr, sizeof(entry->addr))) {
6698 NL_SET_ERR_MSG(extack, "Entry address cannot be set");
6699 return -EINVAL;
6700 }
6701
6702 return 0;
6703 }
6704
6705 static const struct nla_policy mdba_del_bulk_policy[MDBA_SET_ENTRY_MAX + 1] = {
6706 [MDBA_SET_ENTRY] = NLA_POLICY_VALIDATE_FN(NLA_BINARY,
6707 rtnl_validate_mdb_entry_del_bulk,
6708 sizeof(struct br_mdb_entry)),
6709 [MDBA_SET_ENTRY_ATTRS] = { .type = NLA_NESTED },
6710 };
6711
rtnl_mdb_del(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6712 static int rtnl_mdb_del(struct sk_buff *skb, struct nlmsghdr *nlh,
6713 struct netlink_ext_ack *extack)
6714 {
6715 bool del_bulk = !!(nlh->nlmsg_flags & NLM_F_BULK);
6716 struct nlattr *tb[MDBA_SET_ENTRY_MAX + 1];
6717 struct net *net = sock_net(skb->sk);
6718 struct br_port_msg *bpm;
6719 struct net_device *dev;
6720 int err;
6721
6722 if (!del_bulk)
6723 err = nlmsg_parse_deprecated(nlh, sizeof(*bpm), tb,
6724 MDBA_SET_ENTRY_MAX, mdba_policy,
6725 extack);
6726 else
6727 err = nlmsg_parse(nlh, sizeof(*bpm), tb, MDBA_SET_ENTRY_MAX,
6728 mdba_del_bulk_policy, extack);
6729 if (err)
6730 return err;
6731
6732 bpm = nlmsg_data(nlh);
6733 if (!bpm->ifindex) {
6734 NL_SET_ERR_MSG(extack, "Invalid ifindex");
6735 return -EINVAL;
6736 }
6737
6738 dev = __dev_get_by_index(net, bpm->ifindex);
6739 if (!dev) {
6740 NL_SET_ERR_MSG(extack, "Device doesn't exist");
6741 return -ENODEV;
6742 }
6743
6744 if (NL_REQ_ATTR_CHECK(extack, NULL, tb, MDBA_SET_ENTRY)) {
6745 NL_SET_ERR_MSG(extack, "Missing MDBA_SET_ENTRY attribute");
6746 return -EINVAL;
6747 }
6748
6749 if (del_bulk) {
6750 if (!dev->netdev_ops->ndo_mdb_del_bulk) {
6751 NL_SET_ERR_MSG(extack, "Device does not support MDB bulk deletion");
6752 return -EOPNOTSUPP;
6753 }
6754 return dev->netdev_ops->ndo_mdb_del_bulk(dev, tb, extack);
6755 }
6756
6757 if (!dev->netdev_ops->ndo_mdb_del) {
6758 NL_SET_ERR_MSG(extack, "Device does not support MDB operations");
6759 return -EOPNOTSUPP;
6760 }
6761
6762 return dev->netdev_ops->ndo_mdb_del(dev, tb, extack);
6763 }
6764
6765 /* Process one rtnetlink message. */
6766
rtnl_dumpit(struct sk_buff * skb,struct netlink_callback * cb)6767 static int rtnl_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
6768 {
6769 const bool needs_lock = !(cb->flags & RTNL_FLAG_DUMP_UNLOCKED);
6770 rtnl_dumpit_func dumpit = cb->data;
6771 int err;
6772
6773 /* Previous iteration have already finished, avoid calling->dumpit()
6774 * again, it may not expect to be called after it reached the end.
6775 */
6776 if (!dumpit)
6777 return 0;
6778
6779 if (needs_lock)
6780 rtnl_lock();
6781 err = dumpit(skb, cb);
6782 if (needs_lock)
6783 rtnl_unlock();
6784
6785 /* Old dump handlers used to send NLM_DONE as in a separate recvmsg().
6786 * Some applications which parse netlink manually depend on this.
6787 */
6788 if (cb->flags & RTNL_FLAG_DUMP_SPLIT_NLM_DONE) {
6789 if (err < 0 && err != -EMSGSIZE)
6790 return err;
6791 if (!err)
6792 cb->data = NULL;
6793
6794 return skb->len;
6795 }
6796 return err;
6797 }
6798
rtnetlink_dump_start(struct sock * ssk,struct sk_buff * skb,const struct nlmsghdr * nlh,struct netlink_dump_control * control)6799 static int rtnetlink_dump_start(struct sock *ssk, struct sk_buff *skb,
6800 const struct nlmsghdr *nlh,
6801 struct netlink_dump_control *control)
6802 {
6803 if (control->flags & RTNL_FLAG_DUMP_SPLIT_NLM_DONE ||
6804 !(control->flags & RTNL_FLAG_DUMP_UNLOCKED)) {
6805 WARN_ON(control->data);
6806 control->data = control->dump;
6807 control->dump = rtnl_dumpit;
6808 }
6809
6810 return netlink_dump_start(ssk, skb, nlh, control);
6811 }
6812
rtnetlink_rcv_msg(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6813 static int rtnetlink_rcv_msg(struct sk_buff *skb, struct nlmsghdr *nlh,
6814 struct netlink_ext_ack *extack)
6815 {
6816 struct net *net = sock_net(skb->sk);
6817 struct rtnl_link *link;
6818 enum rtnl_kinds kind;
6819 struct module *owner;
6820 int err = -EOPNOTSUPP;
6821 rtnl_doit_func doit;
6822 unsigned int flags;
6823 int family;
6824 int type;
6825
6826 type = nlh->nlmsg_type;
6827 if (type > RTM_MAX)
6828 return -EOPNOTSUPP;
6829
6830 type -= RTM_BASE;
6831
6832 /* All the messages must have at least 1 byte length */
6833 if (nlmsg_len(nlh) < sizeof(struct rtgenmsg))
6834 return 0;
6835
6836 family = ((struct rtgenmsg *)nlmsg_data(nlh))->rtgen_family;
6837 kind = rtnl_msgtype_kind(type);
6838
6839 if (kind != RTNL_KIND_GET && !netlink_net_capable(skb, CAP_NET_ADMIN))
6840 return -EPERM;
6841
6842 rcu_read_lock();
6843 if (kind == RTNL_KIND_GET && (nlh->nlmsg_flags & NLM_F_DUMP)) {
6844 struct sock *rtnl;
6845 rtnl_dumpit_func dumpit;
6846 u32 min_dump_alloc = 0;
6847
6848 link = rtnl_get_link(family, type);
6849 if (!link || !link->dumpit) {
6850 family = PF_UNSPEC;
6851 link = rtnl_get_link(family, type);
6852 if (!link || !link->dumpit)
6853 goto err_unlock;
6854 }
6855 owner = link->owner;
6856 dumpit = link->dumpit;
6857 flags = link->flags;
6858
6859 if (type == RTM_GETLINK - RTM_BASE)
6860 min_dump_alloc = rtnl_calcit(skb, nlh);
6861
6862 err = 0;
6863 /* need to do this before rcu_read_unlock() */
6864 if (!try_module_get(owner))
6865 err = -EPROTONOSUPPORT;
6866
6867 rcu_read_unlock();
6868
6869 rtnl = net->rtnl;
6870 if (err == 0) {
6871 struct netlink_dump_control c = {
6872 .dump = dumpit,
6873 .min_dump_alloc = min_dump_alloc,
6874 .module = owner,
6875 .flags = flags,
6876 };
6877 err = rtnetlink_dump_start(rtnl, skb, nlh, &c);
6878 /* netlink_dump_start() will keep a reference on
6879 * module if dump is still in progress.
6880 */
6881 module_put(owner);
6882 }
6883 return err;
6884 }
6885
6886 link = rtnl_get_link(family, type);
6887 if (!link || !link->doit) {
6888 family = PF_UNSPEC;
6889 link = rtnl_get_link(PF_UNSPEC, type);
6890 if (!link || !link->doit)
6891 goto out_unlock;
6892 }
6893
6894 owner = link->owner;
6895 if (!try_module_get(owner)) {
6896 err = -EPROTONOSUPPORT;
6897 goto out_unlock;
6898 }
6899
6900 flags = link->flags;
6901 if (kind == RTNL_KIND_DEL && (nlh->nlmsg_flags & NLM_F_BULK) &&
6902 !(flags & RTNL_FLAG_BULK_DEL_SUPPORTED)) {
6903 NL_SET_ERR_MSG(extack, "Bulk delete is not supported");
6904 module_put(owner);
6905 goto err_unlock;
6906 }
6907
6908 if (flags & RTNL_FLAG_DOIT_UNLOCKED) {
6909 doit = link->doit;
6910 rcu_read_unlock();
6911 if (doit)
6912 err = doit(skb, nlh, extack);
6913 module_put(owner);
6914 return err;
6915 }
6916 rcu_read_unlock();
6917
6918 rtnl_lock();
6919 link = rtnl_get_link(family, type);
6920 if (link && link->doit)
6921 err = link->doit(skb, nlh, extack);
6922 rtnl_unlock();
6923
6924 module_put(owner);
6925
6926 return err;
6927
6928 out_unlock:
6929 rcu_read_unlock();
6930 return err;
6931
6932 err_unlock:
6933 rcu_read_unlock();
6934 return -EOPNOTSUPP;
6935 }
6936
rtnetlink_rcv(struct sk_buff * skb)6937 static void rtnetlink_rcv(struct sk_buff *skb)
6938 {
6939 netlink_rcv_skb(skb, &rtnetlink_rcv_msg);
6940 }
6941
rtnetlink_bind(struct net * net,int group)6942 static int rtnetlink_bind(struct net *net, int group)
6943 {
6944 switch (group) {
6945 case RTNLGRP_IPV4_MROUTE_R:
6946 case RTNLGRP_IPV6_MROUTE_R:
6947 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
6948 return -EPERM;
6949 break;
6950 }
6951 return 0;
6952 }
6953
rtnetlink_event(struct notifier_block * this,unsigned long event,void * ptr)6954 static int rtnetlink_event(struct notifier_block *this, unsigned long event, void *ptr)
6955 {
6956 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
6957
6958 switch (event) {
6959 case NETDEV_REBOOT:
6960 case NETDEV_CHANGEMTU:
6961 case NETDEV_CHANGEADDR:
6962 case NETDEV_CHANGENAME:
6963 case NETDEV_FEAT_CHANGE:
6964 case NETDEV_BONDING_FAILOVER:
6965 case NETDEV_POST_TYPE_CHANGE:
6966 case NETDEV_NOTIFY_PEERS:
6967 case NETDEV_CHANGEUPPER:
6968 case NETDEV_RESEND_IGMP:
6969 case NETDEV_CHANGEINFODATA:
6970 case NETDEV_CHANGELOWERSTATE:
6971 case NETDEV_CHANGE_TX_QUEUE_LEN:
6972 rtmsg_ifinfo_event(RTM_NEWLINK, dev, 0, rtnl_get_event(event),
6973 GFP_KERNEL, NULL, 0, 0, NULL);
6974 break;
6975 default:
6976 break;
6977 }
6978 return NOTIFY_DONE;
6979 }
6980
6981 static struct notifier_block rtnetlink_dev_notifier = {
6982 .notifier_call = rtnetlink_event,
6983 };
6984
6985
rtnetlink_net_init(struct net * net)6986 static int __net_init rtnetlink_net_init(struct net *net)
6987 {
6988 struct sock *sk;
6989 struct netlink_kernel_cfg cfg = {
6990 .groups = RTNLGRP_MAX,
6991 .input = rtnetlink_rcv,
6992 .flags = NL_CFG_F_NONROOT_RECV,
6993 .bind = rtnetlink_bind,
6994 };
6995
6996 sk = netlink_kernel_create(net, NETLINK_ROUTE, &cfg);
6997 if (!sk)
6998 return -ENOMEM;
6999 net->rtnl = sk;
7000 return 0;
7001 }
7002
rtnetlink_net_exit(struct net * net)7003 static void __net_exit rtnetlink_net_exit(struct net *net)
7004 {
7005 netlink_kernel_release(net->rtnl);
7006 net->rtnl = NULL;
7007 }
7008
7009 static struct pernet_operations rtnetlink_net_ops = {
7010 .init = rtnetlink_net_init,
7011 .exit = rtnetlink_net_exit,
7012 };
7013
7014 static const struct rtnl_msg_handler rtnetlink_rtnl_msg_handlers[] __initconst = {
7015 {.msgtype = RTM_NEWLINK, .doit = rtnl_newlink,
7016 .flags = RTNL_FLAG_DOIT_PERNET},
7017 {.msgtype = RTM_DELLINK, .doit = rtnl_dellink,
7018 .flags = RTNL_FLAG_DOIT_PERNET_WIP},
7019 {.msgtype = RTM_GETLINK, .doit = rtnl_getlink,
7020 .dumpit = rtnl_dump_ifinfo, .flags = RTNL_FLAG_DUMP_SPLIT_NLM_DONE},
7021 {.msgtype = RTM_SETLINK, .doit = rtnl_setlink,
7022 .flags = RTNL_FLAG_DOIT_PERNET_WIP},
7023 {.msgtype = RTM_GETADDR, .dumpit = rtnl_dump_all},
7024 {.msgtype = RTM_GETROUTE, .dumpit = rtnl_dump_all},
7025 {.msgtype = RTM_GETNETCONF, .dumpit = rtnl_dump_all},
7026 {.msgtype = RTM_GETSTATS, .doit = rtnl_stats_get,
7027 .dumpit = rtnl_stats_dump},
7028 {.msgtype = RTM_SETSTATS, .doit = rtnl_stats_set},
7029 {.msgtype = RTM_NEWLINKPROP, .doit = rtnl_newlinkprop},
7030 {.msgtype = RTM_DELLINKPROP, .doit = rtnl_dellinkprop},
7031 {.protocol = PF_BRIDGE, .msgtype = RTM_GETLINK,
7032 .dumpit = rtnl_bridge_getlink},
7033 {.protocol = PF_BRIDGE, .msgtype = RTM_DELLINK,
7034 .doit = rtnl_bridge_dellink},
7035 {.protocol = PF_BRIDGE, .msgtype = RTM_SETLINK,
7036 .doit = rtnl_bridge_setlink},
7037 {.protocol = PF_BRIDGE, .msgtype = RTM_NEWNEIGH, .doit = rtnl_fdb_add},
7038 {.protocol = PF_BRIDGE, .msgtype = RTM_DELNEIGH, .doit = rtnl_fdb_del,
7039 .flags = RTNL_FLAG_BULK_DEL_SUPPORTED},
7040 {.protocol = PF_BRIDGE, .msgtype = RTM_GETNEIGH, .doit = rtnl_fdb_get,
7041 .dumpit = rtnl_fdb_dump},
7042 {.protocol = PF_BRIDGE, .msgtype = RTM_NEWMDB, .doit = rtnl_mdb_add},
7043 {.protocol = PF_BRIDGE, .msgtype = RTM_DELMDB, .doit = rtnl_mdb_del,
7044 .flags = RTNL_FLAG_BULK_DEL_SUPPORTED},
7045 {.protocol = PF_BRIDGE, .msgtype = RTM_GETMDB, .doit = rtnl_mdb_get,
7046 .dumpit = rtnl_mdb_dump},
7047 };
7048
rtnetlink_init(void)7049 void __init rtnetlink_init(void)
7050 {
7051 if (register_pernet_subsys(&rtnetlink_net_ops))
7052 panic("rtnetlink_init: cannot initialize rtnetlink\n");
7053
7054 register_netdevice_notifier(&rtnetlink_dev_notifier);
7055
7056 rtnl_register_many(rtnetlink_rtnl_msg_handlers);
7057 }
7058