1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3 * INET An implementation of the TCP/IP protocol suite for the LINUX
4 * operating system. INET is implemented using the BSD Socket
5 * interface as the means of communication with the user level.
6 *
7 * Routing netlink socket interface: protocol independent part.
8 *
9 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 *
11 * Fixes:
12 * Vitaly E. Lavrov RTA_OK arithmetic was wrong.
13 */
14
15 #include <linux/bitops.h>
16 #include <linux/errno.h>
17 #include <linux/module.h>
18 #include <linux/types.h>
19 #include <linux/socket.h>
20 #include <linux/kernel.h>
21 #include <linux/timer.h>
22 #include <linux/string.h>
23 #include <linux/sockios.h>
24 #include <linux/net.h>
25 #include <linux/fcntl.h>
26 #include <linux/mm.h>
27 #include <linux/slab.h>
28 #include <linux/interrupt.h>
29 #include <linux/capability.h>
30 #include <linux/skbuff.h>
31 #include <linux/init.h>
32 #include <linux/security.h>
33 #include <linux/mutex.h>
34 #include <linux/if_addr.h>
35 #include <linux/if_bridge.h>
36 #include <linux/if_vlan.h>
37 #include <linux/pci.h>
38 #include <linux/etherdevice.h>
39 #include <linux/bpf.h>
40
41 #include <linux/uaccess.h>
42
43 #include <linux/inet.h>
44 #include <linux/netdevice.h>
45 #include <net/ip.h>
46 #include <net/protocol.h>
47 #include <net/arp.h>
48 #include <net/route.h>
49 #include <net/udp.h>
50 #include <net/tcp.h>
51 #include <net/sock.h>
52 #include <net/pkt_sched.h>
53 #include <net/fib_rules.h>
54 #include <net/rtnetlink.h>
55 #include <net/net_namespace.h>
56 #include <net/devlink.h>
57 #if IS_ENABLED(CONFIG_IPV6)
58 #include <net/addrconf.h>
59 #endif
60 #include <linux/dpll.h>
61
62 #include "dev.h"
63
64 #define RTNL_MAX_TYPE 50
65 #define RTNL_SLAVE_MAX_TYPE 44
66
67 struct rtnl_link {
68 rtnl_doit_func doit;
69 rtnl_dumpit_func dumpit;
70 struct module *owner;
71 unsigned int flags;
72 struct rcu_head rcu;
73 };
74
75 static DEFINE_MUTEX(rtnl_mutex);
76
rtnl_lock(void)77 void rtnl_lock(void)
78 {
79 mutex_lock(&rtnl_mutex);
80 }
81 EXPORT_SYMBOL(rtnl_lock);
82
rtnl_lock_killable(void)83 int rtnl_lock_killable(void)
84 {
85 return mutex_lock_killable(&rtnl_mutex);
86 }
87 EXPORT_SYMBOL(rtnl_lock_killable);
88
89 static struct sk_buff *defer_kfree_skb_list;
rtnl_kfree_skbs(struct sk_buff * head,struct sk_buff * tail)90 void rtnl_kfree_skbs(struct sk_buff *head, struct sk_buff *tail)
91 {
92 if (head && tail) {
93 tail->next = defer_kfree_skb_list;
94 defer_kfree_skb_list = head;
95 }
96 }
97 EXPORT_SYMBOL(rtnl_kfree_skbs);
98
__rtnl_unlock(void)99 void __rtnl_unlock(void)
100 {
101 struct sk_buff *head = defer_kfree_skb_list;
102
103 defer_kfree_skb_list = NULL;
104
105 /* Ensure that we didn't actually add any TODO item when __rtnl_unlock()
106 * is used. In some places, e.g. in cfg80211, we have code that will do
107 * something like
108 * rtnl_lock()
109 * wiphy_lock()
110 * ...
111 * rtnl_unlock()
112 *
113 * and because netdev_run_todo() acquires the RTNL for items on the list
114 * we could cause a situation such as this:
115 * Thread 1 Thread 2
116 * rtnl_lock()
117 * unregister_netdevice()
118 * __rtnl_unlock()
119 * rtnl_lock()
120 * wiphy_lock()
121 * rtnl_unlock()
122 * netdev_run_todo()
123 * __rtnl_unlock()
124 *
125 * // list not empty now
126 * // because of thread 2
127 * rtnl_lock()
128 * while (!list_empty(...))
129 * rtnl_lock()
130 * wiphy_lock()
131 * **** DEADLOCK ****
132 *
133 * However, usage of __rtnl_unlock() is rare, and so we can ensure that
134 * it's not used in cases where something is added to do the list.
135 */
136 WARN_ON(!list_empty(&net_todo_list));
137
138 mutex_unlock(&rtnl_mutex);
139
140 while (head) {
141 struct sk_buff *next = head->next;
142
143 kfree_skb(head);
144 cond_resched();
145 head = next;
146 }
147 }
148
rtnl_unlock(void)149 void rtnl_unlock(void)
150 {
151 /* This fellow will unlock it for us. */
152 netdev_run_todo();
153 }
154 EXPORT_SYMBOL(rtnl_unlock);
155
rtnl_trylock(void)156 int rtnl_trylock(void)
157 {
158 return mutex_trylock(&rtnl_mutex);
159 }
160 EXPORT_SYMBOL(rtnl_trylock);
161
rtnl_is_locked(void)162 int rtnl_is_locked(void)
163 {
164 return mutex_is_locked(&rtnl_mutex);
165 }
166 EXPORT_SYMBOL(rtnl_is_locked);
167
refcount_dec_and_rtnl_lock(refcount_t * r)168 bool refcount_dec_and_rtnl_lock(refcount_t *r)
169 {
170 return refcount_dec_and_mutex_lock(r, &rtnl_mutex);
171 }
172 EXPORT_SYMBOL(refcount_dec_and_rtnl_lock);
173
174 #ifdef CONFIG_PROVE_LOCKING
lockdep_rtnl_is_held(void)175 bool lockdep_rtnl_is_held(void)
176 {
177 return lockdep_is_held(&rtnl_mutex);
178 }
179 EXPORT_SYMBOL(lockdep_rtnl_is_held);
180 #endif /* #ifdef CONFIG_PROVE_LOCKING */
181
182 static struct rtnl_link __rcu *__rcu *rtnl_msg_handlers[RTNL_FAMILY_MAX + 1];
183
rtm_msgindex(int msgtype)184 static inline int rtm_msgindex(int msgtype)
185 {
186 int msgindex = msgtype - RTM_BASE;
187
188 /*
189 * msgindex < 0 implies someone tried to register a netlink
190 * control code. msgindex >= RTM_NR_MSGTYPES may indicate that
191 * the message type has not been added to linux/rtnetlink.h
192 */
193 BUG_ON(msgindex < 0 || msgindex >= RTM_NR_MSGTYPES);
194
195 return msgindex;
196 }
197
rtnl_get_link(int protocol,int msgtype)198 static struct rtnl_link *rtnl_get_link(int protocol, int msgtype)
199 {
200 struct rtnl_link __rcu **tab;
201
202 if (protocol >= ARRAY_SIZE(rtnl_msg_handlers))
203 protocol = PF_UNSPEC;
204
205 tab = rcu_dereference_rtnl(rtnl_msg_handlers[protocol]);
206 if (!tab)
207 tab = rcu_dereference_rtnl(rtnl_msg_handlers[PF_UNSPEC]);
208
209 return rcu_dereference_rtnl(tab[msgtype]);
210 }
211
rtnl_register_internal(struct module * owner,int protocol,int msgtype,rtnl_doit_func doit,rtnl_dumpit_func dumpit,unsigned int flags)212 static int rtnl_register_internal(struct module *owner,
213 int protocol, int msgtype,
214 rtnl_doit_func doit, rtnl_dumpit_func dumpit,
215 unsigned int flags)
216 {
217 struct rtnl_link *link, *old;
218 struct rtnl_link __rcu **tab;
219 int msgindex;
220 int ret = -ENOBUFS;
221
222 BUG_ON(protocol < 0 || protocol > RTNL_FAMILY_MAX);
223 msgindex = rtm_msgindex(msgtype);
224
225 rtnl_lock();
226 tab = rtnl_dereference(rtnl_msg_handlers[protocol]);
227 if (tab == NULL) {
228 tab = kcalloc(RTM_NR_MSGTYPES, sizeof(void *), GFP_KERNEL);
229 if (!tab)
230 goto unlock;
231
232 /* ensures we see the 0 stores */
233 rcu_assign_pointer(rtnl_msg_handlers[protocol], tab);
234 }
235
236 old = rtnl_dereference(tab[msgindex]);
237 if (old) {
238 link = kmemdup(old, sizeof(*old), GFP_KERNEL);
239 if (!link)
240 goto unlock;
241 } else {
242 link = kzalloc(sizeof(*link), GFP_KERNEL);
243 if (!link)
244 goto unlock;
245 }
246
247 WARN_ON(link->owner && link->owner != owner);
248 link->owner = owner;
249
250 WARN_ON(doit && link->doit && link->doit != doit);
251 if (doit)
252 link->doit = doit;
253 WARN_ON(dumpit && link->dumpit && link->dumpit != dumpit);
254 if (dumpit)
255 link->dumpit = dumpit;
256
257 WARN_ON(rtnl_msgtype_kind(msgtype) != RTNL_KIND_DEL &&
258 (flags & RTNL_FLAG_BULK_DEL_SUPPORTED));
259 link->flags |= flags;
260
261 /* publish protocol:msgtype */
262 rcu_assign_pointer(tab[msgindex], link);
263 ret = 0;
264 if (old)
265 kfree_rcu(old, rcu);
266 unlock:
267 rtnl_unlock();
268 return ret;
269 }
270
271 /**
272 * rtnl_register_module - Register a rtnetlink message type
273 *
274 * @owner: module registering the hook (THIS_MODULE)
275 * @protocol: Protocol family or PF_UNSPEC
276 * @msgtype: rtnetlink message type
277 * @doit: Function pointer called for each request message
278 * @dumpit: Function pointer called for each dump request (NLM_F_DUMP) message
279 * @flags: rtnl_link_flags to modify behaviour of doit/dumpit functions
280 *
281 * Like rtnl_register, but for use by removable modules.
282 */
rtnl_register_module(struct module * owner,int protocol,int msgtype,rtnl_doit_func doit,rtnl_dumpit_func dumpit,unsigned int flags)283 int rtnl_register_module(struct module *owner,
284 int protocol, int msgtype,
285 rtnl_doit_func doit, rtnl_dumpit_func dumpit,
286 unsigned int flags)
287 {
288 return rtnl_register_internal(owner, protocol, msgtype,
289 doit, dumpit, flags);
290 }
291 EXPORT_SYMBOL_GPL(rtnl_register_module);
292
293 /**
294 * rtnl_register - Register a rtnetlink message type
295 * @protocol: Protocol family or PF_UNSPEC
296 * @msgtype: rtnetlink message type
297 * @doit: Function pointer called for each request message
298 * @dumpit: Function pointer called for each dump request (NLM_F_DUMP) message
299 * @flags: rtnl_link_flags to modify behaviour of doit/dumpit functions
300 *
301 * Registers the specified function pointers (at least one of them has
302 * to be non-NULL) to be called whenever a request message for the
303 * specified protocol family and message type is received.
304 *
305 * The special protocol family PF_UNSPEC may be used to define fallback
306 * function pointers for the case when no entry for the specific protocol
307 * family exists.
308 */
rtnl_register(int protocol,int msgtype,rtnl_doit_func doit,rtnl_dumpit_func dumpit,unsigned int flags)309 void rtnl_register(int protocol, int msgtype,
310 rtnl_doit_func doit, rtnl_dumpit_func dumpit,
311 unsigned int flags)
312 {
313 int err;
314
315 err = rtnl_register_internal(NULL, protocol, msgtype, doit, dumpit,
316 flags);
317 if (err)
318 pr_err("Unable to register rtnetlink message handler, "
319 "protocol = %d, message type = %d\n", protocol, msgtype);
320 }
321
322 /**
323 * rtnl_unregister - Unregister a rtnetlink message type
324 * @protocol: Protocol family or PF_UNSPEC
325 * @msgtype: rtnetlink message type
326 *
327 * Returns 0 on success or a negative error code.
328 */
rtnl_unregister(int protocol,int msgtype)329 int rtnl_unregister(int protocol, int msgtype)
330 {
331 struct rtnl_link __rcu **tab;
332 struct rtnl_link *link;
333 int msgindex;
334
335 BUG_ON(protocol < 0 || protocol > RTNL_FAMILY_MAX);
336 msgindex = rtm_msgindex(msgtype);
337
338 rtnl_lock();
339 tab = rtnl_dereference(rtnl_msg_handlers[protocol]);
340 if (!tab) {
341 rtnl_unlock();
342 return -ENOENT;
343 }
344
345 link = rcu_replace_pointer_rtnl(tab[msgindex], NULL);
346 rtnl_unlock();
347
348 kfree_rcu(link, rcu);
349
350 return 0;
351 }
352 EXPORT_SYMBOL_GPL(rtnl_unregister);
353
354 /**
355 * rtnl_unregister_all - Unregister all rtnetlink message type of a protocol
356 * @protocol : Protocol family or PF_UNSPEC
357 *
358 * Identical to calling rtnl_unregster() for all registered message types
359 * of a certain protocol family.
360 */
rtnl_unregister_all(int protocol)361 void rtnl_unregister_all(int protocol)
362 {
363 struct rtnl_link __rcu **tab;
364 struct rtnl_link *link;
365 int msgindex;
366
367 BUG_ON(protocol < 0 || protocol > RTNL_FAMILY_MAX);
368
369 rtnl_lock();
370 tab = rcu_replace_pointer_rtnl(rtnl_msg_handlers[protocol], NULL);
371 if (!tab) {
372 rtnl_unlock();
373 return;
374 }
375 for (msgindex = 0; msgindex < RTM_NR_MSGTYPES; msgindex++) {
376 link = rcu_replace_pointer_rtnl(tab[msgindex], NULL);
377 kfree_rcu(link, rcu);
378 }
379 rtnl_unlock();
380
381 synchronize_net();
382
383 kfree(tab);
384 }
385 EXPORT_SYMBOL_GPL(rtnl_unregister_all);
386
__rtnl_register_many(const struct rtnl_msg_handler * handlers,int n)387 int __rtnl_register_many(const struct rtnl_msg_handler *handlers, int n)
388 {
389 const struct rtnl_msg_handler *handler;
390 int i, err;
391
392 for (i = 0, handler = handlers; i < n; i++, handler++) {
393 err = rtnl_register_internal(handler->owner, handler->protocol,
394 handler->msgtype, handler->doit,
395 handler->dumpit, handler->flags);
396 if (err) {
397 __rtnl_unregister_many(handlers, i);
398 break;
399 }
400 }
401
402 return err;
403 }
404 EXPORT_SYMBOL_GPL(__rtnl_register_many);
405
__rtnl_unregister_many(const struct rtnl_msg_handler * handlers,int n)406 void __rtnl_unregister_many(const struct rtnl_msg_handler *handlers, int n)
407 {
408 const struct rtnl_msg_handler *handler;
409 int i;
410
411 for (i = n - 1, handler = handlers + n - 1; i >= 0; i--, handler--)
412 rtnl_unregister(handler->protocol, handler->msgtype);
413 }
414 EXPORT_SYMBOL_GPL(__rtnl_unregister_many);
415
416 static LIST_HEAD(link_ops);
417
rtnl_link_ops_get(const char * kind)418 static const struct rtnl_link_ops *rtnl_link_ops_get(const char *kind)
419 {
420 const struct rtnl_link_ops *ops;
421
422 list_for_each_entry(ops, &link_ops, list) {
423 if (!strcmp(ops->kind, kind))
424 return ops;
425 }
426 return NULL;
427 }
428
429 /**
430 * __rtnl_link_register - Register rtnl_link_ops with rtnetlink.
431 * @ops: struct rtnl_link_ops * to register
432 *
433 * The caller must hold the rtnl_mutex. This function should be used
434 * by drivers that create devices during module initialization. It
435 * must be called before registering the devices.
436 *
437 * Returns 0 on success or a negative error code.
438 */
__rtnl_link_register(struct rtnl_link_ops * ops)439 int __rtnl_link_register(struct rtnl_link_ops *ops)
440 {
441 if (rtnl_link_ops_get(ops->kind))
442 return -EEXIST;
443
444 /* The check for alloc/setup is here because if ops
445 * does not have that filled up, it is not possible
446 * to use the ops for creating device. So do not
447 * fill up dellink as well. That disables rtnl_dellink.
448 */
449 if ((ops->alloc || ops->setup) && !ops->dellink)
450 ops->dellink = unregister_netdevice_queue;
451
452 list_add_tail(&ops->list, &link_ops);
453 return 0;
454 }
455 EXPORT_SYMBOL_GPL(__rtnl_link_register);
456
457 /**
458 * rtnl_link_register - Register rtnl_link_ops with rtnetlink.
459 * @ops: struct rtnl_link_ops * to register
460 *
461 * Returns 0 on success or a negative error code.
462 */
rtnl_link_register(struct rtnl_link_ops * ops)463 int rtnl_link_register(struct rtnl_link_ops *ops)
464 {
465 int err;
466
467 /* Sanity-check max sizes to avoid stack buffer overflow. */
468 if (WARN_ON(ops->maxtype > RTNL_MAX_TYPE ||
469 ops->slave_maxtype > RTNL_SLAVE_MAX_TYPE))
470 return -EINVAL;
471
472 rtnl_lock();
473 err = __rtnl_link_register(ops);
474 rtnl_unlock();
475 return err;
476 }
477 EXPORT_SYMBOL_GPL(rtnl_link_register);
478
__rtnl_kill_links(struct net * net,struct rtnl_link_ops * ops)479 static void __rtnl_kill_links(struct net *net, struct rtnl_link_ops *ops)
480 {
481 struct net_device *dev;
482 LIST_HEAD(list_kill);
483
484 for_each_netdev(net, dev) {
485 if (dev->rtnl_link_ops == ops)
486 ops->dellink(dev, &list_kill);
487 }
488 unregister_netdevice_many(&list_kill);
489 }
490
491 /**
492 * __rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
493 * @ops: struct rtnl_link_ops * to unregister
494 *
495 * The caller must hold the rtnl_mutex and guarantee net_namespace_list
496 * integrity (hold pernet_ops_rwsem for writing to close the race
497 * with setup_net() and cleanup_net()).
498 */
__rtnl_link_unregister(struct rtnl_link_ops * ops)499 void __rtnl_link_unregister(struct rtnl_link_ops *ops)
500 {
501 struct net *net;
502
503 for_each_net(net) {
504 __rtnl_kill_links(net, ops);
505 }
506 list_del(&ops->list);
507 }
508 EXPORT_SYMBOL_GPL(__rtnl_link_unregister);
509
510 /* Return with the rtnl_lock held when there are no network
511 * devices unregistering in any network namespace.
512 */
rtnl_lock_unregistering_all(void)513 static void rtnl_lock_unregistering_all(void)
514 {
515 DEFINE_WAIT_FUNC(wait, woken_wake_function);
516
517 add_wait_queue(&netdev_unregistering_wq, &wait);
518 for (;;) {
519 rtnl_lock();
520 /* We held write locked pernet_ops_rwsem, and parallel
521 * setup_net() and cleanup_net() are not possible.
522 */
523 if (!atomic_read(&dev_unreg_count))
524 break;
525 __rtnl_unlock();
526
527 wait_woken(&wait, TASK_UNINTERRUPTIBLE, MAX_SCHEDULE_TIMEOUT);
528 }
529 remove_wait_queue(&netdev_unregistering_wq, &wait);
530 }
531
532 /**
533 * rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
534 * @ops: struct rtnl_link_ops * to unregister
535 */
rtnl_link_unregister(struct rtnl_link_ops * ops)536 void rtnl_link_unregister(struct rtnl_link_ops *ops)
537 {
538 /* Close the race with setup_net() and cleanup_net() */
539 down_write(&pernet_ops_rwsem);
540 rtnl_lock_unregistering_all();
541 __rtnl_link_unregister(ops);
542 rtnl_unlock();
543 up_write(&pernet_ops_rwsem);
544 }
545 EXPORT_SYMBOL_GPL(rtnl_link_unregister);
546
rtnl_link_get_slave_info_data_size(const struct net_device * dev)547 static size_t rtnl_link_get_slave_info_data_size(const struct net_device *dev)
548 {
549 struct net_device *master_dev;
550 const struct rtnl_link_ops *ops;
551 size_t size = 0;
552
553 rcu_read_lock();
554
555 master_dev = netdev_master_upper_dev_get_rcu((struct net_device *)dev);
556 if (!master_dev)
557 goto out;
558
559 ops = master_dev->rtnl_link_ops;
560 if (!ops || !ops->get_slave_size)
561 goto out;
562 /* IFLA_INFO_SLAVE_DATA + nested data */
563 size = nla_total_size(sizeof(struct nlattr)) +
564 ops->get_slave_size(master_dev, dev);
565
566 out:
567 rcu_read_unlock();
568 return size;
569 }
570
rtnl_link_get_size(const struct net_device * dev)571 static size_t rtnl_link_get_size(const struct net_device *dev)
572 {
573 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
574 size_t size;
575
576 if (!ops)
577 return 0;
578
579 size = nla_total_size(sizeof(struct nlattr)) + /* IFLA_LINKINFO */
580 nla_total_size(strlen(ops->kind) + 1); /* IFLA_INFO_KIND */
581
582 if (ops->get_size)
583 /* IFLA_INFO_DATA + nested data */
584 size += nla_total_size(sizeof(struct nlattr)) +
585 ops->get_size(dev);
586
587 if (ops->get_xstats_size)
588 /* IFLA_INFO_XSTATS */
589 size += nla_total_size(ops->get_xstats_size(dev));
590
591 size += rtnl_link_get_slave_info_data_size(dev);
592
593 return size;
594 }
595
596 static LIST_HEAD(rtnl_af_ops);
597
rtnl_af_lookup(const int family)598 static const struct rtnl_af_ops *rtnl_af_lookup(const int family)
599 {
600 const struct rtnl_af_ops *ops;
601
602 ASSERT_RTNL();
603
604 list_for_each_entry(ops, &rtnl_af_ops, list) {
605 if (ops->family == family)
606 return ops;
607 }
608
609 return NULL;
610 }
611
612 /**
613 * rtnl_af_register - Register rtnl_af_ops with rtnetlink.
614 * @ops: struct rtnl_af_ops * to register
615 *
616 * Returns 0 on success or a negative error code.
617 */
rtnl_af_register(struct rtnl_af_ops * ops)618 void rtnl_af_register(struct rtnl_af_ops *ops)
619 {
620 rtnl_lock();
621 list_add_tail_rcu(&ops->list, &rtnl_af_ops);
622 rtnl_unlock();
623 }
624 EXPORT_SYMBOL_GPL(rtnl_af_register);
625
626 /**
627 * rtnl_af_unregister - Unregister rtnl_af_ops from rtnetlink.
628 * @ops: struct rtnl_af_ops * to unregister
629 */
rtnl_af_unregister(struct rtnl_af_ops * ops)630 void rtnl_af_unregister(struct rtnl_af_ops *ops)
631 {
632 rtnl_lock();
633 list_del_rcu(&ops->list);
634 rtnl_unlock();
635
636 synchronize_rcu();
637 }
638 EXPORT_SYMBOL_GPL(rtnl_af_unregister);
639
rtnl_link_get_af_size(const struct net_device * dev,u32 ext_filter_mask)640 static size_t rtnl_link_get_af_size(const struct net_device *dev,
641 u32 ext_filter_mask)
642 {
643 struct rtnl_af_ops *af_ops;
644 size_t size;
645
646 /* IFLA_AF_SPEC */
647 size = nla_total_size(sizeof(struct nlattr));
648
649 rcu_read_lock();
650 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
651 if (af_ops->get_link_af_size) {
652 /* AF_* + nested data */
653 size += nla_total_size(sizeof(struct nlattr)) +
654 af_ops->get_link_af_size(dev, ext_filter_mask);
655 }
656 }
657 rcu_read_unlock();
658
659 return size;
660 }
661
rtnl_have_link_slave_info(const struct net_device * dev)662 static bool rtnl_have_link_slave_info(const struct net_device *dev)
663 {
664 struct net_device *master_dev;
665 bool ret = false;
666
667 rcu_read_lock();
668
669 master_dev = netdev_master_upper_dev_get_rcu((struct net_device *)dev);
670 if (master_dev && master_dev->rtnl_link_ops)
671 ret = true;
672 rcu_read_unlock();
673 return ret;
674 }
675
rtnl_link_slave_info_fill(struct sk_buff * skb,const struct net_device * dev)676 static int rtnl_link_slave_info_fill(struct sk_buff *skb,
677 const struct net_device *dev)
678 {
679 struct net_device *master_dev;
680 const struct rtnl_link_ops *ops;
681 struct nlattr *slave_data;
682 int err;
683
684 master_dev = netdev_master_upper_dev_get((struct net_device *) dev);
685 if (!master_dev)
686 return 0;
687 ops = master_dev->rtnl_link_ops;
688 if (!ops)
689 return 0;
690 if (nla_put_string(skb, IFLA_INFO_SLAVE_KIND, ops->kind) < 0)
691 return -EMSGSIZE;
692 if (ops->fill_slave_info) {
693 slave_data = nla_nest_start_noflag(skb, IFLA_INFO_SLAVE_DATA);
694 if (!slave_data)
695 return -EMSGSIZE;
696 err = ops->fill_slave_info(skb, master_dev, dev);
697 if (err < 0)
698 goto err_cancel_slave_data;
699 nla_nest_end(skb, slave_data);
700 }
701 return 0;
702
703 err_cancel_slave_data:
704 nla_nest_cancel(skb, slave_data);
705 return err;
706 }
707
rtnl_link_info_fill(struct sk_buff * skb,const struct net_device * dev)708 static int rtnl_link_info_fill(struct sk_buff *skb,
709 const struct net_device *dev)
710 {
711 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
712 struct nlattr *data;
713 int err;
714
715 if (!ops)
716 return 0;
717 if (nla_put_string(skb, IFLA_INFO_KIND, ops->kind) < 0)
718 return -EMSGSIZE;
719 if (ops->fill_xstats) {
720 err = ops->fill_xstats(skb, dev);
721 if (err < 0)
722 return err;
723 }
724 if (ops->fill_info) {
725 data = nla_nest_start_noflag(skb, IFLA_INFO_DATA);
726 if (data == NULL)
727 return -EMSGSIZE;
728 err = ops->fill_info(skb, dev);
729 if (err < 0)
730 goto err_cancel_data;
731 nla_nest_end(skb, data);
732 }
733 return 0;
734
735 err_cancel_data:
736 nla_nest_cancel(skb, data);
737 return err;
738 }
739
rtnl_link_fill(struct sk_buff * skb,const struct net_device * dev)740 static int rtnl_link_fill(struct sk_buff *skb, const struct net_device *dev)
741 {
742 struct nlattr *linkinfo;
743 int err = -EMSGSIZE;
744
745 linkinfo = nla_nest_start_noflag(skb, IFLA_LINKINFO);
746 if (linkinfo == NULL)
747 goto out;
748
749 err = rtnl_link_info_fill(skb, dev);
750 if (err < 0)
751 goto err_cancel_link;
752
753 err = rtnl_link_slave_info_fill(skb, dev);
754 if (err < 0)
755 goto err_cancel_link;
756
757 nla_nest_end(skb, linkinfo);
758 return 0;
759
760 err_cancel_link:
761 nla_nest_cancel(skb, linkinfo);
762 out:
763 return err;
764 }
765
rtnetlink_send(struct sk_buff * skb,struct net * net,u32 pid,unsigned int group,int echo)766 int rtnetlink_send(struct sk_buff *skb, struct net *net, u32 pid, unsigned int group, int echo)
767 {
768 struct sock *rtnl = net->rtnl;
769
770 return nlmsg_notify(rtnl, skb, pid, group, echo, GFP_KERNEL);
771 }
772
rtnl_unicast(struct sk_buff * skb,struct net * net,u32 pid)773 int rtnl_unicast(struct sk_buff *skb, struct net *net, u32 pid)
774 {
775 struct sock *rtnl = net->rtnl;
776
777 return nlmsg_unicast(rtnl, skb, pid);
778 }
779 EXPORT_SYMBOL(rtnl_unicast);
780
rtnl_notify(struct sk_buff * skb,struct net * net,u32 pid,u32 group,const struct nlmsghdr * nlh,gfp_t flags)781 void rtnl_notify(struct sk_buff *skb, struct net *net, u32 pid, u32 group,
782 const struct nlmsghdr *nlh, gfp_t flags)
783 {
784 struct sock *rtnl = net->rtnl;
785
786 nlmsg_notify(rtnl, skb, pid, group, nlmsg_report(nlh), flags);
787 }
788 EXPORT_SYMBOL(rtnl_notify);
789
rtnl_set_sk_err(struct net * net,u32 group,int error)790 void rtnl_set_sk_err(struct net *net, u32 group, int error)
791 {
792 struct sock *rtnl = net->rtnl;
793
794 netlink_set_err(rtnl, 0, group, error);
795 }
796 EXPORT_SYMBOL(rtnl_set_sk_err);
797
rtnetlink_put_metrics(struct sk_buff * skb,u32 * metrics)798 int rtnetlink_put_metrics(struct sk_buff *skb, u32 *metrics)
799 {
800 struct nlattr *mx;
801 int i, valid = 0;
802
803 /* nothing is dumped for dst_default_metrics, so just skip the loop */
804 if (metrics == dst_default_metrics.metrics)
805 return 0;
806
807 mx = nla_nest_start_noflag(skb, RTA_METRICS);
808 if (mx == NULL)
809 return -ENOBUFS;
810
811 for (i = 0; i < RTAX_MAX; i++) {
812 if (metrics[i]) {
813 if (i == RTAX_CC_ALGO - 1) {
814 char tmp[TCP_CA_NAME_MAX], *name;
815
816 name = tcp_ca_get_name_by_key(metrics[i], tmp);
817 if (!name)
818 continue;
819 if (nla_put_string(skb, i + 1, name))
820 goto nla_put_failure;
821 } else if (i == RTAX_FEATURES - 1) {
822 u32 user_features = metrics[i] & RTAX_FEATURE_MASK;
823
824 if (!user_features)
825 continue;
826 BUILD_BUG_ON(RTAX_FEATURE_MASK & DST_FEATURE_MASK);
827 if (nla_put_u32(skb, i + 1, user_features))
828 goto nla_put_failure;
829 } else {
830 if (nla_put_u32(skb, i + 1, metrics[i]))
831 goto nla_put_failure;
832 }
833 valid++;
834 }
835 }
836
837 if (!valid) {
838 nla_nest_cancel(skb, mx);
839 return 0;
840 }
841
842 return nla_nest_end(skb, mx);
843
844 nla_put_failure:
845 nla_nest_cancel(skb, mx);
846 return -EMSGSIZE;
847 }
848 EXPORT_SYMBOL(rtnetlink_put_metrics);
849
rtnl_put_cacheinfo(struct sk_buff * skb,struct dst_entry * dst,u32 id,long expires,u32 error)850 int rtnl_put_cacheinfo(struct sk_buff *skb, struct dst_entry *dst, u32 id,
851 long expires, u32 error)
852 {
853 struct rta_cacheinfo ci = {
854 .rta_error = error,
855 .rta_id = id,
856 };
857
858 if (dst) {
859 ci.rta_lastuse = jiffies_delta_to_clock_t(jiffies - dst->lastuse);
860 ci.rta_used = dst->__use;
861 ci.rta_clntref = rcuref_read(&dst->__rcuref);
862 }
863 if (expires) {
864 unsigned long clock;
865
866 clock = jiffies_to_clock_t(abs(expires));
867 clock = min_t(unsigned long, clock, INT_MAX);
868 ci.rta_expires = (expires > 0) ? clock : -clock;
869 }
870 return nla_put(skb, RTA_CACHEINFO, sizeof(ci), &ci);
871 }
872 EXPORT_SYMBOL_GPL(rtnl_put_cacheinfo);
873
netdev_set_operstate(struct net_device * dev,int newstate)874 void netdev_set_operstate(struct net_device *dev, int newstate)
875 {
876 unsigned int old = READ_ONCE(dev->operstate);
877
878 do {
879 if (old == newstate)
880 return;
881 } while (!try_cmpxchg(&dev->operstate, &old, newstate));
882
883 netdev_state_change(dev);
884 }
885 EXPORT_SYMBOL(netdev_set_operstate);
886
set_operstate(struct net_device * dev,unsigned char transition)887 static void set_operstate(struct net_device *dev, unsigned char transition)
888 {
889 unsigned char operstate = READ_ONCE(dev->operstate);
890
891 switch (transition) {
892 case IF_OPER_UP:
893 if ((operstate == IF_OPER_DORMANT ||
894 operstate == IF_OPER_TESTING ||
895 operstate == IF_OPER_UNKNOWN) &&
896 !netif_dormant(dev) && !netif_testing(dev))
897 operstate = IF_OPER_UP;
898 break;
899
900 case IF_OPER_TESTING:
901 if (netif_oper_up(dev))
902 operstate = IF_OPER_TESTING;
903 break;
904
905 case IF_OPER_DORMANT:
906 if (netif_oper_up(dev))
907 operstate = IF_OPER_DORMANT;
908 break;
909 }
910
911 netdev_set_operstate(dev, operstate);
912 }
913
rtnl_dev_get_flags(const struct net_device * dev)914 static unsigned int rtnl_dev_get_flags(const struct net_device *dev)
915 {
916 return (dev->flags & ~(IFF_PROMISC | IFF_ALLMULTI)) |
917 (dev->gflags & (IFF_PROMISC | IFF_ALLMULTI));
918 }
919
rtnl_dev_combine_flags(const struct net_device * dev,const struct ifinfomsg * ifm)920 static unsigned int rtnl_dev_combine_flags(const struct net_device *dev,
921 const struct ifinfomsg *ifm)
922 {
923 unsigned int flags = ifm->ifi_flags;
924
925 /* bugwards compatibility: ifi_change == 0 is treated as ~0 */
926 if (ifm->ifi_change)
927 flags = (flags & ifm->ifi_change) |
928 (rtnl_dev_get_flags(dev) & ~ifm->ifi_change);
929
930 return flags;
931 }
932
copy_rtnl_link_stats(struct rtnl_link_stats * a,const struct rtnl_link_stats64 * b)933 static void copy_rtnl_link_stats(struct rtnl_link_stats *a,
934 const struct rtnl_link_stats64 *b)
935 {
936 a->rx_packets = b->rx_packets;
937 a->tx_packets = b->tx_packets;
938 a->rx_bytes = b->rx_bytes;
939 a->tx_bytes = b->tx_bytes;
940 a->rx_errors = b->rx_errors;
941 a->tx_errors = b->tx_errors;
942 a->rx_dropped = b->rx_dropped;
943 a->tx_dropped = b->tx_dropped;
944
945 a->multicast = b->multicast;
946 a->collisions = b->collisions;
947
948 a->rx_length_errors = b->rx_length_errors;
949 a->rx_over_errors = b->rx_over_errors;
950 a->rx_crc_errors = b->rx_crc_errors;
951 a->rx_frame_errors = b->rx_frame_errors;
952 a->rx_fifo_errors = b->rx_fifo_errors;
953 a->rx_missed_errors = b->rx_missed_errors;
954
955 a->tx_aborted_errors = b->tx_aborted_errors;
956 a->tx_carrier_errors = b->tx_carrier_errors;
957 a->tx_fifo_errors = b->tx_fifo_errors;
958 a->tx_heartbeat_errors = b->tx_heartbeat_errors;
959 a->tx_window_errors = b->tx_window_errors;
960
961 a->rx_compressed = b->rx_compressed;
962 a->tx_compressed = b->tx_compressed;
963
964 a->rx_nohandler = b->rx_nohandler;
965 }
966
967 /* All VF info */
rtnl_vfinfo_size(const struct net_device * dev,u32 ext_filter_mask)968 static inline int rtnl_vfinfo_size(const struct net_device *dev,
969 u32 ext_filter_mask)
970 {
971 if (dev->dev.parent && (ext_filter_mask & RTEXT_FILTER_VF)) {
972 int num_vfs = dev_num_vf(dev->dev.parent);
973 size_t size = nla_total_size(0);
974 size += num_vfs *
975 (nla_total_size(0) +
976 nla_total_size(sizeof(struct ifla_vf_mac)) +
977 nla_total_size(sizeof(struct ifla_vf_broadcast)) +
978 nla_total_size(sizeof(struct ifla_vf_vlan)) +
979 nla_total_size(0) + /* nest IFLA_VF_VLAN_LIST */
980 nla_total_size(MAX_VLAN_LIST_LEN *
981 sizeof(struct ifla_vf_vlan_info)) +
982 nla_total_size(sizeof(struct ifla_vf_spoofchk)) +
983 nla_total_size(sizeof(struct ifla_vf_tx_rate)) +
984 nla_total_size(sizeof(struct ifla_vf_rate)) +
985 nla_total_size(sizeof(struct ifla_vf_link_state)) +
986 nla_total_size(sizeof(struct ifla_vf_rss_query_en)) +
987 nla_total_size(sizeof(struct ifla_vf_trust)));
988 if (~ext_filter_mask & RTEXT_FILTER_SKIP_STATS) {
989 size += num_vfs *
990 (nla_total_size(0) + /* nest IFLA_VF_STATS */
991 /* IFLA_VF_STATS_RX_PACKETS */
992 nla_total_size_64bit(sizeof(__u64)) +
993 /* IFLA_VF_STATS_TX_PACKETS */
994 nla_total_size_64bit(sizeof(__u64)) +
995 /* IFLA_VF_STATS_RX_BYTES */
996 nla_total_size_64bit(sizeof(__u64)) +
997 /* IFLA_VF_STATS_TX_BYTES */
998 nla_total_size_64bit(sizeof(__u64)) +
999 /* IFLA_VF_STATS_BROADCAST */
1000 nla_total_size_64bit(sizeof(__u64)) +
1001 /* IFLA_VF_STATS_MULTICAST */
1002 nla_total_size_64bit(sizeof(__u64)) +
1003 /* IFLA_VF_STATS_RX_DROPPED */
1004 nla_total_size_64bit(sizeof(__u64)) +
1005 /* IFLA_VF_STATS_TX_DROPPED */
1006 nla_total_size_64bit(sizeof(__u64)));
1007 }
1008 if (dev->netdev_ops->ndo_get_vf_guid)
1009 size += num_vfs * 2 *
1010 nla_total_size(sizeof(struct ifla_vf_guid));
1011 return size;
1012 } else
1013 return 0;
1014 }
1015
rtnl_port_size(const struct net_device * dev,u32 ext_filter_mask)1016 static size_t rtnl_port_size(const struct net_device *dev,
1017 u32 ext_filter_mask)
1018 {
1019 size_t port_size = nla_total_size(4) /* PORT_VF */
1020 + nla_total_size(PORT_PROFILE_MAX) /* PORT_PROFILE */
1021 + nla_total_size(PORT_UUID_MAX) /* PORT_INSTANCE_UUID */
1022 + nla_total_size(PORT_UUID_MAX) /* PORT_HOST_UUID */
1023 + nla_total_size(1) /* PROT_VDP_REQUEST */
1024 + nla_total_size(2); /* PORT_VDP_RESPONSE */
1025 size_t vf_ports_size = nla_total_size(sizeof(struct nlattr));
1026 size_t vf_port_size = nla_total_size(sizeof(struct nlattr))
1027 + port_size;
1028 size_t port_self_size = nla_total_size(sizeof(struct nlattr))
1029 + port_size;
1030
1031 if (!dev->netdev_ops->ndo_get_vf_port || !dev->dev.parent ||
1032 !(ext_filter_mask & RTEXT_FILTER_VF))
1033 return 0;
1034 if (dev_num_vf(dev->dev.parent))
1035 return port_self_size + vf_ports_size +
1036 vf_port_size * dev_num_vf(dev->dev.parent);
1037 else
1038 return port_self_size;
1039 }
1040
rtnl_xdp_size(void)1041 static size_t rtnl_xdp_size(void)
1042 {
1043 size_t xdp_size = nla_total_size(0) + /* nest IFLA_XDP */
1044 nla_total_size(1) + /* XDP_ATTACHED */
1045 nla_total_size(4) + /* XDP_PROG_ID (or 1st mode) */
1046 nla_total_size(4); /* XDP_<mode>_PROG_ID */
1047
1048 return xdp_size;
1049 }
1050
rtnl_prop_list_size(const struct net_device * dev)1051 static size_t rtnl_prop_list_size(const struct net_device *dev)
1052 {
1053 struct netdev_name_node *name_node;
1054 unsigned int cnt = 0;
1055
1056 rcu_read_lock();
1057 list_for_each_entry_rcu(name_node, &dev->name_node->list, list)
1058 cnt++;
1059 rcu_read_unlock();
1060
1061 if (!cnt)
1062 return 0;
1063
1064 return nla_total_size(0) + cnt * nla_total_size(ALTIFNAMSIZ);
1065 }
1066
rtnl_proto_down_size(const struct net_device * dev)1067 static size_t rtnl_proto_down_size(const struct net_device *dev)
1068 {
1069 size_t size = nla_total_size(1);
1070
1071 /* Assume dev->proto_down_reason is not zero. */
1072 size += nla_total_size(0) + nla_total_size(4);
1073
1074 return size;
1075 }
1076
rtnl_devlink_port_size(const struct net_device * dev)1077 static size_t rtnl_devlink_port_size(const struct net_device *dev)
1078 {
1079 size_t size = nla_total_size(0); /* nest IFLA_DEVLINK_PORT */
1080
1081 if (dev->devlink_port)
1082 size += devlink_nl_port_handle_size(dev->devlink_port);
1083
1084 return size;
1085 }
1086
rtnl_dpll_pin_size(const struct net_device * dev)1087 static size_t rtnl_dpll_pin_size(const struct net_device *dev)
1088 {
1089 size_t size = nla_total_size(0); /* nest IFLA_DPLL_PIN */
1090
1091 size += dpll_netdev_pin_handle_size(dev);
1092
1093 return size;
1094 }
1095
if_nlmsg_size(const struct net_device * dev,u32 ext_filter_mask)1096 static noinline size_t if_nlmsg_size(const struct net_device *dev,
1097 u32 ext_filter_mask)
1098 {
1099 return NLMSG_ALIGN(sizeof(struct ifinfomsg))
1100 + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */
1101 + nla_total_size(IFALIASZ) /* IFLA_IFALIAS */
1102 + nla_total_size(IFNAMSIZ) /* IFLA_QDISC */
1103 + nla_total_size_64bit(sizeof(struct rtnl_link_ifmap))
1104 + nla_total_size(sizeof(struct rtnl_link_stats))
1105 + nla_total_size_64bit(sizeof(struct rtnl_link_stats64))
1106 + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */
1107 + nla_total_size(MAX_ADDR_LEN) /* IFLA_BROADCAST */
1108 + nla_total_size(4) /* IFLA_TXQLEN */
1109 + nla_total_size(4) /* IFLA_WEIGHT */
1110 + nla_total_size(4) /* IFLA_MTU */
1111 + nla_total_size(4) /* IFLA_LINK */
1112 + nla_total_size(4) /* IFLA_MASTER */
1113 + nla_total_size(1) /* IFLA_CARRIER */
1114 + nla_total_size(4) /* IFLA_PROMISCUITY */
1115 + nla_total_size(4) /* IFLA_ALLMULTI */
1116 + nla_total_size(4) /* IFLA_NUM_TX_QUEUES */
1117 + nla_total_size(4) /* IFLA_NUM_RX_QUEUES */
1118 + nla_total_size(4) /* IFLA_GSO_MAX_SEGS */
1119 + nla_total_size(4) /* IFLA_GSO_MAX_SIZE */
1120 + nla_total_size(4) /* IFLA_GRO_MAX_SIZE */
1121 + nla_total_size(4) /* IFLA_GSO_IPV4_MAX_SIZE */
1122 + nla_total_size(4) /* IFLA_GRO_IPV4_MAX_SIZE */
1123 + nla_total_size(4) /* IFLA_TSO_MAX_SIZE */
1124 + nla_total_size(4) /* IFLA_TSO_MAX_SEGS */
1125 + nla_total_size(1) /* IFLA_OPERSTATE */
1126 + nla_total_size(1) /* IFLA_LINKMODE */
1127 + nla_total_size(4) /* IFLA_CARRIER_CHANGES */
1128 + nla_total_size(4) /* IFLA_LINK_NETNSID */
1129 + nla_total_size(4) /* IFLA_GROUP */
1130 + nla_total_size(ext_filter_mask
1131 & RTEXT_FILTER_VF ? 4 : 0) /* IFLA_NUM_VF */
1132 + rtnl_vfinfo_size(dev, ext_filter_mask) /* IFLA_VFINFO_LIST */
1133 + rtnl_port_size(dev, ext_filter_mask) /* IFLA_VF_PORTS + IFLA_PORT_SELF */
1134 + rtnl_link_get_size(dev) /* IFLA_LINKINFO */
1135 + rtnl_link_get_af_size(dev, ext_filter_mask) /* IFLA_AF_SPEC */
1136 + nla_total_size(MAX_PHYS_ITEM_ID_LEN) /* IFLA_PHYS_PORT_ID */
1137 + nla_total_size(MAX_PHYS_ITEM_ID_LEN) /* IFLA_PHYS_SWITCH_ID */
1138 + nla_total_size(IFNAMSIZ) /* IFLA_PHYS_PORT_NAME */
1139 + rtnl_xdp_size() /* IFLA_XDP */
1140 + nla_total_size(4) /* IFLA_EVENT */
1141 + nla_total_size(4) /* IFLA_NEW_NETNSID */
1142 + nla_total_size(4) /* IFLA_NEW_IFINDEX */
1143 + rtnl_proto_down_size(dev) /* proto down */
1144 + nla_total_size(4) /* IFLA_TARGET_NETNSID */
1145 + nla_total_size(4) /* IFLA_CARRIER_UP_COUNT */
1146 + nla_total_size(4) /* IFLA_CARRIER_DOWN_COUNT */
1147 + nla_total_size(4) /* IFLA_MIN_MTU */
1148 + nla_total_size(4) /* IFLA_MAX_MTU */
1149 + rtnl_prop_list_size(dev)
1150 + nla_total_size(MAX_ADDR_LEN) /* IFLA_PERM_ADDRESS */
1151 + rtnl_devlink_port_size(dev)
1152 + rtnl_dpll_pin_size(dev)
1153 + 0;
1154 }
1155
rtnl_vf_ports_fill(struct sk_buff * skb,struct net_device * dev)1156 static int rtnl_vf_ports_fill(struct sk_buff *skb, struct net_device *dev)
1157 {
1158 struct nlattr *vf_ports;
1159 struct nlattr *vf_port;
1160 int vf;
1161 int err;
1162
1163 vf_ports = nla_nest_start_noflag(skb, IFLA_VF_PORTS);
1164 if (!vf_ports)
1165 return -EMSGSIZE;
1166
1167 for (vf = 0; vf < dev_num_vf(dev->dev.parent); vf++) {
1168 vf_port = nla_nest_start_noflag(skb, IFLA_VF_PORT);
1169 if (!vf_port)
1170 goto nla_put_failure;
1171 if (nla_put_u32(skb, IFLA_PORT_VF, vf))
1172 goto nla_put_failure;
1173 err = dev->netdev_ops->ndo_get_vf_port(dev, vf, skb);
1174 if (err == -EMSGSIZE)
1175 goto nla_put_failure;
1176 if (err) {
1177 nla_nest_cancel(skb, vf_port);
1178 continue;
1179 }
1180 nla_nest_end(skb, vf_port);
1181 }
1182
1183 nla_nest_end(skb, vf_ports);
1184
1185 return 0;
1186
1187 nla_put_failure:
1188 nla_nest_cancel(skb, vf_ports);
1189 return -EMSGSIZE;
1190 }
1191
rtnl_port_self_fill(struct sk_buff * skb,struct net_device * dev)1192 static int rtnl_port_self_fill(struct sk_buff *skb, struct net_device *dev)
1193 {
1194 struct nlattr *port_self;
1195 int err;
1196
1197 port_self = nla_nest_start_noflag(skb, IFLA_PORT_SELF);
1198 if (!port_self)
1199 return -EMSGSIZE;
1200
1201 err = dev->netdev_ops->ndo_get_vf_port(dev, PORT_SELF_VF, skb);
1202 if (err) {
1203 nla_nest_cancel(skb, port_self);
1204 return (err == -EMSGSIZE) ? err : 0;
1205 }
1206
1207 nla_nest_end(skb, port_self);
1208
1209 return 0;
1210 }
1211
rtnl_port_fill(struct sk_buff * skb,struct net_device * dev,u32 ext_filter_mask)1212 static int rtnl_port_fill(struct sk_buff *skb, struct net_device *dev,
1213 u32 ext_filter_mask)
1214 {
1215 int err;
1216
1217 if (!dev->netdev_ops->ndo_get_vf_port || !dev->dev.parent ||
1218 !(ext_filter_mask & RTEXT_FILTER_VF))
1219 return 0;
1220
1221 err = rtnl_port_self_fill(skb, dev);
1222 if (err)
1223 return err;
1224
1225 if (dev_num_vf(dev->dev.parent)) {
1226 err = rtnl_vf_ports_fill(skb, dev);
1227 if (err)
1228 return err;
1229 }
1230
1231 return 0;
1232 }
1233
rtnl_phys_port_id_fill(struct sk_buff * skb,struct net_device * dev)1234 static int rtnl_phys_port_id_fill(struct sk_buff *skb, struct net_device *dev)
1235 {
1236 int err;
1237 struct netdev_phys_item_id ppid;
1238
1239 err = dev_get_phys_port_id(dev, &ppid);
1240 if (err) {
1241 if (err == -EOPNOTSUPP)
1242 return 0;
1243 return err;
1244 }
1245
1246 if (nla_put(skb, IFLA_PHYS_PORT_ID, ppid.id_len, ppid.id))
1247 return -EMSGSIZE;
1248
1249 return 0;
1250 }
1251
rtnl_phys_port_name_fill(struct sk_buff * skb,struct net_device * dev)1252 static int rtnl_phys_port_name_fill(struct sk_buff *skb, struct net_device *dev)
1253 {
1254 char name[IFNAMSIZ];
1255 int err;
1256
1257 err = dev_get_phys_port_name(dev, name, sizeof(name));
1258 if (err) {
1259 if (err == -EOPNOTSUPP)
1260 return 0;
1261 return err;
1262 }
1263
1264 if (nla_put_string(skb, IFLA_PHYS_PORT_NAME, name))
1265 return -EMSGSIZE;
1266
1267 return 0;
1268 }
1269
rtnl_phys_switch_id_fill(struct sk_buff * skb,struct net_device * dev)1270 static int rtnl_phys_switch_id_fill(struct sk_buff *skb, struct net_device *dev)
1271 {
1272 struct netdev_phys_item_id ppid = { };
1273 int err;
1274
1275 err = dev_get_port_parent_id(dev, &ppid, false);
1276 if (err) {
1277 if (err == -EOPNOTSUPP)
1278 return 0;
1279 return err;
1280 }
1281
1282 if (nla_put(skb, IFLA_PHYS_SWITCH_ID, ppid.id_len, ppid.id))
1283 return -EMSGSIZE;
1284
1285 return 0;
1286 }
1287
rtnl_fill_stats(struct sk_buff * skb,struct net_device * dev)1288 static noinline_for_stack int rtnl_fill_stats(struct sk_buff *skb,
1289 struct net_device *dev)
1290 {
1291 struct rtnl_link_stats64 *sp;
1292 struct nlattr *attr;
1293
1294 attr = nla_reserve_64bit(skb, IFLA_STATS64,
1295 sizeof(struct rtnl_link_stats64), IFLA_PAD);
1296 if (!attr)
1297 return -EMSGSIZE;
1298
1299 sp = nla_data(attr);
1300 dev_get_stats(dev, sp);
1301
1302 attr = nla_reserve(skb, IFLA_STATS,
1303 sizeof(struct rtnl_link_stats));
1304 if (!attr)
1305 return -EMSGSIZE;
1306
1307 copy_rtnl_link_stats(nla_data(attr), sp);
1308
1309 return 0;
1310 }
1311
rtnl_fill_vfinfo(struct sk_buff * skb,struct net_device * dev,int vfs_num,u32 ext_filter_mask)1312 static noinline_for_stack int rtnl_fill_vfinfo(struct sk_buff *skb,
1313 struct net_device *dev,
1314 int vfs_num,
1315 u32 ext_filter_mask)
1316 {
1317 struct ifla_vf_rss_query_en vf_rss_query_en;
1318 struct nlattr *vf, *vfstats, *vfvlanlist;
1319 struct ifla_vf_link_state vf_linkstate;
1320 struct ifla_vf_vlan_info vf_vlan_info;
1321 struct ifla_vf_spoofchk vf_spoofchk;
1322 struct ifla_vf_tx_rate vf_tx_rate;
1323 struct ifla_vf_stats vf_stats;
1324 struct ifla_vf_trust vf_trust;
1325 struct ifla_vf_vlan vf_vlan;
1326 struct ifla_vf_rate vf_rate;
1327 struct ifla_vf_mac vf_mac;
1328 struct ifla_vf_broadcast vf_broadcast;
1329 struct ifla_vf_info ivi;
1330 struct ifla_vf_guid node_guid;
1331 struct ifla_vf_guid port_guid;
1332
1333 memset(&ivi, 0, sizeof(ivi));
1334
1335 /* Not all SR-IOV capable drivers support the
1336 * spoofcheck and "RSS query enable" query. Preset to
1337 * -1 so the user space tool can detect that the driver
1338 * didn't report anything.
1339 */
1340 ivi.spoofchk = -1;
1341 ivi.rss_query_en = -1;
1342 ivi.trusted = -1;
1343 /* The default value for VF link state is "auto"
1344 * IFLA_VF_LINK_STATE_AUTO which equals zero
1345 */
1346 ivi.linkstate = 0;
1347 /* VLAN Protocol by default is 802.1Q */
1348 ivi.vlan_proto = htons(ETH_P_8021Q);
1349 if (dev->netdev_ops->ndo_get_vf_config(dev, vfs_num, &ivi))
1350 return 0;
1351
1352 memset(&vf_vlan_info, 0, sizeof(vf_vlan_info));
1353 memset(&node_guid, 0, sizeof(node_guid));
1354 memset(&port_guid, 0, sizeof(port_guid));
1355
1356 vf_mac.vf =
1357 vf_vlan.vf =
1358 vf_vlan_info.vf =
1359 vf_rate.vf =
1360 vf_tx_rate.vf =
1361 vf_spoofchk.vf =
1362 vf_linkstate.vf =
1363 vf_rss_query_en.vf =
1364 vf_trust.vf =
1365 node_guid.vf =
1366 port_guid.vf = ivi.vf;
1367
1368 memcpy(vf_mac.mac, ivi.mac, sizeof(ivi.mac));
1369 memcpy(vf_broadcast.broadcast, dev->broadcast, dev->addr_len);
1370 vf_vlan.vlan = ivi.vlan;
1371 vf_vlan.qos = ivi.qos;
1372 vf_vlan_info.vlan = ivi.vlan;
1373 vf_vlan_info.qos = ivi.qos;
1374 vf_vlan_info.vlan_proto = ivi.vlan_proto;
1375 vf_tx_rate.rate = ivi.max_tx_rate;
1376 vf_rate.min_tx_rate = ivi.min_tx_rate;
1377 vf_rate.max_tx_rate = ivi.max_tx_rate;
1378 vf_spoofchk.setting = ivi.spoofchk;
1379 vf_linkstate.link_state = ivi.linkstate;
1380 vf_rss_query_en.setting = ivi.rss_query_en;
1381 vf_trust.setting = ivi.trusted;
1382 vf = nla_nest_start_noflag(skb, IFLA_VF_INFO);
1383 if (!vf)
1384 return -EMSGSIZE;
1385 if (nla_put(skb, IFLA_VF_MAC, sizeof(vf_mac), &vf_mac) ||
1386 nla_put(skb, IFLA_VF_BROADCAST, sizeof(vf_broadcast), &vf_broadcast) ||
1387 nla_put(skb, IFLA_VF_VLAN, sizeof(vf_vlan), &vf_vlan) ||
1388 nla_put(skb, IFLA_VF_RATE, sizeof(vf_rate),
1389 &vf_rate) ||
1390 nla_put(skb, IFLA_VF_TX_RATE, sizeof(vf_tx_rate),
1391 &vf_tx_rate) ||
1392 nla_put(skb, IFLA_VF_SPOOFCHK, sizeof(vf_spoofchk),
1393 &vf_spoofchk) ||
1394 nla_put(skb, IFLA_VF_LINK_STATE, sizeof(vf_linkstate),
1395 &vf_linkstate) ||
1396 nla_put(skb, IFLA_VF_RSS_QUERY_EN,
1397 sizeof(vf_rss_query_en),
1398 &vf_rss_query_en) ||
1399 nla_put(skb, IFLA_VF_TRUST,
1400 sizeof(vf_trust), &vf_trust))
1401 goto nla_put_vf_failure;
1402
1403 if (dev->netdev_ops->ndo_get_vf_guid &&
1404 !dev->netdev_ops->ndo_get_vf_guid(dev, vfs_num, &node_guid,
1405 &port_guid)) {
1406 if (nla_put(skb, IFLA_VF_IB_NODE_GUID, sizeof(node_guid),
1407 &node_guid) ||
1408 nla_put(skb, IFLA_VF_IB_PORT_GUID, sizeof(port_guid),
1409 &port_guid))
1410 goto nla_put_vf_failure;
1411 }
1412 vfvlanlist = nla_nest_start_noflag(skb, IFLA_VF_VLAN_LIST);
1413 if (!vfvlanlist)
1414 goto nla_put_vf_failure;
1415 if (nla_put(skb, IFLA_VF_VLAN_INFO, sizeof(vf_vlan_info),
1416 &vf_vlan_info)) {
1417 nla_nest_cancel(skb, vfvlanlist);
1418 goto nla_put_vf_failure;
1419 }
1420 nla_nest_end(skb, vfvlanlist);
1421 if (~ext_filter_mask & RTEXT_FILTER_SKIP_STATS) {
1422 memset(&vf_stats, 0, sizeof(vf_stats));
1423 if (dev->netdev_ops->ndo_get_vf_stats)
1424 dev->netdev_ops->ndo_get_vf_stats(dev, vfs_num,
1425 &vf_stats);
1426 vfstats = nla_nest_start_noflag(skb, IFLA_VF_STATS);
1427 if (!vfstats)
1428 goto nla_put_vf_failure;
1429 if (nla_put_u64_64bit(skb, IFLA_VF_STATS_RX_PACKETS,
1430 vf_stats.rx_packets, IFLA_VF_STATS_PAD) ||
1431 nla_put_u64_64bit(skb, IFLA_VF_STATS_TX_PACKETS,
1432 vf_stats.tx_packets, IFLA_VF_STATS_PAD) ||
1433 nla_put_u64_64bit(skb, IFLA_VF_STATS_RX_BYTES,
1434 vf_stats.rx_bytes, IFLA_VF_STATS_PAD) ||
1435 nla_put_u64_64bit(skb, IFLA_VF_STATS_TX_BYTES,
1436 vf_stats.tx_bytes, IFLA_VF_STATS_PAD) ||
1437 nla_put_u64_64bit(skb, IFLA_VF_STATS_BROADCAST,
1438 vf_stats.broadcast, IFLA_VF_STATS_PAD) ||
1439 nla_put_u64_64bit(skb, IFLA_VF_STATS_MULTICAST,
1440 vf_stats.multicast, IFLA_VF_STATS_PAD) ||
1441 nla_put_u64_64bit(skb, IFLA_VF_STATS_RX_DROPPED,
1442 vf_stats.rx_dropped, IFLA_VF_STATS_PAD) ||
1443 nla_put_u64_64bit(skb, IFLA_VF_STATS_TX_DROPPED,
1444 vf_stats.tx_dropped, IFLA_VF_STATS_PAD)) {
1445 nla_nest_cancel(skb, vfstats);
1446 goto nla_put_vf_failure;
1447 }
1448 nla_nest_end(skb, vfstats);
1449 }
1450 nla_nest_end(skb, vf);
1451 return 0;
1452
1453 nla_put_vf_failure:
1454 nla_nest_cancel(skb, vf);
1455 return -EMSGSIZE;
1456 }
1457
rtnl_fill_vf(struct sk_buff * skb,struct net_device * dev,u32 ext_filter_mask)1458 static noinline_for_stack int rtnl_fill_vf(struct sk_buff *skb,
1459 struct net_device *dev,
1460 u32 ext_filter_mask)
1461 {
1462 struct nlattr *vfinfo;
1463 int i, num_vfs;
1464
1465 if (!dev->dev.parent || ((ext_filter_mask & RTEXT_FILTER_VF) == 0))
1466 return 0;
1467
1468 num_vfs = dev_num_vf(dev->dev.parent);
1469 if (nla_put_u32(skb, IFLA_NUM_VF, num_vfs))
1470 return -EMSGSIZE;
1471
1472 if (!dev->netdev_ops->ndo_get_vf_config)
1473 return 0;
1474
1475 vfinfo = nla_nest_start_noflag(skb, IFLA_VFINFO_LIST);
1476 if (!vfinfo)
1477 return -EMSGSIZE;
1478
1479 for (i = 0; i < num_vfs; i++) {
1480 if (rtnl_fill_vfinfo(skb, dev, i, ext_filter_mask)) {
1481 nla_nest_cancel(skb, vfinfo);
1482 return -EMSGSIZE;
1483 }
1484 }
1485
1486 nla_nest_end(skb, vfinfo);
1487 return 0;
1488 }
1489
rtnl_fill_link_ifmap(struct sk_buff * skb,const struct net_device * dev)1490 static int rtnl_fill_link_ifmap(struct sk_buff *skb,
1491 const struct net_device *dev)
1492 {
1493 struct rtnl_link_ifmap map;
1494
1495 memset(&map, 0, sizeof(map));
1496 map.mem_start = READ_ONCE(dev->mem_start);
1497 map.mem_end = READ_ONCE(dev->mem_end);
1498 map.base_addr = READ_ONCE(dev->base_addr);
1499 map.irq = READ_ONCE(dev->irq);
1500 map.dma = READ_ONCE(dev->dma);
1501 map.port = READ_ONCE(dev->if_port);
1502
1503 if (nla_put_64bit(skb, IFLA_MAP, sizeof(map), &map, IFLA_PAD))
1504 return -EMSGSIZE;
1505
1506 return 0;
1507 }
1508
rtnl_xdp_prog_skb(struct net_device * dev)1509 static u32 rtnl_xdp_prog_skb(struct net_device *dev)
1510 {
1511 const struct bpf_prog *generic_xdp_prog;
1512 u32 res = 0;
1513
1514 rcu_read_lock();
1515 generic_xdp_prog = rcu_dereference(dev->xdp_prog);
1516 if (generic_xdp_prog)
1517 res = generic_xdp_prog->aux->id;
1518 rcu_read_unlock();
1519
1520 return res;
1521 }
1522
rtnl_xdp_prog_drv(struct net_device * dev)1523 static u32 rtnl_xdp_prog_drv(struct net_device *dev)
1524 {
1525 return dev_xdp_prog_id(dev, XDP_MODE_DRV);
1526 }
1527
rtnl_xdp_prog_hw(struct net_device * dev)1528 static u32 rtnl_xdp_prog_hw(struct net_device *dev)
1529 {
1530 return dev_xdp_prog_id(dev, XDP_MODE_HW);
1531 }
1532
rtnl_xdp_report_one(struct sk_buff * skb,struct net_device * dev,u32 * prog_id,u8 * mode,u8 tgt_mode,u32 attr,u32 (* get_prog_id)(struct net_device * dev))1533 static int rtnl_xdp_report_one(struct sk_buff *skb, struct net_device *dev,
1534 u32 *prog_id, u8 *mode, u8 tgt_mode, u32 attr,
1535 u32 (*get_prog_id)(struct net_device *dev))
1536 {
1537 u32 curr_id;
1538 int err;
1539
1540 curr_id = get_prog_id(dev);
1541 if (!curr_id)
1542 return 0;
1543
1544 *prog_id = curr_id;
1545 err = nla_put_u32(skb, attr, curr_id);
1546 if (err)
1547 return err;
1548
1549 if (*mode != XDP_ATTACHED_NONE)
1550 *mode = XDP_ATTACHED_MULTI;
1551 else
1552 *mode = tgt_mode;
1553
1554 return 0;
1555 }
1556
rtnl_xdp_fill(struct sk_buff * skb,struct net_device * dev)1557 static int rtnl_xdp_fill(struct sk_buff *skb, struct net_device *dev)
1558 {
1559 struct nlattr *xdp;
1560 u32 prog_id;
1561 int err;
1562 u8 mode;
1563
1564 xdp = nla_nest_start_noflag(skb, IFLA_XDP);
1565 if (!xdp)
1566 return -EMSGSIZE;
1567
1568 prog_id = 0;
1569 mode = XDP_ATTACHED_NONE;
1570 err = rtnl_xdp_report_one(skb, dev, &prog_id, &mode, XDP_ATTACHED_SKB,
1571 IFLA_XDP_SKB_PROG_ID, rtnl_xdp_prog_skb);
1572 if (err)
1573 goto err_cancel;
1574 err = rtnl_xdp_report_one(skb, dev, &prog_id, &mode, XDP_ATTACHED_DRV,
1575 IFLA_XDP_DRV_PROG_ID, rtnl_xdp_prog_drv);
1576 if (err)
1577 goto err_cancel;
1578 err = rtnl_xdp_report_one(skb, dev, &prog_id, &mode, XDP_ATTACHED_HW,
1579 IFLA_XDP_HW_PROG_ID, rtnl_xdp_prog_hw);
1580 if (err)
1581 goto err_cancel;
1582
1583 err = nla_put_u8(skb, IFLA_XDP_ATTACHED, mode);
1584 if (err)
1585 goto err_cancel;
1586
1587 if (prog_id && mode != XDP_ATTACHED_MULTI) {
1588 err = nla_put_u32(skb, IFLA_XDP_PROG_ID, prog_id);
1589 if (err)
1590 goto err_cancel;
1591 }
1592
1593 nla_nest_end(skb, xdp);
1594 return 0;
1595
1596 err_cancel:
1597 nla_nest_cancel(skb, xdp);
1598 return err;
1599 }
1600
rtnl_get_event(unsigned long event)1601 static u32 rtnl_get_event(unsigned long event)
1602 {
1603 u32 rtnl_event_type = IFLA_EVENT_NONE;
1604
1605 switch (event) {
1606 case NETDEV_REBOOT:
1607 rtnl_event_type = IFLA_EVENT_REBOOT;
1608 break;
1609 case NETDEV_FEAT_CHANGE:
1610 rtnl_event_type = IFLA_EVENT_FEATURES;
1611 break;
1612 case NETDEV_BONDING_FAILOVER:
1613 rtnl_event_type = IFLA_EVENT_BONDING_FAILOVER;
1614 break;
1615 case NETDEV_NOTIFY_PEERS:
1616 rtnl_event_type = IFLA_EVENT_NOTIFY_PEERS;
1617 break;
1618 case NETDEV_RESEND_IGMP:
1619 rtnl_event_type = IFLA_EVENT_IGMP_RESEND;
1620 break;
1621 case NETDEV_CHANGEINFODATA:
1622 rtnl_event_type = IFLA_EVENT_BONDING_OPTIONS;
1623 break;
1624 default:
1625 break;
1626 }
1627
1628 return rtnl_event_type;
1629 }
1630
put_master_ifindex(struct sk_buff * skb,struct net_device * dev)1631 static int put_master_ifindex(struct sk_buff *skb, struct net_device *dev)
1632 {
1633 const struct net_device *upper_dev;
1634 int ret = 0;
1635
1636 rcu_read_lock();
1637
1638 upper_dev = netdev_master_upper_dev_get_rcu(dev);
1639 if (upper_dev)
1640 ret = nla_put_u32(skb, IFLA_MASTER,
1641 READ_ONCE(upper_dev->ifindex));
1642
1643 rcu_read_unlock();
1644 return ret;
1645 }
1646
nla_put_iflink(struct sk_buff * skb,const struct net_device * dev,bool force)1647 static int nla_put_iflink(struct sk_buff *skb, const struct net_device *dev,
1648 bool force)
1649 {
1650 int iflink = dev_get_iflink(dev);
1651
1652 if (force || READ_ONCE(dev->ifindex) != iflink)
1653 return nla_put_u32(skb, IFLA_LINK, iflink);
1654
1655 return 0;
1656 }
1657
nla_put_ifalias(struct sk_buff * skb,struct net_device * dev)1658 static noinline_for_stack int nla_put_ifalias(struct sk_buff *skb,
1659 struct net_device *dev)
1660 {
1661 char buf[IFALIASZ];
1662 int ret;
1663
1664 ret = dev_get_alias(dev, buf, sizeof(buf));
1665 return ret > 0 ? nla_put_string(skb, IFLA_IFALIAS, buf) : 0;
1666 }
1667
rtnl_fill_link_netnsid(struct sk_buff * skb,const struct net_device * dev,struct net * src_net,gfp_t gfp)1668 static int rtnl_fill_link_netnsid(struct sk_buff *skb,
1669 const struct net_device *dev,
1670 struct net *src_net, gfp_t gfp)
1671 {
1672 bool put_iflink = false;
1673
1674 if (dev->rtnl_link_ops && dev->rtnl_link_ops->get_link_net) {
1675 struct net *link_net = dev->rtnl_link_ops->get_link_net(dev);
1676
1677 if (!net_eq(dev_net(dev), link_net)) {
1678 int id = peernet2id_alloc(src_net, link_net, gfp);
1679
1680 if (nla_put_s32(skb, IFLA_LINK_NETNSID, id))
1681 return -EMSGSIZE;
1682
1683 put_iflink = true;
1684 }
1685 }
1686
1687 return nla_put_iflink(skb, dev, put_iflink);
1688 }
1689
rtnl_fill_link_af(struct sk_buff * skb,const struct net_device * dev,u32 ext_filter_mask)1690 static int rtnl_fill_link_af(struct sk_buff *skb,
1691 const struct net_device *dev,
1692 u32 ext_filter_mask)
1693 {
1694 const struct rtnl_af_ops *af_ops;
1695 struct nlattr *af_spec;
1696
1697 af_spec = nla_nest_start_noflag(skb, IFLA_AF_SPEC);
1698 if (!af_spec)
1699 return -EMSGSIZE;
1700
1701 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
1702 struct nlattr *af;
1703 int err;
1704
1705 if (!af_ops->fill_link_af)
1706 continue;
1707
1708 af = nla_nest_start_noflag(skb, af_ops->family);
1709 if (!af)
1710 return -EMSGSIZE;
1711
1712 err = af_ops->fill_link_af(skb, dev, ext_filter_mask);
1713 /*
1714 * Caller may return ENODATA to indicate that there
1715 * was no data to be dumped. This is not an error, it
1716 * means we should trim the attribute header and
1717 * continue.
1718 */
1719 if (err == -ENODATA)
1720 nla_nest_cancel(skb, af);
1721 else if (err < 0)
1722 return -EMSGSIZE;
1723
1724 nla_nest_end(skb, af);
1725 }
1726
1727 nla_nest_end(skb, af_spec);
1728 return 0;
1729 }
1730
rtnl_fill_alt_ifnames(struct sk_buff * skb,const struct net_device * dev)1731 static int rtnl_fill_alt_ifnames(struct sk_buff *skb,
1732 const struct net_device *dev)
1733 {
1734 struct netdev_name_node *name_node;
1735 int count = 0;
1736
1737 list_for_each_entry_rcu(name_node, &dev->name_node->list, list) {
1738 if (nla_put_string(skb, IFLA_ALT_IFNAME, name_node->name))
1739 return -EMSGSIZE;
1740 count++;
1741 }
1742 return count;
1743 }
1744
1745 /* RCU protected. */
rtnl_fill_prop_list(struct sk_buff * skb,const struct net_device * dev)1746 static int rtnl_fill_prop_list(struct sk_buff *skb,
1747 const struct net_device *dev)
1748 {
1749 struct nlattr *prop_list;
1750 int ret;
1751
1752 prop_list = nla_nest_start(skb, IFLA_PROP_LIST);
1753 if (!prop_list)
1754 return -EMSGSIZE;
1755
1756 ret = rtnl_fill_alt_ifnames(skb, dev);
1757 if (ret <= 0)
1758 goto nest_cancel;
1759
1760 nla_nest_end(skb, prop_list);
1761 return 0;
1762
1763 nest_cancel:
1764 nla_nest_cancel(skb, prop_list);
1765 return ret;
1766 }
1767
rtnl_fill_proto_down(struct sk_buff * skb,const struct net_device * dev)1768 static int rtnl_fill_proto_down(struct sk_buff *skb,
1769 const struct net_device *dev)
1770 {
1771 struct nlattr *pr;
1772 u32 preason;
1773
1774 if (nla_put_u8(skb, IFLA_PROTO_DOWN, READ_ONCE(dev->proto_down)))
1775 goto nla_put_failure;
1776
1777 preason = READ_ONCE(dev->proto_down_reason);
1778 if (!preason)
1779 return 0;
1780
1781 pr = nla_nest_start(skb, IFLA_PROTO_DOWN_REASON);
1782 if (!pr)
1783 return -EMSGSIZE;
1784
1785 if (nla_put_u32(skb, IFLA_PROTO_DOWN_REASON_VALUE, preason)) {
1786 nla_nest_cancel(skb, pr);
1787 goto nla_put_failure;
1788 }
1789
1790 nla_nest_end(skb, pr);
1791 return 0;
1792
1793 nla_put_failure:
1794 return -EMSGSIZE;
1795 }
1796
rtnl_fill_devlink_port(struct sk_buff * skb,const struct net_device * dev)1797 static int rtnl_fill_devlink_port(struct sk_buff *skb,
1798 const struct net_device *dev)
1799 {
1800 struct nlattr *devlink_port_nest;
1801 int ret;
1802
1803 devlink_port_nest = nla_nest_start(skb, IFLA_DEVLINK_PORT);
1804 if (!devlink_port_nest)
1805 return -EMSGSIZE;
1806
1807 if (dev->devlink_port) {
1808 ret = devlink_nl_port_handle_fill(skb, dev->devlink_port);
1809 if (ret < 0)
1810 goto nest_cancel;
1811 }
1812
1813 nla_nest_end(skb, devlink_port_nest);
1814 return 0;
1815
1816 nest_cancel:
1817 nla_nest_cancel(skb, devlink_port_nest);
1818 return ret;
1819 }
1820
rtnl_fill_dpll_pin(struct sk_buff * skb,const struct net_device * dev)1821 static int rtnl_fill_dpll_pin(struct sk_buff *skb,
1822 const struct net_device *dev)
1823 {
1824 struct nlattr *dpll_pin_nest;
1825 int ret;
1826
1827 dpll_pin_nest = nla_nest_start(skb, IFLA_DPLL_PIN);
1828 if (!dpll_pin_nest)
1829 return -EMSGSIZE;
1830
1831 ret = dpll_netdev_add_pin_handle(skb, dev);
1832 if (ret < 0)
1833 goto nest_cancel;
1834
1835 nla_nest_end(skb, dpll_pin_nest);
1836 return 0;
1837
1838 nest_cancel:
1839 nla_nest_cancel(skb, dpll_pin_nest);
1840 return ret;
1841 }
1842
rtnl_fill_ifinfo(struct sk_buff * skb,struct net_device * dev,struct net * src_net,int type,u32 pid,u32 seq,u32 change,unsigned int flags,u32 ext_filter_mask,u32 event,int * new_nsid,int new_ifindex,int tgt_netnsid,gfp_t gfp)1843 static int rtnl_fill_ifinfo(struct sk_buff *skb,
1844 struct net_device *dev, struct net *src_net,
1845 int type, u32 pid, u32 seq, u32 change,
1846 unsigned int flags, u32 ext_filter_mask,
1847 u32 event, int *new_nsid, int new_ifindex,
1848 int tgt_netnsid, gfp_t gfp)
1849 {
1850 char devname[IFNAMSIZ];
1851 struct ifinfomsg *ifm;
1852 struct nlmsghdr *nlh;
1853 struct Qdisc *qdisc;
1854
1855 ASSERT_RTNL();
1856 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ifm), flags);
1857 if (nlh == NULL)
1858 return -EMSGSIZE;
1859
1860 ifm = nlmsg_data(nlh);
1861 ifm->ifi_family = AF_UNSPEC;
1862 ifm->__ifi_pad = 0;
1863 ifm->ifi_type = READ_ONCE(dev->type);
1864 ifm->ifi_index = READ_ONCE(dev->ifindex);
1865 ifm->ifi_flags = dev_get_flags(dev);
1866 ifm->ifi_change = change;
1867
1868 if (tgt_netnsid >= 0 && nla_put_s32(skb, IFLA_TARGET_NETNSID, tgt_netnsid))
1869 goto nla_put_failure;
1870
1871 netdev_copy_name(dev, devname);
1872 if (nla_put_string(skb, IFLA_IFNAME, devname))
1873 goto nla_put_failure;
1874
1875 if (nla_put_u32(skb, IFLA_TXQLEN, READ_ONCE(dev->tx_queue_len)) ||
1876 nla_put_u8(skb, IFLA_OPERSTATE,
1877 netif_running(dev) ? READ_ONCE(dev->operstate) :
1878 IF_OPER_DOWN) ||
1879 nla_put_u8(skb, IFLA_LINKMODE, READ_ONCE(dev->link_mode)) ||
1880 nla_put_u32(skb, IFLA_MTU, READ_ONCE(dev->mtu)) ||
1881 nla_put_u32(skb, IFLA_MIN_MTU, READ_ONCE(dev->min_mtu)) ||
1882 nla_put_u32(skb, IFLA_MAX_MTU, READ_ONCE(dev->max_mtu)) ||
1883 nla_put_u32(skb, IFLA_GROUP, READ_ONCE(dev->group)) ||
1884 nla_put_u32(skb, IFLA_PROMISCUITY, READ_ONCE(dev->promiscuity)) ||
1885 nla_put_u32(skb, IFLA_ALLMULTI, READ_ONCE(dev->allmulti)) ||
1886 nla_put_u32(skb, IFLA_NUM_TX_QUEUES,
1887 READ_ONCE(dev->num_tx_queues)) ||
1888 nla_put_u32(skb, IFLA_GSO_MAX_SEGS,
1889 READ_ONCE(dev->gso_max_segs)) ||
1890 nla_put_u32(skb, IFLA_GSO_MAX_SIZE,
1891 READ_ONCE(dev->gso_max_size)) ||
1892 nla_put_u32(skb, IFLA_GRO_MAX_SIZE,
1893 READ_ONCE(dev->gro_max_size)) ||
1894 nla_put_u32(skb, IFLA_GSO_IPV4_MAX_SIZE,
1895 READ_ONCE(dev->gso_ipv4_max_size)) ||
1896 nla_put_u32(skb, IFLA_GRO_IPV4_MAX_SIZE,
1897 READ_ONCE(dev->gro_ipv4_max_size)) ||
1898 nla_put_u32(skb, IFLA_TSO_MAX_SIZE,
1899 READ_ONCE(dev->tso_max_size)) ||
1900 nla_put_u32(skb, IFLA_TSO_MAX_SEGS,
1901 READ_ONCE(dev->tso_max_segs)) ||
1902 #ifdef CONFIG_RPS
1903 nla_put_u32(skb, IFLA_NUM_RX_QUEUES,
1904 READ_ONCE(dev->num_rx_queues)) ||
1905 #endif
1906 put_master_ifindex(skb, dev) ||
1907 nla_put_u8(skb, IFLA_CARRIER, netif_carrier_ok(dev)) ||
1908 nla_put_ifalias(skb, dev) ||
1909 nla_put_u32(skb, IFLA_CARRIER_CHANGES,
1910 atomic_read(&dev->carrier_up_count) +
1911 atomic_read(&dev->carrier_down_count)) ||
1912 nla_put_u32(skb, IFLA_CARRIER_UP_COUNT,
1913 atomic_read(&dev->carrier_up_count)) ||
1914 nla_put_u32(skb, IFLA_CARRIER_DOWN_COUNT,
1915 atomic_read(&dev->carrier_down_count)))
1916 goto nla_put_failure;
1917
1918 if (rtnl_fill_proto_down(skb, dev))
1919 goto nla_put_failure;
1920
1921 if (event != IFLA_EVENT_NONE) {
1922 if (nla_put_u32(skb, IFLA_EVENT, event))
1923 goto nla_put_failure;
1924 }
1925
1926 if (dev->addr_len) {
1927 if (nla_put(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr) ||
1928 nla_put(skb, IFLA_BROADCAST, dev->addr_len, dev->broadcast))
1929 goto nla_put_failure;
1930 }
1931
1932 if (rtnl_phys_port_id_fill(skb, dev))
1933 goto nla_put_failure;
1934
1935 if (rtnl_phys_port_name_fill(skb, dev))
1936 goto nla_put_failure;
1937
1938 if (rtnl_phys_switch_id_fill(skb, dev))
1939 goto nla_put_failure;
1940
1941 if (rtnl_fill_stats(skb, dev))
1942 goto nla_put_failure;
1943
1944 if (rtnl_fill_vf(skb, dev, ext_filter_mask))
1945 goto nla_put_failure;
1946
1947 if (rtnl_port_fill(skb, dev, ext_filter_mask))
1948 goto nla_put_failure;
1949
1950 if (rtnl_xdp_fill(skb, dev))
1951 goto nla_put_failure;
1952
1953 if (dev->rtnl_link_ops || rtnl_have_link_slave_info(dev)) {
1954 if (rtnl_link_fill(skb, dev) < 0)
1955 goto nla_put_failure;
1956 }
1957
1958 if (new_nsid &&
1959 nla_put_s32(skb, IFLA_NEW_NETNSID, *new_nsid) < 0)
1960 goto nla_put_failure;
1961 if (new_ifindex &&
1962 nla_put_s32(skb, IFLA_NEW_IFINDEX, new_ifindex) < 0)
1963 goto nla_put_failure;
1964
1965 if (memchr_inv(dev->perm_addr, '\0', dev->addr_len) &&
1966 nla_put(skb, IFLA_PERM_ADDRESS, dev->addr_len, dev->perm_addr))
1967 goto nla_put_failure;
1968
1969 rcu_read_lock();
1970 if (rtnl_fill_link_netnsid(skb, dev, src_net, GFP_ATOMIC))
1971 goto nla_put_failure_rcu;
1972 qdisc = rcu_dereference(dev->qdisc);
1973 if (qdisc && nla_put_string(skb, IFLA_QDISC, qdisc->ops->id))
1974 goto nla_put_failure_rcu;
1975 if (rtnl_fill_link_af(skb, dev, ext_filter_mask))
1976 goto nla_put_failure_rcu;
1977 if (rtnl_fill_link_ifmap(skb, dev))
1978 goto nla_put_failure_rcu;
1979 if (rtnl_fill_prop_list(skb, dev))
1980 goto nla_put_failure_rcu;
1981 rcu_read_unlock();
1982
1983 if (dev->dev.parent &&
1984 nla_put_string(skb, IFLA_PARENT_DEV_NAME,
1985 dev_name(dev->dev.parent)))
1986 goto nla_put_failure;
1987
1988 if (dev->dev.parent && dev->dev.parent->bus &&
1989 nla_put_string(skb, IFLA_PARENT_DEV_BUS_NAME,
1990 dev->dev.parent->bus->name))
1991 goto nla_put_failure;
1992
1993 if (rtnl_fill_devlink_port(skb, dev))
1994 goto nla_put_failure;
1995
1996 if (rtnl_fill_dpll_pin(skb, dev))
1997 goto nla_put_failure;
1998
1999 nlmsg_end(skb, nlh);
2000 return 0;
2001
2002 nla_put_failure_rcu:
2003 rcu_read_unlock();
2004 nla_put_failure:
2005 nlmsg_cancel(skb, nlh);
2006 return -EMSGSIZE;
2007 }
2008
2009 static const struct nla_policy ifla_policy[IFLA_MAX+1] = {
2010 [IFLA_IFNAME] = { .type = NLA_STRING, .len = IFNAMSIZ-1 },
2011 [IFLA_ADDRESS] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
2012 [IFLA_BROADCAST] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
2013 [IFLA_MAP] = { .len = sizeof(struct rtnl_link_ifmap) },
2014 [IFLA_MTU] = { .type = NLA_U32 },
2015 [IFLA_LINK] = { .type = NLA_U32 },
2016 [IFLA_MASTER] = { .type = NLA_U32 },
2017 [IFLA_CARRIER] = { .type = NLA_U8 },
2018 [IFLA_TXQLEN] = { .type = NLA_U32 },
2019 [IFLA_WEIGHT] = { .type = NLA_U32 },
2020 [IFLA_OPERSTATE] = { .type = NLA_U8 },
2021 [IFLA_LINKMODE] = { .type = NLA_U8 },
2022 [IFLA_LINKINFO] = { .type = NLA_NESTED },
2023 [IFLA_NET_NS_PID] = { .type = NLA_U32 },
2024 [IFLA_NET_NS_FD] = { .type = NLA_U32 },
2025 /* IFLA_IFALIAS is a string, but policy is set to NLA_BINARY to
2026 * allow 0-length string (needed to remove an alias).
2027 */
2028 [IFLA_IFALIAS] = { .type = NLA_BINARY, .len = IFALIASZ - 1 },
2029 [IFLA_VFINFO_LIST] = {. type = NLA_NESTED },
2030 [IFLA_VF_PORTS] = { .type = NLA_NESTED },
2031 [IFLA_PORT_SELF] = { .type = NLA_NESTED },
2032 [IFLA_AF_SPEC] = { .type = NLA_NESTED },
2033 [IFLA_EXT_MASK] = { .type = NLA_U32 },
2034 [IFLA_PROMISCUITY] = { .type = NLA_U32 },
2035 [IFLA_NUM_TX_QUEUES] = { .type = NLA_U32 },
2036 [IFLA_NUM_RX_QUEUES] = { .type = NLA_U32 },
2037 [IFLA_GSO_MAX_SEGS] = { .type = NLA_U32 },
2038 [IFLA_GSO_MAX_SIZE] = NLA_POLICY_MIN(NLA_U32, MAX_TCP_HEADER + 1),
2039 [IFLA_PHYS_PORT_ID] = { .type = NLA_BINARY, .len = MAX_PHYS_ITEM_ID_LEN },
2040 [IFLA_CARRIER_CHANGES] = { .type = NLA_U32 }, /* ignored */
2041 [IFLA_PHYS_SWITCH_ID] = { .type = NLA_BINARY, .len = MAX_PHYS_ITEM_ID_LEN },
2042 [IFLA_LINK_NETNSID] = { .type = NLA_S32 },
2043 [IFLA_PROTO_DOWN] = { .type = NLA_U8 },
2044 [IFLA_XDP] = { .type = NLA_NESTED },
2045 [IFLA_EVENT] = { .type = NLA_U32 },
2046 [IFLA_GROUP] = { .type = NLA_U32 },
2047 [IFLA_TARGET_NETNSID] = { .type = NLA_S32 },
2048 [IFLA_CARRIER_UP_COUNT] = { .type = NLA_U32 },
2049 [IFLA_CARRIER_DOWN_COUNT] = { .type = NLA_U32 },
2050 [IFLA_MIN_MTU] = { .type = NLA_U32 },
2051 [IFLA_MAX_MTU] = { .type = NLA_U32 },
2052 [IFLA_PROP_LIST] = { .type = NLA_NESTED },
2053 [IFLA_ALT_IFNAME] = { .type = NLA_STRING,
2054 .len = ALTIFNAMSIZ - 1 },
2055 [IFLA_PERM_ADDRESS] = { .type = NLA_REJECT },
2056 [IFLA_PROTO_DOWN_REASON] = { .type = NLA_NESTED },
2057 [IFLA_NEW_IFINDEX] = NLA_POLICY_MIN(NLA_S32, 1),
2058 [IFLA_PARENT_DEV_NAME] = { .type = NLA_NUL_STRING },
2059 [IFLA_GRO_MAX_SIZE] = { .type = NLA_U32 },
2060 [IFLA_TSO_MAX_SIZE] = { .type = NLA_REJECT },
2061 [IFLA_TSO_MAX_SEGS] = { .type = NLA_REJECT },
2062 [IFLA_ALLMULTI] = { .type = NLA_REJECT },
2063 [IFLA_GSO_IPV4_MAX_SIZE] = NLA_POLICY_MIN(NLA_U32, MAX_TCP_HEADER + 1),
2064 [IFLA_GRO_IPV4_MAX_SIZE] = { .type = NLA_U32 },
2065 };
2066
2067 static const struct nla_policy ifla_info_policy[IFLA_INFO_MAX+1] = {
2068 [IFLA_INFO_KIND] = { .type = NLA_STRING },
2069 [IFLA_INFO_DATA] = { .type = NLA_NESTED },
2070 [IFLA_INFO_SLAVE_KIND] = { .type = NLA_STRING },
2071 [IFLA_INFO_SLAVE_DATA] = { .type = NLA_NESTED },
2072 };
2073
2074 static const struct nla_policy ifla_vf_policy[IFLA_VF_MAX+1] = {
2075 [IFLA_VF_MAC] = { .len = sizeof(struct ifla_vf_mac) },
2076 [IFLA_VF_BROADCAST] = { .type = NLA_REJECT },
2077 [IFLA_VF_VLAN] = { .len = sizeof(struct ifla_vf_vlan) },
2078 [IFLA_VF_VLAN_LIST] = { .type = NLA_NESTED },
2079 [IFLA_VF_TX_RATE] = { .len = sizeof(struct ifla_vf_tx_rate) },
2080 [IFLA_VF_SPOOFCHK] = { .len = sizeof(struct ifla_vf_spoofchk) },
2081 [IFLA_VF_RATE] = { .len = sizeof(struct ifla_vf_rate) },
2082 [IFLA_VF_LINK_STATE] = { .len = sizeof(struct ifla_vf_link_state) },
2083 [IFLA_VF_RSS_QUERY_EN] = { .len = sizeof(struct ifla_vf_rss_query_en) },
2084 [IFLA_VF_STATS] = { .type = NLA_NESTED },
2085 [IFLA_VF_TRUST] = { .len = sizeof(struct ifla_vf_trust) },
2086 [IFLA_VF_IB_NODE_GUID] = { .len = sizeof(struct ifla_vf_guid) },
2087 [IFLA_VF_IB_PORT_GUID] = { .len = sizeof(struct ifla_vf_guid) },
2088 };
2089
2090 static const struct nla_policy ifla_port_policy[IFLA_PORT_MAX+1] = {
2091 [IFLA_PORT_VF] = { .type = NLA_U32 },
2092 [IFLA_PORT_PROFILE] = { .type = NLA_STRING,
2093 .len = PORT_PROFILE_MAX },
2094 [IFLA_PORT_INSTANCE_UUID] = { .type = NLA_BINARY,
2095 .len = PORT_UUID_MAX },
2096 [IFLA_PORT_HOST_UUID] = { .type = NLA_STRING,
2097 .len = PORT_UUID_MAX },
2098 [IFLA_PORT_REQUEST] = { .type = NLA_U8, },
2099 [IFLA_PORT_RESPONSE] = { .type = NLA_U16, },
2100
2101 /* Unused, but we need to keep it here since user space could
2102 * fill it. It's also broken with regard to NLA_BINARY use in
2103 * combination with structs.
2104 */
2105 [IFLA_PORT_VSI_TYPE] = { .type = NLA_BINARY,
2106 .len = sizeof(struct ifla_port_vsi) },
2107 };
2108
2109 static const struct nla_policy ifla_xdp_policy[IFLA_XDP_MAX + 1] = {
2110 [IFLA_XDP_UNSPEC] = { .strict_start_type = IFLA_XDP_EXPECTED_FD },
2111 [IFLA_XDP_FD] = { .type = NLA_S32 },
2112 [IFLA_XDP_EXPECTED_FD] = { .type = NLA_S32 },
2113 [IFLA_XDP_ATTACHED] = { .type = NLA_U8 },
2114 [IFLA_XDP_FLAGS] = { .type = NLA_U32 },
2115 [IFLA_XDP_PROG_ID] = { .type = NLA_U32 },
2116 };
2117
linkinfo_to_kind_ops(const struct nlattr * nla)2118 static const struct rtnl_link_ops *linkinfo_to_kind_ops(const struct nlattr *nla)
2119 {
2120 const struct rtnl_link_ops *ops = NULL;
2121 struct nlattr *linfo[IFLA_INFO_MAX + 1];
2122
2123 if (nla_parse_nested_deprecated(linfo, IFLA_INFO_MAX, nla, ifla_info_policy, NULL) < 0)
2124 return NULL;
2125
2126 if (linfo[IFLA_INFO_KIND]) {
2127 char kind[MODULE_NAME_LEN];
2128
2129 nla_strscpy(kind, linfo[IFLA_INFO_KIND], sizeof(kind));
2130 ops = rtnl_link_ops_get(kind);
2131 }
2132
2133 return ops;
2134 }
2135
link_master_filtered(struct net_device * dev,int master_idx)2136 static bool link_master_filtered(struct net_device *dev, int master_idx)
2137 {
2138 struct net_device *master;
2139
2140 if (!master_idx)
2141 return false;
2142
2143 master = netdev_master_upper_dev_get(dev);
2144
2145 /* 0 is already used to denote IFLA_MASTER wasn't passed, therefore need
2146 * another invalid value for ifindex to denote "no master".
2147 */
2148 if (master_idx == -1)
2149 return !!master;
2150
2151 if (!master || master->ifindex != master_idx)
2152 return true;
2153
2154 return false;
2155 }
2156
link_kind_filtered(const struct net_device * dev,const struct rtnl_link_ops * kind_ops)2157 static bool link_kind_filtered(const struct net_device *dev,
2158 const struct rtnl_link_ops *kind_ops)
2159 {
2160 if (kind_ops && dev->rtnl_link_ops != kind_ops)
2161 return true;
2162
2163 return false;
2164 }
2165
link_dump_filtered(struct net_device * dev,int master_idx,const struct rtnl_link_ops * kind_ops)2166 static bool link_dump_filtered(struct net_device *dev,
2167 int master_idx,
2168 const struct rtnl_link_ops *kind_ops)
2169 {
2170 if (link_master_filtered(dev, master_idx) ||
2171 link_kind_filtered(dev, kind_ops))
2172 return true;
2173
2174 return false;
2175 }
2176
2177 /**
2178 * rtnl_get_net_ns_capable - Get netns if sufficiently privileged.
2179 * @sk: netlink socket
2180 * @netnsid: network namespace identifier
2181 *
2182 * Returns the network namespace identified by netnsid on success or an error
2183 * pointer on failure.
2184 */
rtnl_get_net_ns_capable(struct sock * sk,int netnsid)2185 struct net *rtnl_get_net_ns_capable(struct sock *sk, int netnsid)
2186 {
2187 struct net *net;
2188
2189 net = get_net_ns_by_id(sock_net(sk), netnsid);
2190 if (!net)
2191 return ERR_PTR(-EINVAL);
2192
2193 /* For now, the caller is required to have CAP_NET_ADMIN in
2194 * the user namespace owning the target net ns.
2195 */
2196 if (!sk_ns_capable(sk, net->user_ns, CAP_NET_ADMIN)) {
2197 put_net(net);
2198 return ERR_PTR(-EACCES);
2199 }
2200 return net;
2201 }
2202 EXPORT_SYMBOL_GPL(rtnl_get_net_ns_capable);
2203
rtnl_valid_dump_ifinfo_req(const struct nlmsghdr * nlh,bool strict_check,struct nlattr ** tb,struct netlink_ext_ack * extack)2204 static int rtnl_valid_dump_ifinfo_req(const struct nlmsghdr *nlh,
2205 bool strict_check, struct nlattr **tb,
2206 struct netlink_ext_ack *extack)
2207 {
2208 int hdrlen;
2209
2210 if (strict_check) {
2211 struct ifinfomsg *ifm;
2212
2213 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifm))) {
2214 NL_SET_ERR_MSG(extack, "Invalid header for link dump");
2215 return -EINVAL;
2216 }
2217
2218 ifm = nlmsg_data(nlh);
2219 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags ||
2220 ifm->ifi_change) {
2221 NL_SET_ERR_MSG(extack, "Invalid values in header for link dump request");
2222 return -EINVAL;
2223 }
2224 if (ifm->ifi_index) {
2225 NL_SET_ERR_MSG(extack, "Filter by device index not supported for link dumps");
2226 return -EINVAL;
2227 }
2228
2229 return nlmsg_parse_deprecated_strict(nlh, sizeof(*ifm), tb,
2230 IFLA_MAX, ifla_policy,
2231 extack);
2232 }
2233
2234 /* A hack to preserve kernel<->userspace interface.
2235 * The correct header is ifinfomsg. It is consistent with rtnl_getlink.
2236 * However, before Linux v3.9 the code here assumed rtgenmsg and that's
2237 * what iproute2 < v3.9.0 used.
2238 * We can detect the old iproute2. Even including the IFLA_EXT_MASK
2239 * attribute, its netlink message is shorter than struct ifinfomsg.
2240 */
2241 hdrlen = nlmsg_len(nlh) < sizeof(struct ifinfomsg) ?
2242 sizeof(struct rtgenmsg) : sizeof(struct ifinfomsg);
2243
2244 return nlmsg_parse_deprecated(nlh, hdrlen, tb, IFLA_MAX, ifla_policy,
2245 extack);
2246 }
2247
rtnl_dump_ifinfo(struct sk_buff * skb,struct netlink_callback * cb)2248 static int rtnl_dump_ifinfo(struct sk_buff *skb, struct netlink_callback *cb)
2249 {
2250 const struct rtnl_link_ops *kind_ops = NULL;
2251 struct netlink_ext_ack *extack = cb->extack;
2252 const struct nlmsghdr *nlh = cb->nlh;
2253 struct net *net = sock_net(skb->sk);
2254 unsigned int flags = NLM_F_MULTI;
2255 struct nlattr *tb[IFLA_MAX+1];
2256 struct {
2257 unsigned long ifindex;
2258 } *ctx = (void *)cb->ctx;
2259 struct net *tgt_net = net;
2260 u32 ext_filter_mask = 0;
2261 struct net_device *dev;
2262 int master_idx = 0;
2263 int netnsid = -1;
2264 int err, i;
2265
2266 err = rtnl_valid_dump_ifinfo_req(nlh, cb->strict_check, tb, extack);
2267 if (err < 0) {
2268 if (cb->strict_check)
2269 return err;
2270
2271 goto walk_entries;
2272 }
2273
2274 for (i = 0; i <= IFLA_MAX; ++i) {
2275 if (!tb[i])
2276 continue;
2277
2278 /* new attributes should only be added with strict checking */
2279 switch (i) {
2280 case IFLA_TARGET_NETNSID:
2281 netnsid = nla_get_s32(tb[i]);
2282 tgt_net = rtnl_get_net_ns_capable(skb->sk, netnsid);
2283 if (IS_ERR(tgt_net)) {
2284 NL_SET_ERR_MSG(extack, "Invalid target network namespace id");
2285 return PTR_ERR(tgt_net);
2286 }
2287 break;
2288 case IFLA_EXT_MASK:
2289 ext_filter_mask = nla_get_u32(tb[i]);
2290 break;
2291 case IFLA_MASTER:
2292 master_idx = nla_get_u32(tb[i]);
2293 break;
2294 case IFLA_LINKINFO:
2295 kind_ops = linkinfo_to_kind_ops(tb[i]);
2296 break;
2297 default:
2298 if (cb->strict_check) {
2299 NL_SET_ERR_MSG(extack, "Unsupported attribute in link dump request");
2300 return -EINVAL;
2301 }
2302 }
2303 }
2304
2305 if (master_idx || kind_ops)
2306 flags |= NLM_F_DUMP_FILTERED;
2307
2308 walk_entries:
2309 err = 0;
2310 for_each_netdev_dump(tgt_net, dev, ctx->ifindex) {
2311 if (link_dump_filtered(dev, master_idx, kind_ops))
2312 continue;
2313 err = rtnl_fill_ifinfo(skb, dev, net, RTM_NEWLINK,
2314 NETLINK_CB(cb->skb).portid,
2315 nlh->nlmsg_seq, 0, flags,
2316 ext_filter_mask, 0, NULL, 0,
2317 netnsid, GFP_KERNEL);
2318 if (err < 0)
2319 break;
2320 }
2321 cb->seq = tgt_net->dev_base_seq;
2322 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2323 if (netnsid >= 0)
2324 put_net(tgt_net);
2325
2326 return err;
2327 }
2328
rtnl_nla_parse_ifinfomsg(struct nlattr ** tb,const struct nlattr * nla_peer,struct netlink_ext_ack * exterr)2329 int rtnl_nla_parse_ifinfomsg(struct nlattr **tb, const struct nlattr *nla_peer,
2330 struct netlink_ext_ack *exterr)
2331 {
2332 const struct ifinfomsg *ifmp;
2333 const struct nlattr *attrs;
2334 size_t len;
2335
2336 ifmp = nla_data(nla_peer);
2337 attrs = nla_data(nla_peer) + sizeof(struct ifinfomsg);
2338 len = nla_len(nla_peer) - sizeof(struct ifinfomsg);
2339
2340 if (ifmp->ifi_index < 0) {
2341 NL_SET_ERR_MSG_ATTR(exterr, nla_peer,
2342 "ifindex can't be negative");
2343 return -EINVAL;
2344 }
2345
2346 return nla_parse_deprecated(tb, IFLA_MAX, attrs, len, ifla_policy,
2347 exterr);
2348 }
2349 EXPORT_SYMBOL(rtnl_nla_parse_ifinfomsg);
2350
rtnl_link_get_net(struct net * src_net,struct nlattr * tb[])2351 struct net *rtnl_link_get_net(struct net *src_net, struct nlattr *tb[])
2352 {
2353 struct net *net;
2354 /* Examine the link attributes and figure out which
2355 * network namespace we are talking about.
2356 */
2357 if (tb[IFLA_NET_NS_PID])
2358 net = get_net_ns_by_pid(nla_get_u32(tb[IFLA_NET_NS_PID]));
2359 else if (tb[IFLA_NET_NS_FD])
2360 net = get_net_ns_by_fd(nla_get_u32(tb[IFLA_NET_NS_FD]));
2361 else
2362 net = get_net(src_net);
2363 return net;
2364 }
2365 EXPORT_SYMBOL(rtnl_link_get_net);
2366
2367 /* Figure out which network namespace we are talking about by
2368 * examining the link attributes in the following order:
2369 *
2370 * 1. IFLA_NET_NS_PID
2371 * 2. IFLA_NET_NS_FD
2372 * 3. IFLA_TARGET_NETNSID
2373 */
rtnl_link_get_net_by_nlattr(struct net * src_net,struct nlattr * tb[])2374 static struct net *rtnl_link_get_net_by_nlattr(struct net *src_net,
2375 struct nlattr *tb[])
2376 {
2377 struct net *net;
2378
2379 if (tb[IFLA_NET_NS_PID] || tb[IFLA_NET_NS_FD])
2380 return rtnl_link_get_net(src_net, tb);
2381
2382 if (!tb[IFLA_TARGET_NETNSID])
2383 return get_net(src_net);
2384
2385 net = get_net_ns_by_id(src_net, nla_get_u32(tb[IFLA_TARGET_NETNSID]));
2386 if (!net)
2387 return ERR_PTR(-EINVAL);
2388
2389 return net;
2390 }
2391
rtnl_link_get_net_capable(const struct sk_buff * skb,struct net * src_net,struct nlattr * tb[],int cap)2392 static struct net *rtnl_link_get_net_capable(const struct sk_buff *skb,
2393 struct net *src_net,
2394 struct nlattr *tb[], int cap)
2395 {
2396 struct net *net;
2397
2398 net = rtnl_link_get_net_by_nlattr(src_net, tb);
2399 if (IS_ERR(net))
2400 return net;
2401
2402 if (!netlink_ns_capable(skb, net->user_ns, cap)) {
2403 put_net(net);
2404 return ERR_PTR(-EPERM);
2405 }
2406
2407 return net;
2408 }
2409
2410 /* Verify that rtnetlink requests do not pass additional properties
2411 * potentially referring to different network namespaces.
2412 */
rtnl_ensure_unique_netns(struct nlattr * tb[],struct netlink_ext_ack * extack,bool netns_id_only)2413 static int rtnl_ensure_unique_netns(struct nlattr *tb[],
2414 struct netlink_ext_ack *extack,
2415 bool netns_id_only)
2416 {
2417
2418 if (netns_id_only) {
2419 if (!tb[IFLA_NET_NS_PID] && !tb[IFLA_NET_NS_FD])
2420 return 0;
2421
2422 NL_SET_ERR_MSG(extack, "specified netns attribute not supported");
2423 return -EOPNOTSUPP;
2424 }
2425
2426 if (tb[IFLA_TARGET_NETNSID] && (tb[IFLA_NET_NS_PID] || tb[IFLA_NET_NS_FD]))
2427 goto invalid_attr;
2428
2429 if (tb[IFLA_NET_NS_PID] && (tb[IFLA_TARGET_NETNSID] || tb[IFLA_NET_NS_FD]))
2430 goto invalid_attr;
2431
2432 if (tb[IFLA_NET_NS_FD] && (tb[IFLA_TARGET_NETNSID] || tb[IFLA_NET_NS_PID]))
2433 goto invalid_attr;
2434
2435 return 0;
2436
2437 invalid_attr:
2438 NL_SET_ERR_MSG(extack, "multiple netns identifying attributes specified");
2439 return -EINVAL;
2440 }
2441
rtnl_set_vf_rate(struct net_device * dev,int vf,int min_tx_rate,int max_tx_rate)2442 static int rtnl_set_vf_rate(struct net_device *dev, int vf, int min_tx_rate,
2443 int max_tx_rate)
2444 {
2445 const struct net_device_ops *ops = dev->netdev_ops;
2446
2447 if (!ops->ndo_set_vf_rate)
2448 return -EOPNOTSUPP;
2449 if (max_tx_rate && max_tx_rate < min_tx_rate)
2450 return -EINVAL;
2451
2452 return ops->ndo_set_vf_rate(dev, vf, min_tx_rate, max_tx_rate);
2453 }
2454
validate_linkmsg(struct net_device * dev,struct nlattr * tb[],struct netlink_ext_ack * extack)2455 static int validate_linkmsg(struct net_device *dev, struct nlattr *tb[],
2456 struct netlink_ext_ack *extack)
2457 {
2458 if (tb[IFLA_ADDRESS] &&
2459 nla_len(tb[IFLA_ADDRESS]) < dev->addr_len)
2460 return -EINVAL;
2461
2462 if (tb[IFLA_BROADCAST] &&
2463 nla_len(tb[IFLA_BROADCAST]) < dev->addr_len)
2464 return -EINVAL;
2465
2466 if (tb[IFLA_GSO_MAX_SIZE] &&
2467 nla_get_u32(tb[IFLA_GSO_MAX_SIZE]) > dev->tso_max_size) {
2468 NL_SET_ERR_MSG(extack, "too big gso_max_size");
2469 return -EINVAL;
2470 }
2471
2472 if (tb[IFLA_GSO_MAX_SEGS] &&
2473 (nla_get_u32(tb[IFLA_GSO_MAX_SEGS]) > GSO_MAX_SEGS ||
2474 nla_get_u32(tb[IFLA_GSO_MAX_SEGS]) > dev->tso_max_segs)) {
2475 NL_SET_ERR_MSG(extack, "too big gso_max_segs");
2476 return -EINVAL;
2477 }
2478
2479 if (tb[IFLA_GRO_MAX_SIZE] &&
2480 nla_get_u32(tb[IFLA_GRO_MAX_SIZE]) > GRO_MAX_SIZE) {
2481 NL_SET_ERR_MSG(extack, "too big gro_max_size");
2482 return -EINVAL;
2483 }
2484
2485 if (tb[IFLA_GSO_IPV4_MAX_SIZE] &&
2486 nla_get_u32(tb[IFLA_GSO_IPV4_MAX_SIZE]) > dev->tso_max_size) {
2487 NL_SET_ERR_MSG(extack, "too big gso_ipv4_max_size");
2488 return -EINVAL;
2489 }
2490
2491 if (tb[IFLA_GRO_IPV4_MAX_SIZE] &&
2492 nla_get_u32(tb[IFLA_GRO_IPV4_MAX_SIZE]) > GRO_MAX_SIZE) {
2493 NL_SET_ERR_MSG(extack, "too big gro_ipv4_max_size");
2494 return -EINVAL;
2495 }
2496
2497 if (tb[IFLA_AF_SPEC]) {
2498 struct nlattr *af;
2499 int rem, err;
2500
2501 nla_for_each_nested(af, tb[IFLA_AF_SPEC], rem) {
2502 const struct rtnl_af_ops *af_ops;
2503
2504 af_ops = rtnl_af_lookup(nla_type(af));
2505 if (!af_ops)
2506 return -EAFNOSUPPORT;
2507
2508 if (!af_ops->set_link_af)
2509 return -EOPNOTSUPP;
2510
2511 if (af_ops->validate_link_af) {
2512 err = af_ops->validate_link_af(dev, af, extack);
2513 if (err < 0)
2514 return err;
2515 }
2516 }
2517 }
2518
2519 return 0;
2520 }
2521
handle_infiniband_guid(struct net_device * dev,struct ifla_vf_guid * ivt,int guid_type)2522 static int handle_infiniband_guid(struct net_device *dev, struct ifla_vf_guid *ivt,
2523 int guid_type)
2524 {
2525 const struct net_device_ops *ops = dev->netdev_ops;
2526
2527 return ops->ndo_set_vf_guid(dev, ivt->vf, ivt->guid, guid_type);
2528 }
2529
handle_vf_guid(struct net_device * dev,struct ifla_vf_guid * ivt,int guid_type)2530 static int handle_vf_guid(struct net_device *dev, struct ifla_vf_guid *ivt, int guid_type)
2531 {
2532 if (dev->type != ARPHRD_INFINIBAND)
2533 return -EOPNOTSUPP;
2534
2535 return handle_infiniband_guid(dev, ivt, guid_type);
2536 }
2537
do_setvfinfo(struct net_device * dev,struct nlattr ** tb)2538 static int do_setvfinfo(struct net_device *dev, struct nlattr **tb)
2539 {
2540 const struct net_device_ops *ops = dev->netdev_ops;
2541 int err = -EINVAL;
2542
2543 if (tb[IFLA_VF_MAC]) {
2544 struct ifla_vf_mac *ivm = nla_data(tb[IFLA_VF_MAC]);
2545
2546 if (ivm->vf >= INT_MAX)
2547 return -EINVAL;
2548 err = -EOPNOTSUPP;
2549 if (ops->ndo_set_vf_mac)
2550 err = ops->ndo_set_vf_mac(dev, ivm->vf,
2551 ivm->mac);
2552 if (err < 0)
2553 return err;
2554 }
2555
2556 if (tb[IFLA_VF_VLAN]) {
2557 struct ifla_vf_vlan *ivv = nla_data(tb[IFLA_VF_VLAN]);
2558
2559 if (ivv->vf >= INT_MAX)
2560 return -EINVAL;
2561 err = -EOPNOTSUPP;
2562 if (ops->ndo_set_vf_vlan)
2563 err = ops->ndo_set_vf_vlan(dev, ivv->vf, ivv->vlan,
2564 ivv->qos,
2565 htons(ETH_P_8021Q));
2566 if (err < 0)
2567 return err;
2568 }
2569
2570 if (tb[IFLA_VF_VLAN_LIST]) {
2571 struct ifla_vf_vlan_info *ivvl[MAX_VLAN_LIST_LEN];
2572 struct nlattr *attr;
2573 int rem, len = 0;
2574
2575 err = -EOPNOTSUPP;
2576 if (!ops->ndo_set_vf_vlan)
2577 return err;
2578
2579 nla_for_each_nested(attr, tb[IFLA_VF_VLAN_LIST], rem) {
2580 if (nla_type(attr) != IFLA_VF_VLAN_INFO ||
2581 nla_len(attr) < sizeof(struct ifla_vf_vlan_info)) {
2582 return -EINVAL;
2583 }
2584 if (len >= MAX_VLAN_LIST_LEN)
2585 return -EOPNOTSUPP;
2586 ivvl[len] = nla_data(attr);
2587
2588 len++;
2589 }
2590 if (len == 0)
2591 return -EINVAL;
2592
2593 if (ivvl[0]->vf >= INT_MAX)
2594 return -EINVAL;
2595 err = ops->ndo_set_vf_vlan(dev, ivvl[0]->vf, ivvl[0]->vlan,
2596 ivvl[0]->qos, ivvl[0]->vlan_proto);
2597 if (err < 0)
2598 return err;
2599 }
2600
2601 if (tb[IFLA_VF_TX_RATE]) {
2602 struct ifla_vf_tx_rate *ivt = nla_data(tb[IFLA_VF_TX_RATE]);
2603 struct ifla_vf_info ivf;
2604
2605 if (ivt->vf >= INT_MAX)
2606 return -EINVAL;
2607 err = -EOPNOTSUPP;
2608 if (ops->ndo_get_vf_config)
2609 err = ops->ndo_get_vf_config(dev, ivt->vf, &ivf);
2610 if (err < 0)
2611 return err;
2612
2613 err = rtnl_set_vf_rate(dev, ivt->vf,
2614 ivf.min_tx_rate, ivt->rate);
2615 if (err < 0)
2616 return err;
2617 }
2618
2619 if (tb[IFLA_VF_RATE]) {
2620 struct ifla_vf_rate *ivt = nla_data(tb[IFLA_VF_RATE]);
2621
2622 if (ivt->vf >= INT_MAX)
2623 return -EINVAL;
2624
2625 err = rtnl_set_vf_rate(dev, ivt->vf,
2626 ivt->min_tx_rate, ivt->max_tx_rate);
2627 if (err < 0)
2628 return err;
2629 }
2630
2631 if (tb[IFLA_VF_SPOOFCHK]) {
2632 struct ifla_vf_spoofchk *ivs = nla_data(tb[IFLA_VF_SPOOFCHK]);
2633
2634 if (ivs->vf >= INT_MAX)
2635 return -EINVAL;
2636 err = -EOPNOTSUPP;
2637 if (ops->ndo_set_vf_spoofchk)
2638 err = ops->ndo_set_vf_spoofchk(dev, ivs->vf,
2639 ivs->setting);
2640 if (err < 0)
2641 return err;
2642 }
2643
2644 if (tb[IFLA_VF_LINK_STATE]) {
2645 struct ifla_vf_link_state *ivl = nla_data(tb[IFLA_VF_LINK_STATE]);
2646
2647 if (ivl->vf >= INT_MAX)
2648 return -EINVAL;
2649 err = -EOPNOTSUPP;
2650 if (ops->ndo_set_vf_link_state)
2651 err = ops->ndo_set_vf_link_state(dev, ivl->vf,
2652 ivl->link_state);
2653 if (err < 0)
2654 return err;
2655 }
2656
2657 if (tb[IFLA_VF_RSS_QUERY_EN]) {
2658 struct ifla_vf_rss_query_en *ivrssq_en;
2659
2660 err = -EOPNOTSUPP;
2661 ivrssq_en = nla_data(tb[IFLA_VF_RSS_QUERY_EN]);
2662 if (ivrssq_en->vf >= INT_MAX)
2663 return -EINVAL;
2664 if (ops->ndo_set_vf_rss_query_en)
2665 err = ops->ndo_set_vf_rss_query_en(dev, ivrssq_en->vf,
2666 ivrssq_en->setting);
2667 if (err < 0)
2668 return err;
2669 }
2670
2671 if (tb[IFLA_VF_TRUST]) {
2672 struct ifla_vf_trust *ivt = nla_data(tb[IFLA_VF_TRUST]);
2673
2674 if (ivt->vf >= INT_MAX)
2675 return -EINVAL;
2676 err = -EOPNOTSUPP;
2677 if (ops->ndo_set_vf_trust)
2678 err = ops->ndo_set_vf_trust(dev, ivt->vf, ivt->setting);
2679 if (err < 0)
2680 return err;
2681 }
2682
2683 if (tb[IFLA_VF_IB_NODE_GUID]) {
2684 struct ifla_vf_guid *ivt = nla_data(tb[IFLA_VF_IB_NODE_GUID]);
2685
2686 if (ivt->vf >= INT_MAX)
2687 return -EINVAL;
2688 if (!ops->ndo_set_vf_guid)
2689 return -EOPNOTSUPP;
2690 return handle_vf_guid(dev, ivt, IFLA_VF_IB_NODE_GUID);
2691 }
2692
2693 if (tb[IFLA_VF_IB_PORT_GUID]) {
2694 struct ifla_vf_guid *ivt = nla_data(tb[IFLA_VF_IB_PORT_GUID]);
2695
2696 if (ivt->vf >= INT_MAX)
2697 return -EINVAL;
2698 if (!ops->ndo_set_vf_guid)
2699 return -EOPNOTSUPP;
2700
2701 return handle_vf_guid(dev, ivt, IFLA_VF_IB_PORT_GUID);
2702 }
2703
2704 return err;
2705 }
2706
do_set_master(struct net_device * dev,int ifindex,struct netlink_ext_ack * extack)2707 static int do_set_master(struct net_device *dev, int ifindex,
2708 struct netlink_ext_ack *extack)
2709 {
2710 struct net_device *upper_dev = netdev_master_upper_dev_get(dev);
2711 const struct net_device_ops *ops;
2712 int err;
2713
2714 if (upper_dev) {
2715 if (upper_dev->ifindex == ifindex)
2716 return 0;
2717 ops = upper_dev->netdev_ops;
2718 if (ops->ndo_del_slave) {
2719 err = ops->ndo_del_slave(upper_dev, dev);
2720 if (err)
2721 return err;
2722 } else {
2723 return -EOPNOTSUPP;
2724 }
2725 }
2726
2727 if (ifindex) {
2728 upper_dev = __dev_get_by_index(dev_net(dev), ifindex);
2729 if (!upper_dev)
2730 return -EINVAL;
2731 ops = upper_dev->netdev_ops;
2732 if (ops->ndo_add_slave) {
2733 err = ops->ndo_add_slave(upper_dev, dev, extack);
2734 if (err)
2735 return err;
2736 } else {
2737 return -EOPNOTSUPP;
2738 }
2739 }
2740 return 0;
2741 }
2742
2743 static const struct nla_policy ifla_proto_down_reason_policy[IFLA_PROTO_DOWN_REASON_VALUE + 1] = {
2744 [IFLA_PROTO_DOWN_REASON_MASK] = { .type = NLA_U32 },
2745 [IFLA_PROTO_DOWN_REASON_VALUE] = { .type = NLA_U32 },
2746 };
2747
do_set_proto_down(struct net_device * dev,struct nlattr * nl_proto_down,struct nlattr * nl_proto_down_reason,struct netlink_ext_ack * extack)2748 static int do_set_proto_down(struct net_device *dev,
2749 struct nlattr *nl_proto_down,
2750 struct nlattr *nl_proto_down_reason,
2751 struct netlink_ext_ack *extack)
2752 {
2753 struct nlattr *pdreason[IFLA_PROTO_DOWN_REASON_MAX + 1];
2754 unsigned long mask = 0;
2755 u32 value;
2756 bool proto_down;
2757 int err;
2758
2759 if (!dev->change_proto_down) {
2760 NL_SET_ERR_MSG(extack, "Protodown not supported by device");
2761 return -EOPNOTSUPP;
2762 }
2763
2764 if (nl_proto_down_reason) {
2765 err = nla_parse_nested_deprecated(pdreason,
2766 IFLA_PROTO_DOWN_REASON_MAX,
2767 nl_proto_down_reason,
2768 ifla_proto_down_reason_policy,
2769 NULL);
2770 if (err < 0)
2771 return err;
2772
2773 if (!pdreason[IFLA_PROTO_DOWN_REASON_VALUE]) {
2774 NL_SET_ERR_MSG(extack, "Invalid protodown reason value");
2775 return -EINVAL;
2776 }
2777
2778 value = nla_get_u32(pdreason[IFLA_PROTO_DOWN_REASON_VALUE]);
2779
2780 if (pdreason[IFLA_PROTO_DOWN_REASON_MASK])
2781 mask = nla_get_u32(pdreason[IFLA_PROTO_DOWN_REASON_MASK]);
2782
2783 dev_change_proto_down_reason(dev, mask, value);
2784 }
2785
2786 if (nl_proto_down) {
2787 proto_down = nla_get_u8(nl_proto_down);
2788
2789 /* Don't turn off protodown if there are active reasons */
2790 if (!proto_down && dev->proto_down_reason) {
2791 NL_SET_ERR_MSG(extack, "Cannot clear protodown, active reasons");
2792 return -EBUSY;
2793 }
2794 err = dev_change_proto_down(dev,
2795 proto_down);
2796 if (err)
2797 return err;
2798 }
2799
2800 return 0;
2801 }
2802
2803 #define DO_SETLINK_MODIFIED 0x01
2804 /* notify flag means notify + modified. */
2805 #define DO_SETLINK_NOTIFY 0x03
do_setlink(const struct sk_buff * skb,struct net_device * dev,struct ifinfomsg * ifm,struct netlink_ext_ack * extack,struct nlattr ** tb,int status)2806 static int do_setlink(const struct sk_buff *skb,
2807 struct net_device *dev, struct ifinfomsg *ifm,
2808 struct netlink_ext_ack *extack,
2809 struct nlattr **tb, int status)
2810 {
2811 const struct net_device_ops *ops = dev->netdev_ops;
2812 char ifname[IFNAMSIZ];
2813 int err;
2814
2815 if (tb[IFLA_IFNAME])
2816 nla_strscpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
2817 else
2818 ifname[0] = '\0';
2819
2820 if (tb[IFLA_NET_NS_PID] || tb[IFLA_NET_NS_FD] || tb[IFLA_TARGET_NETNSID]) {
2821 const char *pat = ifname[0] ? ifname : NULL;
2822 struct net *net;
2823 int new_ifindex;
2824
2825 net = rtnl_link_get_net_capable(skb, dev_net(dev),
2826 tb, CAP_NET_ADMIN);
2827 if (IS_ERR(net)) {
2828 err = PTR_ERR(net);
2829 goto errout;
2830 }
2831
2832 if (tb[IFLA_NEW_IFINDEX])
2833 new_ifindex = nla_get_s32(tb[IFLA_NEW_IFINDEX]);
2834 else
2835 new_ifindex = 0;
2836
2837 err = __dev_change_net_namespace(dev, net, pat, new_ifindex);
2838 put_net(net);
2839 if (err)
2840 goto errout;
2841 status |= DO_SETLINK_MODIFIED;
2842 }
2843
2844 if (tb[IFLA_MAP]) {
2845 struct rtnl_link_ifmap *u_map;
2846 struct ifmap k_map;
2847
2848 if (!ops->ndo_set_config) {
2849 err = -EOPNOTSUPP;
2850 goto errout;
2851 }
2852
2853 if (!netif_device_present(dev)) {
2854 err = -ENODEV;
2855 goto errout;
2856 }
2857
2858 u_map = nla_data(tb[IFLA_MAP]);
2859 k_map.mem_start = (unsigned long) u_map->mem_start;
2860 k_map.mem_end = (unsigned long) u_map->mem_end;
2861 k_map.base_addr = (unsigned short) u_map->base_addr;
2862 k_map.irq = (unsigned char) u_map->irq;
2863 k_map.dma = (unsigned char) u_map->dma;
2864 k_map.port = (unsigned char) u_map->port;
2865
2866 err = ops->ndo_set_config(dev, &k_map);
2867 if (err < 0)
2868 goto errout;
2869
2870 status |= DO_SETLINK_NOTIFY;
2871 }
2872
2873 if (tb[IFLA_ADDRESS]) {
2874 struct sockaddr *sa;
2875 int len;
2876
2877 len = sizeof(sa_family_t) + max_t(size_t, dev->addr_len,
2878 sizeof(*sa));
2879 sa = kmalloc(len, GFP_KERNEL);
2880 if (!sa) {
2881 err = -ENOMEM;
2882 goto errout;
2883 }
2884 sa->sa_family = dev->type;
2885 memcpy(sa->sa_data, nla_data(tb[IFLA_ADDRESS]),
2886 dev->addr_len);
2887 err = dev_set_mac_address_user(dev, sa, extack);
2888 kfree(sa);
2889 if (err)
2890 goto errout;
2891 status |= DO_SETLINK_MODIFIED;
2892 }
2893
2894 if (tb[IFLA_MTU]) {
2895 err = dev_set_mtu_ext(dev, nla_get_u32(tb[IFLA_MTU]), extack);
2896 if (err < 0)
2897 goto errout;
2898 status |= DO_SETLINK_MODIFIED;
2899 }
2900
2901 if (tb[IFLA_GROUP]) {
2902 dev_set_group(dev, nla_get_u32(tb[IFLA_GROUP]));
2903 status |= DO_SETLINK_NOTIFY;
2904 }
2905
2906 /*
2907 * Interface selected by interface index but interface
2908 * name provided implies that a name change has been
2909 * requested.
2910 */
2911 if (ifm->ifi_index > 0 && ifname[0]) {
2912 err = dev_change_name(dev, ifname);
2913 if (err < 0)
2914 goto errout;
2915 status |= DO_SETLINK_MODIFIED;
2916 }
2917
2918 if (tb[IFLA_IFALIAS]) {
2919 err = dev_set_alias(dev, nla_data(tb[IFLA_IFALIAS]),
2920 nla_len(tb[IFLA_IFALIAS]));
2921 if (err < 0)
2922 goto errout;
2923 status |= DO_SETLINK_NOTIFY;
2924 }
2925
2926 if (tb[IFLA_BROADCAST]) {
2927 nla_memcpy(dev->broadcast, tb[IFLA_BROADCAST], dev->addr_len);
2928 call_netdevice_notifiers(NETDEV_CHANGEADDR, dev);
2929 }
2930
2931 if (ifm->ifi_flags || ifm->ifi_change) {
2932 err = dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm),
2933 extack);
2934 if (err < 0)
2935 goto errout;
2936 }
2937
2938 if (tb[IFLA_MASTER]) {
2939 err = do_set_master(dev, nla_get_u32(tb[IFLA_MASTER]), extack);
2940 if (err)
2941 goto errout;
2942 status |= DO_SETLINK_MODIFIED;
2943 }
2944
2945 if (tb[IFLA_CARRIER]) {
2946 err = dev_change_carrier(dev, nla_get_u8(tb[IFLA_CARRIER]));
2947 if (err)
2948 goto errout;
2949 status |= DO_SETLINK_MODIFIED;
2950 }
2951
2952 if (tb[IFLA_TXQLEN]) {
2953 unsigned int value = nla_get_u32(tb[IFLA_TXQLEN]);
2954
2955 err = dev_change_tx_queue_len(dev, value);
2956 if (err)
2957 goto errout;
2958 status |= DO_SETLINK_MODIFIED;
2959 }
2960
2961 if (tb[IFLA_GSO_MAX_SIZE]) {
2962 u32 max_size = nla_get_u32(tb[IFLA_GSO_MAX_SIZE]);
2963
2964 if (dev->gso_max_size ^ max_size) {
2965 netif_set_gso_max_size(dev, max_size);
2966 status |= DO_SETLINK_MODIFIED;
2967 }
2968 }
2969
2970 if (tb[IFLA_GSO_MAX_SEGS]) {
2971 u32 max_segs = nla_get_u32(tb[IFLA_GSO_MAX_SEGS]);
2972
2973 if (dev->gso_max_segs ^ max_segs) {
2974 netif_set_gso_max_segs(dev, max_segs);
2975 status |= DO_SETLINK_MODIFIED;
2976 }
2977 }
2978
2979 if (tb[IFLA_GRO_MAX_SIZE]) {
2980 u32 gro_max_size = nla_get_u32(tb[IFLA_GRO_MAX_SIZE]);
2981
2982 if (dev->gro_max_size ^ gro_max_size) {
2983 netif_set_gro_max_size(dev, gro_max_size);
2984 status |= DO_SETLINK_MODIFIED;
2985 }
2986 }
2987
2988 if (tb[IFLA_GSO_IPV4_MAX_SIZE]) {
2989 u32 max_size = nla_get_u32(tb[IFLA_GSO_IPV4_MAX_SIZE]);
2990
2991 if (dev->gso_ipv4_max_size ^ max_size) {
2992 netif_set_gso_ipv4_max_size(dev, max_size);
2993 status |= DO_SETLINK_MODIFIED;
2994 }
2995 }
2996
2997 if (tb[IFLA_GRO_IPV4_MAX_SIZE]) {
2998 u32 gro_max_size = nla_get_u32(tb[IFLA_GRO_IPV4_MAX_SIZE]);
2999
3000 if (dev->gro_ipv4_max_size ^ gro_max_size) {
3001 netif_set_gro_ipv4_max_size(dev, gro_max_size);
3002 status |= DO_SETLINK_MODIFIED;
3003 }
3004 }
3005
3006 if (tb[IFLA_OPERSTATE])
3007 set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
3008
3009 if (tb[IFLA_LINKMODE]) {
3010 unsigned char value = nla_get_u8(tb[IFLA_LINKMODE]);
3011
3012 if (dev->link_mode ^ value)
3013 status |= DO_SETLINK_NOTIFY;
3014 WRITE_ONCE(dev->link_mode, value);
3015 }
3016
3017 if (tb[IFLA_VFINFO_LIST]) {
3018 struct nlattr *vfinfo[IFLA_VF_MAX + 1];
3019 struct nlattr *attr;
3020 int rem;
3021
3022 nla_for_each_nested(attr, tb[IFLA_VFINFO_LIST], rem) {
3023 if (nla_type(attr) != IFLA_VF_INFO ||
3024 nla_len(attr) < NLA_HDRLEN) {
3025 err = -EINVAL;
3026 goto errout;
3027 }
3028 err = nla_parse_nested_deprecated(vfinfo, IFLA_VF_MAX,
3029 attr,
3030 ifla_vf_policy,
3031 NULL);
3032 if (err < 0)
3033 goto errout;
3034 err = do_setvfinfo(dev, vfinfo);
3035 if (err < 0)
3036 goto errout;
3037 status |= DO_SETLINK_NOTIFY;
3038 }
3039 }
3040 err = 0;
3041
3042 if (tb[IFLA_VF_PORTS]) {
3043 struct nlattr *port[IFLA_PORT_MAX+1];
3044 struct nlattr *attr;
3045 int vf;
3046 int rem;
3047
3048 err = -EOPNOTSUPP;
3049 if (!ops->ndo_set_vf_port)
3050 goto errout;
3051
3052 nla_for_each_nested(attr, tb[IFLA_VF_PORTS], rem) {
3053 if (nla_type(attr) != IFLA_VF_PORT ||
3054 nla_len(attr) < NLA_HDRLEN) {
3055 err = -EINVAL;
3056 goto errout;
3057 }
3058 err = nla_parse_nested_deprecated(port, IFLA_PORT_MAX,
3059 attr,
3060 ifla_port_policy,
3061 NULL);
3062 if (err < 0)
3063 goto errout;
3064 if (!port[IFLA_PORT_VF]) {
3065 err = -EOPNOTSUPP;
3066 goto errout;
3067 }
3068 vf = nla_get_u32(port[IFLA_PORT_VF]);
3069 err = ops->ndo_set_vf_port(dev, vf, port);
3070 if (err < 0)
3071 goto errout;
3072 status |= DO_SETLINK_NOTIFY;
3073 }
3074 }
3075 err = 0;
3076
3077 if (tb[IFLA_PORT_SELF]) {
3078 struct nlattr *port[IFLA_PORT_MAX+1];
3079
3080 err = nla_parse_nested_deprecated(port, IFLA_PORT_MAX,
3081 tb[IFLA_PORT_SELF],
3082 ifla_port_policy, NULL);
3083 if (err < 0)
3084 goto errout;
3085
3086 err = -EOPNOTSUPP;
3087 if (ops->ndo_set_vf_port)
3088 err = ops->ndo_set_vf_port(dev, PORT_SELF_VF, port);
3089 if (err < 0)
3090 goto errout;
3091 status |= DO_SETLINK_NOTIFY;
3092 }
3093
3094 if (tb[IFLA_AF_SPEC]) {
3095 struct nlattr *af;
3096 int rem;
3097
3098 nla_for_each_nested(af, tb[IFLA_AF_SPEC], rem) {
3099 const struct rtnl_af_ops *af_ops;
3100
3101 BUG_ON(!(af_ops = rtnl_af_lookup(nla_type(af))));
3102
3103 err = af_ops->set_link_af(dev, af, extack);
3104 if (err < 0)
3105 goto errout;
3106
3107 status |= DO_SETLINK_NOTIFY;
3108 }
3109 }
3110 err = 0;
3111
3112 if (tb[IFLA_PROTO_DOWN] || tb[IFLA_PROTO_DOWN_REASON]) {
3113 err = do_set_proto_down(dev, tb[IFLA_PROTO_DOWN],
3114 tb[IFLA_PROTO_DOWN_REASON], extack);
3115 if (err)
3116 goto errout;
3117 status |= DO_SETLINK_NOTIFY;
3118 }
3119
3120 if (tb[IFLA_XDP]) {
3121 struct nlattr *xdp[IFLA_XDP_MAX + 1];
3122 u32 xdp_flags = 0;
3123
3124 err = nla_parse_nested_deprecated(xdp, IFLA_XDP_MAX,
3125 tb[IFLA_XDP],
3126 ifla_xdp_policy, NULL);
3127 if (err < 0)
3128 goto errout;
3129
3130 if (xdp[IFLA_XDP_ATTACHED] || xdp[IFLA_XDP_PROG_ID]) {
3131 err = -EINVAL;
3132 goto errout;
3133 }
3134
3135 if (xdp[IFLA_XDP_FLAGS]) {
3136 xdp_flags = nla_get_u32(xdp[IFLA_XDP_FLAGS]);
3137 if (xdp_flags & ~XDP_FLAGS_MASK) {
3138 err = -EINVAL;
3139 goto errout;
3140 }
3141 if (hweight32(xdp_flags & XDP_FLAGS_MODES) > 1) {
3142 err = -EINVAL;
3143 goto errout;
3144 }
3145 }
3146
3147 if (xdp[IFLA_XDP_FD]) {
3148 int expected_fd = -1;
3149
3150 if (xdp_flags & XDP_FLAGS_REPLACE) {
3151 if (!xdp[IFLA_XDP_EXPECTED_FD]) {
3152 err = -EINVAL;
3153 goto errout;
3154 }
3155 expected_fd =
3156 nla_get_s32(xdp[IFLA_XDP_EXPECTED_FD]);
3157 }
3158
3159 err = dev_change_xdp_fd(dev, extack,
3160 nla_get_s32(xdp[IFLA_XDP_FD]),
3161 expected_fd,
3162 xdp_flags);
3163 if (err)
3164 goto errout;
3165 status |= DO_SETLINK_NOTIFY;
3166 }
3167 }
3168
3169 errout:
3170 if (status & DO_SETLINK_MODIFIED) {
3171 if ((status & DO_SETLINK_NOTIFY) == DO_SETLINK_NOTIFY)
3172 netdev_state_change(dev);
3173
3174 if (err < 0)
3175 net_warn_ratelimited("A link change request failed with some changes committed already. Interface %s may have been left with an inconsistent configuration, please check.\n",
3176 dev->name);
3177 }
3178
3179 return err;
3180 }
3181
rtnl_dev_get(struct net * net,struct nlattr * tb[])3182 static struct net_device *rtnl_dev_get(struct net *net,
3183 struct nlattr *tb[])
3184 {
3185 char ifname[ALTIFNAMSIZ];
3186
3187 if (tb[IFLA_IFNAME])
3188 nla_strscpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
3189 else if (tb[IFLA_ALT_IFNAME])
3190 nla_strscpy(ifname, tb[IFLA_ALT_IFNAME], ALTIFNAMSIZ);
3191 else
3192 return NULL;
3193
3194 return __dev_get_by_name(net, ifname);
3195 }
3196
rtnl_setlink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3197 static int rtnl_setlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3198 struct netlink_ext_ack *extack)
3199 {
3200 struct net *net = sock_net(skb->sk);
3201 struct ifinfomsg *ifm;
3202 struct net_device *dev;
3203 int err;
3204 struct nlattr *tb[IFLA_MAX+1];
3205
3206 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3207 ifla_policy, extack);
3208 if (err < 0)
3209 goto errout;
3210
3211 err = rtnl_ensure_unique_netns(tb, extack, false);
3212 if (err < 0)
3213 goto errout;
3214
3215 err = -EINVAL;
3216 ifm = nlmsg_data(nlh);
3217 if (ifm->ifi_index > 0)
3218 dev = __dev_get_by_index(net, ifm->ifi_index);
3219 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3220 dev = rtnl_dev_get(net, tb);
3221 else
3222 goto errout;
3223
3224 if (dev == NULL) {
3225 err = -ENODEV;
3226 goto errout;
3227 }
3228
3229 err = validate_linkmsg(dev, tb, extack);
3230 if (err < 0)
3231 goto errout;
3232
3233 err = do_setlink(skb, dev, ifm, extack, tb, 0);
3234 errout:
3235 return err;
3236 }
3237
rtnl_group_dellink(const struct net * net,int group)3238 static int rtnl_group_dellink(const struct net *net, int group)
3239 {
3240 struct net_device *dev, *aux;
3241 LIST_HEAD(list_kill);
3242 bool found = false;
3243
3244 if (!group)
3245 return -EPERM;
3246
3247 for_each_netdev(net, dev) {
3248 if (dev->group == group) {
3249 const struct rtnl_link_ops *ops;
3250
3251 found = true;
3252 ops = dev->rtnl_link_ops;
3253 if (!ops || !ops->dellink)
3254 return -EOPNOTSUPP;
3255 }
3256 }
3257
3258 if (!found)
3259 return -ENODEV;
3260
3261 for_each_netdev_safe(net, dev, aux) {
3262 if (dev->group == group) {
3263 const struct rtnl_link_ops *ops;
3264
3265 ops = dev->rtnl_link_ops;
3266 ops->dellink(dev, &list_kill);
3267 }
3268 }
3269 unregister_netdevice_many(&list_kill);
3270
3271 return 0;
3272 }
3273
rtnl_delete_link(struct net_device * dev,u32 portid,const struct nlmsghdr * nlh)3274 int rtnl_delete_link(struct net_device *dev, u32 portid, const struct nlmsghdr *nlh)
3275 {
3276 const struct rtnl_link_ops *ops;
3277 LIST_HEAD(list_kill);
3278
3279 ops = dev->rtnl_link_ops;
3280 if (!ops || !ops->dellink)
3281 return -EOPNOTSUPP;
3282
3283 ops->dellink(dev, &list_kill);
3284 unregister_netdevice_many_notify(&list_kill, portid, nlh);
3285
3286 return 0;
3287 }
3288 EXPORT_SYMBOL_GPL(rtnl_delete_link);
3289
rtnl_dellink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3290 static int rtnl_dellink(struct sk_buff *skb, struct nlmsghdr *nlh,
3291 struct netlink_ext_ack *extack)
3292 {
3293 struct net *net = sock_net(skb->sk);
3294 u32 portid = NETLINK_CB(skb).portid;
3295 struct net *tgt_net = net;
3296 struct net_device *dev = NULL;
3297 struct ifinfomsg *ifm;
3298 struct nlattr *tb[IFLA_MAX+1];
3299 int err;
3300 int netnsid = -1;
3301
3302 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3303 ifla_policy, extack);
3304 if (err < 0)
3305 return err;
3306
3307 err = rtnl_ensure_unique_netns(tb, extack, true);
3308 if (err < 0)
3309 return err;
3310
3311 if (tb[IFLA_TARGET_NETNSID]) {
3312 netnsid = nla_get_s32(tb[IFLA_TARGET_NETNSID]);
3313 tgt_net = rtnl_get_net_ns_capable(NETLINK_CB(skb).sk, netnsid);
3314 if (IS_ERR(tgt_net))
3315 return PTR_ERR(tgt_net);
3316 }
3317
3318 err = -EINVAL;
3319 ifm = nlmsg_data(nlh);
3320 if (ifm->ifi_index > 0)
3321 dev = __dev_get_by_index(tgt_net, ifm->ifi_index);
3322 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3323 dev = rtnl_dev_get(tgt_net, tb);
3324 else if (tb[IFLA_GROUP])
3325 err = rtnl_group_dellink(tgt_net, nla_get_u32(tb[IFLA_GROUP]));
3326 else
3327 goto out;
3328
3329 if (!dev) {
3330 if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME] || ifm->ifi_index > 0)
3331 err = -ENODEV;
3332
3333 goto out;
3334 }
3335
3336 err = rtnl_delete_link(dev, portid, nlh);
3337
3338 out:
3339 if (netnsid >= 0)
3340 put_net(tgt_net);
3341
3342 return err;
3343 }
3344
rtnl_configure_link(struct net_device * dev,const struct ifinfomsg * ifm,u32 portid,const struct nlmsghdr * nlh)3345 int rtnl_configure_link(struct net_device *dev, const struct ifinfomsg *ifm,
3346 u32 portid, const struct nlmsghdr *nlh)
3347 {
3348 unsigned int old_flags;
3349 int err;
3350
3351 old_flags = dev->flags;
3352 if (ifm && (ifm->ifi_flags || ifm->ifi_change)) {
3353 err = __dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm),
3354 NULL);
3355 if (err < 0)
3356 return err;
3357 }
3358
3359 if (dev->rtnl_link_state == RTNL_LINK_INITIALIZED) {
3360 __dev_notify_flags(dev, old_flags, (old_flags ^ dev->flags), portid, nlh);
3361 } else {
3362 dev->rtnl_link_state = RTNL_LINK_INITIALIZED;
3363 __dev_notify_flags(dev, old_flags, ~0U, portid, nlh);
3364 }
3365 return 0;
3366 }
3367 EXPORT_SYMBOL(rtnl_configure_link);
3368
rtnl_create_link(struct net * net,const char * ifname,unsigned char name_assign_type,const struct rtnl_link_ops * ops,struct nlattr * tb[],struct netlink_ext_ack * extack)3369 struct net_device *rtnl_create_link(struct net *net, const char *ifname,
3370 unsigned char name_assign_type,
3371 const struct rtnl_link_ops *ops,
3372 struct nlattr *tb[],
3373 struct netlink_ext_ack *extack)
3374 {
3375 struct net_device *dev;
3376 unsigned int num_tx_queues = 1;
3377 unsigned int num_rx_queues = 1;
3378 int err;
3379
3380 if (tb[IFLA_NUM_TX_QUEUES])
3381 num_tx_queues = nla_get_u32(tb[IFLA_NUM_TX_QUEUES]);
3382 else if (ops->get_num_tx_queues)
3383 num_tx_queues = ops->get_num_tx_queues();
3384
3385 if (tb[IFLA_NUM_RX_QUEUES])
3386 num_rx_queues = nla_get_u32(tb[IFLA_NUM_RX_QUEUES]);
3387 else if (ops->get_num_rx_queues)
3388 num_rx_queues = ops->get_num_rx_queues();
3389
3390 if (num_tx_queues < 1 || num_tx_queues > 4096) {
3391 NL_SET_ERR_MSG(extack, "Invalid number of transmit queues");
3392 return ERR_PTR(-EINVAL);
3393 }
3394
3395 if (num_rx_queues < 1 || num_rx_queues > 4096) {
3396 NL_SET_ERR_MSG(extack, "Invalid number of receive queues");
3397 return ERR_PTR(-EINVAL);
3398 }
3399
3400 if (ops->alloc) {
3401 dev = ops->alloc(tb, ifname, name_assign_type,
3402 num_tx_queues, num_rx_queues);
3403 if (IS_ERR(dev))
3404 return dev;
3405 } else {
3406 dev = alloc_netdev_mqs(ops->priv_size, ifname,
3407 name_assign_type, ops->setup,
3408 num_tx_queues, num_rx_queues);
3409 }
3410
3411 if (!dev)
3412 return ERR_PTR(-ENOMEM);
3413
3414 err = validate_linkmsg(dev, tb, extack);
3415 if (err < 0) {
3416 free_netdev(dev);
3417 return ERR_PTR(err);
3418 }
3419
3420 dev_net_set(dev, net);
3421 dev->rtnl_link_ops = ops;
3422 dev->rtnl_link_state = RTNL_LINK_INITIALIZING;
3423
3424 if (tb[IFLA_MTU]) {
3425 u32 mtu = nla_get_u32(tb[IFLA_MTU]);
3426
3427 err = dev_validate_mtu(dev, mtu, extack);
3428 if (err) {
3429 free_netdev(dev);
3430 return ERR_PTR(err);
3431 }
3432 dev->mtu = mtu;
3433 }
3434 if (tb[IFLA_ADDRESS]) {
3435 __dev_addr_set(dev, nla_data(tb[IFLA_ADDRESS]),
3436 nla_len(tb[IFLA_ADDRESS]));
3437 dev->addr_assign_type = NET_ADDR_SET;
3438 }
3439 if (tb[IFLA_BROADCAST])
3440 memcpy(dev->broadcast, nla_data(tb[IFLA_BROADCAST]),
3441 nla_len(tb[IFLA_BROADCAST]));
3442 if (tb[IFLA_TXQLEN])
3443 dev->tx_queue_len = nla_get_u32(tb[IFLA_TXQLEN]);
3444 if (tb[IFLA_OPERSTATE])
3445 set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
3446 if (tb[IFLA_LINKMODE])
3447 dev->link_mode = nla_get_u8(tb[IFLA_LINKMODE]);
3448 if (tb[IFLA_GROUP])
3449 dev_set_group(dev, nla_get_u32(tb[IFLA_GROUP]));
3450 if (tb[IFLA_GSO_MAX_SIZE])
3451 netif_set_gso_max_size(dev, nla_get_u32(tb[IFLA_GSO_MAX_SIZE]));
3452 if (tb[IFLA_GSO_MAX_SEGS])
3453 netif_set_gso_max_segs(dev, nla_get_u32(tb[IFLA_GSO_MAX_SEGS]));
3454 if (tb[IFLA_GRO_MAX_SIZE])
3455 netif_set_gro_max_size(dev, nla_get_u32(tb[IFLA_GRO_MAX_SIZE]));
3456 if (tb[IFLA_GSO_IPV4_MAX_SIZE])
3457 netif_set_gso_ipv4_max_size(dev, nla_get_u32(tb[IFLA_GSO_IPV4_MAX_SIZE]));
3458 if (tb[IFLA_GRO_IPV4_MAX_SIZE])
3459 netif_set_gro_ipv4_max_size(dev, nla_get_u32(tb[IFLA_GRO_IPV4_MAX_SIZE]));
3460
3461 return dev;
3462 }
3463 EXPORT_SYMBOL(rtnl_create_link);
3464
rtnl_group_changelink(const struct sk_buff * skb,struct net * net,int group,struct ifinfomsg * ifm,struct netlink_ext_ack * extack,struct nlattr ** tb)3465 static int rtnl_group_changelink(const struct sk_buff *skb,
3466 struct net *net, int group,
3467 struct ifinfomsg *ifm,
3468 struct netlink_ext_ack *extack,
3469 struct nlattr **tb)
3470 {
3471 struct net_device *dev, *aux;
3472 int err;
3473
3474 for_each_netdev_safe(net, dev, aux) {
3475 if (dev->group == group) {
3476 err = validate_linkmsg(dev, tb, extack);
3477 if (err < 0)
3478 return err;
3479 err = do_setlink(skb, dev, ifm, extack, tb, 0);
3480 if (err < 0)
3481 return err;
3482 }
3483 }
3484
3485 return 0;
3486 }
3487
rtnl_newlink_create(struct sk_buff * skb,struct ifinfomsg * ifm,const struct rtnl_link_ops * ops,const struct nlmsghdr * nlh,struct nlattr ** tb,struct nlattr ** data,struct netlink_ext_ack * extack)3488 static int rtnl_newlink_create(struct sk_buff *skb, struct ifinfomsg *ifm,
3489 const struct rtnl_link_ops *ops,
3490 const struct nlmsghdr *nlh,
3491 struct nlattr **tb, struct nlattr **data,
3492 struct netlink_ext_ack *extack)
3493 {
3494 unsigned char name_assign_type = NET_NAME_USER;
3495 struct net *net = sock_net(skb->sk);
3496 u32 portid = NETLINK_CB(skb).portid;
3497 struct net *dest_net, *link_net;
3498 struct net_device *dev;
3499 char ifname[IFNAMSIZ];
3500 int err;
3501
3502 if (!ops->alloc && !ops->setup)
3503 return -EOPNOTSUPP;
3504
3505 if (tb[IFLA_IFNAME]) {
3506 nla_strscpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
3507 } else {
3508 snprintf(ifname, IFNAMSIZ, "%s%%d", ops->kind);
3509 name_assign_type = NET_NAME_ENUM;
3510 }
3511
3512 dest_net = rtnl_link_get_net_capable(skb, net, tb, CAP_NET_ADMIN);
3513 if (IS_ERR(dest_net))
3514 return PTR_ERR(dest_net);
3515
3516 if (tb[IFLA_LINK_NETNSID]) {
3517 int id = nla_get_s32(tb[IFLA_LINK_NETNSID]);
3518
3519 link_net = get_net_ns_by_id(dest_net, id);
3520 if (!link_net) {
3521 NL_SET_ERR_MSG(extack, "Unknown network namespace id");
3522 err = -EINVAL;
3523 goto out;
3524 }
3525 err = -EPERM;
3526 if (!netlink_ns_capable(skb, link_net->user_ns, CAP_NET_ADMIN))
3527 goto out;
3528 } else {
3529 link_net = NULL;
3530 }
3531
3532 dev = rtnl_create_link(link_net ? : dest_net, ifname,
3533 name_assign_type, ops, tb, extack);
3534 if (IS_ERR(dev)) {
3535 err = PTR_ERR(dev);
3536 goto out;
3537 }
3538
3539 dev->ifindex = ifm->ifi_index;
3540
3541 if (ops->newlink)
3542 err = ops->newlink(link_net ? : net, dev, tb, data, extack);
3543 else
3544 err = register_netdevice(dev);
3545 if (err < 0) {
3546 free_netdev(dev);
3547 goto out;
3548 }
3549
3550 err = rtnl_configure_link(dev, ifm, portid, nlh);
3551 if (err < 0)
3552 goto out_unregister;
3553 if (link_net) {
3554 err = dev_change_net_namespace(dev, dest_net, ifname);
3555 if (err < 0)
3556 goto out_unregister;
3557 }
3558 if (tb[IFLA_MASTER]) {
3559 err = do_set_master(dev, nla_get_u32(tb[IFLA_MASTER]), extack);
3560 if (err)
3561 goto out_unregister;
3562 }
3563 out:
3564 if (link_net)
3565 put_net(link_net);
3566 put_net(dest_net);
3567 return err;
3568 out_unregister:
3569 if (ops->newlink) {
3570 LIST_HEAD(list_kill);
3571
3572 ops->dellink(dev, &list_kill);
3573 unregister_netdevice_many(&list_kill);
3574 } else {
3575 unregister_netdevice(dev);
3576 }
3577 goto out;
3578 }
3579
3580 struct rtnl_newlink_tbs {
3581 struct nlattr *tb[IFLA_MAX + 1];
3582 struct nlattr *attr[RTNL_MAX_TYPE + 1];
3583 struct nlattr *slave_attr[RTNL_SLAVE_MAX_TYPE + 1];
3584 };
3585
__rtnl_newlink(struct sk_buff * skb,struct nlmsghdr * nlh,struct rtnl_newlink_tbs * tbs,struct netlink_ext_ack * extack)3586 static int __rtnl_newlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3587 struct rtnl_newlink_tbs *tbs,
3588 struct netlink_ext_ack *extack)
3589 {
3590 struct nlattr *linkinfo[IFLA_INFO_MAX + 1];
3591 struct nlattr ** const tb = tbs->tb;
3592 const struct rtnl_link_ops *m_ops;
3593 struct net_device *master_dev;
3594 struct net *net = sock_net(skb->sk);
3595 const struct rtnl_link_ops *ops;
3596 struct nlattr **slave_data;
3597 char kind[MODULE_NAME_LEN];
3598 struct net_device *dev;
3599 struct ifinfomsg *ifm;
3600 struct nlattr **data;
3601 bool link_specified;
3602 int err;
3603
3604 #ifdef CONFIG_MODULES
3605 replay:
3606 #endif
3607 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3608 ifla_policy, extack);
3609 if (err < 0)
3610 return err;
3611
3612 err = rtnl_ensure_unique_netns(tb, extack, false);
3613 if (err < 0)
3614 return err;
3615
3616 ifm = nlmsg_data(nlh);
3617 if (ifm->ifi_index > 0) {
3618 link_specified = true;
3619 dev = __dev_get_by_index(net, ifm->ifi_index);
3620 } else if (ifm->ifi_index < 0) {
3621 NL_SET_ERR_MSG(extack, "ifindex can't be negative");
3622 return -EINVAL;
3623 } else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME]) {
3624 link_specified = true;
3625 dev = rtnl_dev_get(net, tb);
3626 } else {
3627 link_specified = false;
3628 dev = NULL;
3629 }
3630
3631 master_dev = NULL;
3632 m_ops = NULL;
3633 if (dev) {
3634 master_dev = netdev_master_upper_dev_get(dev);
3635 if (master_dev)
3636 m_ops = master_dev->rtnl_link_ops;
3637 }
3638
3639 if (tb[IFLA_LINKINFO]) {
3640 err = nla_parse_nested_deprecated(linkinfo, IFLA_INFO_MAX,
3641 tb[IFLA_LINKINFO],
3642 ifla_info_policy, NULL);
3643 if (err < 0)
3644 return err;
3645 } else
3646 memset(linkinfo, 0, sizeof(linkinfo));
3647
3648 if (linkinfo[IFLA_INFO_KIND]) {
3649 nla_strscpy(kind, linkinfo[IFLA_INFO_KIND], sizeof(kind));
3650 ops = rtnl_link_ops_get(kind);
3651 } else {
3652 kind[0] = '\0';
3653 ops = NULL;
3654 }
3655
3656 data = NULL;
3657 if (ops) {
3658 if (ops->maxtype > RTNL_MAX_TYPE)
3659 return -EINVAL;
3660
3661 if (ops->maxtype && linkinfo[IFLA_INFO_DATA]) {
3662 err = nla_parse_nested_deprecated(tbs->attr, ops->maxtype,
3663 linkinfo[IFLA_INFO_DATA],
3664 ops->policy, extack);
3665 if (err < 0)
3666 return err;
3667 data = tbs->attr;
3668 }
3669 if (ops->validate) {
3670 err = ops->validate(tb, data, extack);
3671 if (err < 0)
3672 return err;
3673 }
3674 }
3675
3676 slave_data = NULL;
3677 if (m_ops) {
3678 if (m_ops->slave_maxtype > RTNL_SLAVE_MAX_TYPE)
3679 return -EINVAL;
3680
3681 if (m_ops->slave_maxtype &&
3682 linkinfo[IFLA_INFO_SLAVE_DATA]) {
3683 err = nla_parse_nested_deprecated(tbs->slave_attr,
3684 m_ops->slave_maxtype,
3685 linkinfo[IFLA_INFO_SLAVE_DATA],
3686 m_ops->slave_policy,
3687 extack);
3688 if (err < 0)
3689 return err;
3690 slave_data = tbs->slave_attr;
3691 }
3692 }
3693
3694 if (dev) {
3695 int status = 0;
3696
3697 if (nlh->nlmsg_flags & NLM_F_EXCL)
3698 return -EEXIST;
3699 if (nlh->nlmsg_flags & NLM_F_REPLACE)
3700 return -EOPNOTSUPP;
3701
3702 err = validate_linkmsg(dev, tb, extack);
3703 if (err < 0)
3704 return err;
3705
3706 if (linkinfo[IFLA_INFO_DATA]) {
3707 if (!ops || ops != dev->rtnl_link_ops ||
3708 !ops->changelink)
3709 return -EOPNOTSUPP;
3710
3711 err = ops->changelink(dev, tb, data, extack);
3712 if (err < 0)
3713 return err;
3714 status |= DO_SETLINK_NOTIFY;
3715 }
3716
3717 if (linkinfo[IFLA_INFO_SLAVE_DATA]) {
3718 if (!m_ops || !m_ops->slave_changelink)
3719 return -EOPNOTSUPP;
3720
3721 err = m_ops->slave_changelink(master_dev, dev, tb,
3722 slave_data, extack);
3723 if (err < 0)
3724 return err;
3725 status |= DO_SETLINK_NOTIFY;
3726 }
3727
3728 return do_setlink(skb, dev, ifm, extack, tb, status);
3729 }
3730
3731 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
3732 /* No dev found and NLM_F_CREATE not set. Requested dev does not exist,
3733 * or it's for a group
3734 */
3735 if (link_specified)
3736 return -ENODEV;
3737 if (tb[IFLA_GROUP])
3738 return rtnl_group_changelink(skb, net,
3739 nla_get_u32(tb[IFLA_GROUP]),
3740 ifm, extack, tb);
3741 return -ENODEV;
3742 }
3743
3744 if (tb[IFLA_MAP] || tb[IFLA_PROTINFO])
3745 return -EOPNOTSUPP;
3746
3747 if (!ops) {
3748 #ifdef CONFIG_MODULES
3749 if (kind[0]) {
3750 __rtnl_unlock();
3751 request_module("rtnl-link-%s", kind);
3752 rtnl_lock();
3753 ops = rtnl_link_ops_get(kind);
3754 if (ops)
3755 goto replay;
3756 }
3757 #endif
3758 NL_SET_ERR_MSG(extack, "Unknown device type");
3759 return -EOPNOTSUPP;
3760 }
3761
3762 return rtnl_newlink_create(skb, ifm, ops, nlh, tb, data, extack);
3763 }
3764
rtnl_newlink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3765 static int rtnl_newlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3766 struct netlink_ext_ack *extack)
3767 {
3768 struct rtnl_newlink_tbs *tbs;
3769 int ret;
3770
3771 tbs = kmalloc(sizeof(*tbs), GFP_KERNEL);
3772 if (!tbs)
3773 return -ENOMEM;
3774
3775 ret = __rtnl_newlink(skb, nlh, tbs, extack);
3776 kfree(tbs);
3777 return ret;
3778 }
3779
rtnl_valid_getlink_req(struct sk_buff * skb,const struct nlmsghdr * nlh,struct nlattr ** tb,struct netlink_ext_ack * extack)3780 static int rtnl_valid_getlink_req(struct sk_buff *skb,
3781 const struct nlmsghdr *nlh,
3782 struct nlattr **tb,
3783 struct netlink_ext_ack *extack)
3784 {
3785 struct ifinfomsg *ifm;
3786 int i, err;
3787
3788 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifm))) {
3789 NL_SET_ERR_MSG(extack, "Invalid header for get link");
3790 return -EINVAL;
3791 }
3792
3793 if (!netlink_strict_get_check(skb))
3794 return nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3795 ifla_policy, extack);
3796
3797 ifm = nlmsg_data(nlh);
3798 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags ||
3799 ifm->ifi_change) {
3800 NL_SET_ERR_MSG(extack, "Invalid values in header for get link request");
3801 return -EINVAL;
3802 }
3803
3804 err = nlmsg_parse_deprecated_strict(nlh, sizeof(*ifm), tb, IFLA_MAX,
3805 ifla_policy, extack);
3806 if (err)
3807 return err;
3808
3809 for (i = 0; i <= IFLA_MAX; i++) {
3810 if (!tb[i])
3811 continue;
3812
3813 switch (i) {
3814 case IFLA_IFNAME:
3815 case IFLA_ALT_IFNAME:
3816 case IFLA_EXT_MASK:
3817 case IFLA_TARGET_NETNSID:
3818 break;
3819 default:
3820 NL_SET_ERR_MSG(extack, "Unsupported attribute in get link request");
3821 return -EINVAL;
3822 }
3823 }
3824
3825 return 0;
3826 }
3827
rtnl_getlink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3828 static int rtnl_getlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3829 struct netlink_ext_ack *extack)
3830 {
3831 struct net *net = sock_net(skb->sk);
3832 struct net *tgt_net = net;
3833 struct ifinfomsg *ifm;
3834 struct nlattr *tb[IFLA_MAX+1];
3835 struct net_device *dev = NULL;
3836 struct sk_buff *nskb;
3837 int netnsid = -1;
3838 int err;
3839 u32 ext_filter_mask = 0;
3840
3841 err = rtnl_valid_getlink_req(skb, nlh, tb, extack);
3842 if (err < 0)
3843 return err;
3844
3845 err = rtnl_ensure_unique_netns(tb, extack, true);
3846 if (err < 0)
3847 return err;
3848
3849 if (tb[IFLA_TARGET_NETNSID]) {
3850 netnsid = nla_get_s32(tb[IFLA_TARGET_NETNSID]);
3851 tgt_net = rtnl_get_net_ns_capable(NETLINK_CB(skb).sk, netnsid);
3852 if (IS_ERR(tgt_net))
3853 return PTR_ERR(tgt_net);
3854 }
3855
3856 if (tb[IFLA_EXT_MASK])
3857 ext_filter_mask = nla_get_u32(tb[IFLA_EXT_MASK]);
3858
3859 err = -EINVAL;
3860 ifm = nlmsg_data(nlh);
3861 if (ifm->ifi_index > 0)
3862 dev = __dev_get_by_index(tgt_net, ifm->ifi_index);
3863 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3864 dev = rtnl_dev_get(tgt_net, tb);
3865 else
3866 goto out;
3867
3868 err = -ENODEV;
3869 if (dev == NULL)
3870 goto out;
3871
3872 err = -ENOBUFS;
3873 nskb = nlmsg_new_large(if_nlmsg_size(dev, ext_filter_mask));
3874 if (nskb == NULL)
3875 goto out;
3876
3877 /* Synchronize the carrier state so we don't report a state
3878 * that we're not actually going to honour immediately; if
3879 * the driver just did a carrier off->on transition, we can
3880 * only TX if link watch work has run, but without this we'd
3881 * already report carrier on, even if it doesn't work yet.
3882 */
3883 linkwatch_sync_dev(dev);
3884
3885 err = rtnl_fill_ifinfo(nskb, dev, net,
3886 RTM_NEWLINK, NETLINK_CB(skb).portid,
3887 nlh->nlmsg_seq, 0, 0, ext_filter_mask,
3888 0, NULL, 0, netnsid, GFP_KERNEL);
3889 if (err < 0) {
3890 /* -EMSGSIZE implies BUG in if_nlmsg_size */
3891 WARN_ON(err == -EMSGSIZE);
3892 kfree_skb(nskb);
3893 } else
3894 err = rtnl_unicast(nskb, net, NETLINK_CB(skb).portid);
3895 out:
3896 if (netnsid >= 0)
3897 put_net(tgt_net);
3898
3899 return err;
3900 }
3901
rtnl_alt_ifname(int cmd,struct net_device * dev,struct nlattr * attr,bool * changed,struct netlink_ext_ack * extack)3902 static int rtnl_alt_ifname(int cmd, struct net_device *dev, struct nlattr *attr,
3903 bool *changed, struct netlink_ext_ack *extack)
3904 {
3905 char *alt_ifname;
3906 size_t size;
3907 int err;
3908
3909 err = nla_validate(attr, attr->nla_len, IFLA_MAX, ifla_policy, extack);
3910 if (err)
3911 return err;
3912
3913 if (cmd == RTM_NEWLINKPROP) {
3914 size = rtnl_prop_list_size(dev);
3915 size += nla_total_size(ALTIFNAMSIZ);
3916 if (size >= U16_MAX) {
3917 NL_SET_ERR_MSG(extack,
3918 "effective property list too long");
3919 return -EINVAL;
3920 }
3921 }
3922
3923 alt_ifname = nla_strdup(attr, GFP_KERNEL_ACCOUNT);
3924 if (!alt_ifname)
3925 return -ENOMEM;
3926
3927 if (cmd == RTM_NEWLINKPROP) {
3928 err = netdev_name_node_alt_create(dev, alt_ifname);
3929 if (!err)
3930 alt_ifname = NULL;
3931 } else if (cmd == RTM_DELLINKPROP) {
3932 err = netdev_name_node_alt_destroy(dev, alt_ifname);
3933 } else {
3934 WARN_ON_ONCE(1);
3935 err = -EINVAL;
3936 }
3937
3938 kfree(alt_ifname);
3939 if (!err)
3940 *changed = true;
3941 return err;
3942 }
3943
rtnl_linkprop(int cmd,struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3944 static int rtnl_linkprop(int cmd, struct sk_buff *skb, struct nlmsghdr *nlh,
3945 struct netlink_ext_ack *extack)
3946 {
3947 struct net *net = sock_net(skb->sk);
3948 struct nlattr *tb[IFLA_MAX + 1];
3949 struct net_device *dev;
3950 struct ifinfomsg *ifm;
3951 bool changed = false;
3952 struct nlattr *attr;
3953 int err, rem;
3954
3955 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy, extack);
3956 if (err)
3957 return err;
3958
3959 err = rtnl_ensure_unique_netns(tb, extack, true);
3960 if (err)
3961 return err;
3962
3963 ifm = nlmsg_data(nlh);
3964 if (ifm->ifi_index > 0)
3965 dev = __dev_get_by_index(net, ifm->ifi_index);
3966 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3967 dev = rtnl_dev_get(net, tb);
3968 else
3969 return -EINVAL;
3970
3971 if (!dev)
3972 return -ENODEV;
3973
3974 if (!tb[IFLA_PROP_LIST])
3975 return 0;
3976
3977 nla_for_each_nested(attr, tb[IFLA_PROP_LIST], rem) {
3978 switch (nla_type(attr)) {
3979 case IFLA_ALT_IFNAME:
3980 err = rtnl_alt_ifname(cmd, dev, attr, &changed, extack);
3981 if (err)
3982 return err;
3983 break;
3984 }
3985 }
3986
3987 if (changed)
3988 netdev_state_change(dev);
3989 return 0;
3990 }
3991
rtnl_newlinkprop(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3992 static int rtnl_newlinkprop(struct sk_buff *skb, struct nlmsghdr *nlh,
3993 struct netlink_ext_ack *extack)
3994 {
3995 return rtnl_linkprop(RTM_NEWLINKPROP, skb, nlh, extack);
3996 }
3997
rtnl_dellinkprop(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)3998 static int rtnl_dellinkprop(struct sk_buff *skb, struct nlmsghdr *nlh,
3999 struct netlink_ext_ack *extack)
4000 {
4001 return rtnl_linkprop(RTM_DELLINKPROP, skb, nlh, extack);
4002 }
4003
rtnl_calcit(struct sk_buff * skb,struct nlmsghdr * nlh)4004 static noinline_for_stack u32 rtnl_calcit(struct sk_buff *skb,
4005 struct nlmsghdr *nlh)
4006 {
4007 struct net *net = sock_net(skb->sk);
4008 size_t min_ifinfo_dump_size = 0;
4009 u32 ext_filter_mask = 0;
4010 struct net_device *dev;
4011 struct nlattr *nla;
4012 int hdrlen, rem;
4013
4014 /* Same kernel<->userspace interface hack as in rtnl_dump_ifinfo. */
4015 hdrlen = nlmsg_len(nlh) < sizeof(struct ifinfomsg) ?
4016 sizeof(struct rtgenmsg) : sizeof(struct ifinfomsg);
4017
4018 if (nlh->nlmsg_len < nlmsg_msg_size(hdrlen))
4019 return NLMSG_GOODSIZE;
4020
4021 nla_for_each_attr_type(nla, IFLA_EXT_MASK,
4022 nlmsg_attrdata(nlh, hdrlen),
4023 nlmsg_attrlen(nlh, hdrlen), rem) {
4024 if (nla_len(nla) == sizeof(u32))
4025 ext_filter_mask = nla_get_u32(nla);
4026 }
4027
4028 if (!ext_filter_mask)
4029 return NLMSG_GOODSIZE;
4030 /*
4031 * traverse the list of net devices and compute the minimum
4032 * buffer size based upon the filter mask.
4033 */
4034 rcu_read_lock();
4035 for_each_netdev_rcu(net, dev) {
4036 min_ifinfo_dump_size = max(min_ifinfo_dump_size,
4037 if_nlmsg_size(dev, ext_filter_mask));
4038 }
4039 rcu_read_unlock();
4040
4041 return nlmsg_total_size(min_ifinfo_dump_size);
4042 }
4043
rtnl_dump_all(struct sk_buff * skb,struct netlink_callback * cb)4044 static int rtnl_dump_all(struct sk_buff *skb, struct netlink_callback *cb)
4045 {
4046 int idx;
4047 int s_idx = cb->family;
4048 int type = cb->nlh->nlmsg_type - RTM_BASE;
4049 int ret = 0;
4050
4051 if (s_idx == 0)
4052 s_idx = 1;
4053
4054 for (idx = 1; idx <= RTNL_FAMILY_MAX; idx++) {
4055 struct rtnl_link __rcu **tab;
4056 struct rtnl_link *link;
4057 rtnl_dumpit_func dumpit;
4058
4059 if (idx < s_idx || idx == PF_PACKET)
4060 continue;
4061
4062 if (type < 0 || type >= RTM_NR_MSGTYPES)
4063 continue;
4064
4065 tab = rcu_dereference_rtnl(rtnl_msg_handlers[idx]);
4066 if (!tab)
4067 continue;
4068
4069 link = rcu_dereference_rtnl(tab[type]);
4070 if (!link)
4071 continue;
4072
4073 dumpit = link->dumpit;
4074 if (!dumpit)
4075 continue;
4076
4077 if (idx > s_idx) {
4078 memset(&cb->args[0], 0, sizeof(cb->args));
4079 cb->prev_seq = 0;
4080 cb->seq = 0;
4081 }
4082 ret = dumpit(skb, cb);
4083 if (ret)
4084 break;
4085 }
4086 cb->family = idx;
4087
4088 return skb->len ? : ret;
4089 }
4090
rtmsg_ifinfo_build_skb(int type,struct net_device * dev,unsigned int change,u32 event,gfp_t flags,int * new_nsid,int new_ifindex,u32 portid,const struct nlmsghdr * nlh)4091 struct sk_buff *rtmsg_ifinfo_build_skb(int type, struct net_device *dev,
4092 unsigned int change,
4093 u32 event, gfp_t flags, int *new_nsid,
4094 int new_ifindex, u32 portid,
4095 const struct nlmsghdr *nlh)
4096 {
4097 struct net *net = dev_net(dev);
4098 struct sk_buff *skb;
4099 int err = -ENOBUFS;
4100 u32 seq = 0;
4101
4102 skb = nlmsg_new(if_nlmsg_size(dev, 0), flags);
4103 if (skb == NULL)
4104 goto errout;
4105
4106 if (nlmsg_report(nlh))
4107 seq = nlmsg_seq(nlh);
4108 else
4109 portid = 0;
4110
4111 err = rtnl_fill_ifinfo(skb, dev, dev_net(dev),
4112 type, portid, seq, change, 0, 0, event,
4113 new_nsid, new_ifindex, -1, flags);
4114 if (err < 0) {
4115 /* -EMSGSIZE implies BUG in if_nlmsg_size() */
4116 WARN_ON(err == -EMSGSIZE);
4117 kfree_skb(skb);
4118 goto errout;
4119 }
4120 return skb;
4121 errout:
4122 rtnl_set_sk_err(net, RTNLGRP_LINK, err);
4123 return NULL;
4124 }
4125
rtmsg_ifinfo_send(struct sk_buff * skb,struct net_device * dev,gfp_t flags,u32 portid,const struct nlmsghdr * nlh)4126 void rtmsg_ifinfo_send(struct sk_buff *skb, struct net_device *dev, gfp_t flags,
4127 u32 portid, const struct nlmsghdr *nlh)
4128 {
4129 struct net *net = dev_net(dev);
4130
4131 rtnl_notify(skb, net, portid, RTNLGRP_LINK, nlh, flags);
4132 }
4133
rtmsg_ifinfo_event(int type,struct net_device * dev,unsigned int change,u32 event,gfp_t flags,int * new_nsid,int new_ifindex,u32 portid,const struct nlmsghdr * nlh)4134 static void rtmsg_ifinfo_event(int type, struct net_device *dev,
4135 unsigned int change, u32 event,
4136 gfp_t flags, int *new_nsid, int new_ifindex,
4137 u32 portid, const struct nlmsghdr *nlh)
4138 {
4139 struct sk_buff *skb;
4140
4141 if (dev->reg_state != NETREG_REGISTERED)
4142 return;
4143
4144 skb = rtmsg_ifinfo_build_skb(type, dev, change, event, flags, new_nsid,
4145 new_ifindex, portid, nlh);
4146 if (skb)
4147 rtmsg_ifinfo_send(skb, dev, flags, portid, nlh);
4148 }
4149
rtmsg_ifinfo(int type,struct net_device * dev,unsigned int change,gfp_t flags,u32 portid,const struct nlmsghdr * nlh)4150 void rtmsg_ifinfo(int type, struct net_device *dev, unsigned int change,
4151 gfp_t flags, u32 portid, const struct nlmsghdr *nlh)
4152 {
4153 rtmsg_ifinfo_event(type, dev, change, rtnl_get_event(0), flags,
4154 NULL, 0, portid, nlh);
4155 }
4156
rtmsg_ifinfo_newnet(int type,struct net_device * dev,unsigned int change,gfp_t flags,int * new_nsid,int new_ifindex)4157 void rtmsg_ifinfo_newnet(int type, struct net_device *dev, unsigned int change,
4158 gfp_t flags, int *new_nsid, int new_ifindex)
4159 {
4160 rtmsg_ifinfo_event(type, dev, change, rtnl_get_event(0), flags,
4161 new_nsid, new_ifindex, 0, NULL);
4162 }
4163
nlmsg_populate_fdb_fill(struct sk_buff * skb,struct net_device * dev,u8 * addr,u16 vid,u32 pid,u32 seq,int type,unsigned int flags,int nlflags,u16 ndm_state)4164 static int nlmsg_populate_fdb_fill(struct sk_buff *skb,
4165 struct net_device *dev,
4166 u8 *addr, u16 vid, u32 pid, u32 seq,
4167 int type, unsigned int flags,
4168 int nlflags, u16 ndm_state)
4169 {
4170 struct nlmsghdr *nlh;
4171 struct ndmsg *ndm;
4172
4173 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), nlflags);
4174 if (!nlh)
4175 return -EMSGSIZE;
4176
4177 ndm = nlmsg_data(nlh);
4178 ndm->ndm_family = AF_BRIDGE;
4179 ndm->ndm_pad1 = 0;
4180 ndm->ndm_pad2 = 0;
4181 ndm->ndm_flags = flags;
4182 ndm->ndm_type = 0;
4183 ndm->ndm_ifindex = dev->ifindex;
4184 ndm->ndm_state = ndm_state;
4185
4186 if (nla_put(skb, NDA_LLADDR, dev->addr_len, addr))
4187 goto nla_put_failure;
4188 if (vid)
4189 if (nla_put(skb, NDA_VLAN, sizeof(u16), &vid))
4190 goto nla_put_failure;
4191
4192 nlmsg_end(skb, nlh);
4193 return 0;
4194
4195 nla_put_failure:
4196 nlmsg_cancel(skb, nlh);
4197 return -EMSGSIZE;
4198 }
4199
rtnl_fdb_nlmsg_size(const struct net_device * dev)4200 static inline size_t rtnl_fdb_nlmsg_size(const struct net_device *dev)
4201 {
4202 return NLMSG_ALIGN(sizeof(struct ndmsg)) +
4203 nla_total_size(dev->addr_len) + /* NDA_LLADDR */
4204 nla_total_size(sizeof(u16)) + /* NDA_VLAN */
4205 0;
4206 }
4207
rtnl_fdb_notify(struct net_device * dev,u8 * addr,u16 vid,int type,u16 ndm_state)4208 static void rtnl_fdb_notify(struct net_device *dev, u8 *addr, u16 vid, int type,
4209 u16 ndm_state)
4210 {
4211 struct net *net = dev_net(dev);
4212 struct sk_buff *skb;
4213 int err = -ENOBUFS;
4214
4215 skb = nlmsg_new(rtnl_fdb_nlmsg_size(dev), GFP_ATOMIC);
4216 if (!skb)
4217 goto errout;
4218
4219 err = nlmsg_populate_fdb_fill(skb, dev, addr, vid,
4220 0, 0, type, NTF_SELF, 0, ndm_state);
4221 if (err < 0) {
4222 kfree_skb(skb);
4223 goto errout;
4224 }
4225
4226 rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
4227 return;
4228 errout:
4229 rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
4230 }
4231
4232 /*
4233 * ndo_dflt_fdb_add - default netdevice operation to add an FDB entry
4234 */
ndo_dflt_fdb_add(struct ndmsg * ndm,struct nlattr * tb[],struct net_device * dev,const unsigned char * addr,u16 vid,u16 flags)4235 int ndo_dflt_fdb_add(struct ndmsg *ndm,
4236 struct nlattr *tb[],
4237 struct net_device *dev,
4238 const unsigned char *addr, u16 vid,
4239 u16 flags)
4240 {
4241 int err = -EINVAL;
4242
4243 /* If aging addresses are supported device will need to
4244 * implement its own handler for this.
4245 */
4246 if (ndm->ndm_state && !(ndm->ndm_state & NUD_PERMANENT)) {
4247 netdev_info(dev, "default FDB implementation only supports local addresses\n");
4248 return err;
4249 }
4250
4251 if (tb[NDA_FLAGS_EXT]) {
4252 netdev_info(dev, "invalid flags given to default FDB implementation\n");
4253 return err;
4254 }
4255
4256 if (vid) {
4257 netdev_info(dev, "vlans aren't supported yet for dev_uc|mc_add()\n");
4258 return err;
4259 }
4260
4261 if (is_unicast_ether_addr(addr) || is_link_local_ether_addr(addr))
4262 err = dev_uc_add_excl(dev, addr);
4263 else if (is_multicast_ether_addr(addr))
4264 err = dev_mc_add_excl(dev, addr);
4265
4266 /* Only return duplicate errors if NLM_F_EXCL is set */
4267 if (err == -EEXIST && !(flags & NLM_F_EXCL))
4268 err = 0;
4269
4270 return err;
4271 }
4272 EXPORT_SYMBOL(ndo_dflt_fdb_add);
4273
fdb_vid_parse(struct nlattr * vlan_attr,u16 * p_vid,struct netlink_ext_ack * extack)4274 static int fdb_vid_parse(struct nlattr *vlan_attr, u16 *p_vid,
4275 struct netlink_ext_ack *extack)
4276 {
4277 u16 vid = 0;
4278
4279 if (vlan_attr) {
4280 if (nla_len(vlan_attr) != sizeof(u16)) {
4281 NL_SET_ERR_MSG(extack, "invalid vlan attribute size");
4282 return -EINVAL;
4283 }
4284
4285 vid = nla_get_u16(vlan_attr);
4286
4287 if (!vid || vid >= VLAN_VID_MASK) {
4288 NL_SET_ERR_MSG(extack, "invalid vlan id");
4289 return -EINVAL;
4290 }
4291 }
4292 *p_vid = vid;
4293 return 0;
4294 }
4295
rtnl_fdb_add(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)4296 static int rtnl_fdb_add(struct sk_buff *skb, struct nlmsghdr *nlh,
4297 struct netlink_ext_ack *extack)
4298 {
4299 struct net *net = sock_net(skb->sk);
4300 struct ndmsg *ndm;
4301 struct nlattr *tb[NDA_MAX+1];
4302 struct net_device *dev;
4303 u8 *addr;
4304 u16 vid;
4305 int err;
4306
4307 err = nlmsg_parse_deprecated(nlh, sizeof(*ndm), tb, NDA_MAX, NULL,
4308 extack);
4309 if (err < 0)
4310 return err;
4311
4312 ndm = nlmsg_data(nlh);
4313 if (ndm->ndm_ifindex == 0) {
4314 NL_SET_ERR_MSG(extack, "invalid ifindex");
4315 return -EINVAL;
4316 }
4317
4318 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
4319 if (dev == NULL) {
4320 NL_SET_ERR_MSG(extack, "unknown ifindex");
4321 return -ENODEV;
4322 }
4323
4324 if (!tb[NDA_LLADDR] || nla_len(tb[NDA_LLADDR]) != ETH_ALEN) {
4325 NL_SET_ERR_MSG(extack, "invalid address");
4326 return -EINVAL;
4327 }
4328
4329 if (dev->type != ARPHRD_ETHER) {
4330 NL_SET_ERR_MSG(extack, "FDB add only supported for Ethernet devices");
4331 return -EINVAL;
4332 }
4333
4334 addr = nla_data(tb[NDA_LLADDR]);
4335
4336 err = fdb_vid_parse(tb[NDA_VLAN], &vid, extack);
4337 if (err)
4338 return err;
4339
4340 err = -EOPNOTSUPP;
4341
4342 /* Support fdb on master device the net/bridge default case */
4343 if ((!ndm->ndm_flags || ndm->ndm_flags & NTF_MASTER) &&
4344 netif_is_bridge_port(dev)) {
4345 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
4346 const struct net_device_ops *ops = br_dev->netdev_ops;
4347
4348 err = ops->ndo_fdb_add(ndm, tb, dev, addr, vid,
4349 nlh->nlmsg_flags, extack);
4350 if (err)
4351 goto out;
4352 else
4353 ndm->ndm_flags &= ~NTF_MASTER;
4354 }
4355
4356 /* Embedded bridge, macvlan, and any other device support */
4357 if ((ndm->ndm_flags & NTF_SELF)) {
4358 if (dev->netdev_ops->ndo_fdb_add)
4359 err = dev->netdev_ops->ndo_fdb_add(ndm, tb, dev, addr,
4360 vid,
4361 nlh->nlmsg_flags,
4362 extack);
4363 else
4364 err = ndo_dflt_fdb_add(ndm, tb, dev, addr, vid,
4365 nlh->nlmsg_flags);
4366
4367 if (!err) {
4368 rtnl_fdb_notify(dev, addr, vid, RTM_NEWNEIGH,
4369 ndm->ndm_state);
4370 ndm->ndm_flags &= ~NTF_SELF;
4371 }
4372 }
4373 out:
4374 return err;
4375 }
4376
4377 /*
4378 * ndo_dflt_fdb_del - default netdevice operation to delete an FDB entry
4379 */
ndo_dflt_fdb_del(struct ndmsg * ndm,struct nlattr * tb[],struct net_device * dev,const unsigned char * addr,u16 vid)4380 int ndo_dflt_fdb_del(struct ndmsg *ndm,
4381 struct nlattr *tb[],
4382 struct net_device *dev,
4383 const unsigned char *addr, u16 vid)
4384 {
4385 int err = -EINVAL;
4386
4387 /* If aging addresses are supported device will need to
4388 * implement its own handler for this.
4389 */
4390 if (!(ndm->ndm_state & NUD_PERMANENT)) {
4391 netdev_info(dev, "default FDB implementation only supports local addresses\n");
4392 return err;
4393 }
4394
4395 if (is_unicast_ether_addr(addr) || is_link_local_ether_addr(addr))
4396 err = dev_uc_del(dev, addr);
4397 else if (is_multicast_ether_addr(addr))
4398 err = dev_mc_del(dev, addr);
4399
4400 return err;
4401 }
4402 EXPORT_SYMBOL(ndo_dflt_fdb_del);
4403
rtnl_fdb_del(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)4404 static int rtnl_fdb_del(struct sk_buff *skb, struct nlmsghdr *nlh,
4405 struct netlink_ext_ack *extack)
4406 {
4407 bool del_bulk = !!(nlh->nlmsg_flags & NLM_F_BULK);
4408 struct net *net = sock_net(skb->sk);
4409 const struct net_device_ops *ops;
4410 struct ndmsg *ndm;
4411 struct nlattr *tb[NDA_MAX+1];
4412 struct net_device *dev;
4413 __u8 *addr = NULL;
4414 int err;
4415 u16 vid;
4416
4417 if (!netlink_capable(skb, CAP_NET_ADMIN))
4418 return -EPERM;
4419
4420 if (!del_bulk) {
4421 err = nlmsg_parse_deprecated(nlh, sizeof(*ndm), tb, NDA_MAX,
4422 NULL, extack);
4423 } else {
4424 /* For bulk delete, the drivers will parse the message with
4425 * policy.
4426 */
4427 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL, extack);
4428 }
4429 if (err < 0)
4430 return err;
4431
4432 ndm = nlmsg_data(nlh);
4433 if (ndm->ndm_ifindex == 0) {
4434 NL_SET_ERR_MSG(extack, "invalid ifindex");
4435 return -EINVAL;
4436 }
4437
4438 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
4439 if (dev == NULL) {
4440 NL_SET_ERR_MSG(extack, "unknown ifindex");
4441 return -ENODEV;
4442 }
4443
4444 if (!del_bulk) {
4445 if (!tb[NDA_LLADDR] || nla_len(tb[NDA_LLADDR]) != ETH_ALEN) {
4446 NL_SET_ERR_MSG(extack, "invalid address");
4447 return -EINVAL;
4448 }
4449 addr = nla_data(tb[NDA_LLADDR]);
4450
4451 err = fdb_vid_parse(tb[NDA_VLAN], &vid, extack);
4452 if (err)
4453 return err;
4454 }
4455
4456 if (dev->type != ARPHRD_ETHER) {
4457 NL_SET_ERR_MSG(extack, "FDB delete only supported for Ethernet devices");
4458 return -EINVAL;
4459 }
4460
4461 err = -EOPNOTSUPP;
4462
4463 /* Support fdb on master device the net/bridge default case */
4464 if ((!ndm->ndm_flags || ndm->ndm_flags & NTF_MASTER) &&
4465 netif_is_bridge_port(dev)) {
4466 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
4467
4468 ops = br_dev->netdev_ops;
4469 if (!del_bulk) {
4470 if (ops->ndo_fdb_del)
4471 err = ops->ndo_fdb_del(ndm, tb, dev, addr, vid, extack);
4472 } else {
4473 if (ops->ndo_fdb_del_bulk)
4474 err = ops->ndo_fdb_del_bulk(nlh, dev, extack);
4475 }
4476
4477 if (err)
4478 goto out;
4479 else
4480 ndm->ndm_flags &= ~NTF_MASTER;
4481 }
4482
4483 /* Embedded bridge, macvlan, and any other device support */
4484 if (ndm->ndm_flags & NTF_SELF) {
4485 ops = dev->netdev_ops;
4486 if (!del_bulk) {
4487 if (ops->ndo_fdb_del)
4488 err = ops->ndo_fdb_del(ndm, tb, dev, addr, vid, extack);
4489 else
4490 err = ndo_dflt_fdb_del(ndm, tb, dev, addr, vid);
4491 } else {
4492 /* in case err was cleared by NTF_MASTER call */
4493 err = -EOPNOTSUPP;
4494 if (ops->ndo_fdb_del_bulk)
4495 err = ops->ndo_fdb_del_bulk(nlh, dev, extack);
4496 }
4497
4498 if (!err) {
4499 if (!del_bulk)
4500 rtnl_fdb_notify(dev, addr, vid, RTM_DELNEIGH,
4501 ndm->ndm_state);
4502 ndm->ndm_flags &= ~NTF_SELF;
4503 }
4504 }
4505 out:
4506 return err;
4507 }
4508
nlmsg_populate_fdb(struct sk_buff * skb,struct netlink_callback * cb,struct net_device * dev,int * idx,struct netdev_hw_addr_list * list)4509 static int nlmsg_populate_fdb(struct sk_buff *skb,
4510 struct netlink_callback *cb,
4511 struct net_device *dev,
4512 int *idx,
4513 struct netdev_hw_addr_list *list)
4514 {
4515 struct netdev_hw_addr *ha;
4516 int err;
4517 u32 portid, seq;
4518
4519 portid = NETLINK_CB(cb->skb).portid;
4520 seq = cb->nlh->nlmsg_seq;
4521
4522 list_for_each_entry(ha, &list->list, list) {
4523 if (*idx < cb->args[2])
4524 goto skip;
4525
4526 err = nlmsg_populate_fdb_fill(skb, dev, ha->addr, 0,
4527 portid, seq,
4528 RTM_NEWNEIGH, NTF_SELF,
4529 NLM_F_MULTI, NUD_PERMANENT);
4530 if (err < 0)
4531 return err;
4532 skip:
4533 *idx += 1;
4534 }
4535 return 0;
4536 }
4537
4538 /**
4539 * ndo_dflt_fdb_dump - default netdevice operation to dump an FDB table.
4540 * @skb: socket buffer to store message in
4541 * @cb: netlink callback
4542 * @dev: netdevice
4543 * @filter_dev: ignored
4544 * @idx: the number of FDB table entries dumped is added to *@idx
4545 *
4546 * Default netdevice operation to dump the existing unicast address list.
4547 * Returns number of addresses from list put in skb.
4548 */
ndo_dflt_fdb_dump(struct sk_buff * skb,struct netlink_callback * cb,struct net_device * dev,struct net_device * filter_dev,int * idx)4549 int ndo_dflt_fdb_dump(struct sk_buff *skb,
4550 struct netlink_callback *cb,
4551 struct net_device *dev,
4552 struct net_device *filter_dev,
4553 int *idx)
4554 {
4555 int err;
4556
4557 if (dev->type != ARPHRD_ETHER)
4558 return -EINVAL;
4559
4560 netif_addr_lock_bh(dev);
4561 err = nlmsg_populate_fdb(skb, cb, dev, idx, &dev->uc);
4562 if (err)
4563 goto out;
4564 err = nlmsg_populate_fdb(skb, cb, dev, idx, &dev->mc);
4565 out:
4566 netif_addr_unlock_bh(dev);
4567 return err;
4568 }
4569 EXPORT_SYMBOL(ndo_dflt_fdb_dump);
4570
valid_fdb_dump_strict(const struct nlmsghdr * nlh,int * br_idx,int * brport_idx,struct netlink_ext_ack * extack)4571 static int valid_fdb_dump_strict(const struct nlmsghdr *nlh,
4572 int *br_idx, int *brport_idx,
4573 struct netlink_ext_ack *extack)
4574 {
4575 struct nlattr *tb[NDA_MAX + 1];
4576 struct ndmsg *ndm;
4577 int err, i;
4578
4579 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ndm))) {
4580 NL_SET_ERR_MSG(extack, "Invalid header for fdb dump request");
4581 return -EINVAL;
4582 }
4583
4584 ndm = nlmsg_data(nlh);
4585 if (ndm->ndm_pad1 || ndm->ndm_pad2 || ndm->ndm_state ||
4586 ndm->ndm_flags || ndm->ndm_type) {
4587 NL_SET_ERR_MSG(extack, "Invalid values in header for fdb dump request");
4588 return -EINVAL;
4589 }
4590
4591 err = nlmsg_parse_deprecated_strict(nlh, sizeof(struct ndmsg), tb,
4592 NDA_MAX, NULL, extack);
4593 if (err < 0)
4594 return err;
4595
4596 *brport_idx = ndm->ndm_ifindex;
4597 for (i = 0; i <= NDA_MAX; ++i) {
4598 if (!tb[i])
4599 continue;
4600
4601 switch (i) {
4602 case NDA_IFINDEX:
4603 if (nla_len(tb[i]) != sizeof(u32)) {
4604 NL_SET_ERR_MSG(extack, "Invalid IFINDEX attribute in fdb dump request");
4605 return -EINVAL;
4606 }
4607 *brport_idx = nla_get_u32(tb[NDA_IFINDEX]);
4608 break;
4609 case NDA_MASTER:
4610 if (nla_len(tb[i]) != sizeof(u32)) {
4611 NL_SET_ERR_MSG(extack, "Invalid MASTER attribute in fdb dump request");
4612 return -EINVAL;
4613 }
4614 *br_idx = nla_get_u32(tb[NDA_MASTER]);
4615 break;
4616 default:
4617 NL_SET_ERR_MSG(extack, "Unsupported attribute in fdb dump request");
4618 return -EINVAL;
4619 }
4620 }
4621
4622 return 0;
4623 }
4624
valid_fdb_dump_legacy(const struct nlmsghdr * nlh,int * br_idx,int * brport_idx,struct netlink_ext_ack * extack)4625 static int valid_fdb_dump_legacy(const struct nlmsghdr *nlh,
4626 int *br_idx, int *brport_idx,
4627 struct netlink_ext_ack *extack)
4628 {
4629 struct nlattr *tb[IFLA_MAX+1];
4630 int err;
4631
4632 /* A hack to preserve kernel<->userspace interface.
4633 * Before Linux v4.12 this code accepted ndmsg since iproute2 v3.3.0.
4634 * However, ndmsg is shorter than ifinfomsg thus nlmsg_parse() bails.
4635 * So, check for ndmsg with an optional u32 attribute (not used here).
4636 * Fortunately these sizes don't conflict with the size of ifinfomsg
4637 * with an optional attribute.
4638 */
4639 if (nlmsg_len(nlh) != sizeof(struct ndmsg) &&
4640 (nlmsg_len(nlh) != sizeof(struct ndmsg) +
4641 nla_attr_size(sizeof(u32)))) {
4642 struct ifinfomsg *ifm;
4643
4644 err = nlmsg_parse_deprecated(nlh, sizeof(struct ifinfomsg),
4645 tb, IFLA_MAX, ifla_policy,
4646 extack);
4647 if (err < 0) {
4648 return -EINVAL;
4649 } else if (err == 0) {
4650 if (tb[IFLA_MASTER])
4651 *br_idx = nla_get_u32(tb[IFLA_MASTER]);
4652 }
4653
4654 ifm = nlmsg_data(nlh);
4655 *brport_idx = ifm->ifi_index;
4656 }
4657 return 0;
4658 }
4659
rtnl_fdb_dump(struct sk_buff * skb,struct netlink_callback * cb)4660 static int rtnl_fdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
4661 {
4662 struct net_device *dev;
4663 struct net_device *br_dev = NULL;
4664 const struct net_device_ops *ops = NULL;
4665 const struct net_device_ops *cops = NULL;
4666 struct net *net = sock_net(skb->sk);
4667 struct hlist_head *head;
4668 int brport_idx = 0;
4669 int br_idx = 0;
4670 int h, s_h;
4671 int idx = 0, s_idx;
4672 int err = 0;
4673 int fidx = 0;
4674
4675 if (cb->strict_check)
4676 err = valid_fdb_dump_strict(cb->nlh, &br_idx, &brport_idx,
4677 cb->extack);
4678 else
4679 err = valid_fdb_dump_legacy(cb->nlh, &br_idx, &brport_idx,
4680 cb->extack);
4681 if (err < 0)
4682 return err;
4683
4684 if (br_idx) {
4685 br_dev = __dev_get_by_index(net, br_idx);
4686 if (!br_dev)
4687 return -ENODEV;
4688
4689 ops = br_dev->netdev_ops;
4690 }
4691
4692 s_h = cb->args[0];
4693 s_idx = cb->args[1];
4694
4695 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
4696 idx = 0;
4697 head = &net->dev_index_head[h];
4698 hlist_for_each_entry(dev, head, index_hlist) {
4699
4700 if (brport_idx && (dev->ifindex != brport_idx))
4701 continue;
4702
4703 if (!br_idx) { /* user did not specify a specific bridge */
4704 if (netif_is_bridge_port(dev)) {
4705 br_dev = netdev_master_upper_dev_get(dev);
4706 cops = br_dev->netdev_ops;
4707 }
4708 } else {
4709 if (dev != br_dev &&
4710 !netif_is_bridge_port(dev))
4711 continue;
4712
4713 if (br_dev != netdev_master_upper_dev_get(dev) &&
4714 !netif_is_bridge_master(dev))
4715 continue;
4716 cops = ops;
4717 }
4718
4719 if (idx < s_idx)
4720 goto cont;
4721
4722 if (netif_is_bridge_port(dev)) {
4723 if (cops && cops->ndo_fdb_dump) {
4724 err = cops->ndo_fdb_dump(skb, cb,
4725 br_dev, dev,
4726 &fidx);
4727 if (err == -EMSGSIZE)
4728 goto out;
4729 }
4730 }
4731
4732 if (dev->netdev_ops->ndo_fdb_dump)
4733 err = dev->netdev_ops->ndo_fdb_dump(skb, cb,
4734 dev, NULL,
4735 &fidx);
4736 else
4737 err = ndo_dflt_fdb_dump(skb, cb, dev, NULL,
4738 &fidx);
4739 if (err == -EMSGSIZE)
4740 goto out;
4741
4742 cops = NULL;
4743
4744 /* reset fdb offset to 0 for rest of the interfaces */
4745 cb->args[2] = 0;
4746 fidx = 0;
4747 cont:
4748 idx++;
4749 }
4750 }
4751
4752 out:
4753 cb->args[0] = h;
4754 cb->args[1] = idx;
4755 cb->args[2] = fidx;
4756
4757 return skb->len;
4758 }
4759
valid_fdb_get_strict(const struct nlmsghdr * nlh,struct nlattr ** tb,u8 * ndm_flags,int * br_idx,int * brport_idx,u8 ** addr,u16 * vid,struct netlink_ext_ack * extack)4760 static int valid_fdb_get_strict(const struct nlmsghdr *nlh,
4761 struct nlattr **tb, u8 *ndm_flags,
4762 int *br_idx, int *brport_idx, u8 **addr,
4763 u16 *vid, struct netlink_ext_ack *extack)
4764 {
4765 struct ndmsg *ndm;
4766 int err, i;
4767
4768 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ndm))) {
4769 NL_SET_ERR_MSG(extack, "Invalid header for fdb get request");
4770 return -EINVAL;
4771 }
4772
4773 ndm = nlmsg_data(nlh);
4774 if (ndm->ndm_pad1 || ndm->ndm_pad2 || ndm->ndm_state ||
4775 ndm->ndm_type) {
4776 NL_SET_ERR_MSG(extack, "Invalid values in header for fdb get request");
4777 return -EINVAL;
4778 }
4779
4780 if (ndm->ndm_flags & ~(NTF_MASTER | NTF_SELF)) {
4781 NL_SET_ERR_MSG(extack, "Invalid flags in header for fdb get request");
4782 return -EINVAL;
4783 }
4784
4785 err = nlmsg_parse_deprecated_strict(nlh, sizeof(struct ndmsg), tb,
4786 NDA_MAX, nda_policy, extack);
4787 if (err < 0)
4788 return err;
4789
4790 *ndm_flags = ndm->ndm_flags;
4791 *brport_idx = ndm->ndm_ifindex;
4792 for (i = 0; i <= NDA_MAX; ++i) {
4793 if (!tb[i])
4794 continue;
4795
4796 switch (i) {
4797 case NDA_MASTER:
4798 *br_idx = nla_get_u32(tb[i]);
4799 break;
4800 case NDA_LLADDR:
4801 if (nla_len(tb[i]) != ETH_ALEN) {
4802 NL_SET_ERR_MSG(extack, "Invalid address in fdb get request");
4803 return -EINVAL;
4804 }
4805 *addr = nla_data(tb[i]);
4806 break;
4807 case NDA_VLAN:
4808 err = fdb_vid_parse(tb[i], vid, extack);
4809 if (err)
4810 return err;
4811 break;
4812 case NDA_VNI:
4813 break;
4814 default:
4815 NL_SET_ERR_MSG(extack, "Unsupported attribute in fdb get request");
4816 return -EINVAL;
4817 }
4818 }
4819
4820 return 0;
4821 }
4822
rtnl_fdb_get(struct sk_buff * in_skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)4823 static int rtnl_fdb_get(struct sk_buff *in_skb, struct nlmsghdr *nlh,
4824 struct netlink_ext_ack *extack)
4825 {
4826 struct net_device *dev = NULL, *br_dev = NULL;
4827 const struct net_device_ops *ops = NULL;
4828 struct net *net = sock_net(in_skb->sk);
4829 struct nlattr *tb[NDA_MAX + 1];
4830 struct sk_buff *skb;
4831 int brport_idx = 0;
4832 u8 ndm_flags = 0;
4833 int br_idx = 0;
4834 u8 *addr = NULL;
4835 u16 vid = 0;
4836 int err;
4837
4838 err = valid_fdb_get_strict(nlh, tb, &ndm_flags, &br_idx,
4839 &brport_idx, &addr, &vid, extack);
4840 if (err < 0)
4841 return err;
4842
4843 if (!addr) {
4844 NL_SET_ERR_MSG(extack, "Missing lookup address for fdb get request");
4845 return -EINVAL;
4846 }
4847
4848 if (brport_idx) {
4849 dev = __dev_get_by_index(net, brport_idx);
4850 if (!dev) {
4851 NL_SET_ERR_MSG(extack, "Unknown device ifindex");
4852 return -ENODEV;
4853 }
4854 }
4855
4856 if (br_idx) {
4857 if (dev) {
4858 NL_SET_ERR_MSG(extack, "Master and device are mutually exclusive");
4859 return -EINVAL;
4860 }
4861
4862 br_dev = __dev_get_by_index(net, br_idx);
4863 if (!br_dev) {
4864 NL_SET_ERR_MSG(extack, "Invalid master ifindex");
4865 return -EINVAL;
4866 }
4867 ops = br_dev->netdev_ops;
4868 }
4869
4870 if (dev) {
4871 if (!ndm_flags || (ndm_flags & NTF_MASTER)) {
4872 if (!netif_is_bridge_port(dev)) {
4873 NL_SET_ERR_MSG(extack, "Device is not a bridge port");
4874 return -EINVAL;
4875 }
4876 br_dev = netdev_master_upper_dev_get(dev);
4877 if (!br_dev) {
4878 NL_SET_ERR_MSG(extack, "Master of device not found");
4879 return -EINVAL;
4880 }
4881 ops = br_dev->netdev_ops;
4882 } else {
4883 if (!(ndm_flags & NTF_SELF)) {
4884 NL_SET_ERR_MSG(extack, "Missing NTF_SELF");
4885 return -EINVAL;
4886 }
4887 ops = dev->netdev_ops;
4888 }
4889 }
4890
4891 if (!br_dev && !dev) {
4892 NL_SET_ERR_MSG(extack, "No device specified");
4893 return -ENODEV;
4894 }
4895
4896 if (!ops || !ops->ndo_fdb_get) {
4897 NL_SET_ERR_MSG(extack, "Fdb get operation not supported by device");
4898 return -EOPNOTSUPP;
4899 }
4900
4901 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
4902 if (!skb)
4903 return -ENOBUFS;
4904
4905 if (br_dev)
4906 dev = br_dev;
4907 err = ops->ndo_fdb_get(skb, tb, dev, addr, vid,
4908 NETLINK_CB(in_skb).portid,
4909 nlh->nlmsg_seq, extack);
4910 if (err)
4911 goto out;
4912
4913 return rtnl_unicast(skb, net, NETLINK_CB(in_skb).portid);
4914 out:
4915 kfree_skb(skb);
4916 return err;
4917 }
4918
brport_nla_put_flag(struct sk_buff * skb,u32 flags,u32 mask,unsigned int attrnum,unsigned int flag)4919 static int brport_nla_put_flag(struct sk_buff *skb, u32 flags, u32 mask,
4920 unsigned int attrnum, unsigned int flag)
4921 {
4922 if (mask & flag)
4923 return nla_put_u8(skb, attrnum, !!(flags & flag));
4924 return 0;
4925 }
4926
ndo_dflt_bridge_getlink(struct sk_buff * skb,u32 pid,u32 seq,struct net_device * dev,u16 mode,u32 flags,u32 mask,int nlflags,u32 filter_mask,int (* vlan_fill)(struct sk_buff * skb,struct net_device * dev,u32 filter_mask))4927 int ndo_dflt_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
4928 struct net_device *dev, u16 mode,
4929 u32 flags, u32 mask, int nlflags,
4930 u32 filter_mask,
4931 int (*vlan_fill)(struct sk_buff *skb,
4932 struct net_device *dev,
4933 u32 filter_mask))
4934 {
4935 struct nlmsghdr *nlh;
4936 struct ifinfomsg *ifm;
4937 struct nlattr *br_afspec;
4938 struct nlattr *protinfo;
4939 u8 operstate = netif_running(dev) ? dev->operstate : IF_OPER_DOWN;
4940 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
4941 int err = 0;
4942
4943 nlh = nlmsg_put(skb, pid, seq, RTM_NEWLINK, sizeof(*ifm), nlflags);
4944 if (nlh == NULL)
4945 return -EMSGSIZE;
4946
4947 ifm = nlmsg_data(nlh);
4948 ifm->ifi_family = AF_BRIDGE;
4949 ifm->__ifi_pad = 0;
4950 ifm->ifi_type = dev->type;
4951 ifm->ifi_index = dev->ifindex;
4952 ifm->ifi_flags = dev_get_flags(dev);
4953 ifm->ifi_change = 0;
4954
4955
4956 if (nla_put_string(skb, IFLA_IFNAME, dev->name) ||
4957 nla_put_u32(skb, IFLA_MTU, dev->mtu) ||
4958 nla_put_u8(skb, IFLA_OPERSTATE, operstate) ||
4959 (br_dev &&
4960 nla_put_u32(skb, IFLA_MASTER, br_dev->ifindex)) ||
4961 (dev->addr_len &&
4962 nla_put(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr)) ||
4963 (dev->ifindex != dev_get_iflink(dev) &&
4964 nla_put_u32(skb, IFLA_LINK, dev_get_iflink(dev))))
4965 goto nla_put_failure;
4966
4967 br_afspec = nla_nest_start_noflag(skb, IFLA_AF_SPEC);
4968 if (!br_afspec)
4969 goto nla_put_failure;
4970
4971 if (nla_put_u16(skb, IFLA_BRIDGE_FLAGS, BRIDGE_FLAGS_SELF)) {
4972 nla_nest_cancel(skb, br_afspec);
4973 goto nla_put_failure;
4974 }
4975
4976 if (mode != BRIDGE_MODE_UNDEF) {
4977 if (nla_put_u16(skb, IFLA_BRIDGE_MODE, mode)) {
4978 nla_nest_cancel(skb, br_afspec);
4979 goto nla_put_failure;
4980 }
4981 }
4982 if (vlan_fill) {
4983 err = vlan_fill(skb, dev, filter_mask);
4984 if (err) {
4985 nla_nest_cancel(skb, br_afspec);
4986 goto nla_put_failure;
4987 }
4988 }
4989 nla_nest_end(skb, br_afspec);
4990
4991 protinfo = nla_nest_start(skb, IFLA_PROTINFO);
4992 if (!protinfo)
4993 goto nla_put_failure;
4994
4995 if (brport_nla_put_flag(skb, flags, mask,
4996 IFLA_BRPORT_MODE, BR_HAIRPIN_MODE) ||
4997 brport_nla_put_flag(skb, flags, mask,
4998 IFLA_BRPORT_GUARD, BR_BPDU_GUARD) ||
4999 brport_nla_put_flag(skb, flags, mask,
5000 IFLA_BRPORT_FAST_LEAVE,
5001 BR_MULTICAST_FAST_LEAVE) ||
5002 brport_nla_put_flag(skb, flags, mask,
5003 IFLA_BRPORT_PROTECT, BR_ROOT_BLOCK) ||
5004 brport_nla_put_flag(skb, flags, mask,
5005 IFLA_BRPORT_LEARNING, BR_LEARNING) ||
5006 brport_nla_put_flag(skb, flags, mask,
5007 IFLA_BRPORT_LEARNING_SYNC, BR_LEARNING_SYNC) ||
5008 brport_nla_put_flag(skb, flags, mask,
5009 IFLA_BRPORT_UNICAST_FLOOD, BR_FLOOD) ||
5010 brport_nla_put_flag(skb, flags, mask,
5011 IFLA_BRPORT_PROXYARP, BR_PROXYARP) ||
5012 brport_nla_put_flag(skb, flags, mask,
5013 IFLA_BRPORT_MCAST_FLOOD, BR_MCAST_FLOOD) ||
5014 brport_nla_put_flag(skb, flags, mask,
5015 IFLA_BRPORT_BCAST_FLOOD, BR_BCAST_FLOOD)) {
5016 nla_nest_cancel(skb, protinfo);
5017 goto nla_put_failure;
5018 }
5019
5020 nla_nest_end(skb, protinfo);
5021
5022 nlmsg_end(skb, nlh);
5023 return 0;
5024 nla_put_failure:
5025 nlmsg_cancel(skb, nlh);
5026 return err ? err : -EMSGSIZE;
5027 }
5028 EXPORT_SYMBOL_GPL(ndo_dflt_bridge_getlink);
5029
valid_bridge_getlink_req(const struct nlmsghdr * nlh,bool strict_check,u32 * filter_mask,struct netlink_ext_ack * extack)5030 static int valid_bridge_getlink_req(const struct nlmsghdr *nlh,
5031 bool strict_check, u32 *filter_mask,
5032 struct netlink_ext_ack *extack)
5033 {
5034 struct nlattr *tb[IFLA_MAX+1];
5035 int err, i;
5036
5037 if (strict_check) {
5038 struct ifinfomsg *ifm;
5039
5040 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifm))) {
5041 NL_SET_ERR_MSG(extack, "Invalid header for bridge link dump");
5042 return -EINVAL;
5043 }
5044
5045 ifm = nlmsg_data(nlh);
5046 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags ||
5047 ifm->ifi_change || ifm->ifi_index) {
5048 NL_SET_ERR_MSG(extack, "Invalid values in header for bridge link dump request");
5049 return -EINVAL;
5050 }
5051
5052 err = nlmsg_parse_deprecated_strict(nlh,
5053 sizeof(struct ifinfomsg),
5054 tb, IFLA_MAX, ifla_policy,
5055 extack);
5056 } else {
5057 err = nlmsg_parse_deprecated(nlh, sizeof(struct ifinfomsg),
5058 tb, IFLA_MAX, ifla_policy,
5059 extack);
5060 }
5061 if (err < 0)
5062 return err;
5063
5064 /* new attributes should only be added with strict checking */
5065 for (i = 0; i <= IFLA_MAX; ++i) {
5066 if (!tb[i])
5067 continue;
5068
5069 switch (i) {
5070 case IFLA_EXT_MASK:
5071 *filter_mask = nla_get_u32(tb[i]);
5072 break;
5073 default:
5074 if (strict_check) {
5075 NL_SET_ERR_MSG(extack, "Unsupported attribute in bridge link dump request");
5076 return -EINVAL;
5077 }
5078 }
5079 }
5080
5081 return 0;
5082 }
5083
rtnl_bridge_getlink(struct sk_buff * skb,struct netlink_callback * cb)5084 static int rtnl_bridge_getlink(struct sk_buff *skb, struct netlink_callback *cb)
5085 {
5086 const struct nlmsghdr *nlh = cb->nlh;
5087 struct net *net = sock_net(skb->sk);
5088 struct net_device *dev;
5089 int idx = 0;
5090 u32 portid = NETLINK_CB(cb->skb).portid;
5091 u32 seq = nlh->nlmsg_seq;
5092 u32 filter_mask = 0;
5093 int err;
5094
5095 err = valid_bridge_getlink_req(nlh, cb->strict_check, &filter_mask,
5096 cb->extack);
5097 if (err < 0 && cb->strict_check)
5098 return err;
5099
5100 rcu_read_lock();
5101 for_each_netdev_rcu(net, dev) {
5102 const struct net_device_ops *ops = dev->netdev_ops;
5103 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5104
5105 if (br_dev && br_dev->netdev_ops->ndo_bridge_getlink) {
5106 if (idx >= cb->args[0]) {
5107 err = br_dev->netdev_ops->ndo_bridge_getlink(
5108 skb, portid, seq, dev,
5109 filter_mask, NLM_F_MULTI);
5110 if (err < 0 && err != -EOPNOTSUPP) {
5111 if (likely(skb->len))
5112 break;
5113
5114 goto out_err;
5115 }
5116 }
5117 idx++;
5118 }
5119
5120 if (ops->ndo_bridge_getlink) {
5121 if (idx >= cb->args[0]) {
5122 err = ops->ndo_bridge_getlink(skb, portid,
5123 seq, dev,
5124 filter_mask,
5125 NLM_F_MULTI);
5126 if (err < 0 && err != -EOPNOTSUPP) {
5127 if (likely(skb->len))
5128 break;
5129
5130 goto out_err;
5131 }
5132 }
5133 idx++;
5134 }
5135 }
5136 err = skb->len;
5137 out_err:
5138 rcu_read_unlock();
5139 cb->args[0] = idx;
5140
5141 return err;
5142 }
5143
bridge_nlmsg_size(void)5144 static inline size_t bridge_nlmsg_size(void)
5145 {
5146 return NLMSG_ALIGN(sizeof(struct ifinfomsg))
5147 + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */
5148 + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */
5149 + nla_total_size(sizeof(u32)) /* IFLA_MASTER */
5150 + nla_total_size(sizeof(u32)) /* IFLA_MTU */
5151 + nla_total_size(sizeof(u32)) /* IFLA_LINK */
5152 + nla_total_size(sizeof(u32)) /* IFLA_OPERSTATE */
5153 + nla_total_size(sizeof(u8)) /* IFLA_PROTINFO */
5154 + nla_total_size(sizeof(struct nlattr)) /* IFLA_AF_SPEC */
5155 + nla_total_size(sizeof(u16)) /* IFLA_BRIDGE_FLAGS */
5156 + nla_total_size(sizeof(u16)); /* IFLA_BRIDGE_MODE */
5157 }
5158
rtnl_bridge_notify(struct net_device * dev)5159 static int rtnl_bridge_notify(struct net_device *dev)
5160 {
5161 struct net *net = dev_net(dev);
5162 struct sk_buff *skb;
5163 int err = -EOPNOTSUPP;
5164
5165 if (!dev->netdev_ops->ndo_bridge_getlink)
5166 return 0;
5167
5168 skb = nlmsg_new(bridge_nlmsg_size(), GFP_ATOMIC);
5169 if (!skb) {
5170 err = -ENOMEM;
5171 goto errout;
5172 }
5173
5174 err = dev->netdev_ops->ndo_bridge_getlink(skb, 0, 0, dev, 0, 0);
5175 if (err < 0)
5176 goto errout;
5177
5178 /* Notification info is only filled for bridge ports, not the bridge
5179 * device itself. Therefore, a zero notification length is valid and
5180 * should not result in an error.
5181 */
5182 if (!skb->len)
5183 goto errout;
5184
5185 rtnl_notify(skb, net, 0, RTNLGRP_LINK, NULL, GFP_ATOMIC);
5186 return 0;
5187 errout:
5188 WARN_ON(err == -EMSGSIZE);
5189 kfree_skb(skb);
5190 if (err)
5191 rtnl_set_sk_err(net, RTNLGRP_LINK, err);
5192 return err;
5193 }
5194
rtnl_bridge_setlink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)5195 static int rtnl_bridge_setlink(struct sk_buff *skb, struct nlmsghdr *nlh,
5196 struct netlink_ext_ack *extack)
5197 {
5198 struct net *net = sock_net(skb->sk);
5199 struct ifinfomsg *ifm;
5200 struct net_device *dev;
5201 struct nlattr *br_spec, *attr, *br_flags_attr = NULL;
5202 int rem, err = -EOPNOTSUPP;
5203 u16 flags = 0;
5204
5205 if (nlmsg_len(nlh) < sizeof(*ifm))
5206 return -EINVAL;
5207
5208 ifm = nlmsg_data(nlh);
5209 if (ifm->ifi_family != AF_BRIDGE)
5210 return -EPFNOSUPPORT;
5211
5212 dev = __dev_get_by_index(net, ifm->ifi_index);
5213 if (!dev) {
5214 NL_SET_ERR_MSG(extack, "unknown ifindex");
5215 return -ENODEV;
5216 }
5217
5218 br_spec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg), IFLA_AF_SPEC);
5219 if (br_spec) {
5220 nla_for_each_nested(attr, br_spec, rem) {
5221 if (nla_type(attr) == IFLA_BRIDGE_FLAGS && !br_flags_attr) {
5222 if (nla_len(attr) < sizeof(flags))
5223 return -EINVAL;
5224
5225 br_flags_attr = attr;
5226 flags = nla_get_u16(attr);
5227 }
5228
5229 if (nla_type(attr) == IFLA_BRIDGE_MODE) {
5230 if (nla_len(attr) < sizeof(u16))
5231 return -EINVAL;
5232 }
5233 }
5234 }
5235
5236 if (!flags || (flags & BRIDGE_FLAGS_MASTER)) {
5237 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5238
5239 if (!br_dev || !br_dev->netdev_ops->ndo_bridge_setlink) {
5240 err = -EOPNOTSUPP;
5241 goto out;
5242 }
5243
5244 err = br_dev->netdev_ops->ndo_bridge_setlink(dev, nlh, flags,
5245 extack);
5246 if (err)
5247 goto out;
5248
5249 flags &= ~BRIDGE_FLAGS_MASTER;
5250 }
5251
5252 if ((flags & BRIDGE_FLAGS_SELF)) {
5253 if (!dev->netdev_ops->ndo_bridge_setlink)
5254 err = -EOPNOTSUPP;
5255 else
5256 err = dev->netdev_ops->ndo_bridge_setlink(dev, nlh,
5257 flags,
5258 extack);
5259 if (!err) {
5260 flags &= ~BRIDGE_FLAGS_SELF;
5261
5262 /* Generate event to notify upper layer of bridge
5263 * change
5264 */
5265 err = rtnl_bridge_notify(dev);
5266 }
5267 }
5268
5269 if (br_flags_attr)
5270 memcpy(nla_data(br_flags_attr), &flags, sizeof(flags));
5271 out:
5272 return err;
5273 }
5274
rtnl_bridge_dellink(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)5275 static int rtnl_bridge_dellink(struct sk_buff *skb, struct nlmsghdr *nlh,
5276 struct netlink_ext_ack *extack)
5277 {
5278 struct net *net = sock_net(skb->sk);
5279 struct ifinfomsg *ifm;
5280 struct net_device *dev;
5281 struct nlattr *br_spec, *attr = NULL;
5282 int rem, err = -EOPNOTSUPP;
5283 u16 flags = 0;
5284 bool have_flags = false;
5285
5286 if (nlmsg_len(nlh) < sizeof(*ifm))
5287 return -EINVAL;
5288
5289 ifm = nlmsg_data(nlh);
5290 if (ifm->ifi_family != AF_BRIDGE)
5291 return -EPFNOSUPPORT;
5292
5293 dev = __dev_get_by_index(net, ifm->ifi_index);
5294 if (!dev) {
5295 NL_SET_ERR_MSG(extack, "unknown ifindex");
5296 return -ENODEV;
5297 }
5298
5299 br_spec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg), IFLA_AF_SPEC);
5300 if (br_spec) {
5301 nla_for_each_nested_type(attr, IFLA_BRIDGE_FLAGS, br_spec,
5302 rem) {
5303 if (nla_len(attr) < sizeof(flags))
5304 return -EINVAL;
5305
5306 have_flags = true;
5307 flags = nla_get_u16(attr);
5308 break;
5309 }
5310 }
5311
5312 if (!flags || (flags & BRIDGE_FLAGS_MASTER)) {
5313 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5314
5315 if (!br_dev || !br_dev->netdev_ops->ndo_bridge_dellink) {
5316 err = -EOPNOTSUPP;
5317 goto out;
5318 }
5319
5320 err = br_dev->netdev_ops->ndo_bridge_dellink(dev, nlh, flags);
5321 if (err)
5322 goto out;
5323
5324 flags &= ~BRIDGE_FLAGS_MASTER;
5325 }
5326
5327 if ((flags & BRIDGE_FLAGS_SELF)) {
5328 if (!dev->netdev_ops->ndo_bridge_dellink)
5329 err = -EOPNOTSUPP;
5330 else
5331 err = dev->netdev_ops->ndo_bridge_dellink(dev, nlh,
5332 flags);
5333
5334 if (!err) {
5335 flags &= ~BRIDGE_FLAGS_SELF;
5336
5337 /* Generate event to notify upper layer of bridge
5338 * change
5339 */
5340 err = rtnl_bridge_notify(dev);
5341 }
5342 }
5343
5344 if (have_flags)
5345 memcpy(nla_data(attr), &flags, sizeof(flags));
5346 out:
5347 return err;
5348 }
5349
stats_attr_valid(unsigned int mask,int attrid,int idxattr)5350 static bool stats_attr_valid(unsigned int mask, int attrid, int idxattr)
5351 {
5352 return (mask & IFLA_STATS_FILTER_BIT(attrid)) &&
5353 (!idxattr || idxattr == attrid);
5354 }
5355
5356 static bool
rtnl_offload_xstats_have_ndo(const struct net_device * dev,int attr_id)5357 rtnl_offload_xstats_have_ndo(const struct net_device *dev, int attr_id)
5358 {
5359 return dev->netdev_ops &&
5360 dev->netdev_ops->ndo_has_offload_stats &&
5361 dev->netdev_ops->ndo_get_offload_stats &&
5362 dev->netdev_ops->ndo_has_offload_stats(dev, attr_id);
5363 }
5364
5365 static unsigned int
rtnl_offload_xstats_get_size_ndo(const struct net_device * dev,int attr_id)5366 rtnl_offload_xstats_get_size_ndo(const struct net_device *dev, int attr_id)
5367 {
5368 return rtnl_offload_xstats_have_ndo(dev, attr_id) ?
5369 sizeof(struct rtnl_link_stats64) : 0;
5370 }
5371
5372 static int
rtnl_offload_xstats_fill_ndo(struct net_device * dev,int attr_id,struct sk_buff * skb)5373 rtnl_offload_xstats_fill_ndo(struct net_device *dev, int attr_id,
5374 struct sk_buff *skb)
5375 {
5376 unsigned int size = rtnl_offload_xstats_get_size_ndo(dev, attr_id);
5377 struct nlattr *attr = NULL;
5378 void *attr_data;
5379 int err;
5380
5381 if (!size)
5382 return -ENODATA;
5383
5384 attr = nla_reserve_64bit(skb, attr_id, size,
5385 IFLA_OFFLOAD_XSTATS_UNSPEC);
5386 if (!attr)
5387 return -EMSGSIZE;
5388
5389 attr_data = nla_data(attr);
5390 memset(attr_data, 0, size);
5391
5392 err = dev->netdev_ops->ndo_get_offload_stats(attr_id, dev, attr_data);
5393 if (err)
5394 return err;
5395
5396 return 0;
5397 }
5398
5399 static unsigned int
rtnl_offload_xstats_get_size_stats(const struct net_device * dev,enum netdev_offload_xstats_type type)5400 rtnl_offload_xstats_get_size_stats(const struct net_device *dev,
5401 enum netdev_offload_xstats_type type)
5402 {
5403 bool enabled = netdev_offload_xstats_enabled(dev, type);
5404
5405 return enabled ? sizeof(struct rtnl_hw_stats64) : 0;
5406 }
5407
5408 struct rtnl_offload_xstats_request_used {
5409 bool request;
5410 bool used;
5411 };
5412
5413 static int
rtnl_offload_xstats_get_stats(struct net_device * dev,enum netdev_offload_xstats_type type,struct rtnl_offload_xstats_request_used * ru,struct rtnl_hw_stats64 * stats,struct netlink_ext_ack * extack)5414 rtnl_offload_xstats_get_stats(struct net_device *dev,
5415 enum netdev_offload_xstats_type type,
5416 struct rtnl_offload_xstats_request_used *ru,
5417 struct rtnl_hw_stats64 *stats,
5418 struct netlink_ext_ack *extack)
5419 {
5420 bool request;
5421 bool used;
5422 int err;
5423
5424 request = netdev_offload_xstats_enabled(dev, type);
5425 if (!request) {
5426 used = false;
5427 goto out;
5428 }
5429
5430 err = netdev_offload_xstats_get(dev, type, stats, &used, extack);
5431 if (err)
5432 return err;
5433
5434 out:
5435 if (ru) {
5436 ru->request = request;
5437 ru->used = used;
5438 }
5439 return 0;
5440 }
5441
5442 static int
rtnl_offload_xstats_fill_hw_s_info_one(struct sk_buff * skb,int attr_id,struct rtnl_offload_xstats_request_used * ru)5443 rtnl_offload_xstats_fill_hw_s_info_one(struct sk_buff *skb, int attr_id,
5444 struct rtnl_offload_xstats_request_used *ru)
5445 {
5446 struct nlattr *nest;
5447
5448 nest = nla_nest_start(skb, attr_id);
5449 if (!nest)
5450 return -EMSGSIZE;
5451
5452 if (nla_put_u8(skb, IFLA_OFFLOAD_XSTATS_HW_S_INFO_REQUEST, ru->request))
5453 goto nla_put_failure;
5454
5455 if (nla_put_u8(skb, IFLA_OFFLOAD_XSTATS_HW_S_INFO_USED, ru->used))
5456 goto nla_put_failure;
5457
5458 nla_nest_end(skb, nest);
5459 return 0;
5460
5461 nla_put_failure:
5462 nla_nest_cancel(skb, nest);
5463 return -EMSGSIZE;
5464 }
5465
5466 static int
rtnl_offload_xstats_fill_hw_s_info(struct sk_buff * skb,struct net_device * dev,struct netlink_ext_ack * extack)5467 rtnl_offload_xstats_fill_hw_s_info(struct sk_buff *skb, struct net_device *dev,
5468 struct netlink_ext_ack *extack)
5469 {
5470 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5471 struct rtnl_offload_xstats_request_used ru_l3;
5472 struct nlattr *nest;
5473 int err;
5474
5475 err = rtnl_offload_xstats_get_stats(dev, t_l3, &ru_l3, NULL, extack);
5476 if (err)
5477 return err;
5478
5479 nest = nla_nest_start(skb, IFLA_OFFLOAD_XSTATS_HW_S_INFO);
5480 if (!nest)
5481 return -EMSGSIZE;
5482
5483 if (rtnl_offload_xstats_fill_hw_s_info_one(skb,
5484 IFLA_OFFLOAD_XSTATS_L3_STATS,
5485 &ru_l3))
5486 goto nla_put_failure;
5487
5488 nla_nest_end(skb, nest);
5489 return 0;
5490
5491 nla_put_failure:
5492 nla_nest_cancel(skb, nest);
5493 return -EMSGSIZE;
5494 }
5495
rtnl_offload_xstats_fill(struct sk_buff * skb,struct net_device * dev,int * prividx,u32 off_filter_mask,struct netlink_ext_ack * extack)5496 static int rtnl_offload_xstats_fill(struct sk_buff *skb, struct net_device *dev,
5497 int *prividx, u32 off_filter_mask,
5498 struct netlink_ext_ack *extack)
5499 {
5500 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5501 int attr_id_hw_s_info = IFLA_OFFLOAD_XSTATS_HW_S_INFO;
5502 int attr_id_l3_stats = IFLA_OFFLOAD_XSTATS_L3_STATS;
5503 int attr_id_cpu_hit = IFLA_OFFLOAD_XSTATS_CPU_HIT;
5504 bool have_data = false;
5505 int err;
5506
5507 if (*prividx <= attr_id_cpu_hit &&
5508 (off_filter_mask &
5509 IFLA_STATS_FILTER_BIT(attr_id_cpu_hit))) {
5510 err = rtnl_offload_xstats_fill_ndo(dev, attr_id_cpu_hit, skb);
5511 if (!err) {
5512 have_data = true;
5513 } else if (err != -ENODATA) {
5514 *prividx = attr_id_cpu_hit;
5515 return err;
5516 }
5517 }
5518
5519 if (*prividx <= attr_id_hw_s_info &&
5520 (off_filter_mask & IFLA_STATS_FILTER_BIT(attr_id_hw_s_info))) {
5521 *prividx = attr_id_hw_s_info;
5522
5523 err = rtnl_offload_xstats_fill_hw_s_info(skb, dev, extack);
5524 if (err)
5525 return err;
5526
5527 have_data = true;
5528 *prividx = 0;
5529 }
5530
5531 if (*prividx <= attr_id_l3_stats &&
5532 (off_filter_mask & IFLA_STATS_FILTER_BIT(attr_id_l3_stats))) {
5533 unsigned int size_l3;
5534 struct nlattr *attr;
5535
5536 *prividx = attr_id_l3_stats;
5537
5538 size_l3 = rtnl_offload_xstats_get_size_stats(dev, t_l3);
5539 if (!size_l3)
5540 goto skip_l3_stats;
5541 attr = nla_reserve_64bit(skb, attr_id_l3_stats, size_l3,
5542 IFLA_OFFLOAD_XSTATS_UNSPEC);
5543 if (!attr)
5544 return -EMSGSIZE;
5545
5546 err = rtnl_offload_xstats_get_stats(dev, t_l3, NULL,
5547 nla_data(attr), extack);
5548 if (err)
5549 return err;
5550
5551 have_data = true;
5552 skip_l3_stats:
5553 *prividx = 0;
5554 }
5555
5556 if (!have_data)
5557 return -ENODATA;
5558
5559 *prividx = 0;
5560 return 0;
5561 }
5562
5563 static unsigned int
rtnl_offload_xstats_get_size_hw_s_info_one(const struct net_device * dev,enum netdev_offload_xstats_type type)5564 rtnl_offload_xstats_get_size_hw_s_info_one(const struct net_device *dev,
5565 enum netdev_offload_xstats_type type)
5566 {
5567 return nla_total_size(0) +
5568 /* IFLA_OFFLOAD_XSTATS_HW_S_INFO_REQUEST */
5569 nla_total_size(sizeof(u8)) +
5570 /* IFLA_OFFLOAD_XSTATS_HW_S_INFO_USED */
5571 nla_total_size(sizeof(u8)) +
5572 0;
5573 }
5574
5575 static unsigned int
rtnl_offload_xstats_get_size_hw_s_info(const struct net_device * dev)5576 rtnl_offload_xstats_get_size_hw_s_info(const struct net_device *dev)
5577 {
5578 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5579
5580 return nla_total_size(0) +
5581 /* IFLA_OFFLOAD_XSTATS_L3_STATS */
5582 rtnl_offload_xstats_get_size_hw_s_info_one(dev, t_l3) +
5583 0;
5584 }
5585
rtnl_offload_xstats_get_size(const struct net_device * dev,u32 off_filter_mask)5586 static int rtnl_offload_xstats_get_size(const struct net_device *dev,
5587 u32 off_filter_mask)
5588 {
5589 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5590 int attr_id_cpu_hit = IFLA_OFFLOAD_XSTATS_CPU_HIT;
5591 int nla_size = 0;
5592 int size;
5593
5594 if (off_filter_mask &
5595 IFLA_STATS_FILTER_BIT(attr_id_cpu_hit)) {
5596 size = rtnl_offload_xstats_get_size_ndo(dev, attr_id_cpu_hit);
5597 nla_size += nla_total_size_64bit(size);
5598 }
5599
5600 if (off_filter_mask &
5601 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_HW_S_INFO))
5602 nla_size += rtnl_offload_xstats_get_size_hw_s_info(dev);
5603
5604 if (off_filter_mask &
5605 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_L3_STATS)) {
5606 size = rtnl_offload_xstats_get_size_stats(dev, t_l3);
5607 nla_size += nla_total_size_64bit(size);
5608 }
5609
5610 if (nla_size != 0)
5611 nla_size += nla_total_size(0);
5612
5613 return nla_size;
5614 }
5615
5616 struct rtnl_stats_dump_filters {
5617 /* mask[0] filters outer attributes. Then individual nests have their
5618 * filtering mask at the index of the nested attribute.
5619 */
5620 u32 mask[IFLA_STATS_MAX + 1];
5621 };
5622
rtnl_fill_statsinfo(struct sk_buff * skb,struct net_device * dev,int type,u32 pid,u32 seq,u32 change,unsigned int flags,const struct rtnl_stats_dump_filters * filters,int * idxattr,int * prividx,struct netlink_ext_ack * extack)5623 static int rtnl_fill_statsinfo(struct sk_buff *skb, struct net_device *dev,
5624 int type, u32 pid, u32 seq, u32 change,
5625 unsigned int flags,
5626 const struct rtnl_stats_dump_filters *filters,
5627 int *idxattr, int *prividx,
5628 struct netlink_ext_ack *extack)
5629 {
5630 unsigned int filter_mask = filters->mask[0];
5631 struct if_stats_msg *ifsm;
5632 struct nlmsghdr *nlh;
5633 struct nlattr *attr;
5634 int s_prividx = *prividx;
5635 int err;
5636
5637 ASSERT_RTNL();
5638
5639 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ifsm), flags);
5640 if (!nlh)
5641 return -EMSGSIZE;
5642
5643 ifsm = nlmsg_data(nlh);
5644 ifsm->family = PF_UNSPEC;
5645 ifsm->pad1 = 0;
5646 ifsm->pad2 = 0;
5647 ifsm->ifindex = dev->ifindex;
5648 ifsm->filter_mask = filter_mask;
5649
5650 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_64, *idxattr)) {
5651 struct rtnl_link_stats64 *sp;
5652
5653 attr = nla_reserve_64bit(skb, IFLA_STATS_LINK_64,
5654 sizeof(struct rtnl_link_stats64),
5655 IFLA_STATS_UNSPEC);
5656 if (!attr) {
5657 err = -EMSGSIZE;
5658 goto nla_put_failure;
5659 }
5660
5661 sp = nla_data(attr);
5662 dev_get_stats(dev, sp);
5663 }
5664
5665 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS, *idxattr)) {
5666 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
5667
5668 if (ops && ops->fill_linkxstats) {
5669 *idxattr = IFLA_STATS_LINK_XSTATS;
5670 attr = nla_nest_start_noflag(skb,
5671 IFLA_STATS_LINK_XSTATS);
5672 if (!attr) {
5673 err = -EMSGSIZE;
5674 goto nla_put_failure;
5675 }
5676
5677 err = ops->fill_linkxstats(skb, dev, prividx, *idxattr);
5678 nla_nest_end(skb, attr);
5679 if (err)
5680 goto nla_put_failure;
5681 *idxattr = 0;
5682 }
5683 }
5684
5685 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS_SLAVE,
5686 *idxattr)) {
5687 const struct rtnl_link_ops *ops = NULL;
5688 const struct net_device *master;
5689
5690 master = netdev_master_upper_dev_get(dev);
5691 if (master)
5692 ops = master->rtnl_link_ops;
5693 if (ops && ops->fill_linkxstats) {
5694 *idxattr = IFLA_STATS_LINK_XSTATS_SLAVE;
5695 attr = nla_nest_start_noflag(skb,
5696 IFLA_STATS_LINK_XSTATS_SLAVE);
5697 if (!attr) {
5698 err = -EMSGSIZE;
5699 goto nla_put_failure;
5700 }
5701
5702 err = ops->fill_linkxstats(skb, dev, prividx, *idxattr);
5703 nla_nest_end(skb, attr);
5704 if (err)
5705 goto nla_put_failure;
5706 *idxattr = 0;
5707 }
5708 }
5709
5710 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_OFFLOAD_XSTATS,
5711 *idxattr)) {
5712 u32 off_filter_mask;
5713
5714 off_filter_mask = filters->mask[IFLA_STATS_LINK_OFFLOAD_XSTATS];
5715 *idxattr = IFLA_STATS_LINK_OFFLOAD_XSTATS;
5716 attr = nla_nest_start_noflag(skb,
5717 IFLA_STATS_LINK_OFFLOAD_XSTATS);
5718 if (!attr) {
5719 err = -EMSGSIZE;
5720 goto nla_put_failure;
5721 }
5722
5723 err = rtnl_offload_xstats_fill(skb, dev, prividx,
5724 off_filter_mask, extack);
5725 if (err == -ENODATA)
5726 nla_nest_cancel(skb, attr);
5727 else
5728 nla_nest_end(skb, attr);
5729
5730 if (err && err != -ENODATA)
5731 goto nla_put_failure;
5732 *idxattr = 0;
5733 }
5734
5735 if (stats_attr_valid(filter_mask, IFLA_STATS_AF_SPEC, *idxattr)) {
5736 struct rtnl_af_ops *af_ops;
5737
5738 *idxattr = IFLA_STATS_AF_SPEC;
5739 attr = nla_nest_start_noflag(skb, IFLA_STATS_AF_SPEC);
5740 if (!attr) {
5741 err = -EMSGSIZE;
5742 goto nla_put_failure;
5743 }
5744
5745 rcu_read_lock();
5746 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
5747 if (af_ops->fill_stats_af) {
5748 struct nlattr *af;
5749
5750 af = nla_nest_start_noflag(skb,
5751 af_ops->family);
5752 if (!af) {
5753 rcu_read_unlock();
5754 err = -EMSGSIZE;
5755 goto nla_put_failure;
5756 }
5757 err = af_ops->fill_stats_af(skb, dev);
5758
5759 if (err == -ENODATA) {
5760 nla_nest_cancel(skb, af);
5761 } else if (err < 0) {
5762 rcu_read_unlock();
5763 goto nla_put_failure;
5764 }
5765
5766 nla_nest_end(skb, af);
5767 }
5768 }
5769 rcu_read_unlock();
5770
5771 nla_nest_end(skb, attr);
5772
5773 *idxattr = 0;
5774 }
5775
5776 nlmsg_end(skb, nlh);
5777
5778 return 0;
5779
5780 nla_put_failure:
5781 /* not a multi message or no progress mean a real error */
5782 if (!(flags & NLM_F_MULTI) || s_prividx == *prividx)
5783 nlmsg_cancel(skb, nlh);
5784 else
5785 nlmsg_end(skb, nlh);
5786
5787 return err;
5788 }
5789
if_nlmsg_stats_size(const struct net_device * dev,const struct rtnl_stats_dump_filters * filters)5790 static size_t if_nlmsg_stats_size(const struct net_device *dev,
5791 const struct rtnl_stats_dump_filters *filters)
5792 {
5793 size_t size = NLMSG_ALIGN(sizeof(struct if_stats_msg));
5794 unsigned int filter_mask = filters->mask[0];
5795
5796 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_64, 0))
5797 size += nla_total_size_64bit(sizeof(struct rtnl_link_stats64));
5798
5799 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS, 0)) {
5800 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
5801 int attr = IFLA_STATS_LINK_XSTATS;
5802
5803 if (ops && ops->get_linkxstats_size) {
5804 size += nla_total_size(ops->get_linkxstats_size(dev,
5805 attr));
5806 /* for IFLA_STATS_LINK_XSTATS */
5807 size += nla_total_size(0);
5808 }
5809 }
5810
5811 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS_SLAVE, 0)) {
5812 struct net_device *_dev = (struct net_device *)dev;
5813 const struct rtnl_link_ops *ops = NULL;
5814 const struct net_device *master;
5815
5816 /* netdev_master_upper_dev_get can't take const */
5817 master = netdev_master_upper_dev_get(_dev);
5818 if (master)
5819 ops = master->rtnl_link_ops;
5820 if (ops && ops->get_linkxstats_size) {
5821 int attr = IFLA_STATS_LINK_XSTATS_SLAVE;
5822
5823 size += nla_total_size(ops->get_linkxstats_size(dev,
5824 attr));
5825 /* for IFLA_STATS_LINK_XSTATS_SLAVE */
5826 size += nla_total_size(0);
5827 }
5828 }
5829
5830 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_OFFLOAD_XSTATS, 0)) {
5831 u32 off_filter_mask;
5832
5833 off_filter_mask = filters->mask[IFLA_STATS_LINK_OFFLOAD_XSTATS];
5834 size += rtnl_offload_xstats_get_size(dev, off_filter_mask);
5835 }
5836
5837 if (stats_attr_valid(filter_mask, IFLA_STATS_AF_SPEC, 0)) {
5838 struct rtnl_af_ops *af_ops;
5839
5840 /* for IFLA_STATS_AF_SPEC */
5841 size += nla_total_size(0);
5842
5843 rcu_read_lock();
5844 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
5845 if (af_ops->get_stats_af_size) {
5846 size += nla_total_size(
5847 af_ops->get_stats_af_size(dev));
5848
5849 /* for AF_* */
5850 size += nla_total_size(0);
5851 }
5852 }
5853 rcu_read_unlock();
5854 }
5855
5856 return size;
5857 }
5858
5859 #define RTNL_STATS_OFFLOAD_XSTATS_VALID ((1 << __IFLA_OFFLOAD_XSTATS_MAX) - 1)
5860
5861 static const struct nla_policy
5862 rtnl_stats_get_policy_filters[IFLA_STATS_MAX + 1] = {
5863 [IFLA_STATS_LINK_OFFLOAD_XSTATS] =
5864 NLA_POLICY_MASK(NLA_U32, RTNL_STATS_OFFLOAD_XSTATS_VALID),
5865 };
5866
5867 static const struct nla_policy
5868 rtnl_stats_get_policy[IFLA_STATS_GETSET_MAX + 1] = {
5869 [IFLA_STATS_GET_FILTERS] =
5870 NLA_POLICY_NESTED(rtnl_stats_get_policy_filters),
5871 };
5872
5873 static const struct nla_policy
5874 ifla_stats_set_policy[IFLA_STATS_GETSET_MAX + 1] = {
5875 [IFLA_STATS_SET_OFFLOAD_XSTATS_L3_STATS] = NLA_POLICY_MAX(NLA_U8, 1),
5876 };
5877
rtnl_stats_get_parse_filters(struct nlattr * ifla_filters,struct rtnl_stats_dump_filters * filters,struct netlink_ext_ack * extack)5878 static int rtnl_stats_get_parse_filters(struct nlattr *ifla_filters,
5879 struct rtnl_stats_dump_filters *filters,
5880 struct netlink_ext_ack *extack)
5881 {
5882 struct nlattr *tb[IFLA_STATS_MAX + 1];
5883 int err;
5884 int at;
5885
5886 err = nla_parse_nested(tb, IFLA_STATS_MAX, ifla_filters,
5887 rtnl_stats_get_policy_filters, extack);
5888 if (err < 0)
5889 return err;
5890
5891 for (at = 1; at <= IFLA_STATS_MAX; at++) {
5892 if (tb[at]) {
5893 if (!(filters->mask[0] & IFLA_STATS_FILTER_BIT(at))) {
5894 NL_SET_ERR_MSG(extack, "Filtered attribute not enabled in filter_mask");
5895 return -EINVAL;
5896 }
5897 filters->mask[at] = nla_get_u32(tb[at]);
5898 }
5899 }
5900
5901 return 0;
5902 }
5903
rtnl_stats_get_parse(const struct nlmsghdr * nlh,u32 filter_mask,struct rtnl_stats_dump_filters * filters,struct netlink_ext_ack * extack)5904 static int rtnl_stats_get_parse(const struct nlmsghdr *nlh,
5905 u32 filter_mask,
5906 struct rtnl_stats_dump_filters *filters,
5907 struct netlink_ext_ack *extack)
5908 {
5909 struct nlattr *tb[IFLA_STATS_GETSET_MAX + 1];
5910 int err;
5911 int i;
5912
5913 filters->mask[0] = filter_mask;
5914 for (i = 1; i < ARRAY_SIZE(filters->mask); i++)
5915 filters->mask[i] = -1U;
5916
5917 err = nlmsg_parse(nlh, sizeof(struct if_stats_msg), tb,
5918 IFLA_STATS_GETSET_MAX, rtnl_stats_get_policy, extack);
5919 if (err < 0)
5920 return err;
5921
5922 if (tb[IFLA_STATS_GET_FILTERS]) {
5923 err = rtnl_stats_get_parse_filters(tb[IFLA_STATS_GET_FILTERS],
5924 filters, extack);
5925 if (err)
5926 return err;
5927 }
5928
5929 return 0;
5930 }
5931
rtnl_valid_stats_req(const struct nlmsghdr * nlh,bool strict_check,bool is_dump,struct netlink_ext_ack * extack)5932 static int rtnl_valid_stats_req(const struct nlmsghdr *nlh, bool strict_check,
5933 bool is_dump, struct netlink_ext_ack *extack)
5934 {
5935 struct if_stats_msg *ifsm;
5936
5937 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifsm))) {
5938 NL_SET_ERR_MSG(extack, "Invalid header for stats dump");
5939 return -EINVAL;
5940 }
5941
5942 if (!strict_check)
5943 return 0;
5944
5945 ifsm = nlmsg_data(nlh);
5946
5947 /* only requests using strict checks can pass data to influence
5948 * the dump. The legacy exception is filter_mask.
5949 */
5950 if (ifsm->pad1 || ifsm->pad2 || (is_dump && ifsm->ifindex)) {
5951 NL_SET_ERR_MSG(extack, "Invalid values in header for stats dump request");
5952 return -EINVAL;
5953 }
5954 if (ifsm->filter_mask >= IFLA_STATS_FILTER_BIT(IFLA_STATS_MAX + 1)) {
5955 NL_SET_ERR_MSG(extack, "Invalid stats requested through filter mask");
5956 return -EINVAL;
5957 }
5958
5959 return 0;
5960 }
5961
rtnl_stats_get(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)5962 static int rtnl_stats_get(struct sk_buff *skb, struct nlmsghdr *nlh,
5963 struct netlink_ext_ack *extack)
5964 {
5965 struct rtnl_stats_dump_filters filters;
5966 struct net *net = sock_net(skb->sk);
5967 struct net_device *dev = NULL;
5968 int idxattr = 0, prividx = 0;
5969 struct if_stats_msg *ifsm;
5970 struct sk_buff *nskb;
5971 int err;
5972
5973 err = rtnl_valid_stats_req(nlh, netlink_strict_get_check(skb),
5974 false, extack);
5975 if (err)
5976 return err;
5977
5978 ifsm = nlmsg_data(nlh);
5979 if (ifsm->ifindex > 0)
5980 dev = __dev_get_by_index(net, ifsm->ifindex);
5981 else
5982 return -EINVAL;
5983
5984 if (!dev)
5985 return -ENODEV;
5986
5987 if (!ifsm->filter_mask) {
5988 NL_SET_ERR_MSG(extack, "Filter mask must be set for stats get");
5989 return -EINVAL;
5990 }
5991
5992 err = rtnl_stats_get_parse(nlh, ifsm->filter_mask, &filters, extack);
5993 if (err)
5994 return err;
5995
5996 nskb = nlmsg_new(if_nlmsg_stats_size(dev, &filters), GFP_KERNEL);
5997 if (!nskb)
5998 return -ENOBUFS;
5999
6000 err = rtnl_fill_statsinfo(nskb, dev, RTM_NEWSTATS,
6001 NETLINK_CB(skb).portid, nlh->nlmsg_seq, 0,
6002 0, &filters, &idxattr, &prividx, extack);
6003 if (err < 0) {
6004 /* -EMSGSIZE implies BUG in if_nlmsg_stats_size */
6005 WARN_ON(err == -EMSGSIZE);
6006 kfree_skb(nskb);
6007 } else {
6008 err = rtnl_unicast(nskb, net, NETLINK_CB(skb).portid);
6009 }
6010
6011 return err;
6012 }
6013
rtnl_stats_dump(struct sk_buff * skb,struct netlink_callback * cb)6014 static int rtnl_stats_dump(struct sk_buff *skb, struct netlink_callback *cb)
6015 {
6016 struct netlink_ext_ack *extack = cb->extack;
6017 struct rtnl_stats_dump_filters filters;
6018 struct net *net = sock_net(skb->sk);
6019 unsigned int flags = NLM_F_MULTI;
6020 struct if_stats_msg *ifsm;
6021 struct {
6022 unsigned long ifindex;
6023 int idxattr;
6024 int prividx;
6025 } *ctx = (void *)cb->ctx;
6026 struct net_device *dev;
6027 int err;
6028
6029 cb->seq = net->dev_base_seq;
6030
6031 err = rtnl_valid_stats_req(cb->nlh, cb->strict_check, true, extack);
6032 if (err)
6033 return err;
6034
6035 ifsm = nlmsg_data(cb->nlh);
6036 if (!ifsm->filter_mask) {
6037 NL_SET_ERR_MSG(extack, "Filter mask must be set for stats dump");
6038 return -EINVAL;
6039 }
6040
6041 err = rtnl_stats_get_parse(cb->nlh, ifsm->filter_mask, &filters,
6042 extack);
6043 if (err)
6044 return err;
6045
6046 for_each_netdev_dump(net, dev, ctx->ifindex) {
6047 err = rtnl_fill_statsinfo(skb, dev, RTM_NEWSTATS,
6048 NETLINK_CB(cb->skb).portid,
6049 cb->nlh->nlmsg_seq, 0,
6050 flags, &filters,
6051 &ctx->idxattr, &ctx->prividx,
6052 extack);
6053 /* If we ran out of room on the first message,
6054 * we're in trouble.
6055 */
6056 WARN_ON((err == -EMSGSIZE) && (skb->len == 0));
6057
6058 if (err < 0)
6059 break;
6060 ctx->prividx = 0;
6061 ctx->idxattr = 0;
6062 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
6063 }
6064
6065 return err;
6066 }
6067
rtnl_offload_xstats_notify(struct net_device * dev)6068 void rtnl_offload_xstats_notify(struct net_device *dev)
6069 {
6070 struct rtnl_stats_dump_filters response_filters = {};
6071 struct net *net = dev_net(dev);
6072 int idxattr = 0, prividx = 0;
6073 struct sk_buff *skb;
6074 int err = -ENOBUFS;
6075
6076 ASSERT_RTNL();
6077
6078 response_filters.mask[0] |=
6079 IFLA_STATS_FILTER_BIT(IFLA_STATS_LINK_OFFLOAD_XSTATS);
6080 response_filters.mask[IFLA_STATS_LINK_OFFLOAD_XSTATS] |=
6081 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_HW_S_INFO);
6082
6083 skb = nlmsg_new(if_nlmsg_stats_size(dev, &response_filters),
6084 GFP_KERNEL);
6085 if (!skb)
6086 goto errout;
6087
6088 err = rtnl_fill_statsinfo(skb, dev, RTM_NEWSTATS, 0, 0, 0, 0,
6089 &response_filters, &idxattr, &prividx, NULL);
6090 if (err < 0) {
6091 kfree_skb(skb);
6092 goto errout;
6093 }
6094
6095 rtnl_notify(skb, net, 0, RTNLGRP_STATS, NULL, GFP_KERNEL);
6096 return;
6097
6098 errout:
6099 rtnl_set_sk_err(net, RTNLGRP_STATS, err);
6100 }
6101 EXPORT_SYMBOL(rtnl_offload_xstats_notify);
6102
rtnl_stats_set(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6103 static int rtnl_stats_set(struct sk_buff *skb, struct nlmsghdr *nlh,
6104 struct netlink_ext_ack *extack)
6105 {
6106 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
6107 struct rtnl_stats_dump_filters response_filters = {};
6108 struct nlattr *tb[IFLA_STATS_GETSET_MAX + 1];
6109 struct net *net = sock_net(skb->sk);
6110 struct net_device *dev = NULL;
6111 struct if_stats_msg *ifsm;
6112 bool notify = false;
6113 int err;
6114
6115 err = rtnl_valid_stats_req(nlh, netlink_strict_get_check(skb),
6116 false, extack);
6117 if (err)
6118 return err;
6119
6120 ifsm = nlmsg_data(nlh);
6121 if (ifsm->family != AF_UNSPEC) {
6122 NL_SET_ERR_MSG(extack, "Address family should be AF_UNSPEC");
6123 return -EINVAL;
6124 }
6125
6126 if (ifsm->ifindex > 0)
6127 dev = __dev_get_by_index(net, ifsm->ifindex);
6128 else
6129 return -EINVAL;
6130
6131 if (!dev)
6132 return -ENODEV;
6133
6134 if (ifsm->filter_mask) {
6135 NL_SET_ERR_MSG(extack, "Filter mask must be 0 for stats set");
6136 return -EINVAL;
6137 }
6138
6139 err = nlmsg_parse(nlh, sizeof(*ifsm), tb, IFLA_STATS_GETSET_MAX,
6140 ifla_stats_set_policy, extack);
6141 if (err < 0)
6142 return err;
6143
6144 if (tb[IFLA_STATS_SET_OFFLOAD_XSTATS_L3_STATS]) {
6145 u8 req = nla_get_u8(tb[IFLA_STATS_SET_OFFLOAD_XSTATS_L3_STATS]);
6146
6147 if (req)
6148 err = netdev_offload_xstats_enable(dev, t_l3, extack);
6149 else
6150 err = netdev_offload_xstats_disable(dev, t_l3);
6151
6152 if (!err)
6153 notify = true;
6154 else if (err != -EALREADY)
6155 return err;
6156
6157 response_filters.mask[0] |=
6158 IFLA_STATS_FILTER_BIT(IFLA_STATS_LINK_OFFLOAD_XSTATS);
6159 response_filters.mask[IFLA_STATS_LINK_OFFLOAD_XSTATS] |=
6160 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_HW_S_INFO);
6161 }
6162
6163 if (notify)
6164 rtnl_offload_xstats_notify(dev);
6165
6166 return 0;
6167 }
6168
rtnl_mdb_valid_dump_req(const struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6169 static int rtnl_mdb_valid_dump_req(const struct nlmsghdr *nlh,
6170 struct netlink_ext_ack *extack)
6171 {
6172 struct br_port_msg *bpm;
6173
6174 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*bpm))) {
6175 NL_SET_ERR_MSG(extack, "Invalid header for mdb dump request");
6176 return -EINVAL;
6177 }
6178
6179 bpm = nlmsg_data(nlh);
6180 if (bpm->ifindex) {
6181 NL_SET_ERR_MSG(extack, "Filtering by device index is not supported for mdb dump request");
6182 return -EINVAL;
6183 }
6184 if (nlmsg_attrlen(nlh, sizeof(*bpm))) {
6185 NL_SET_ERR_MSG(extack, "Invalid data after header in mdb dump request");
6186 return -EINVAL;
6187 }
6188
6189 return 0;
6190 }
6191
6192 struct rtnl_mdb_dump_ctx {
6193 long idx;
6194 };
6195
rtnl_mdb_dump(struct sk_buff * skb,struct netlink_callback * cb)6196 static int rtnl_mdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
6197 {
6198 struct rtnl_mdb_dump_ctx *ctx = (void *)cb->ctx;
6199 struct net *net = sock_net(skb->sk);
6200 struct net_device *dev;
6201 int idx, s_idx;
6202 int err;
6203
6204 NL_ASSERT_DUMP_CTX_FITS(struct rtnl_mdb_dump_ctx);
6205
6206 if (cb->strict_check) {
6207 err = rtnl_mdb_valid_dump_req(cb->nlh, cb->extack);
6208 if (err)
6209 return err;
6210 }
6211
6212 s_idx = ctx->idx;
6213 idx = 0;
6214
6215 for_each_netdev(net, dev) {
6216 if (idx < s_idx)
6217 goto skip;
6218 if (!dev->netdev_ops->ndo_mdb_dump)
6219 goto skip;
6220
6221 err = dev->netdev_ops->ndo_mdb_dump(dev, skb, cb);
6222 if (err == -EMSGSIZE)
6223 goto out;
6224 /* Moving on to next device, reset markers and sequence
6225 * counters since they are all maintained per-device.
6226 */
6227 memset(cb->ctx, 0, sizeof(cb->ctx));
6228 cb->prev_seq = 0;
6229 cb->seq = 0;
6230 skip:
6231 idx++;
6232 }
6233
6234 out:
6235 ctx->idx = idx;
6236 return skb->len;
6237 }
6238
rtnl_validate_mdb_entry_get(const struct nlattr * attr,struct netlink_ext_ack * extack)6239 static int rtnl_validate_mdb_entry_get(const struct nlattr *attr,
6240 struct netlink_ext_ack *extack)
6241 {
6242 struct br_mdb_entry *entry = nla_data(attr);
6243
6244 if (nla_len(attr) != sizeof(struct br_mdb_entry)) {
6245 NL_SET_ERR_MSG_ATTR(extack, attr, "Invalid attribute length");
6246 return -EINVAL;
6247 }
6248
6249 if (entry->ifindex) {
6250 NL_SET_ERR_MSG(extack, "Entry ifindex cannot be specified");
6251 return -EINVAL;
6252 }
6253
6254 if (entry->state) {
6255 NL_SET_ERR_MSG(extack, "Entry state cannot be specified");
6256 return -EINVAL;
6257 }
6258
6259 if (entry->flags) {
6260 NL_SET_ERR_MSG(extack, "Entry flags cannot be specified");
6261 return -EINVAL;
6262 }
6263
6264 if (entry->vid >= VLAN_VID_MASK) {
6265 NL_SET_ERR_MSG(extack, "Invalid entry VLAN id");
6266 return -EINVAL;
6267 }
6268
6269 if (entry->addr.proto != htons(ETH_P_IP) &&
6270 entry->addr.proto != htons(ETH_P_IPV6) &&
6271 entry->addr.proto != 0) {
6272 NL_SET_ERR_MSG(extack, "Unknown entry protocol");
6273 return -EINVAL;
6274 }
6275
6276 return 0;
6277 }
6278
6279 static const struct nla_policy mdba_get_policy[MDBA_GET_ENTRY_MAX + 1] = {
6280 [MDBA_GET_ENTRY] = NLA_POLICY_VALIDATE_FN(NLA_BINARY,
6281 rtnl_validate_mdb_entry_get,
6282 sizeof(struct br_mdb_entry)),
6283 [MDBA_GET_ENTRY_ATTRS] = { .type = NLA_NESTED },
6284 };
6285
rtnl_mdb_get(struct sk_buff * in_skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6286 static int rtnl_mdb_get(struct sk_buff *in_skb, struct nlmsghdr *nlh,
6287 struct netlink_ext_ack *extack)
6288 {
6289 struct nlattr *tb[MDBA_GET_ENTRY_MAX + 1];
6290 struct net *net = sock_net(in_skb->sk);
6291 struct br_port_msg *bpm;
6292 struct net_device *dev;
6293 int err;
6294
6295 err = nlmsg_parse(nlh, sizeof(struct br_port_msg), tb,
6296 MDBA_GET_ENTRY_MAX, mdba_get_policy, extack);
6297 if (err)
6298 return err;
6299
6300 bpm = nlmsg_data(nlh);
6301 if (!bpm->ifindex) {
6302 NL_SET_ERR_MSG(extack, "Invalid ifindex");
6303 return -EINVAL;
6304 }
6305
6306 dev = __dev_get_by_index(net, bpm->ifindex);
6307 if (!dev) {
6308 NL_SET_ERR_MSG(extack, "Device doesn't exist");
6309 return -ENODEV;
6310 }
6311
6312 if (NL_REQ_ATTR_CHECK(extack, NULL, tb, MDBA_GET_ENTRY)) {
6313 NL_SET_ERR_MSG(extack, "Missing MDBA_GET_ENTRY attribute");
6314 return -EINVAL;
6315 }
6316
6317 if (!dev->netdev_ops->ndo_mdb_get) {
6318 NL_SET_ERR_MSG(extack, "Device does not support MDB operations");
6319 return -EOPNOTSUPP;
6320 }
6321
6322 return dev->netdev_ops->ndo_mdb_get(dev, tb, NETLINK_CB(in_skb).portid,
6323 nlh->nlmsg_seq, extack);
6324 }
6325
rtnl_validate_mdb_entry(const struct nlattr * attr,struct netlink_ext_ack * extack)6326 static int rtnl_validate_mdb_entry(const struct nlattr *attr,
6327 struct netlink_ext_ack *extack)
6328 {
6329 struct br_mdb_entry *entry = nla_data(attr);
6330
6331 if (nla_len(attr) != sizeof(struct br_mdb_entry)) {
6332 NL_SET_ERR_MSG_ATTR(extack, attr, "Invalid attribute length");
6333 return -EINVAL;
6334 }
6335
6336 if (entry->ifindex == 0) {
6337 NL_SET_ERR_MSG(extack, "Zero entry ifindex is not allowed");
6338 return -EINVAL;
6339 }
6340
6341 if (entry->addr.proto == htons(ETH_P_IP)) {
6342 if (!ipv4_is_multicast(entry->addr.u.ip4) &&
6343 !ipv4_is_zeronet(entry->addr.u.ip4)) {
6344 NL_SET_ERR_MSG(extack, "IPv4 entry group address is not multicast or 0.0.0.0");
6345 return -EINVAL;
6346 }
6347 if (ipv4_is_local_multicast(entry->addr.u.ip4)) {
6348 NL_SET_ERR_MSG(extack, "IPv4 entry group address is local multicast");
6349 return -EINVAL;
6350 }
6351 #if IS_ENABLED(CONFIG_IPV6)
6352 } else if (entry->addr.proto == htons(ETH_P_IPV6)) {
6353 if (ipv6_addr_is_ll_all_nodes(&entry->addr.u.ip6)) {
6354 NL_SET_ERR_MSG(extack, "IPv6 entry group address is link-local all nodes");
6355 return -EINVAL;
6356 }
6357 #endif
6358 } else if (entry->addr.proto == 0) {
6359 /* L2 mdb */
6360 if (!is_multicast_ether_addr(entry->addr.u.mac_addr)) {
6361 NL_SET_ERR_MSG(extack, "L2 entry group is not multicast");
6362 return -EINVAL;
6363 }
6364 } else {
6365 NL_SET_ERR_MSG(extack, "Unknown entry protocol");
6366 return -EINVAL;
6367 }
6368
6369 if (entry->state != MDB_PERMANENT && entry->state != MDB_TEMPORARY) {
6370 NL_SET_ERR_MSG(extack, "Unknown entry state");
6371 return -EINVAL;
6372 }
6373 if (entry->vid >= VLAN_VID_MASK) {
6374 NL_SET_ERR_MSG(extack, "Invalid entry VLAN id");
6375 return -EINVAL;
6376 }
6377
6378 return 0;
6379 }
6380
6381 static const struct nla_policy mdba_policy[MDBA_SET_ENTRY_MAX + 1] = {
6382 [MDBA_SET_ENTRY_UNSPEC] = { .strict_start_type = MDBA_SET_ENTRY_ATTRS + 1 },
6383 [MDBA_SET_ENTRY] = NLA_POLICY_VALIDATE_FN(NLA_BINARY,
6384 rtnl_validate_mdb_entry,
6385 sizeof(struct br_mdb_entry)),
6386 [MDBA_SET_ENTRY_ATTRS] = { .type = NLA_NESTED },
6387 };
6388
rtnl_mdb_add(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6389 static int rtnl_mdb_add(struct sk_buff *skb, struct nlmsghdr *nlh,
6390 struct netlink_ext_ack *extack)
6391 {
6392 struct nlattr *tb[MDBA_SET_ENTRY_MAX + 1];
6393 struct net *net = sock_net(skb->sk);
6394 struct br_port_msg *bpm;
6395 struct net_device *dev;
6396 int err;
6397
6398 err = nlmsg_parse_deprecated(nlh, sizeof(*bpm), tb,
6399 MDBA_SET_ENTRY_MAX, mdba_policy, extack);
6400 if (err)
6401 return err;
6402
6403 bpm = nlmsg_data(nlh);
6404 if (!bpm->ifindex) {
6405 NL_SET_ERR_MSG(extack, "Invalid ifindex");
6406 return -EINVAL;
6407 }
6408
6409 dev = __dev_get_by_index(net, bpm->ifindex);
6410 if (!dev) {
6411 NL_SET_ERR_MSG(extack, "Device doesn't exist");
6412 return -ENODEV;
6413 }
6414
6415 if (NL_REQ_ATTR_CHECK(extack, NULL, tb, MDBA_SET_ENTRY)) {
6416 NL_SET_ERR_MSG(extack, "Missing MDBA_SET_ENTRY attribute");
6417 return -EINVAL;
6418 }
6419
6420 if (!dev->netdev_ops->ndo_mdb_add) {
6421 NL_SET_ERR_MSG(extack, "Device does not support MDB operations");
6422 return -EOPNOTSUPP;
6423 }
6424
6425 return dev->netdev_ops->ndo_mdb_add(dev, tb, nlh->nlmsg_flags, extack);
6426 }
6427
rtnl_validate_mdb_entry_del_bulk(const struct nlattr * attr,struct netlink_ext_ack * extack)6428 static int rtnl_validate_mdb_entry_del_bulk(const struct nlattr *attr,
6429 struct netlink_ext_ack *extack)
6430 {
6431 struct br_mdb_entry *entry = nla_data(attr);
6432 struct br_mdb_entry zero_entry = {};
6433
6434 if (nla_len(attr) != sizeof(struct br_mdb_entry)) {
6435 NL_SET_ERR_MSG_ATTR(extack, attr, "Invalid attribute length");
6436 return -EINVAL;
6437 }
6438
6439 if (entry->state != MDB_PERMANENT && entry->state != MDB_TEMPORARY) {
6440 NL_SET_ERR_MSG(extack, "Unknown entry state");
6441 return -EINVAL;
6442 }
6443
6444 if (entry->flags) {
6445 NL_SET_ERR_MSG(extack, "Entry flags cannot be set");
6446 return -EINVAL;
6447 }
6448
6449 if (entry->vid >= VLAN_N_VID - 1) {
6450 NL_SET_ERR_MSG(extack, "Invalid entry VLAN id");
6451 return -EINVAL;
6452 }
6453
6454 if (memcmp(&entry->addr, &zero_entry.addr, sizeof(entry->addr))) {
6455 NL_SET_ERR_MSG(extack, "Entry address cannot be set");
6456 return -EINVAL;
6457 }
6458
6459 return 0;
6460 }
6461
6462 static const struct nla_policy mdba_del_bulk_policy[MDBA_SET_ENTRY_MAX + 1] = {
6463 [MDBA_SET_ENTRY] = NLA_POLICY_VALIDATE_FN(NLA_BINARY,
6464 rtnl_validate_mdb_entry_del_bulk,
6465 sizeof(struct br_mdb_entry)),
6466 [MDBA_SET_ENTRY_ATTRS] = { .type = NLA_NESTED },
6467 };
6468
rtnl_mdb_del(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6469 static int rtnl_mdb_del(struct sk_buff *skb, struct nlmsghdr *nlh,
6470 struct netlink_ext_ack *extack)
6471 {
6472 bool del_bulk = !!(nlh->nlmsg_flags & NLM_F_BULK);
6473 struct nlattr *tb[MDBA_SET_ENTRY_MAX + 1];
6474 struct net *net = sock_net(skb->sk);
6475 struct br_port_msg *bpm;
6476 struct net_device *dev;
6477 int err;
6478
6479 if (!del_bulk)
6480 err = nlmsg_parse_deprecated(nlh, sizeof(*bpm), tb,
6481 MDBA_SET_ENTRY_MAX, mdba_policy,
6482 extack);
6483 else
6484 err = nlmsg_parse(nlh, sizeof(*bpm), tb, MDBA_SET_ENTRY_MAX,
6485 mdba_del_bulk_policy, extack);
6486 if (err)
6487 return err;
6488
6489 bpm = nlmsg_data(nlh);
6490 if (!bpm->ifindex) {
6491 NL_SET_ERR_MSG(extack, "Invalid ifindex");
6492 return -EINVAL;
6493 }
6494
6495 dev = __dev_get_by_index(net, bpm->ifindex);
6496 if (!dev) {
6497 NL_SET_ERR_MSG(extack, "Device doesn't exist");
6498 return -ENODEV;
6499 }
6500
6501 if (NL_REQ_ATTR_CHECK(extack, NULL, tb, MDBA_SET_ENTRY)) {
6502 NL_SET_ERR_MSG(extack, "Missing MDBA_SET_ENTRY attribute");
6503 return -EINVAL;
6504 }
6505
6506 if (del_bulk) {
6507 if (!dev->netdev_ops->ndo_mdb_del_bulk) {
6508 NL_SET_ERR_MSG(extack, "Device does not support MDB bulk deletion");
6509 return -EOPNOTSUPP;
6510 }
6511 return dev->netdev_ops->ndo_mdb_del_bulk(dev, tb, extack);
6512 }
6513
6514 if (!dev->netdev_ops->ndo_mdb_del) {
6515 NL_SET_ERR_MSG(extack, "Device does not support MDB operations");
6516 return -EOPNOTSUPP;
6517 }
6518
6519 return dev->netdev_ops->ndo_mdb_del(dev, tb, extack);
6520 }
6521
6522 /* Process one rtnetlink message. */
6523
rtnl_dumpit(struct sk_buff * skb,struct netlink_callback * cb)6524 static int rtnl_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
6525 {
6526 const bool needs_lock = !(cb->flags & RTNL_FLAG_DUMP_UNLOCKED);
6527 rtnl_dumpit_func dumpit = cb->data;
6528 int err;
6529
6530 /* Previous iteration have already finished, avoid calling->dumpit()
6531 * again, it may not expect to be called after it reached the end.
6532 */
6533 if (!dumpit)
6534 return 0;
6535
6536 if (needs_lock)
6537 rtnl_lock();
6538 err = dumpit(skb, cb);
6539 if (needs_lock)
6540 rtnl_unlock();
6541
6542 /* Old dump handlers used to send NLM_DONE as in a separate recvmsg().
6543 * Some applications which parse netlink manually depend on this.
6544 */
6545 if (cb->flags & RTNL_FLAG_DUMP_SPLIT_NLM_DONE) {
6546 if (err < 0 && err != -EMSGSIZE)
6547 return err;
6548 if (!err)
6549 cb->data = NULL;
6550
6551 return skb->len;
6552 }
6553 return err;
6554 }
6555
rtnetlink_dump_start(struct sock * ssk,struct sk_buff * skb,const struct nlmsghdr * nlh,struct netlink_dump_control * control)6556 static int rtnetlink_dump_start(struct sock *ssk, struct sk_buff *skb,
6557 const struct nlmsghdr *nlh,
6558 struct netlink_dump_control *control)
6559 {
6560 if (control->flags & RTNL_FLAG_DUMP_SPLIT_NLM_DONE ||
6561 !(control->flags & RTNL_FLAG_DUMP_UNLOCKED)) {
6562 WARN_ON(control->data);
6563 control->data = control->dump;
6564 control->dump = rtnl_dumpit;
6565 }
6566
6567 return netlink_dump_start(ssk, skb, nlh, control);
6568 }
6569
rtnetlink_rcv_msg(struct sk_buff * skb,struct nlmsghdr * nlh,struct netlink_ext_ack * extack)6570 static int rtnetlink_rcv_msg(struct sk_buff *skb, struct nlmsghdr *nlh,
6571 struct netlink_ext_ack *extack)
6572 {
6573 struct net *net = sock_net(skb->sk);
6574 struct rtnl_link *link;
6575 enum rtnl_kinds kind;
6576 struct module *owner;
6577 int err = -EOPNOTSUPP;
6578 rtnl_doit_func doit;
6579 unsigned int flags;
6580 int family;
6581 int type;
6582
6583 type = nlh->nlmsg_type;
6584 if (type > RTM_MAX)
6585 return -EOPNOTSUPP;
6586
6587 type -= RTM_BASE;
6588
6589 /* All the messages must have at least 1 byte length */
6590 if (nlmsg_len(nlh) < sizeof(struct rtgenmsg))
6591 return 0;
6592
6593 family = ((struct rtgenmsg *)nlmsg_data(nlh))->rtgen_family;
6594 kind = rtnl_msgtype_kind(type);
6595
6596 if (kind != RTNL_KIND_GET && !netlink_net_capable(skb, CAP_NET_ADMIN))
6597 return -EPERM;
6598
6599 rcu_read_lock();
6600 if (kind == RTNL_KIND_GET && (nlh->nlmsg_flags & NLM_F_DUMP)) {
6601 struct sock *rtnl;
6602 rtnl_dumpit_func dumpit;
6603 u32 min_dump_alloc = 0;
6604
6605 link = rtnl_get_link(family, type);
6606 if (!link || !link->dumpit) {
6607 family = PF_UNSPEC;
6608 link = rtnl_get_link(family, type);
6609 if (!link || !link->dumpit)
6610 goto err_unlock;
6611 }
6612 owner = link->owner;
6613 dumpit = link->dumpit;
6614 flags = link->flags;
6615
6616 if (type == RTM_GETLINK - RTM_BASE)
6617 min_dump_alloc = rtnl_calcit(skb, nlh);
6618
6619 err = 0;
6620 /* need to do this before rcu_read_unlock() */
6621 if (!try_module_get(owner))
6622 err = -EPROTONOSUPPORT;
6623
6624 rcu_read_unlock();
6625
6626 rtnl = net->rtnl;
6627 if (err == 0) {
6628 struct netlink_dump_control c = {
6629 .dump = dumpit,
6630 .min_dump_alloc = min_dump_alloc,
6631 .module = owner,
6632 .flags = flags,
6633 };
6634 err = rtnetlink_dump_start(rtnl, skb, nlh, &c);
6635 /* netlink_dump_start() will keep a reference on
6636 * module if dump is still in progress.
6637 */
6638 module_put(owner);
6639 }
6640 return err;
6641 }
6642
6643 link = rtnl_get_link(family, type);
6644 if (!link || !link->doit) {
6645 family = PF_UNSPEC;
6646 link = rtnl_get_link(PF_UNSPEC, type);
6647 if (!link || !link->doit)
6648 goto out_unlock;
6649 }
6650
6651 owner = link->owner;
6652 if (!try_module_get(owner)) {
6653 err = -EPROTONOSUPPORT;
6654 goto out_unlock;
6655 }
6656
6657 flags = link->flags;
6658 if (kind == RTNL_KIND_DEL && (nlh->nlmsg_flags & NLM_F_BULK) &&
6659 !(flags & RTNL_FLAG_BULK_DEL_SUPPORTED)) {
6660 NL_SET_ERR_MSG(extack, "Bulk delete is not supported");
6661 module_put(owner);
6662 goto err_unlock;
6663 }
6664
6665 if (flags & RTNL_FLAG_DOIT_UNLOCKED) {
6666 doit = link->doit;
6667 rcu_read_unlock();
6668 if (doit)
6669 err = doit(skb, nlh, extack);
6670 module_put(owner);
6671 return err;
6672 }
6673 rcu_read_unlock();
6674
6675 rtnl_lock();
6676 link = rtnl_get_link(family, type);
6677 if (link && link->doit)
6678 err = link->doit(skb, nlh, extack);
6679 rtnl_unlock();
6680
6681 module_put(owner);
6682
6683 return err;
6684
6685 out_unlock:
6686 rcu_read_unlock();
6687 return err;
6688
6689 err_unlock:
6690 rcu_read_unlock();
6691 return -EOPNOTSUPP;
6692 }
6693
rtnetlink_rcv(struct sk_buff * skb)6694 static void rtnetlink_rcv(struct sk_buff *skb)
6695 {
6696 netlink_rcv_skb(skb, &rtnetlink_rcv_msg);
6697 }
6698
rtnetlink_bind(struct net * net,int group)6699 static int rtnetlink_bind(struct net *net, int group)
6700 {
6701 switch (group) {
6702 case RTNLGRP_IPV4_MROUTE_R:
6703 case RTNLGRP_IPV6_MROUTE_R:
6704 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
6705 return -EPERM;
6706 break;
6707 }
6708 return 0;
6709 }
6710
rtnetlink_event(struct notifier_block * this,unsigned long event,void * ptr)6711 static int rtnetlink_event(struct notifier_block *this, unsigned long event, void *ptr)
6712 {
6713 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
6714
6715 switch (event) {
6716 case NETDEV_REBOOT:
6717 case NETDEV_CHANGEMTU:
6718 case NETDEV_CHANGEADDR:
6719 case NETDEV_CHANGENAME:
6720 case NETDEV_FEAT_CHANGE:
6721 case NETDEV_BONDING_FAILOVER:
6722 case NETDEV_POST_TYPE_CHANGE:
6723 case NETDEV_NOTIFY_PEERS:
6724 case NETDEV_CHANGEUPPER:
6725 case NETDEV_RESEND_IGMP:
6726 case NETDEV_CHANGEINFODATA:
6727 case NETDEV_CHANGELOWERSTATE:
6728 case NETDEV_CHANGE_TX_QUEUE_LEN:
6729 rtmsg_ifinfo_event(RTM_NEWLINK, dev, 0, rtnl_get_event(event),
6730 GFP_KERNEL, NULL, 0, 0, NULL);
6731 break;
6732 default:
6733 break;
6734 }
6735 return NOTIFY_DONE;
6736 }
6737
6738 static struct notifier_block rtnetlink_dev_notifier = {
6739 .notifier_call = rtnetlink_event,
6740 };
6741
6742
rtnetlink_net_init(struct net * net)6743 static int __net_init rtnetlink_net_init(struct net *net)
6744 {
6745 struct sock *sk;
6746 struct netlink_kernel_cfg cfg = {
6747 .groups = RTNLGRP_MAX,
6748 .input = rtnetlink_rcv,
6749 .flags = NL_CFG_F_NONROOT_RECV,
6750 .bind = rtnetlink_bind,
6751 };
6752
6753 sk = netlink_kernel_create(net, NETLINK_ROUTE, &cfg);
6754 if (!sk)
6755 return -ENOMEM;
6756 net->rtnl = sk;
6757 return 0;
6758 }
6759
rtnetlink_net_exit(struct net * net)6760 static void __net_exit rtnetlink_net_exit(struct net *net)
6761 {
6762 netlink_kernel_release(net->rtnl);
6763 net->rtnl = NULL;
6764 }
6765
6766 static struct pernet_operations rtnetlink_net_ops = {
6767 .init = rtnetlink_net_init,
6768 .exit = rtnetlink_net_exit,
6769 };
6770
rtnetlink_init(void)6771 void __init rtnetlink_init(void)
6772 {
6773 if (register_pernet_subsys(&rtnetlink_net_ops))
6774 panic("rtnetlink_init: cannot initialize rtnetlink\n");
6775
6776 register_netdevice_notifier(&rtnetlink_dev_notifier);
6777
6778 rtnl_register(PF_UNSPEC, RTM_GETLINK, rtnl_getlink,
6779 rtnl_dump_ifinfo, RTNL_FLAG_DUMP_SPLIT_NLM_DONE);
6780 rtnl_register(PF_UNSPEC, RTM_SETLINK, rtnl_setlink, NULL, 0);
6781 rtnl_register(PF_UNSPEC, RTM_NEWLINK, rtnl_newlink, NULL, 0);
6782 rtnl_register(PF_UNSPEC, RTM_DELLINK, rtnl_dellink, NULL, 0);
6783
6784 rtnl_register(PF_UNSPEC, RTM_GETADDR, NULL, rtnl_dump_all, 0);
6785 rtnl_register(PF_UNSPEC, RTM_GETROUTE, NULL, rtnl_dump_all, 0);
6786 rtnl_register(PF_UNSPEC, RTM_GETNETCONF, NULL, rtnl_dump_all, 0);
6787
6788 rtnl_register(PF_UNSPEC, RTM_NEWLINKPROP, rtnl_newlinkprop, NULL, 0);
6789 rtnl_register(PF_UNSPEC, RTM_DELLINKPROP, rtnl_dellinkprop, NULL, 0);
6790
6791 rtnl_register(PF_BRIDGE, RTM_NEWNEIGH, rtnl_fdb_add, NULL, 0);
6792 rtnl_register(PF_BRIDGE, RTM_DELNEIGH, rtnl_fdb_del, NULL,
6793 RTNL_FLAG_BULK_DEL_SUPPORTED);
6794 rtnl_register(PF_BRIDGE, RTM_GETNEIGH, rtnl_fdb_get, rtnl_fdb_dump, 0);
6795
6796 rtnl_register(PF_BRIDGE, RTM_GETLINK, NULL, rtnl_bridge_getlink, 0);
6797 rtnl_register(PF_BRIDGE, RTM_DELLINK, rtnl_bridge_dellink, NULL, 0);
6798 rtnl_register(PF_BRIDGE, RTM_SETLINK, rtnl_bridge_setlink, NULL, 0);
6799
6800 rtnl_register(PF_UNSPEC, RTM_GETSTATS, rtnl_stats_get, rtnl_stats_dump,
6801 0);
6802 rtnl_register(PF_UNSPEC, RTM_SETSTATS, rtnl_stats_set, NULL, 0);
6803
6804 rtnl_register(PF_BRIDGE, RTM_GETMDB, rtnl_mdb_get, rtnl_mdb_dump, 0);
6805 rtnl_register(PF_BRIDGE, RTM_NEWMDB, rtnl_mdb_add, NULL, 0);
6806 rtnl_register(PF_BRIDGE, RTM_DELMDB, rtnl_mdb_del, NULL,
6807 RTNL_FLAG_BULK_DEL_SUPPORTED);
6808 }
6809