1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * INET An implementation of the TCP/IP protocol suite for the LINUX
4 * operating system. INET is implemented using the BSD Socket
5 * interface as the means of communication with the user level.
7 * Routing netlink socket interface: protocol independent part.
12 * Vitaly E. Lavrov RTA_OK arithmetic was wrong.
15 #include <linux/bitops.h>
16 #include <linux/errno.h>
17 #include <linux/module.h>
18 #include <linux/types.h>
19 #include <linux/socket.h>
20 #include <linux/kernel.h>
21 #include <linux/timer.h>
22 #include <linux/string.h>
23 #include <linux/sockios.h>
24 #include <linux/net.h>
25 #include <linux/fcntl.h>
27 #include <linux/slab.h>
28 #include <linux/interrupt.h>
29 #include <linux/capability.h>
30 #include <linux/skbuff.h>
31 #include <linux/init.h>
32 #include <linux/security.h>
33 #include <linux/mutex.h>
34 #include <linux/if_addr.h>
35 #include <linux/if_bridge.h>
36 #include <linux/if_vlan.h>
37 #include <linux/pci.h>
38 #include <linux/etherdevice.h>
39 #include <linux/bpf.h>
41 #include <linux/uaccess.h>
43 #include <linux/inet.h>
44 #include <linux/netdevice.h>
46 #include <net/protocol.h>
48 #include <net/route.h>
52 #include <net/pkt_sched.h>
53 #include <net/fib_rules.h>
54 #include <net/rtnetlink.h>
55 #include <net/net_namespace.h>
56 #include <net/devlink.h>
57 #if IS_ENABLED(CONFIG_IPV6)
58 #include <net/addrconf.h>
60 #include <linux/dpll.h>
64 #define RTNL_MAX_TYPE 50
65 #define RTNL_SLAVE_MAX_TYPE 44
69 rtnl_dumpit_func dumpit;
75 static DEFINE_MUTEX(rtnl_mutex);
79 mutex_lock(&rtnl_mutex);
81 EXPORT_SYMBOL(rtnl_lock);
83 int rtnl_lock_killable(void)
85 return mutex_lock_killable(&rtnl_mutex);
87 EXPORT_SYMBOL(rtnl_lock_killable);
89 static struct sk_buff *defer_kfree_skb_list;
90 void rtnl_kfree_skbs(struct sk_buff *head, struct sk_buff *tail)
93 tail->next = defer_kfree_skb_list;
94 defer_kfree_skb_list = head;
97 EXPORT_SYMBOL(rtnl_kfree_skbs);
99 void __rtnl_unlock(void)
101 struct sk_buff *head = defer_kfree_skb_list;
103 defer_kfree_skb_list = NULL;
105 /* Ensure that we didn't actually add any TODO item when __rtnl_unlock()
106 * is used. In some places, e.g. in cfg80211, we have code that will do
113 * and because netdev_run_todo() acquires the RTNL for items on the list
114 * we could cause a situation such as this:
117 * unregister_netdevice()
125 * // list not empty now
126 * // because of thread 2
128 * while (!list_empty(...))
133 * However, usage of __rtnl_unlock() is rare, and so we can ensure that
134 * it's not used in cases where something is added to do the list.
136 WARN_ON(!list_empty(&net_todo_list));
138 mutex_unlock(&rtnl_mutex);
141 struct sk_buff *next = head->next;
149 void rtnl_unlock(void)
151 /* This fellow will unlock it for us. */
154 EXPORT_SYMBOL(rtnl_unlock);
156 int rtnl_trylock(void)
158 return mutex_trylock(&rtnl_mutex);
160 EXPORT_SYMBOL(rtnl_trylock);
162 int rtnl_is_locked(void)
164 return mutex_is_locked(&rtnl_mutex);
166 EXPORT_SYMBOL(rtnl_is_locked);
168 bool refcount_dec_and_rtnl_lock(refcount_t *r)
170 return refcount_dec_and_mutex_lock(r, &rtnl_mutex);
172 EXPORT_SYMBOL(refcount_dec_and_rtnl_lock);
174 #ifdef CONFIG_PROVE_LOCKING
175 bool lockdep_rtnl_is_held(void)
177 return lockdep_is_held(&rtnl_mutex);
179 EXPORT_SYMBOL(lockdep_rtnl_is_held);
180 #endif /* #ifdef CONFIG_PROVE_LOCKING */
182 static struct rtnl_link __rcu *__rcu *rtnl_msg_handlers[RTNL_FAMILY_MAX + 1];
184 static inline int rtm_msgindex(int msgtype)
186 int msgindex = msgtype - RTM_BASE;
189 * msgindex < 0 implies someone tried to register a netlink
190 * control code. msgindex >= RTM_NR_MSGTYPES may indicate that
191 * the message type has not been added to linux/rtnetlink.h
193 BUG_ON(msgindex < 0 || msgindex >= RTM_NR_MSGTYPES);
198 static struct rtnl_link *rtnl_get_link(int protocol, int msgtype)
200 struct rtnl_link __rcu **tab;
202 if (protocol >= ARRAY_SIZE(rtnl_msg_handlers))
203 protocol = PF_UNSPEC;
205 tab = rcu_dereference_rtnl(rtnl_msg_handlers[protocol]);
207 tab = rcu_dereference_rtnl(rtnl_msg_handlers[PF_UNSPEC]);
209 return rcu_dereference_rtnl(tab[msgtype]);
212 static int rtnl_register_internal(struct module *owner,
213 int protocol, int msgtype,
214 rtnl_doit_func doit, rtnl_dumpit_func dumpit,
217 struct rtnl_link *link, *old;
218 struct rtnl_link __rcu **tab;
222 BUG_ON(protocol < 0 || protocol > RTNL_FAMILY_MAX);
223 msgindex = rtm_msgindex(msgtype);
226 tab = rtnl_dereference(rtnl_msg_handlers[protocol]);
228 tab = kcalloc(RTM_NR_MSGTYPES, sizeof(void *), GFP_KERNEL);
232 /* ensures we see the 0 stores */
233 rcu_assign_pointer(rtnl_msg_handlers[protocol], tab);
236 old = rtnl_dereference(tab[msgindex]);
238 link = kmemdup(old, sizeof(*old), GFP_KERNEL);
242 link = kzalloc(sizeof(*link), GFP_KERNEL);
247 WARN_ON(link->owner && link->owner != owner);
250 WARN_ON(doit && link->doit && link->doit != doit);
253 WARN_ON(dumpit && link->dumpit && link->dumpit != dumpit);
255 link->dumpit = dumpit;
257 WARN_ON(rtnl_msgtype_kind(msgtype) != RTNL_KIND_DEL &&
258 (flags & RTNL_FLAG_BULK_DEL_SUPPORTED));
259 link->flags |= flags;
261 /* publish protocol:msgtype */
262 rcu_assign_pointer(tab[msgindex], link);
272 * rtnl_register_module - Register a rtnetlink message type
274 * @owner: module registering the hook (THIS_MODULE)
275 * @protocol: Protocol family or PF_UNSPEC
276 * @msgtype: rtnetlink message type
277 * @doit: Function pointer called for each request message
278 * @dumpit: Function pointer called for each dump request (NLM_F_DUMP) message
279 * @flags: rtnl_link_flags to modify behaviour of doit/dumpit functions
281 * Like rtnl_register, but for use by removable modules.
283 int rtnl_register_module(struct module *owner,
284 int protocol, int msgtype,
285 rtnl_doit_func doit, rtnl_dumpit_func dumpit,
288 return rtnl_register_internal(owner, protocol, msgtype,
289 doit, dumpit, flags);
291 EXPORT_SYMBOL_GPL(rtnl_register_module);
294 * rtnl_register - Register a rtnetlink message type
295 * @protocol: Protocol family or PF_UNSPEC
296 * @msgtype: rtnetlink message type
297 * @doit: Function pointer called for each request message
298 * @dumpit: Function pointer called for each dump request (NLM_F_DUMP) message
299 * @flags: rtnl_link_flags to modify behaviour of doit/dumpit functions
301 * Registers the specified function pointers (at least one of them has
302 * to be non-NULL) to be called whenever a request message for the
303 * specified protocol family and message type is received.
305 * The special protocol family PF_UNSPEC may be used to define fallback
306 * function pointers for the case when no entry for the specific protocol
309 void rtnl_register(int protocol, int msgtype,
310 rtnl_doit_func doit, rtnl_dumpit_func dumpit,
315 err = rtnl_register_internal(NULL, protocol, msgtype, doit, dumpit,
318 pr_err("Unable to register rtnetlink message handler, "
319 "protocol = %d, message type = %d\n", protocol, msgtype);
323 * rtnl_unregister - Unregister a rtnetlink message type
324 * @protocol: Protocol family or PF_UNSPEC
325 * @msgtype: rtnetlink message type
327 * Returns 0 on success or a negative error code.
329 int rtnl_unregister(int protocol, int msgtype)
331 struct rtnl_link __rcu **tab;
332 struct rtnl_link *link;
335 BUG_ON(protocol < 0 || protocol > RTNL_FAMILY_MAX);
336 msgindex = rtm_msgindex(msgtype);
339 tab = rtnl_dereference(rtnl_msg_handlers[protocol]);
345 link = rtnl_dereference(tab[msgindex]);
346 RCU_INIT_POINTER(tab[msgindex], NULL);
349 kfree_rcu(link, rcu);
353 EXPORT_SYMBOL_GPL(rtnl_unregister);
356 * rtnl_unregister_all - Unregister all rtnetlink message type of a protocol
357 * @protocol : Protocol family or PF_UNSPEC
359 * Identical to calling rtnl_unregster() for all registered message types
360 * of a certain protocol family.
362 void rtnl_unregister_all(int protocol)
364 struct rtnl_link __rcu **tab;
365 struct rtnl_link *link;
368 BUG_ON(protocol < 0 || protocol > RTNL_FAMILY_MAX);
371 tab = rtnl_dereference(rtnl_msg_handlers[protocol]);
376 RCU_INIT_POINTER(rtnl_msg_handlers[protocol], NULL);
377 for (msgindex = 0; msgindex < RTM_NR_MSGTYPES; msgindex++) {
378 link = rtnl_dereference(tab[msgindex]);
382 RCU_INIT_POINTER(tab[msgindex], NULL);
383 kfree_rcu(link, rcu);
391 EXPORT_SYMBOL_GPL(rtnl_unregister_all);
393 static LIST_HEAD(link_ops);
395 static const struct rtnl_link_ops *rtnl_link_ops_get(const char *kind)
397 const struct rtnl_link_ops *ops;
399 list_for_each_entry(ops, &link_ops, list) {
400 if (!strcmp(ops->kind, kind))
407 * __rtnl_link_register - Register rtnl_link_ops with rtnetlink.
408 * @ops: struct rtnl_link_ops * to register
410 * The caller must hold the rtnl_mutex. This function should be used
411 * by drivers that create devices during module initialization. It
412 * must be called before registering the devices.
414 * Returns 0 on success or a negative error code.
416 int __rtnl_link_register(struct rtnl_link_ops *ops)
418 if (rtnl_link_ops_get(ops->kind))
421 /* The check for alloc/setup is here because if ops
422 * does not have that filled up, it is not possible
423 * to use the ops for creating device. So do not
424 * fill up dellink as well. That disables rtnl_dellink.
426 if ((ops->alloc || ops->setup) && !ops->dellink)
427 ops->dellink = unregister_netdevice_queue;
429 list_add_tail(&ops->list, &link_ops);
432 EXPORT_SYMBOL_GPL(__rtnl_link_register);
435 * rtnl_link_register - Register rtnl_link_ops with rtnetlink.
436 * @ops: struct rtnl_link_ops * to register
438 * Returns 0 on success or a negative error code.
440 int rtnl_link_register(struct rtnl_link_ops *ops)
444 /* Sanity-check max sizes to avoid stack buffer overflow. */
445 if (WARN_ON(ops->maxtype > RTNL_MAX_TYPE ||
446 ops->slave_maxtype > RTNL_SLAVE_MAX_TYPE))
450 err = __rtnl_link_register(ops);
454 EXPORT_SYMBOL_GPL(rtnl_link_register);
456 static void __rtnl_kill_links(struct net *net, struct rtnl_link_ops *ops)
458 struct net_device *dev;
459 LIST_HEAD(list_kill);
461 for_each_netdev(net, dev) {
462 if (dev->rtnl_link_ops == ops)
463 ops->dellink(dev, &list_kill);
465 unregister_netdevice_many(&list_kill);
469 * __rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
470 * @ops: struct rtnl_link_ops * to unregister
472 * The caller must hold the rtnl_mutex and guarantee net_namespace_list
473 * integrity (hold pernet_ops_rwsem for writing to close the race
474 * with setup_net() and cleanup_net()).
476 void __rtnl_link_unregister(struct rtnl_link_ops *ops)
481 __rtnl_kill_links(net, ops);
483 list_del(&ops->list);
485 EXPORT_SYMBOL_GPL(__rtnl_link_unregister);
487 /* Return with the rtnl_lock held when there are no network
488 * devices unregistering in any network namespace.
490 static void rtnl_lock_unregistering_all(void)
494 DEFINE_WAIT_FUNC(wait, woken_wake_function);
496 add_wait_queue(&netdev_unregistering_wq, &wait);
498 unregistering = false;
500 /* We held write locked pernet_ops_rwsem, and parallel
501 * setup_net() and cleanup_net() are not possible.
504 if (atomic_read(&net->dev_unreg_count) > 0) {
505 unregistering = true;
513 wait_woken(&wait, TASK_UNINTERRUPTIBLE, MAX_SCHEDULE_TIMEOUT);
515 remove_wait_queue(&netdev_unregistering_wq, &wait);
519 * rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
520 * @ops: struct rtnl_link_ops * to unregister
522 void rtnl_link_unregister(struct rtnl_link_ops *ops)
524 /* Close the race with setup_net() and cleanup_net() */
525 down_write(&pernet_ops_rwsem);
526 rtnl_lock_unregistering_all();
527 __rtnl_link_unregister(ops);
529 up_write(&pernet_ops_rwsem);
531 EXPORT_SYMBOL_GPL(rtnl_link_unregister);
533 static size_t rtnl_link_get_slave_info_data_size(const struct net_device *dev)
535 struct net_device *master_dev;
536 const struct rtnl_link_ops *ops;
541 master_dev = netdev_master_upper_dev_get_rcu((struct net_device *)dev);
545 ops = master_dev->rtnl_link_ops;
546 if (!ops || !ops->get_slave_size)
548 /* IFLA_INFO_SLAVE_DATA + nested data */
549 size = nla_total_size(sizeof(struct nlattr)) +
550 ops->get_slave_size(master_dev, dev);
557 static size_t rtnl_link_get_size(const struct net_device *dev)
559 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
565 size = nla_total_size(sizeof(struct nlattr)) + /* IFLA_LINKINFO */
566 nla_total_size(strlen(ops->kind) + 1); /* IFLA_INFO_KIND */
569 /* IFLA_INFO_DATA + nested data */
570 size += nla_total_size(sizeof(struct nlattr)) +
573 if (ops->get_xstats_size)
574 /* IFLA_INFO_XSTATS */
575 size += nla_total_size(ops->get_xstats_size(dev));
577 size += rtnl_link_get_slave_info_data_size(dev);
582 static LIST_HEAD(rtnl_af_ops);
584 static const struct rtnl_af_ops *rtnl_af_lookup(const int family)
586 const struct rtnl_af_ops *ops;
590 list_for_each_entry(ops, &rtnl_af_ops, list) {
591 if (ops->family == family)
599 * rtnl_af_register - Register rtnl_af_ops with rtnetlink.
600 * @ops: struct rtnl_af_ops * to register
602 * Returns 0 on success or a negative error code.
604 void rtnl_af_register(struct rtnl_af_ops *ops)
607 list_add_tail_rcu(&ops->list, &rtnl_af_ops);
610 EXPORT_SYMBOL_GPL(rtnl_af_register);
613 * rtnl_af_unregister - Unregister rtnl_af_ops from rtnetlink.
614 * @ops: struct rtnl_af_ops * to unregister
616 void rtnl_af_unregister(struct rtnl_af_ops *ops)
619 list_del_rcu(&ops->list);
624 EXPORT_SYMBOL_GPL(rtnl_af_unregister);
626 static size_t rtnl_link_get_af_size(const struct net_device *dev,
629 struct rtnl_af_ops *af_ops;
633 size = nla_total_size(sizeof(struct nlattr));
636 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
637 if (af_ops->get_link_af_size) {
638 /* AF_* + nested data */
639 size += nla_total_size(sizeof(struct nlattr)) +
640 af_ops->get_link_af_size(dev, ext_filter_mask);
648 static bool rtnl_have_link_slave_info(const struct net_device *dev)
650 struct net_device *master_dev;
655 master_dev = netdev_master_upper_dev_get_rcu((struct net_device *)dev);
656 if (master_dev && master_dev->rtnl_link_ops)
662 static int rtnl_link_slave_info_fill(struct sk_buff *skb,
663 const struct net_device *dev)
665 struct net_device *master_dev;
666 const struct rtnl_link_ops *ops;
667 struct nlattr *slave_data;
670 master_dev = netdev_master_upper_dev_get((struct net_device *) dev);
673 ops = master_dev->rtnl_link_ops;
676 if (nla_put_string(skb, IFLA_INFO_SLAVE_KIND, ops->kind) < 0)
678 if (ops->fill_slave_info) {
679 slave_data = nla_nest_start_noflag(skb, IFLA_INFO_SLAVE_DATA);
682 err = ops->fill_slave_info(skb, master_dev, dev);
684 goto err_cancel_slave_data;
685 nla_nest_end(skb, slave_data);
689 err_cancel_slave_data:
690 nla_nest_cancel(skb, slave_data);
694 static int rtnl_link_info_fill(struct sk_buff *skb,
695 const struct net_device *dev)
697 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
703 if (nla_put_string(skb, IFLA_INFO_KIND, ops->kind) < 0)
705 if (ops->fill_xstats) {
706 err = ops->fill_xstats(skb, dev);
710 if (ops->fill_info) {
711 data = nla_nest_start_noflag(skb, IFLA_INFO_DATA);
714 err = ops->fill_info(skb, dev);
716 goto err_cancel_data;
717 nla_nest_end(skb, data);
722 nla_nest_cancel(skb, data);
726 static int rtnl_link_fill(struct sk_buff *skb, const struct net_device *dev)
728 struct nlattr *linkinfo;
731 linkinfo = nla_nest_start_noflag(skb, IFLA_LINKINFO);
732 if (linkinfo == NULL)
735 err = rtnl_link_info_fill(skb, dev);
737 goto err_cancel_link;
739 err = rtnl_link_slave_info_fill(skb, dev);
741 goto err_cancel_link;
743 nla_nest_end(skb, linkinfo);
747 nla_nest_cancel(skb, linkinfo);
752 int rtnetlink_send(struct sk_buff *skb, struct net *net, u32 pid, unsigned int group, int echo)
754 struct sock *rtnl = net->rtnl;
756 return nlmsg_notify(rtnl, skb, pid, group, echo, GFP_KERNEL);
759 int rtnl_unicast(struct sk_buff *skb, struct net *net, u32 pid)
761 struct sock *rtnl = net->rtnl;
763 return nlmsg_unicast(rtnl, skb, pid);
765 EXPORT_SYMBOL(rtnl_unicast);
767 void rtnl_notify(struct sk_buff *skb, struct net *net, u32 pid, u32 group,
768 const struct nlmsghdr *nlh, gfp_t flags)
770 struct sock *rtnl = net->rtnl;
772 nlmsg_notify(rtnl, skb, pid, group, nlmsg_report(nlh), flags);
774 EXPORT_SYMBOL(rtnl_notify);
776 void rtnl_set_sk_err(struct net *net, u32 group, int error)
778 struct sock *rtnl = net->rtnl;
780 netlink_set_err(rtnl, 0, group, error);
782 EXPORT_SYMBOL(rtnl_set_sk_err);
784 int rtnetlink_put_metrics(struct sk_buff *skb, u32 *metrics)
789 /* nothing is dumped for dst_default_metrics, so just skip the loop */
790 if (metrics == dst_default_metrics.metrics)
793 mx = nla_nest_start_noflag(skb, RTA_METRICS);
797 for (i = 0; i < RTAX_MAX; i++) {
799 if (i == RTAX_CC_ALGO - 1) {
800 char tmp[TCP_CA_NAME_MAX], *name;
802 name = tcp_ca_get_name_by_key(metrics[i], tmp);
805 if (nla_put_string(skb, i + 1, name))
806 goto nla_put_failure;
807 } else if (i == RTAX_FEATURES - 1) {
808 u32 user_features = metrics[i] & RTAX_FEATURE_MASK;
812 BUILD_BUG_ON(RTAX_FEATURE_MASK & DST_FEATURE_MASK);
813 if (nla_put_u32(skb, i + 1, user_features))
814 goto nla_put_failure;
816 if (nla_put_u32(skb, i + 1, metrics[i]))
817 goto nla_put_failure;
824 nla_nest_cancel(skb, mx);
828 return nla_nest_end(skb, mx);
831 nla_nest_cancel(skb, mx);
834 EXPORT_SYMBOL(rtnetlink_put_metrics);
836 int rtnl_put_cacheinfo(struct sk_buff *skb, struct dst_entry *dst, u32 id,
837 long expires, u32 error)
839 struct rta_cacheinfo ci = {
845 ci.rta_lastuse = jiffies_delta_to_clock_t(jiffies - dst->lastuse);
846 ci.rta_used = dst->__use;
847 ci.rta_clntref = rcuref_read(&dst->__rcuref);
852 clock = jiffies_to_clock_t(abs(expires));
853 clock = min_t(unsigned long, clock, INT_MAX);
854 ci.rta_expires = (expires > 0) ? clock : -clock;
856 return nla_put(skb, RTA_CACHEINFO, sizeof(ci), &ci);
858 EXPORT_SYMBOL_GPL(rtnl_put_cacheinfo);
860 static void set_operstate(struct net_device *dev, unsigned char transition)
862 unsigned char operstate = dev->operstate;
864 switch (transition) {
866 if ((operstate == IF_OPER_DORMANT ||
867 operstate == IF_OPER_TESTING ||
868 operstate == IF_OPER_UNKNOWN) &&
869 !netif_dormant(dev) && !netif_testing(dev))
870 operstate = IF_OPER_UP;
873 case IF_OPER_TESTING:
874 if (netif_oper_up(dev))
875 operstate = IF_OPER_TESTING;
878 case IF_OPER_DORMANT:
879 if (netif_oper_up(dev))
880 operstate = IF_OPER_DORMANT;
884 if (dev->operstate != operstate) {
885 write_lock(&dev_base_lock);
886 dev->operstate = operstate;
887 write_unlock(&dev_base_lock);
888 netdev_state_change(dev);
892 static unsigned int rtnl_dev_get_flags(const struct net_device *dev)
894 return (dev->flags & ~(IFF_PROMISC | IFF_ALLMULTI)) |
895 (dev->gflags & (IFF_PROMISC | IFF_ALLMULTI));
898 static unsigned int rtnl_dev_combine_flags(const struct net_device *dev,
899 const struct ifinfomsg *ifm)
901 unsigned int flags = ifm->ifi_flags;
903 /* bugwards compatibility: ifi_change == 0 is treated as ~0 */
905 flags = (flags & ifm->ifi_change) |
906 (rtnl_dev_get_flags(dev) & ~ifm->ifi_change);
911 static void copy_rtnl_link_stats(struct rtnl_link_stats *a,
912 const struct rtnl_link_stats64 *b)
914 a->rx_packets = b->rx_packets;
915 a->tx_packets = b->tx_packets;
916 a->rx_bytes = b->rx_bytes;
917 a->tx_bytes = b->tx_bytes;
918 a->rx_errors = b->rx_errors;
919 a->tx_errors = b->tx_errors;
920 a->rx_dropped = b->rx_dropped;
921 a->tx_dropped = b->tx_dropped;
923 a->multicast = b->multicast;
924 a->collisions = b->collisions;
926 a->rx_length_errors = b->rx_length_errors;
927 a->rx_over_errors = b->rx_over_errors;
928 a->rx_crc_errors = b->rx_crc_errors;
929 a->rx_frame_errors = b->rx_frame_errors;
930 a->rx_fifo_errors = b->rx_fifo_errors;
931 a->rx_missed_errors = b->rx_missed_errors;
933 a->tx_aborted_errors = b->tx_aborted_errors;
934 a->tx_carrier_errors = b->tx_carrier_errors;
935 a->tx_fifo_errors = b->tx_fifo_errors;
936 a->tx_heartbeat_errors = b->tx_heartbeat_errors;
937 a->tx_window_errors = b->tx_window_errors;
939 a->rx_compressed = b->rx_compressed;
940 a->tx_compressed = b->tx_compressed;
942 a->rx_nohandler = b->rx_nohandler;
946 static inline int rtnl_vfinfo_size(const struct net_device *dev,
949 if (dev->dev.parent && (ext_filter_mask & RTEXT_FILTER_VF)) {
950 int num_vfs = dev_num_vf(dev->dev.parent);
951 size_t size = nla_total_size(0);
954 nla_total_size(sizeof(struct ifla_vf_mac)) +
955 nla_total_size(sizeof(struct ifla_vf_broadcast)) +
956 nla_total_size(sizeof(struct ifla_vf_vlan)) +
957 nla_total_size(0) + /* nest IFLA_VF_VLAN_LIST */
958 nla_total_size(MAX_VLAN_LIST_LEN *
959 sizeof(struct ifla_vf_vlan_info)) +
960 nla_total_size(sizeof(struct ifla_vf_spoofchk)) +
961 nla_total_size(sizeof(struct ifla_vf_tx_rate)) +
962 nla_total_size(sizeof(struct ifla_vf_rate)) +
963 nla_total_size(sizeof(struct ifla_vf_link_state)) +
964 nla_total_size(sizeof(struct ifla_vf_rss_query_en)) +
965 nla_total_size(sizeof(struct ifla_vf_trust)));
966 if (~ext_filter_mask & RTEXT_FILTER_SKIP_STATS) {
968 (nla_total_size(0) + /* nest IFLA_VF_STATS */
969 /* IFLA_VF_STATS_RX_PACKETS */
970 nla_total_size_64bit(sizeof(__u64)) +
971 /* IFLA_VF_STATS_TX_PACKETS */
972 nla_total_size_64bit(sizeof(__u64)) +
973 /* IFLA_VF_STATS_RX_BYTES */
974 nla_total_size_64bit(sizeof(__u64)) +
975 /* IFLA_VF_STATS_TX_BYTES */
976 nla_total_size_64bit(sizeof(__u64)) +
977 /* IFLA_VF_STATS_BROADCAST */
978 nla_total_size_64bit(sizeof(__u64)) +
979 /* IFLA_VF_STATS_MULTICAST */
980 nla_total_size_64bit(sizeof(__u64)) +
981 /* IFLA_VF_STATS_RX_DROPPED */
982 nla_total_size_64bit(sizeof(__u64)) +
983 /* IFLA_VF_STATS_TX_DROPPED */
984 nla_total_size_64bit(sizeof(__u64)));
991 static size_t rtnl_port_size(const struct net_device *dev,
994 size_t port_size = nla_total_size(4) /* PORT_VF */
995 + nla_total_size(PORT_PROFILE_MAX) /* PORT_PROFILE */
996 + nla_total_size(PORT_UUID_MAX) /* PORT_INSTANCE_UUID */
997 + nla_total_size(PORT_UUID_MAX) /* PORT_HOST_UUID */
998 + nla_total_size(1) /* PROT_VDP_REQUEST */
999 + nla_total_size(2); /* PORT_VDP_RESPONSE */
1000 size_t vf_ports_size = nla_total_size(sizeof(struct nlattr));
1001 size_t vf_port_size = nla_total_size(sizeof(struct nlattr))
1003 size_t port_self_size = nla_total_size(sizeof(struct nlattr))
1006 if (!dev->netdev_ops->ndo_get_vf_port || !dev->dev.parent ||
1007 !(ext_filter_mask & RTEXT_FILTER_VF))
1009 if (dev_num_vf(dev->dev.parent))
1010 return port_self_size + vf_ports_size +
1011 vf_port_size * dev_num_vf(dev->dev.parent);
1013 return port_self_size;
1016 static size_t rtnl_xdp_size(void)
1018 size_t xdp_size = nla_total_size(0) + /* nest IFLA_XDP */
1019 nla_total_size(1) + /* XDP_ATTACHED */
1020 nla_total_size(4) + /* XDP_PROG_ID (or 1st mode) */
1021 nla_total_size(4); /* XDP_<mode>_PROG_ID */
1026 static size_t rtnl_prop_list_size(const struct net_device *dev)
1028 struct netdev_name_node *name_node;
1031 if (list_empty(&dev->name_node->list))
1033 size = nla_total_size(0);
1034 list_for_each_entry(name_node, &dev->name_node->list, list)
1035 size += nla_total_size(ALTIFNAMSIZ);
1039 static size_t rtnl_proto_down_size(const struct net_device *dev)
1041 size_t size = nla_total_size(1);
1043 if (dev->proto_down_reason)
1044 size += nla_total_size(0) + nla_total_size(4);
1049 static size_t rtnl_devlink_port_size(const struct net_device *dev)
1051 size_t size = nla_total_size(0); /* nest IFLA_DEVLINK_PORT */
1053 if (dev->devlink_port)
1054 size += devlink_nl_port_handle_size(dev->devlink_port);
1059 static size_t rtnl_dpll_pin_size(const struct net_device *dev)
1061 size_t size = nla_total_size(0); /* nest IFLA_DPLL_PIN */
1063 size += dpll_msg_pin_handle_size(netdev_dpll_pin(dev));
1068 static noinline size_t if_nlmsg_size(const struct net_device *dev,
1069 u32 ext_filter_mask)
1071 return NLMSG_ALIGN(sizeof(struct ifinfomsg))
1072 + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */
1073 + nla_total_size(IFALIASZ) /* IFLA_IFALIAS */
1074 + nla_total_size(IFNAMSIZ) /* IFLA_QDISC */
1075 + nla_total_size_64bit(sizeof(struct rtnl_link_ifmap))
1076 + nla_total_size(sizeof(struct rtnl_link_stats))
1077 + nla_total_size_64bit(sizeof(struct rtnl_link_stats64))
1078 + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */
1079 + nla_total_size(MAX_ADDR_LEN) /* IFLA_BROADCAST */
1080 + nla_total_size(4) /* IFLA_TXQLEN */
1081 + nla_total_size(4) /* IFLA_WEIGHT */
1082 + nla_total_size(4) /* IFLA_MTU */
1083 + nla_total_size(4) /* IFLA_LINK */
1084 + nla_total_size(4) /* IFLA_MASTER */
1085 + nla_total_size(1) /* IFLA_CARRIER */
1086 + nla_total_size(4) /* IFLA_PROMISCUITY */
1087 + nla_total_size(4) /* IFLA_ALLMULTI */
1088 + nla_total_size(4) /* IFLA_NUM_TX_QUEUES */
1089 + nla_total_size(4) /* IFLA_NUM_RX_QUEUES */
1090 + nla_total_size(4) /* IFLA_GSO_MAX_SEGS */
1091 + nla_total_size(4) /* IFLA_GSO_MAX_SIZE */
1092 + nla_total_size(4) /* IFLA_GRO_MAX_SIZE */
1093 + nla_total_size(4) /* IFLA_GSO_IPV4_MAX_SIZE */
1094 + nla_total_size(4) /* IFLA_GRO_IPV4_MAX_SIZE */
1095 + nla_total_size(4) /* IFLA_TSO_MAX_SIZE */
1096 + nla_total_size(4) /* IFLA_TSO_MAX_SEGS */
1097 + nla_total_size(1) /* IFLA_OPERSTATE */
1098 + nla_total_size(1) /* IFLA_LINKMODE */
1099 + nla_total_size(4) /* IFLA_CARRIER_CHANGES */
1100 + nla_total_size(4) /* IFLA_LINK_NETNSID */
1101 + nla_total_size(4) /* IFLA_GROUP */
1102 + nla_total_size(ext_filter_mask
1103 & RTEXT_FILTER_VF ? 4 : 0) /* IFLA_NUM_VF */
1104 + rtnl_vfinfo_size(dev, ext_filter_mask) /* IFLA_VFINFO_LIST */
1105 + rtnl_port_size(dev, ext_filter_mask) /* IFLA_VF_PORTS + IFLA_PORT_SELF */
1106 + rtnl_link_get_size(dev) /* IFLA_LINKINFO */
1107 + rtnl_link_get_af_size(dev, ext_filter_mask) /* IFLA_AF_SPEC */
1108 + nla_total_size(MAX_PHYS_ITEM_ID_LEN) /* IFLA_PHYS_PORT_ID */
1109 + nla_total_size(MAX_PHYS_ITEM_ID_LEN) /* IFLA_PHYS_SWITCH_ID */
1110 + nla_total_size(IFNAMSIZ) /* IFLA_PHYS_PORT_NAME */
1111 + rtnl_xdp_size() /* IFLA_XDP */
1112 + nla_total_size(4) /* IFLA_EVENT */
1113 + nla_total_size(4) /* IFLA_NEW_NETNSID */
1114 + nla_total_size(4) /* IFLA_NEW_IFINDEX */
1115 + rtnl_proto_down_size(dev) /* proto down */
1116 + nla_total_size(4) /* IFLA_TARGET_NETNSID */
1117 + nla_total_size(4) /* IFLA_CARRIER_UP_COUNT */
1118 + nla_total_size(4) /* IFLA_CARRIER_DOWN_COUNT */
1119 + nla_total_size(4) /* IFLA_MIN_MTU */
1120 + nla_total_size(4) /* IFLA_MAX_MTU */
1121 + rtnl_prop_list_size(dev)
1122 + nla_total_size(MAX_ADDR_LEN) /* IFLA_PERM_ADDRESS */
1123 + rtnl_devlink_port_size(dev)
1124 + rtnl_dpll_pin_size(dev)
1128 static int rtnl_vf_ports_fill(struct sk_buff *skb, struct net_device *dev)
1130 struct nlattr *vf_ports;
1131 struct nlattr *vf_port;
1135 vf_ports = nla_nest_start_noflag(skb, IFLA_VF_PORTS);
1139 for (vf = 0; vf < dev_num_vf(dev->dev.parent); vf++) {
1140 vf_port = nla_nest_start_noflag(skb, IFLA_VF_PORT);
1142 goto nla_put_failure;
1143 if (nla_put_u32(skb, IFLA_PORT_VF, vf))
1144 goto nla_put_failure;
1145 err = dev->netdev_ops->ndo_get_vf_port(dev, vf, skb);
1146 if (err == -EMSGSIZE)
1147 goto nla_put_failure;
1149 nla_nest_cancel(skb, vf_port);
1152 nla_nest_end(skb, vf_port);
1155 nla_nest_end(skb, vf_ports);
1160 nla_nest_cancel(skb, vf_ports);
1164 static int rtnl_port_self_fill(struct sk_buff *skb, struct net_device *dev)
1166 struct nlattr *port_self;
1169 port_self = nla_nest_start_noflag(skb, IFLA_PORT_SELF);
1173 err = dev->netdev_ops->ndo_get_vf_port(dev, PORT_SELF_VF, skb);
1175 nla_nest_cancel(skb, port_self);
1176 return (err == -EMSGSIZE) ? err : 0;
1179 nla_nest_end(skb, port_self);
1184 static int rtnl_port_fill(struct sk_buff *skb, struct net_device *dev,
1185 u32 ext_filter_mask)
1189 if (!dev->netdev_ops->ndo_get_vf_port || !dev->dev.parent ||
1190 !(ext_filter_mask & RTEXT_FILTER_VF))
1193 err = rtnl_port_self_fill(skb, dev);
1197 if (dev_num_vf(dev->dev.parent)) {
1198 err = rtnl_vf_ports_fill(skb, dev);
1206 static int rtnl_phys_port_id_fill(struct sk_buff *skb, struct net_device *dev)
1209 struct netdev_phys_item_id ppid;
1211 err = dev_get_phys_port_id(dev, &ppid);
1213 if (err == -EOPNOTSUPP)
1218 if (nla_put(skb, IFLA_PHYS_PORT_ID, ppid.id_len, ppid.id))
1224 static int rtnl_phys_port_name_fill(struct sk_buff *skb, struct net_device *dev)
1226 char name[IFNAMSIZ];
1229 err = dev_get_phys_port_name(dev, name, sizeof(name));
1231 if (err == -EOPNOTSUPP)
1236 if (nla_put_string(skb, IFLA_PHYS_PORT_NAME, name))
1242 static int rtnl_phys_switch_id_fill(struct sk_buff *skb, struct net_device *dev)
1244 struct netdev_phys_item_id ppid = { };
1247 err = dev_get_port_parent_id(dev, &ppid, false);
1249 if (err == -EOPNOTSUPP)
1254 if (nla_put(skb, IFLA_PHYS_SWITCH_ID, ppid.id_len, ppid.id))
1260 static noinline_for_stack int rtnl_fill_stats(struct sk_buff *skb,
1261 struct net_device *dev)
1263 struct rtnl_link_stats64 *sp;
1264 struct nlattr *attr;
1266 attr = nla_reserve_64bit(skb, IFLA_STATS64,
1267 sizeof(struct rtnl_link_stats64), IFLA_PAD);
1271 sp = nla_data(attr);
1272 dev_get_stats(dev, sp);
1274 attr = nla_reserve(skb, IFLA_STATS,
1275 sizeof(struct rtnl_link_stats));
1279 copy_rtnl_link_stats(nla_data(attr), sp);
1284 static noinline_for_stack int rtnl_fill_vfinfo(struct sk_buff *skb,
1285 struct net_device *dev,
1287 u32 ext_filter_mask)
1289 struct ifla_vf_rss_query_en vf_rss_query_en;
1290 struct nlattr *vf, *vfstats, *vfvlanlist;
1291 struct ifla_vf_link_state vf_linkstate;
1292 struct ifla_vf_vlan_info vf_vlan_info;
1293 struct ifla_vf_spoofchk vf_spoofchk;
1294 struct ifla_vf_tx_rate vf_tx_rate;
1295 struct ifla_vf_stats vf_stats;
1296 struct ifla_vf_trust vf_trust;
1297 struct ifla_vf_vlan vf_vlan;
1298 struct ifla_vf_rate vf_rate;
1299 struct ifla_vf_mac vf_mac;
1300 struct ifla_vf_broadcast vf_broadcast;
1301 struct ifla_vf_info ivi;
1302 struct ifla_vf_guid node_guid;
1303 struct ifla_vf_guid port_guid;
1305 memset(&ivi, 0, sizeof(ivi));
1307 /* Not all SR-IOV capable drivers support the
1308 * spoofcheck and "RSS query enable" query. Preset to
1309 * -1 so the user space tool can detect that the driver
1310 * didn't report anything.
1313 ivi.rss_query_en = -1;
1315 /* The default value for VF link state is "auto"
1316 * IFLA_VF_LINK_STATE_AUTO which equals zero
1319 /* VLAN Protocol by default is 802.1Q */
1320 ivi.vlan_proto = htons(ETH_P_8021Q);
1321 if (dev->netdev_ops->ndo_get_vf_config(dev, vfs_num, &ivi))
1324 memset(&vf_vlan_info, 0, sizeof(vf_vlan_info));
1325 memset(&node_guid, 0, sizeof(node_guid));
1326 memset(&port_guid, 0, sizeof(port_guid));
1335 vf_rss_query_en.vf =
1338 port_guid.vf = ivi.vf;
1340 memcpy(vf_mac.mac, ivi.mac, sizeof(ivi.mac));
1341 memcpy(vf_broadcast.broadcast, dev->broadcast, dev->addr_len);
1342 vf_vlan.vlan = ivi.vlan;
1343 vf_vlan.qos = ivi.qos;
1344 vf_vlan_info.vlan = ivi.vlan;
1345 vf_vlan_info.qos = ivi.qos;
1346 vf_vlan_info.vlan_proto = ivi.vlan_proto;
1347 vf_tx_rate.rate = ivi.max_tx_rate;
1348 vf_rate.min_tx_rate = ivi.min_tx_rate;
1349 vf_rate.max_tx_rate = ivi.max_tx_rate;
1350 vf_spoofchk.setting = ivi.spoofchk;
1351 vf_linkstate.link_state = ivi.linkstate;
1352 vf_rss_query_en.setting = ivi.rss_query_en;
1353 vf_trust.setting = ivi.trusted;
1354 vf = nla_nest_start_noflag(skb, IFLA_VF_INFO);
1357 if (nla_put(skb, IFLA_VF_MAC, sizeof(vf_mac), &vf_mac) ||
1358 nla_put(skb, IFLA_VF_BROADCAST, sizeof(vf_broadcast), &vf_broadcast) ||
1359 nla_put(skb, IFLA_VF_VLAN, sizeof(vf_vlan), &vf_vlan) ||
1360 nla_put(skb, IFLA_VF_RATE, sizeof(vf_rate),
1362 nla_put(skb, IFLA_VF_TX_RATE, sizeof(vf_tx_rate),
1364 nla_put(skb, IFLA_VF_SPOOFCHK, sizeof(vf_spoofchk),
1366 nla_put(skb, IFLA_VF_LINK_STATE, sizeof(vf_linkstate),
1368 nla_put(skb, IFLA_VF_RSS_QUERY_EN,
1369 sizeof(vf_rss_query_en),
1370 &vf_rss_query_en) ||
1371 nla_put(skb, IFLA_VF_TRUST,
1372 sizeof(vf_trust), &vf_trust))
1373 goto nla_put_vf_failure;
1375 if (dev->netdev_ops->ndo_get_vf_guid &&
1376 !dev->netdev_ops->ndo_get_vf_guid(dev, vfs_num, &node_guid,
1378 if (nla_put(skb, IFLA_VF_IB_NODE_GUID, sizeof(node_guid),
1380 nla_put(skb, IFLA_VF_IB_PORT_GUID, sizeof(port_guid),
1382 goto nla_put_vf_failure;
1384 vfvlanlist = nla_nest_start_noflag(skb, IFLA_VF_VLAN_LIST);
1386 goto nla_put_vf_failure;
1387 if (nla_put(skb, IFLA_VF_VLAN_INFO, sizeof(vf_vlan_info),
1389 nla_nest_cancel(skb, vfvlanlist);
1390 goto nla_put_vf_failure;
1392 nla_nest_end(skb, vfvlanlist);
1393 if (~ext_filter_mask & RTEXT_FILTER_SKIP_STATS) {
1394 memset(&vf_stats, 0, sizeof(vf_stats));
1395 if (dev->netdev_ops->ndo_get_vf_stats)
1396 dev->netdev_ops->ndo_get_vf_stats(dev, vfs_num,
1398 vfstats = nla_nest_start_noflag(skb, IFLA_VF_STATS);
1400 goto nla_put_vf_failure;
1401 if (nla_put_u64_64bit(skb, IFLA_VF_STATS_RX_PACKETS,
1402 vf_stats.rx_packets, IFLA_VF_STATS_PAD) ||
1403 nla_put_u64_64bit(skb, IFLA_VF_STATS_TX_PACKETS,
1404 vf_stats.tx_packets, IFLA_VF_STATS_PAD) ||
1405 nla_put_u64_64bit(skb, IFLA_VF_STATS_RX_BYTES,
1406 vf_stats.rx_bytes, IFLA_VF_STATS_PAD) ||
1407 nla_put_u64_64bit(skb, IFLA_VF_STATS_TX_BYTES,
1408 vf_stats.tx_bytes, IFLA_VF_STATS_PAD) ||
1409 nla_put_u64_64bit(skb, IFLA_VF_STATS_BROADCAST,
1410 vf_stats.broadcast, IFLA_VF_STATS_PAD) ||
1411 nla_put_u64_64bit(skb, IFLA_VF_STATS_MULTICAST,
1412 vf_stats.multicast, IFLA_VF_STATS_PAD) ||
1413 nla_put_u64_64bit(skb, IFLA_VF_STATS_RX_DROPPED,
1414 vf_stats.rx_dropped, IFLA_VF_STATS_PAD) ||
1415 nla_put_u64_64bit(skb, IFLA_VF_STATS_TX_DROPPED,
1416 vf_stats.tx_dropped, IFLA_VF_STATS_PAD)) {
1417 nla_nest_cancel(skb, vfstats);
1418 goto nla_put_vf_failure;
1420 nla_nest_end(skb, vfstats);
1422 nla_nest_end(skb, vf);
1426 nla_nest_cancel(skb, vf);
1430 static noinline_for_stack int rtnl_fill_vf(struct sk_buff *skb,
1431 struct net_device *dev,
1432 u32 ext_filter_mask)
1434 struct nlattr *vfinfo;
1437 if (!dev->dev.parent || ((ext_filter_mask & RTEXT_FILTER_VF) == 0))
1440 num_vfs = dev_num_vf(dev->dev.parent);
1441 if (nla_put_u32(skb, IFLA_NUM_VF, num_vfs))
1444 if (!dev->netdev_ops->ndo_get_vf_config)
1447 vfinfo = nla_nest_start_noflag(skb, IFLA_VFINFO_LIST);
1451 for (i = 0; i < num_vfs; i++) {
1452 if (rtnl_fill_vfinfo(skb, dev, i, ext_filter_mask)) {
1453 nla_nest_cancel(skb, vfinfo);
1458 nla_nest_end(skb, vfinfo);
1462 static int rtnl_fill_link_ifmap(struct sk_buff *skb, struct net_device *dev)
1464 struct rtnl_link_ifmap map;
1466 memset(&map, 0, sizeof(map));
1467 map.mem_start = dev->mem_start;
1468 map.mem_end = dev->mem_end;
1469 map.base_addr = dev->base_addr;
1472 map.port = dev->if_port;
1474 if (nla_put_64bit(skb, IFLA_MAP, sizeof(map), &map, IFLA_PAD))
1480 static u32 rtnl_xdp_prog_skb(struct net_device *dev)
1482 const struct bpf_prog *generic_xdp_prog;
1486 generic_xdp_prog = rtnl_dereference(dev->xdp_prog);
1487 if (!generic_xdp_prog)
1489 return generic_xdp_prog->aux->id;
1492 static u32 rtnl_xdp_prog_drv(struct net_device *dev)
1494 return dev_xdp_prog_id(dev, XDP_MODE_DRV);
1497 static u32 rtnl_xdp_prog_hw(struct net_device *dev)
1499 return dev_xdp_prog_id(dev, XDP_MODE_HW);
1502 static int rtnl_xdp_report_one(struct sk_buff *skb, struct net_device *dev,
1503 u32 *prog_id, u8 *mode, u8 tgt_mode, u32 attr,
1504 u32 (*get_prog_id)(struct net_device *dev))
1509 curr_id = get_prog_id(dev);
1514 err = nla_put_u32(skb, attr, curr_id);
1518 if (*mode != XDP_ATTACHED_NONE)
1519 *mode = XDP_ATTACHED_MULTI;
1526 static int rtnl_xdp_fill(struct sk_buff *skb, struct net_device *dev)
1533 xdp = nla_nest_start_noflag(skb, IFLA_XDP);
1538 mode = XDP_ATTACHED_NONE;
1539 err = rtnl_xdp_report_one(skb, dev, &prog_id, &mode, XDP_ATTACHED_SKB,
1540 IFLA_XDP_SKB_PROG_ID, rtnl_xdp_prog_skb);
1543 err = rtnl_xdp_report_one(skb, dev, &prog_id, &mode, XDP_ATTACHED_DRV,
1544 IFLA_XDP_DRV_PROG_ID, rtnl_xdp_prog_drv);
1547 err = rtnl_xdp_report_one(skb, dev, &prog_id, &mode, XDP_ATTACHED_HW,
1548 IFLA_XDP_HW_PROG_ID, rtnl_xdp_prog_hw);
1552 err = nla_put_u8(skb, IFLA_XDP_ATTACHED, mode);
1556 if (prog_id && mode != XDP_ATTACHED_MULTI) {
1557 err = nla_put_u32(skb, IFLA_XDP_PROG_ID, prog_id);
1562 nla_nest_end(skb, xdp);
1566 nla_nest_cancel(skb, xdp);
1570 static u32 rtnl_get_event(unsigned long event)
1572 u32 rtnl_event_type = IFLA_EVENT_NONE;
1576 rtnl_event_type = IFLA_EVENT_REBOOT;
1578 case NETDEV_FEAT_CHANGE:
1579 rtnl_event_type = IFLA_EVENT_FEATURES;
1581 case NETDEV_BONDING_FAILOVER:
1582 rtnl_event_type = IFLA_EVENT_BONDING_FAILOVER;
1584 case NETDEV_NOTIFY_PEERS:
1585 rtnl_event_type = IFLA_EVENT_NOTIFY_PEERS;
1587 case NETDEV_RESEND_IGMP:
1588 rtnl_event_type = IFLA_EVENT_IGMP_RESEND;
1590 case NETDEV_CHANGEINFODATA:
1591 rtnl_event_type = IFLA_EVENT_BONDING_OPTIONS;
1597 return rtnl_event_type;
1600 static int put_master_ifindex(struct sk_buff *skb, struct net_device *dev)
1602 const struct net_device *upper_dev;
1607 upper_dev = netdev_master_upper_dev_get_rcu(dev);
1609 ret = nla_put_u32(skb, IFLA_MASTER, upper_dev->ifindex);
1615 static int nla_put_iflink(struct sk_buff *skb, const struct net_device *dev,
1618 int ifindex = dev_get_iflink(dev);
1620 if (force || dev->ifindex != ifindex)
1621 return nla_put_u32(skb, IFLA_LINK, ifindex);
1626 static noinline_for_stack int nla_put_ifalias(struct sk_buff *skb,
1627 struct net_device *dev)
1632 ret = dev_get_alias(dev, buf, sizeof(buf));
1633 return ret > 0 ? nla_put_string(skb, IFLA_IFALIAS, buf) : 0;
1636 static int rtnl_fill_link_netnsid(struct sk_buff *skb,
1637 const struct net_device *dev,
1638 struct net *src_net, gfp_t gfp)
1640 bool put_iflink = false;
1642 if (dev->rtnl_link_ops && dev->rtnl_link_ops->get_link_net) {
1643 struct net *link_net = dev->rtnl_link_ops->get_link_net(dev);
1645 if (!net_eq(dev_net(dev), link_net)) {
1646 int id = peernet2id_alloc(src_net, link_net, gfp);
1648 if (nla_put_s32(skb, IFLA_LINK_NETNSID, id))
1655 return nla_put_iflink(skb, dev, put_iflink);
1658 static int rtnl_fill_link_af(struct sk_buff *skb,
1659 const struct net_device *dev,
1660 u32 ext_filter_mask)
1662 const struct rtnl_af_ops *af_ops;
1663 struct nlattr *af_spec;
1665 af_spec = nla_nest_start_noflag(skb, IFLA_AF_SPEC);
1669 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
1673 if (!af_ops->fill_link_af)
1676 af = nla_nest_start_noflag(skb, af_ops->family);
1680 err = af_ops->fill_link_af(skb, dev, ext_filter_mask);
1682 * Caller may return ENODATA to indicate that there
1683 * was no data to be dumped. This is not an error, it
1684 * means we should trim the attribute header and
1687 if (err == -ENODATA)
1688 nla_nest_cancel(skb, af);
1692 nla_nest_end(skb, af);
1695 nla_nest_end(skb, af_spec);
1699 static int rtnl_fill_alt_ifnames(struct sk_buff *skb,
1700 const struct net_device *dev)
1702 struct netdev_name_node *name_node;
1705 list_for_each_entry(name_node, &dev->name_node->list, list) {
1706 if (nla_put_string(skb, IFLA_ALT_IFNAME, name_node->name))
1713 static int rtnl_fill_prop_list(struct sk_buff *skb,
1714 const struct net_device *dev)
1716 struct nlattr *prop_list;
1719 prop_list = nla_nest_start(skb, IFLA_PROP_LIST);
1723 ret = rtnl_fill_alt_ifnames(skb, dev);
1727 nla_nest_end(skb, prop_list);
1731 nla_nest_cancel(skb, prop_list);
1735 static int rtnl_fill_proto_down(struct sk_buff *skb,
1736 const struct net_device *dev)
1741 if (nla_put_u8(skb, IFLA_PROTO_DOWN, dev->proto_down))
1742 goto nla_put_failure;
1744 preason = dev->proto_down_reason;
1748 pr = nla_nest_start(skb, IFLA_PROTO_DOWN_REASON);
1752 if (nla_put_u32(skb, IFLA_PROTO_DOWN_REASON_VALUE, preason)) {
1753 nla_nest_cancel(skb, pr);
1754 goto nla_put_failure;
1757 nla_nest_end(skb, pr);
1764 static int rtnl_fill_devlink_port(struct sk_buff *skb,
1765 const struct net_device *dev)
1767 struct nlattr *devlink_port_nest;
1770 devlink_port_nest = nla_nest_start(skb, IFLA_DEVLINK_PORT);
1771 if (!devlink_port_nest)
1774 if (dev->devlink_port) {
1775 ret = devlink_nl_port_handle_fill(skb, dev->devlink_port);
1780 nla_nest_end(skb, devlink_port_nest);
1784 nla_nest_cancel(skb, devlink_port_nest);
1788 static int rtnl_fill_dpll_pin(struct sk_buff *skb,
1789 const struct net_device *dev)
1791 struct nlattr *dpll_pin_nest;
1794 dpll_pin_nest = nla_nest_start(skb, IFLA_DPLL_PIN);
1798 ret = dpll_msg_add_pin_handle(skb, netdev_dpll_pin(dev));
1802 nla_nest_end(skb, dpll_pin_nest);
1806 nla_nest_cancel(skb, dpll_pin_nest);
1810 static int rtnl_fill_ifinfo(struct sk_buff *skb,
1811 struct net_device *dev, struct net *src_net,
1812 int type, u32 pid, u32 seq, u32 change,
1813 unsigned int flags, u32 ext_filter_mask,
1814 u32 event, int *new_nsid, int new_ifindex,
1815 int tgt_netnsid, gfp_t gfp)
1817 struct ifinfomsg *ifm;
1818 struct nlmsghdr *nlh;
1819 struct Qdisc *qdisc;
1822 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ifm), flags);
1826 ifm = nlmsg_data(nlh);
1827 ifm->ifi_family = AF_UNSPEC;
1829 ifm->ifi_type = dev->type;
1830 ifm->ifi_index = dev->ifindex;
1831 ifm->ifi_flags = dev_get_flags(dev);
1832 ifm->ifi_change = change;
1834 if (tgt_netnsid >= 0 && nla_put_s32(skb, IFLA_TARGET_NETNSID, tgt_netnsid))
1835 goto nla_put_failure;
1837 qdisc = rtnl_dereference(dev->qdisc);
1838 if (nla_put_string(skb, IFLA_IFNAME, dev->name) ||
1839 nla_put_u32(skb, IFLA_TXQLEN, dev->tx_queue_len) ||
1840 nla_put_u8(skb, IFLA_OPERSTATE,
1841 netif_running(dev) ? dev->operstate : IF_OPER_DOWN) ||
1842 nla_put_u8(skb, IFLA_LINKMODE, dev->link_mode) ||
1843 nla_put_u32(skb, IFLA_MTU, dev->mtu) ||
1844 nla_put_u32(skb, IFLA_MIN_MTU, dev->min_mtu) ||
1845 nla_put_u32(skb, IFLA_MAX_MTU, dev->max_mtu) ||
1846 nla_put_u32(skb, IFLA_GROUP, dev->group) ||
1847 nla_put_u32(skb, IFLA_PROMISCUITY, dev->promiscuity) ||
1848 nla_put_u32(skb, IFLA_ALLMULTI, dev->allmulti) ||
1849 nla_put_u32(skb, IFLA_NUM_TX_QUEUES, dev->num_tx_queues) ||
1850 nla_put_u32(skb, IFLA_GSO_MAX_SEGS, dev->gso_max_segs) ||
1851 nla_put_u32(skb, IFLA_GSO_MAX_SIZE, dev->gso_max_size) ||
1852 nla_put_u32(skb, IFLA_GRO_MAX_SIZE, dev->gro_max_size) ||
1853 nla_put_u32(skb, IFLA_GSO_IPV4_MAX_SIZE, dev->gso_ipv4_max_size) ||
1854 nla_put_u32(skb, IFLA_GRO_IPV4_MAX_SIZE, dev->gro_ipv4_max_size) ||
1855 nla_put_u32(skb, IFLA_TSO_MAX_SIZE, dev->tso_max_size) ||
1856 nla_put_u32(skb, IFLA_TSO_MAX_SEGS, dev->tso_max_segs) ||
1858 nla_put_u32(skb, IFLA_NUM_RX_QUEUES, dev->num_rx_queues) ||
1860 put_master_ifindex(skb, dev) ||
1861 nla_put_u8(skb, IFLA_CARRIER, netif_carrier_ok(dev)) ||
1863 nla_put_string(skb, IFLA_QDISC, qdisc->ops->id)) ||
1864 nla_put_ifalias(skb, dev) ||
1865 nla_put_u32(skb, IFLA_CARRIER_CHANGES,
1866 atomic_read(&dev->carrier_up_count) +
1867 atomic_read(&dev->carrier_down_count)) ||
1868 nla_put_u32(skb, IFLA_CARRIER_UP_COUNT,
1869 atomic_read(&dev->carrier_up_count)) ||
1870 nla_put_u32(skb, IFLA_CARRIER_DOWN_COUNT,
1871 atomic_read(&dev->carrier_down_count)))
1872 goto nla_put_failure;
1874 if (rtnl_fill_proto_down(skb, dev))
1875 goto nla_put_failure;
1877 if (event != IFLA_EVENT_NONE) {
1878 if (nla_put_u32(skb, IFLA_EVENT, event))
1879 goto nla_put_failure;
1882 if (rtnl_fill_link_ifmap(skb, dev))
1883 goto nla_put_failure;
1885 if (dev->addr_len) {
1886 if (nla_put(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr) ||
1887 nla_put(skb, IFLA_BROADCAST, dev->addr_len, dev->broadcast))
1888 goto nla_put_failure;
1891 if (rtnl_phys_port_id_fill(skb, dev))
1892 goto nla_put_failure;
1894 if (rtnl_phys_port_name_fill(skb, dev))
1895 goto nla_put_failure;
1897 if (rtnl_phys_switch_id_fill(skb, dev))
1898 goto nla_put_failure;
1900 if (rtnl_fill_stats(skb, dev))
1901 goto nla_put_failure;
1903 if (rtnl_fill_vf(skb, dev, ext_filter_mask))
1904 goto nla_put_failure;
1906 if (rtnl_port_fill(skb, dev, ext_filter_mask))
1907 goto nla_put_failure;
1909 if (rtnl_xdp_fill(skb, dev))
1910 goto nla_put_failure;
1912 if (dev->rtnl_link_ops || rtnl_have_link_slave_info(dev)) {
1913 if (rtnl_link_fill(skb, dev) < 0)
1914 goto nla_put_failure;
1917 if (rtnl_fill_link_netnsid(skb, dev, src_net, gfp))
1918 goto nla_put_failure;
1921 nla_put_s32(skb, IFLA_NEW_NETNSID, *new_nsid) < 0)
1922 goto nla_put_failure;
1924 nla_put_s32(skb, IFLA_NEW_IFINDEX, new_ifindex) < 0)
1925 goto nla_put_failure;
1927 if (memchr_inv(dev->perm_addr, '\0', dev->addr_len) &&
1928 nla_put(skb, IFLA_PERM_ADDRESS, dev->addr_len, dev->perm_addr))
1929 goto nla_put_failure;
1932 if (rtnl_fill_link_af(skb, dev, ext_filter_mask))
1933 goto nla_put_failure_rcu;
1936 if (rtnl_fill_prop_list(skb, dev))
1937 goto nla_put_failure;
1939 if (dev->dev.parent &&
1940 nla_put_string(skb, IFLA_PARENT_DEV_NAME,
1941 dev_name(dev->dev.parent)))
1942 goto nla_put_failure;
1944 if (dev->dev.parent && dev->dev.parent->bus &&
1945 nla_put_string(skb, IFLA_PARENT_DEV_BUS_NAME,
1946 dev->dev.parent->bus->name))
1947 goto nla_put_failure;
1949 if (rtnl_fill_devlink_port(skb, dev))
1950 goto nla_put_failure;
1952 if (rtnl_fill_dpll_pin(skb, dev))
1953 goto nla_put_failure;
1955 nlmsg_end(skb, nlh);
1958 nla_put_failure_rcu:
1961 nlmsg_cancel(skb, nlh);
1965 static const struct nla_policy ifla_policy[IFLA_MAX+1] = {
1966 [IFLA_IFNAME] = { .type = NLA_STRING, .len = IFNAMSIZ-1 },
1967 [IFLA_ADDRESS] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
1968 [IFLA_BROADCAST] = { .type = NLA_BINARY, .len = MAX_ADDR_LEN },
1969 [IFLA_MAP] = { .len = sizeof(struct rtnl_link_ifmap) },
1970 [IFLA_MTU] = { .type = NLA_U32 },
1971 [IFLA_LINK] = { .type = NLA_U32 },
1972 [IFLA_MASTER] = { .type = NLA_U32 },
1973 [IFLA_CARRIER] = { .type = NLA_U8 },
1974 [IFLA_TXQLEN] = { .type = NLA_U32 },
1975 [IFLA_WEIGHT] = { .type = NLA_U32 },
1976 [IFLA_OPERSTATE] = { .type = NLA_U8 },
1977 [IFLA_LINKMODE] = { .type = NLA_U8 },
1978 [IFLA_LINKINFO] = { .type = NLA_NESTED },
1979 [IFLA_NET_NS_PID] = { .type = NLA_U32 },
1980 [IFLA_NET_NS_FD] = { .type = NLA_U32 },
1981 /* IFLA_IFALIAS is a string, but policy is set to NLA_BINARY to
1982 * allow 0-length string (needed to remove an alias).
1984 [IFLA_IFALIAS] = { .type = NLA_BINARY, .len = IFALIASZ - 1 },
1985 [IFLA_VFINFO_LIST] = {. type = NLA_NESTED },
1986 [IFLA_VF_PORTS] = { .type = NLA_NESTED },
1987 [IFLA_PORT_SELF] = { .type = NLA_NESTED },
1988 [IFLA_AF_SPEC] = { .type = NLA_NESTED },
1989 [IFLA_EXT_MASK] = { .type = NLA_U32 },
1990 [IFLA_PROMISCUITY] = { .type = NLA_U32 },
1991 [IFLA_NUM_TX_QUEUES] = { .type = NLA_U32 },
1992 [IFLA_NUM_RX_QUEUES] = { .type = NLA_U32 },
1993 [IFLA_GSO_MAX_SEGS] = { .type = NLA_U32 },
1994 [IFLA_GSO_MAX_SIZE] = { .type = NLA_U32 },
1995 [IFLA_PHYS_PORT_ID] = { .type = NLA_BINARY, .len = MAX_PHYS_ITEM_ID_LEN },
1996 [IFLA_CARRIER_CHANGES] = { .type = NLA_U32 }, /* ignored */
1997 [IFLA_PHYS_SWITCH_ID] = { .type = NLA_BINARY, .len = MAX_PHYS_ITEM_ID_LEN },
1998 [IFLA_LINK_NETNSID] = { .type = NLA_S32 },
1999 [IFLA_PROTO_DOWN] = { .type = NLA_U8 },
2000 [IFLA_XDP] = { .type = NLA_NESTED },
2001 [IFLA_EVENT] = { .type = NLA_U32 },
2002 [IFLA_GROUP] = { .type = NLA_U32 },
2003 [IFLA_TARGET_NETNSID] = { .type = NLA_S32 },
2004 [IFLA_CARRIER_UP_COUNT] = { .type = NLA_U32 },
2005 [IFLA_CARRIER_DOWN_COUNT] = { .type = NLA_U32 },
2006 [IFLA_MIN_MTU] = { .type = NLA_U32 },
2007 [IFLA_MAX_MTU] = { .type = NLA_U32 },
2008 [IFLA_PROP_LIST] = { .type = NLA_NESTED },
2009 [IFLA_ALT_IFNAME] = { .type = NLA_STRING,
2010 .len = ALTIFNAMSIZ - 1 },
2011 [IFLA_PERM_ADDRESS] = { .type = NLA_REJECT },
2012 [IFLA_PROTO_DOWN_REASON] = { .type = NLA_NESTED },
2013 [IFLA_NEW_IFINDEX] = NLA_POLICY_MIN(NLA_S32, 1),
2014 [IFLA_PARENT_DEV_NAME] = { .type = NLA_NUL_STRING },
2015 [IFLA_GRO_MAX_SIZE] = { .type = NLA_U32 },
2016 [IFLA_TSO_MAX_SIZE] = { .type = NLA_REJECT },
2017 [IFLA_TSO_MAX_SEGS] = { .type = NLA_REJECT },
2018 [IFLA_ALLMULTI] = { .type = NLA_REJECT },
2019 [IFLA_GSO_IPV4_MAX_SIZE] = { .type = NLA_U32 },
2020 [IFLA_GRO_IPV4_MAX_SIZE] = { .type = NLA_U32 },
2023 static const struct nla_policy ifla_info_policy[IFLA_INFO_MAX+1] = {
2024 [IFLA_INFO_KIND] = { .type = NLA_STRING },
2025 [IFLA_INFO_DATA] = { .type = NLA_NESTED },
2026 [IFLA_INFO_SLAVE_KIND] = { .type = NLA_STRING },
2027 [IFLA_INFO_SLAVE_DATA] = { .type = NLA_NESTED },
2030 static const struct nla_policy ifla_vf_policy[IFLA_VF_MAX+1] = {
2031 [IFLA_VF_MAC] = { .len = sizeof(struct ifla_vf_mac) },
2032 [IFLA_VF_BROADCAST] = { .type = NLA_REJECT },
2033 [IFLA_VF_VLAN] = { .len = sizeof(struct ifla_vf_vlan) },
2034 [IFLA_VF_VLAN_LIST] = { .type = NLA_NESTED },
2035 [IFLA_VF_TX_RATE] = { .len = sizeof(struct ifla_vf_tx_rate) },
2036 [IFLA_VF_SPOOFCHK] = { .len = sizeof(struct ifla_vf_spoofchk) },
2037 [IFLA_VF_RATE] = { .len = sizeof(struct ifla_vf_rate) },
2038 [IFLA_VF_LINK_STATE] = { .len = sizeof(struct ifla_vf_link_state) },
2039 [IFLA_VF_RSS_QUERY_EN] = { .len = sizeof(struct ifla_vf_rss_query_en) },
2040 [IFLA_VF_STATS] = { .type = NLA_NESTED },
2041 [IFLA_VF_TRUST] = { .len = sizeof(struct ifla_vf_trust) },
2042 [IFLA_VF_IB_NODE_GUID] = { .len = sizeof(struct ifla_vf_guid) },
2043 [IFLA_VF_IB_PORT_GUID] = { .len = sizeof(struct ifla_vf_guid) },
2046 static const struct nla_policy ifla_port_policy[IFLA_PORT_MAX+1] = {
2047 [IFLA_PORT_VF] = { .type = NLA_U32 },
2048 [IFLA_PORT_PROFILE] = { .type = NLA_STRING,
2049 .len = PORT_PROFILE_MAX },
2050 [IFLA_PORT_INSTANCE_UUID] = { .type = NLA_BINARY,
2051 .len = PORT_UUID_MAX },
2052 [IFLA_PORT_HOST_UUID] = { .type = NLA_STRING,
2053 .len = PORT_UUID_MAX },
2054 [IFLA_PORT_REQUEST] = { .type = NLA_U8, },
2055 [IFLA_PORT_RESPONSE] = { .type = NLA_U16, },
2057 /* Unused, but we need to keep it here since user space could
2058 * fill it. It's also broken with regard to NLA_BINARY use in
2059 * combination with structs.
2061 [IFLA_PORT_VSI_TYPE] = { .type = NLA_BINARY,
2062 .len = sizeof(struct ifla_port_vsi) },
2065 static const struct nla_policy ifla_xdp_policy[IFLA_XDP_MAX + 1] = {
2066 [IFLA_XDP_UNSPEC] = { .strict_start_type = IFLA_XDP_EXPECTED_FD },
2067 [IFLA_XDP_FD] = { .type = NLA_S32 },
2068 [IFLA_XDP_EXPECTED_FD] = { .type = NLA_S32 },
2069 [IFLA_XDP_ATTACHED] = { .type = NLA_U8 },
2070 [IFLA_XDP_FLAGS] = { .type = NLA_U32 },
2071 [IFLA_XDP_PROG_ID] = { .type = NLA_U32 },
2074 static const struct rtnl_link_ops *linkinfo_to_kind_ops(const struct nlattr *nla)
2076 const struct rtnl_link_ops *ops = NULL;
2077 struct nlattr *linfo[IFLA_INFO_MAX + 1];
2079 if (nla_parse_nested_deprecated(linfo, IFLA_INFO_MAX, nla, ifla_info_policy, NULL) < 0)
2082 if (linfo[IFLA_INFO_KIND]) {
2083 char kind[MODULE_NAME_LEN];
2085 nla_strscpy(kind, linfo[IFLA_INFO_KIND], sizeof(kind));
2086 ops = rtnl_link_ops_get(kind);
2092 static bool link_master_filtered(struct net_device *dev, int master_idx)
2094 struct net_device *master;
2099 master = netdev_master_upper_dev_get(dev);
2101 /* 0 is already used to denote IFLA_MASTER wasn't passed, therefore need
2102 * another invalid value for ifindex to denote "no master".
2104 if (master_idx == -1)
2107 if (!master || master->ifindex != master_idx)
2113 static bool link_kind_filtered(const struct net_device *dev,
2114 const struct rtnl_link_ops *kind_ops)
2116 if (kind_ops && dev->rtnl_link_ops != kind_ops)
2122 static bool link_dump_filtered(struct net_device *dev,
2124 const struct rtnl_link_ops *kind_ops)
2126 if (link_master_filtered(dev, master_idx) ||
2127 link_kind_filtered(dev, kind_ops))
2134 * rtnl_get_net_ns_capable - Get netns if sufficiently privileged.
2135 * @sk: netlink socket
2136 * @netnsid: network namespace identifier
2138 * Returns the network namespace identified by netnsid on success or an error
2139 * pointer on failure.
2141 struct net *rtnl_get_net_ns_capable(struct sock *sk, int netnsid)
2145 net = get_net_ns_by_id(sock_net(sk), netnsid);
2147 return ERR_PTR(-EINVAL);
2149 /* For now, the caller is required to have CAP_NET_ADMIN in
2150 * the user namespace owning the target net ns.
2152 if (!sk_ns_capable(sk, net->user_ns, CAP_NET_ADMIN)) {
2154 return ERR_PTR(-EACCES);
2158 EXPORT_SYMBOL_GPL(rtnl_get_net_ns_capable);
2160 static int rtnl_valid_dump_ifinfo_req(const struct nlmsghdr *nlh,
2161 bool strict_check, struct nlattr **tb,
2162 struct netlink_ext_ack *extack)
2167 struct ifinfomsg *ifm;
2169 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifm))) {
2170 NL_SET_ERR_MSG(extack, "Invalid header for link dump");
2174 ifm = nlmsg_data(nlh);
2175 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags ||
2177 NL_SET_ERR_MSG(extack, "Invalid values in header for link dump request");
2180 if (ifm->ifi_index) {
2181 NL_SET_ERR_MSG(extack, "Filter by device index not supported for link dumps");
2185 return nlmsg_parse_deprecated_strict(nlh, sizeof(*ifm), tb,
2186 IFLA_MAX, ifla_policy,
2190 /* A hack to preserve kernel<->userspace interface.
2191 * The correct header is ifinfomsg. It is consistent with rtnl_getlink.
2192 * However, before Linux v3.9 the code here assumed rtgenmsg and that's
2193 * what iproute2 < v3.9.0 used.
2194 * We can detect the old iproute2. Even including the IFLA_EXT_MASK
2195 * attribute, its netlink message is shorter than struct ifinfomsg.
2197 hdrlen = nlmsg_len(nlh) < sizeof(struct ifinfomsg) ?
2198 sizeof(struct rtgenmsg) : sizeof(struct ifinfomsg);
2200 return nlmsg_parse_deprecated(nlh, hdrlen, tb, IFLA_MAX, ifla_policy,
2204 static int rtnl_dump_ifinfo(struct sk_buff *skb, struct netlink_callback *cb)
2206 struct netlink_ext_ack *extack = cb->extack;
2207 const struct nlmsghdr *nlh = cb->nlh;
2208 struct net *net = sock_net(skb->sk);
2209 struct net *tgt_net = net;
2212 struct net_device *dev;
2213 struct hlist_head *head;
2214 struct nlattr *tb[IFLA_MAX+1];
2215 u32 ext_filter_mask = 0;
2216 const struct rtnl_link_ops *kind_ops = NULL;
2217 unsigned int flags = NLM_F_MULTI;
2223 s_idx = cb->args[1];
2225 err = rtnl_valid_dump_ifinfo_req(nlh, cb->strict_check, tb, extack);
2227 if (cb->strict_check)
2233 for (i = 0; i <= IFLA_MAX; ++i) {
2237 /* new attributes should only be added with strict checking */
2239 case IFLA_TARGET_NETNSID:
2240 netnsid = nla_get_s32(tb[i]);
2241 tgt_net = rtnl_get_net_ns_capable(skb->sk, netnsid);
2242 if (IS_ERR(tgt_net)) {
2243 NL_SET_ERR_MSG(extack, "Invalid target network namespace id");
2244 return PTR_ERR(tgt_net);
2248 ext_filter_mask = nla_get_u32(tb[i]);
2251 master_idx = nla_get_u32(tb[i]);
2254 kind_ops = linkinfo_to_kind_ops(tb[i]);
2257 if (cb->strict_check) {
2258 NL_SET_ERR_MSG(extack, "Unsupported attribute in link dump request");
2264 if (master_idx || kind_ops)
2265 flags |= NLM_F_DUMP_FILTERED;
2268 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
2270 head = &tgt_net->dev_index_head[h];
2271 hlist_for_each_entry(dev, head, index_hlist) {
2272 if (link_dump_filtered(dev, master_idx, kind_ops))
2276 err = rtnl_fill_ifinfo(skb, dev, net,
2278 NETLINK_CB(cb->skb).portid,
2279 nlh->nlmsg_seq, 0, flags,
2280 ext_filter_mask, 0, NULL, 0,
2281 netnsid, GFP_KERNEL);
2284 if (likely(skb->len))
2298 cb->seq = tgt_net->dev_base_seq;
2299 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
2306 int rtnl_nla_parse_ifinfomsg(struct nlattr **tb, const struct nlattr *nla_peer,
2307 struct netlink_ext_ack *exterr)
2309 const struct ifinfomsg *ifmp;
2310 const struct nlattr *attrs;
2313 ifmp = nla_data(nla_peer);
2314 attrs = nla_data(nla_peer) + sizeof(struct ifinfomsg);
2315 len = nla_len(nla_peer) - sizeof(struct ifinfomsg);
2317 if (ifmp->ifi_index < 0) {
2318 NL_SET_ERR_MSG_ATTR(exterr, nla_peer,
2319 "ifindex can't be negative");
2323 return nla_parse_deprecated(tb, IFLA_MAX, attrs, len, ifla_policy,
2326 EXPORT_SYMBOL(rtnl_nla_parse_ifinfomsg);
2328 struct net *rtnl_link_get_net(struct net *src_net, struct nlattr *tb[])
2331 /* Examine the link attributes and figure out which
2332 * network namespace we are talking about.
2334 if (tb[IFLA_NET_NS_PID])
2335 net = get_net_ns_by_pid(nla_get_u32(tb[IFLA_NET_NS_PID]));
2336 else if (tb[IFLA_NET_NS_FD])
2337 net = get_net_ns_by_fd(nla_get_u32(tb[IFLA_NET_NS_FD]));
2339 net = get_net(src_net);
2342 EXPORT_SYMBOL(rtnl_link_get_net);
2344 /* Figure out which network namespace we are talking about by
2345 * examining the link attributes in the following order:
2347 * 1. IFLA_NET_NS_PID
2349 * 3. IFLA_TARGET_NETNSID
2351 static struct net *rtnl_link_get_net_by_nlattr(struct net *src_net,
2352 struct nlattr *tb[])
2356 if (tb[IFLA_NET_NS_PID] || tb[IFLA_NET_NS_FD])
2357 return rtnl_link_get_net(src_net, tb);
2359 if (!tb[IFLA_TARGET_NETNSID])
2360 return get_net(src_net);
2362 net = get_net_ns_by_id(src_net, nla_get_u32(tb[IFLA_TARGET_NETNSID]));
2364 return ERR_PTR(-EINVAL);
2369 static struct net *rtnl_link_get_net_capable(const struct sk_buff *skb,
2370 struct net *src_net,
2371 struct nlattr *tb[], int cap)
2375 net = rtnl_link_get_net_by_nlattr(src_net, tb);
2379 if (!netlink_ns_capable(skb, net->user_ns, cap)) {
2381 return ERR_PTR(-EPERM);
2387 /* Verify that rtnetlink requests do not pass additional properties
2388 * potentially referring to different network namespaces.
2390 static int rtnl_ensure_unique_netns(struct nlattr *tb[],
2391 struct netlink_ext_ack *extack,
2395 if (netns_id_only) {
2396 if (!tb[IFLA_NET_NS_PID] && !tb[IFLA_NET_NS_FD])
2399 NL_SET_ERR_MSG(extack, "specified netns attribute not supported");
2403 if (tb[IFLA_TARGET_NETNSID] && (tb[IFLA_NET_NS_PID] || tb[IFLA_NET_NS_FD]))
2406 if (tb[IFLA_NET_NS_PID] && (tb[IFLA_TARGET_NETNSID] || tb[IFLA_NET_NS_FD]))
2409 if (tb[IFLA_NET_NS_FD] && (tb[IFLA_TARGET_NETNSID] || tb[IFLA_NET_NS_PID]))
2415 NL_SET_ERR_MSG(extack, "multiple netns identifying attributes specified");
2419 static int rtnl_set_vf_rate(struct net_device *dev, int vf, int min_tx_rate,
2422 const struct net_device_ops *ops = dev->netdev_ops;
2424 if (!ops->ndo_set_vf_rate)
2426 if (max_tx_rate && max_tx_rate < min_tx_rate)
2429 return ops->ndo_set_vf_rate(dev, vf, min_tx_rate, max_tx_rate);
2432 static int validate_linkmsg(struct net_device *dev, struct nlattr *tb[],
2433 struct netlink_ext_ack *extack)
2435 if (tb[IFLA_ADDRESS] &&
2436 nla_len(tb[IFLA_ADDRESS]) < dev->addr_len)
2439 if (tb[IFLA_BROADCAST] &&
2440 nla_len(tb[IFLA_BROADCAST]) < dev->addr_len)
2443 if (tb[IFLA_GSO_MAX_SIZE] &&
2444 nla_get_u32(tb[IFLA_GSO_MAX_SIZE]) > dev->tso_max_size) {
2445 NL_SET_ERR_MSG(extack, "too big gso_max_size");
2449 if (tb[IFLA_GSO_MAX_SEGS] &&
2450 (nla_get_u32(tb[IFLA_GSO_MAX_SEGS]) > GSO_MAX_SEGS ||
2451 nla_get_u32(tb[IFLA_GSO_MAX_SEGS]) > dev->tso_max_segs)) {
2452 NL_SET_ERR_MSG(extack, "too big gso_max_segs");
2456 if (tb[IFLA_GRO_MAX_SIZE] &&
2457 nla_get_u32(tb[IFLA_GRO_MAX_SIZE]) > GRO_MAX_SIZE) {
2458 NL_SET_ERR_MSG(extack, "too big gro_max_size");
2462 if (tb[IFLA_GSO_IPV4_MAX_SIZE] &&
2463 nla_get_u32(tb[IFLA_GSO_IPV4_MAX_SIZE]) > dev->tso_max_size) {
2464 NL_SET_ERR_MSG(extack, "too big gso_ipv4_max_size");
2468 if (tb[IFLA_GRO_IPV4_MAX_SIZE] &&
2469 nla_get_u32(tb[IFLA_GRO_IPV4_MAX_SIZE]) > GRO_MAX_SIZE) {
2470 NL_SET_ERR_MSG(extack, "too big gro_ipv4_max_size");
2474 if (tb[IFLA_AF_SPEC]) {
2478 nla_for_each_nested(af, tb[IFLA_AF_SPEC], rem) {
2479 const struct rtnl_af_ops *af_ops;
2481 af_ops = rtnl_af_lookup(nla_type(af));
2483 return -EAFNOSUPPORT;
2485 if (!af_ops->set_link_af)
2488 if (af_ops->validate_link_af) {
2489 err = af_ops->validate_link_af(dev, af, extack);
2499 static int handle_infiniband_guid(struct net_device *dev, struct ifla_vf_guid *ivt,
2502 const struct net_device_ops *ops = dev->netdev_ops;
2504 return ops->ndo_set_vf_guid(dev, ivt->vf, ivt->guid, guid_type);
2507 static int handle_vf_guid(struct net_device *dev, struct ifla_vf_guid *ivt, int guid_type)
2509 if (dev->type != ARPHRD_INFINIBAND)
2512 return handle_infiniband_guid(dev, ivt, guid_type);
2515 static int do_setvfinfo(struct net_device *dev, struct nlattr **tb)
2517 const struct net_device_ops *ops = dev->netdev_ops;
2520 if (tb[IFLA_VF_MAC]) {
2521 struct ifla_vf_mac *ivm = nla_data(tb[IFLA_VF_MAC]);
2523 if (ivm->vf >= INT_MAX)
2526 if (ops->ndo_set_vf_mac)
2527 err = ops->ndo_set_vf_mac(dev, ivm->vf,
2533 if (tb[IFLA_VF_VLAN]) {
2534 struct ifla_vf_vlan *ivv = nla_data(tb[IFLA_VF_VLAN]);
2536 if (ivv->vf >= INT_MAX)
2539 if (ops->ndo_set_vf_vlan)
2540 err = ops->ndo_set_vf_vlan(dev, ivv->vf, ivv->vlan,
2542 htons(ETH_P_8021Q));
2547 if (tb[IFLA_VF_VLAN_LIST]) {
2548 struct ifla_vf_vlan_info *ivvl[MAX_VLAN_LIST_LEN];
2549 struct nlattr *attr;
2553 if (!ops->ndo_set_vf_vlan)
2556 nla_for_each_nested(attr, tb[IFLA_VF_VLAN_LIST], rem) {
2557 if (nla_type(attr) != IFLA_VF_VLAN_INFO ||
2558 nla_len(attr) < NLA_HDRLEN) {
2561 if (len >= MAX_VLAN_LIST_LEN)
2563 ivvl[len] = nla_data(attr);
2570 if (ivvl[0]->vf >= INT_MAX)
2572 err = ops->ndo_set_vf_vlan(dev, ivvl[0]->vf, ivvl[0]->vlan,
2573 ivvl[0]->qos, ivvl[0]->vlan_proto);
2578 if (tb[IFLA_VF_TX_RATE]) {
2579 struct ifla_vf_tx_rate *ivt = nla_data(tb[IFLA_VF_TX_RATE]);
2580 struct ifla_vf_info ivf;
2582 if (ivt->vf >= INT_MAX)
2585 if (ops->ndo_get_vf_config)
2586 err = ops->ndo_get_vf_config(dev, ivt->vf, &ivf);
2590 err = rtnl_set_vf_rate(dev, ivt->vf,
2591 ivf.min_tx_rate, ivt->rate);
2596 if (tb[IFLA_VF_RATE]) {
2597 struct ifla_vf_rate *ivt = nla_data(tb[IFLA_VF_RATE]);
2599 if (ivt->vf >= INT_MAX)
2602 err = rtnl_set_vf_rate(dev, ivt->vf,
2603 ivt->min_tx_rate, ivt->max_tx_rate);
2608 if (tb[IFLA_VF_SPOOFCHK]) {
2609 struct ifla_vf_spoofchk *ivs = nla_data(tb[IFLA_VF_SPOOFCHK]);
2611 if (ivs->vf >= INT_MAX)
2614 if (ops->ndo_set_vf_spoofchk)
2615 err = ops->ndo_set_vf_spoofchk(dev, ivs->vf,
2621 if (tb[IFLA_VF_LINK_STATE]) {
2622 struct ifla_vf_link_state *ivl = nla_data(tb[IFLA_VF_LINK_STATE]);
2624 if (ivl->vf >= INT_MAX)
2627 if (ops->ndo_set_vf_link_state)
2628 err = ops->ndo_set_vf_link_state(dev, ivl->vf,
2634 if (tb[IFLA_VF_RSS_QUERY_EN]) {
2635 struct ifla_vf_rss_query_en *ivrssq_en;
2638 ivrssq_en = nla_data(tb[IFLA_VF_RSS_QUERY_EN]);
2639 if (ivrssq_en->vf >= INT_MAX)
2641 if (ops->ndo_set_vf_rss_query_en)
2642 err = ops->ndo_set_vf_rss_query_en(dev, ivrssq_en->vf,
2643 ivrssq_en->setting);
2648 if (tb[IFLA_VF_TRUST]) {
2649 struct ifla_vf_trust *ivt = nla_data(tb[IFLA_VF_TRUST]);
2651 if (ivt->vf >= INT_MAX)
2654 if (ops->ndo_set_vf_trust)
2655 err = ops->ndo_set_vf_trust(dev, ivt->vf, ivt->setting);
2660 if (tb[IFLA_VF_IB_NODE_GUID]) {
2661 struct ifla_vf_guid *ivt = nla_data(tb[IFLA_VF_IB_NODE_GUID]);
2663 if (ivt->vf >= INT_MAX)
2665 if (!ops->ndo_set_vf_guid)
2667 return handle_vf_guid(dev, ivt, IFLA_VF_IB_NODE_GUID);
2670 if (tb[IFLA_VF_IB_PORT_GUID]) {
2671 struct ifla_vf_guid *ivt = nla_data(tb[IFLA_VF_IB_PORT_GUID]);
2673 if (ivt->vf >= INT_MAX)
2675 if (!ops->ndo_set_vf_guid)
2678 return handle_vf_guid(dev, ivt, IFLA_VF_IB_PORT_GUID);
2684 static int do_set_master(struct net_device *dev, int ifindex,
2685 struct netlink_ext_ack *extack)
2687 struct net_device *upper_dev = netdev_master_upper_dev_get(dev);
2688 const struct net_device_ops *ops;
2692 if (upper_dev->ifindex == ifindex)
2694 ops = upper_dev->netdev_ops;
2695 if (ops->ndo_del_slave) {
2696 err = ops->ndo_del_slave(upper_dev, dev);
2705 upper_dev = __dev_get_by_index(dev_net(dev), ifindex);
2708 ops = upper_dev->netdev_ops;
2709 if (ops->ndo_add_slave) {
2710 err = ops->ndo_add_slave(upper_dev, dev, extack);
2720 static const struct nla_policy ifla_proto_down_reason_policy[IFLA_PROTO_DOWN_REASON_VALUE + 1] = {
2721 [IFLA_PROTO_DOWN_REASON_MASK] = { .type = NLA_U32 },
2722 [IFLA_PROTO_DOWN_REASON_VALUE] = { .type = NLA_U32 },
2725 static int do_set_proto_down(struct net_device *dev,
2726 struct nlattr *nl_proto_down,
2727 struct nlattr *nl_proto_down_reason,
2728 struct netlink_ext_ack *extack)
2730 struct nlattr *pdreason[IFLA_PROTO_DOWN_REASON_MAX + 1];
2731 unsigned long mask = 0;
2736 if (!(dev->priv_flags & IFF_CHANGE_PROTO_DOWN)) {
2737 NL_SET_ERR_MSG(extack, "Protodown not supported by device");
2741 if (nl_proto_down_reason) {
2742 err = nla_parse_nested_deprecated(pdreason,
2743 IFLA_PROTO_DOWN_REASON_MAX,
2744 nl_proto_down_reason,
2745 ifla_proto_down_reason_policy,
2750 if (!pdreason[IFLA_PROTO_DOWN_REASON_VALUE]) {
2751 NL_SET_ERR_MSG(extack, "Invalid protodown reason value");
2755 value = nla_get_u32(pdreason[IFLA_PROTO_DOWN_REASON_VALUE]);
2757 if (pdreason[IFLA_PROTO_DOWN_REASON_MASK])
2758 mask = nla_get_u32(pdreason[IFLA_PROTO_DOWN_REASON_MASK]);
2760 dev_change_proto_down_reason(dev, mask, value);
2763 if (nl_proto_down) {
2764 proto_down = nla_get_u8(nl_proto_down);
2766 /* Don't turn off protodown if there are active reasons */
2767 if (!proto_down && dev->proto_down_reason) {
2768 NL_SET_ERR_MSG(extack, "Cannot clear protodown, active reasons");
2771 err = dev_change_proto_down(dev,
2780 #define DO_SETLINK_MODIFIED 0x01
2781 /* notify flag means notify + modified. */
2782 #define DO_SETLINK_NOTIFY 0x03
2783 static int do_setlink(const struct sk_buff *skb,
2784 struct net_device *dev, struct ifinfomsg *ifm,
2785 struct netlink_ext_ack *extack,
2786 struct nlattr **tb, int status)
2788 const struct net_device_ops *ops = dev->netdev_ops;
2789 char ifname[IFNAMSIZ];
2792 if (tb[IFLA_IFNAME])
2793 nla_strscpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
2797 if (tb[IFLA_NET_NS_PID] || tb[IFLA_NET_NS_FD] || tb[IFLA_TARGET_NETNSID]) {
2798 const char *pat = ifname[0] ? ifname : NULL;
2802 net = rtnl_link_get_net_capable(skb, dev_net(dev),
2809 if (tb[IFLA_NEW_IFINDEX])
2810 new_ifindex = nla_get_s32(tb[IFLA_NEW_IFINDEX]);
2814 err = __dev_change_net_namespace(dev, net, pat, new_ifindex);
2818 status |= DO_SETLINK_MODIFIED;
2822 struct rtnl_link_ifmap *u_map;
2825 if (!ops->ndo_set_config) {
2830 if (!netif_device_present(dev)) {
2835 u_map = nla_data(tb[IFLA_MAP]);
2836 k_map.mem_start = (unsigned long) u_map->mem_start;
2837 k_map.mem_end = (unsigned long) u_map->mem_end;
2838 k_map.base_addr = (unsigned short) u_map->base_addr;
2839 k_map.irq = (unsigned char) u_map->irq;
2840 k_map.dma = (unsigned char) u_map->dma;
2841 k_map.port = (unsigned char) u_map->port;
2843 err = ops->ndo_set_config(dev, &k_map);
2847 status |= DO_SETLINK_NOTIFY;
2850 if (tb[IFLA_ADDRESS]) {
2851 struct sockaddr *sa;
2854 len = sizeof(sa_family_t) + max_t(size_t, dev->addr_len,
2856 sa = kmalloc(len, GFP_KERNEL);
2861 sa->sa_family = dev->type;
2862 memcpy(sa->sa_data, nla_data(tb[IFLA_ADDRESS]),
2864 err = dev_set_mac_address_user(dev, sa, extack);
2868 status |= DO_SETLINK_MODIFIED;
2872 err = dev_set_mtu_ext(dev, nla_get_u32(tb[IFLA_MTU]), extack);
2875 status |= DO_SETLINK_MODIFIED;
2878 if (tb[IFLA_GROUP]) {
2879 dev_set_group(dev, nla_get_u32(tb[IFLA_GROUP]));
2880 status |= DO_SETLINK_NOTIFY;
2884 * Interface selected by interface index but interface
2885 * name provided implies that a name change has been
2888 if (ifm->ifi_index > 0 && ifname[0]) {
2889 err = dev_change_name(dev, ifname);
2892 status |= DO_SETLINK_MODIFIED;
2895 if (tb[IFLA_IFALIAS]) {
2896 err = dev_set_alias(dev, nla_data(tb[IFLA_IFALIAS]),
2897 nla_len(tb[IFLA_IFALIAS]));
2900 status |= DO_SETLINK_NOTIFY;
2903 if (tb[IFLA_BROADCAST]) {
2904 nla_memcpy(dev->broadcast, tb[IFLA_BROADCAST], dev->addr_len);
2905 call_netdevice_notifiers(NETDEV_CHANGEADDR, dev);
2908 if (tb[IFLA_MASTER]) {
2909 err = do_set_master(dev, nla_get_u32(tb[IFLA_MASTER]), extack);
2912 status |= DO_SETLINK_MODIFIED;
2915 if (ifm->ifi_flags || ifm->ifi_change) {
2916 err = dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm),
2922 if (tb[IFLA_CARRIER]) {
2923 err = dev_change_carrier(dev, nla_get_u8(tb[IFLA_CARRIER]));
2926 status |= DO_SETLINK_MODIFIED;
2929 if (tb[IFLA_TXQLEN]) {
2930 unsigned int value = nla_get_u32(tb[IFLA_TXQLEN]);
2932 err = dev_change_tx_queue_len(dev, value);
2935 status |= DO_SETLINK_MODIFIED;
2938 if (tb[IFLA_GSO_MAX_SIZE]) {
2939 u32 max_size = nla_get_u32(tb[IFLA_GSO_MAX_SIZE]);
2941 if (dev->gso_max_size ^ max_size) {
2942 netif_set_gso_max_size(dev, max_size);
2943 status |= DO_SETLINK_MODIFIED;
2947 if (tb[IFLA_GSO_MAX_SEGS]) {
2948 u32 max_segs = nla_get_u32(tb[IFLA_GSO_MAX_SEGS]);
2950 if (dev->gso_max_segs ^ max_segs) {
2951 netif_set_gso_max_segs(dev, max_segs);
2952 status |= DO_SETLINK_MODIFIED;
2956 if (tb[IFLA_GRO_MAX_SIZE]) {
2957 u32 gro_max_size = nla_get_u32(tb[IFLA_GRO_MAX_SIZE]);
2959 if (dev->gro_max_size ^ gro_max_size) {
2960 netif_set_gro_max_size(dev, gro_max_size);
2961 status |= DO_SETLINK_MODIFIED;
2965 if (tb[IFLA_GSO_IPV4_MAX_SIZE]) {
2966 u32 max_size = nla_get_u32(tb[IFLA_GSO_IPV4_MAX_SIZE]);
2968 if (dev->gso_ipv4_max_size ^ max_size) {
2969 netif_set_gso_ipv4_max_size(dev, max_size);
2970 status |= DO_SETLINK_MODIFIED;
2974 if (tb[IFLA_GRO_IPV4_MAX_SIZE]) {
2975 u32 gro_max_size = nla_get_u32(tb[IFLA_GRO_IPV4_MAX_SIZE]);
2977 if (dev->gro_ipv4_max_size ^ gro_max_size) {
2978 netif_set_gro_ipv4_max_size(dev, gro_max_size);
2979 status |= DO_SETLINK_MODIFIED;
2983 if (tb[IFLA_OPERSTATE])
2984 set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
2986 if (tb[IFLA_LINKMODE]) {
2987 unsigned char value = nla_get_u8(tb[IFLA_LINKMODE]);
2989 write_lock(&dev_base_lock);
2990 if (dev->link_mode ^ value)
2991 status |= DO_SETLINK_NOTIFY;
2992 dev->link_mode = value;
2993 write_unlock(&dev_base_lock);
2996 if (tb[IFLA_VFINFO_LIST]) {
2997 struct nlattr *vfinfo[IFLA_VF_MAX + 1];
2998 struct nlattr *attr;
3001 nla_for_each_nested(attr, tb[IFLA_VFINFO_LIST], rem) {
3002 if (nla_type(attr) != IFLA_VF_INFO ||
3003 nla_len(attr) < NLA_HDRLEN) {
3007 err = nla_parse_nested_deprecated(vfinfo, IFLA_VF_MAX,
3013 err = do_setvfinfo(dev, vfinfo);
3016 status |= DO_SETLINK_NOTIFY;
3021 if (tb[IFLA_VF_PORTS]) {
3022 struct nlattr *port[IFLA_PORT_MAX+1];
3023 struct nlattr *attr;
3028 if (!ops->ndo_set_vf_port)
3031 nla_for_each_nested(attr, tb[IFLA_VF_PORTS], rem) {
3032 if (nla_type(attr) != IFLA_VF_PORT ||
3033 nla_len(attr) < NLA_HDRLEN) {
3037 err = nla_parse_nested_deprecated(port, IFLA_PORT_MAX,
3043 if (!port[IFLA_PORT_VF]) {
3047 vf = nla_get_u32(port[IFLA_PORT_VF]);
3048 err = ops->ndo_set_vf_port(dev, vf, port);
3051 status |= DO_SETLINK_NOTIFY;
3056 if (tb[IFLA_PORT_SELF]) {
3057 struct nlattr *port[IFLA_PORT_MAX+1];
3059 err = nla_parse_nested_deprecated(port, IFLA_PORT_MAX,
3061 ifla_port_policy, NULL);
3066 if (ops->ndo_set_vf_port)
3067 err = ops->ndo_set_vf_port(dev, PORT_SELF_VF, port);
3070 status |= DO_SETLINK_NOTIFY;
3073 if (tb[IFLA_AF_SPEC]) {
3077 nla_for_each_nested(af, tb[IFLA_AF_SPEC], rem) {
3078 const struct rtnl_af_ops *af_ops;
3080 BUG_ON(!(af_ops = rtnl_af_lookup(nla_type(af))));
3082 err = af_ops->set_link_af(dev, af, extack);
3086 status |= DO_SETLINK_NOTIFY;
3091 if (tb[IFLA_PROTO_DOWN] || tb[IFLA_PROTO_DOWN_REASON]) {
3092 err = do_set_proto_down(dev, tb[IFLA_PROTO_DOWN],
3093 tb[IFLA_PROTO_DOWN_REASON], extack);
3096 status |= DO_SETLINK_NOTIFY;
3100 struct nlattr *xdp[IFLA_XDP_MAX + 1];
3103 err = nla_parse_nested_deprecated(xdp, IFLA_XDP_MAX,
3105 ifla_xdp_policy, NULL);
3109 if (xdp[IFLA_XDP_ATTACHED] || xdp[IFLA_XDP_PROG_ID]) {
3114 if (xdp[IFLA_XDP_FLAGS]) {
3115 xdp_flags = nla_get_u32(xdp[IFLA_XDP_FLAGS]);
3116 if (xdp_flags & ~XDP_FLAGS_MASK) {
3120 if (hweight32(xdp_flags & XDP_FLAGS_MODES) > 1) {
3126 if (xdp[IFLA_XDP_FD]) {
3127 int expected_fd = -1;
3129 if (xdp_flags & XDP_FLAGS_REPLACE) {
3130 if (!xdp[IFLA_XDP_EXPECTED_FD]) {
3135 nla_get_s32(xdp[IFLA_XDP_EXPECTED_FD]);
3138 err = dev_change_xdp_fd(dev, extack,
3139 nla_get_s32(xdp[IFLA_XDP_FD]),
3144 status |= DO_SETLINK_NOTIFY;
3149 if (status & DO_SETLINK_MODIFIED) {
3150 if ((status & DO_SETLINK_NOTIFY) == DO_SETLINK_NOTIFY)
3151 netdev_state_change(dev);
3154 net_warn_ratelimited("A link change request failed with some changes committed already. Interface %s may have been left with an inconsistent configuration, please check.\n",
3161 static struct net_device *rtnl_dev_get(struct net *net,
3162 struct nlattr *tb[])
3164 char ifname[ALTIFNAMSIZ];
3166 if (tb[IFLA_IFNAME])
3167 nla_strscpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
3168 else if (tb[IFLA_ALT_IFNAME])
3169 nla_strscpy(ifname, tb[IFLA_ALT_IFNAME], ALTIFNAMSIZ);
3173 return __dev_get_by_name(net, ifname);
3176 static int rtnl_setlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3177 struct netlink_ext_ack *extack)
3179 struct net *net = sock_net(skb->sk);
3180 struct ifinfomsg *ifm;
3181 struct net_device *dev;
3183 struct nlattr *tb[IFLA_MAX+1];
3185 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3186 ifla_policy, extack);
3190 err = rtnl_ensure_unique_netns(tb, extack, false);
3195 ifm = nlmsg_data(nlh);
3196 if (ifm->ifi_index > 0)
3197 dev = __dev_get_by_index(net, ifm->ifi_index);
3198 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3199 dev = rtnl_dev_get(net, tb);
3208 err = validate_linkmsg(dev, tb, extack);
3212 err = do_setlink(skb, dev, ifm, extack, tb, 0);
3217 static int rtnl_group_dellink(const struct net *net, int group)
3219 struct net_device *dev, *aux;
3220 LIST_HEAD(list_kill);
3226 for_each_netdev(net, dev) {
3227 if (dev->group == group) {
3228 const struct rtnl_link_ops *ops;
3231 ops = dev->rtnl_link_ops;
3232 if (!ops || !ops->dellink)
3240 for_each_netdev_safe(net, dev, aux) {
3241 if (dev->group == group) {
3242 const struct rtnl_link_ops *ops;
3244 ops = dev->rtnl_link_ops;
3245 ops->dellink(dev, &list_kill);
3248 unregister_netdevice_many(&list_kill);
3253 int rtnl_delete_link(struct net_device *dev, u32 portid, const struct nlmsghdr *nlh)
3255 const struct rtnl_link_ops *ops;
3256 LIST_HEAD(list_kill);
3258 ops = dev->rtnl_link_ops;
3259 if (!ops || !ops->dellink)
3262 ops->dellink(dev, &list_kill);
3263 unregister_netdevice_many_notify(&list_kill, portid, nlh);
3267 EXPORT_SYMBOL_GPL(rtnl_delete_link);
3269 static int rtnl_dellink(struct sk_buff *skb, struct nlmsghdr *nlh,
3270 struct netlink_ext_ack *extack)
3272 struct net *net = sock_net(skb->sk);
3273 u32 portid = NETLINK_CB(skb).portid;
3274 struct net *tgt_net = net;
3275 struct net_device *dev = NULL;
3276 struct ifinfomsg *ifm;
3277 struct nlattr *tb[IFLA_MAX+1];
3281 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3282 ifla_policy, extack);
3286 err = rtnl_ensure_unique_netns(tb, extack, true);
3290 if (tb[IFLA_TARGET_NETNSID]) {
3291 netnsid = nla_get_s32(tb[IFLA_TARGET_NETNSID]);
3292 tgt_net = rtnl_get_net_ns_capable(NETLINK_CB(skb).sk, netnsid);
3293 if (IS_ERR(tgt_net))
3294 return PTR_ERR(tgt_net);
3298 ifm = nlmsg_data(nlh);
3299 if (ifm->ifi_index > 0)
3300 dev = __dev_get_by_index(tgt_net, ifm->ifi_index);
3301 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3302 dev = rtnl_dev_get(net, tb);
3303 else if (tb[IFLA_GROUP])
3304 err = rtnl_group_dellink(tgt_net, nla_get_u32(tb[IFLA_GROUP]));
3309 if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME] || ifm->ifi_index > 0)
3315 err = rtnl_delete_link(dev, portid, nlh);
3324 int rtnl_configure_link(struct net_device *dev, const struct ifinfomsg *ifm,
3325 u32 portid, const struct nlmsghdr *nlh)
3327 unsigned int old_flags;
3330 old_flags = dev->flags;
3331 if (ifm && (ifm->ifi_flags || ifm->ifi_change)) {
3332 err = __dev_change_flags(dev, rtnl_dev_combine_flags(dev, ifm),
3338 if (dev->rtnl_link_state == RTNL_LINK_INITIALIZED) {
3339 __dev_notify_flags(dev, old_flags, (old_flags ^ dev->flags), portid, nlh);
3341 dev->rtnl_link_state = RTNL_LINK_INITIALIZED;
3342 __dev_notify_flags(dev, old_flags, ~0U, portid, nlh);
3346 EXPORT_SYMBOL(rtnl_configure_link);
3348 struct net_device *rtnl_create_link(struct net *net, const char *ifname,
3349 unsigned char name_assign_type,
3350 const struct rtnl_link_ops *ops,
3351 struct nlattr *tb[],
3352 struct netlink_ext_ack *extack)
3354 struct net_device *dev;
3355 unsigned int num_tx_queues = 1;
3356 unsigned int num_rx_queues = 1;
3359 if (tb[IFLA_NUM_TX_QUEUES])
3360 num_tx_queues = nla_get_u32(tb[IFLA_NUM_TX_QUEUES]);
3361 else if (ops->get_num_tx_queues)
3362 num_tx_queues = ops->get_num_tx_queues();
3364 if (tb[IFLA_NUM_RX_QUEUES])
3365 num_rx_queues = nla_get_u32(tb[IFLA_NUM_RX_QUEUES]);
3366 else if (ops->get_num_rx_queues)
3367 num_rx_queues = ops->get_num_rx_queues();
3369 if (num_tx_queues < 1 || num_tx_queues > 4096) {
3370 NL_SET_ERR_MSG(extack, "Invalid number of transmit queues");
3371 return ERR_PTR(-EINVAL);
3374 if (num_rx_queues < 1 || num_rx_queues > 4096) {
3375 NL_SET_ERR_MSG(extack, "Invalid number of receive queues");
3376 return ERR_PTR(-EINVAL);
3380 dev = ops->alloc(tb, ifname, name_assign_type,
3381 num_tx_queues, num_rx_queues);
3385 dev = alloc_netdev_mqs(ops->priv_size, ifname,
3386 name_assign_type, ops->setup,
3387 num_tx_queues, num_rx_queues);
3391 return ERR_PTR(-ENOMEM);
3393 err = validate_linkmsg(dev, tb, extack);
3396 return ERR_PTR(err);
3399 dev_net_set(dev, net);
3400 dev->rtnl_link_ops = ops;
3401 dev->rtnl_link_state = RTNL_LINK_INITIALIZING;
3404 u32 mtu = nla_get_u32(tb[IFLA_MTU]);
3406 err = dev_validate_mtu(dev, mtu, extack);
3409 return ERR_PTR(err);
3413 if (tb[IFLA_ADDRESS]) {
3414 __dev_addr_set(dev, nla_data(tb[IFLA_ADDRESS]),
3415 nla_len(tb[IFLA_ADDRESS]));
3416 dev->addr_assign_type = NET_ADDR_SET;
3418 if (tb[IFLA_BROADCAST])
3419 memcpy(dev->broadcast, nla_data(tb[IFLA_BROADCAST]),
3420 nla_len(tb[IFLA_BROADCAST]));
3421 if (tb[IFLA_TXQLEN])
3422 dev->tx_queue_len = nla_get_u32(tb[IFLA_TXQLEN]);
3423 if (tb[IFLA_OPERSTATE])
3424 set_operstate(dev, nla_get_u8(tb[IFLA_OPERSTATE]));
3425 if (tb[IFLA_LINKMODE])
3426 dev->link_mode = nla_get_u8(tb[IFLA_LINKMODE]);
3428 dev_set_group(dev, nla_get_u32(tb[IFLA_GROUP]));
3429 if (tb[IFLA_GSO_MAX_SIZE])
3430 netif_set_gso_max_size(dev, nla_get_u32(tb[IFLA_GSO_MAX_SIZE]));
3431 if (tb[IFLA_GSO_MAX_SEGS])
3432 netif_set_gso_max_segs(dev, nla_get_u32(tb[IFLA_GSO_MAX_SEGS]));
3433 if (tb[IFLA_GRO_MAX_SIZE])
3434 netif_set_gro_max_size(dev, nla_get_u32(tb[IFLA_GRO_MAX_SIZE]));
3435 if (tb[IFLA_GSO_IPV4_MAX_SIZE])
3436 netif_set_gso_ipv4_max_size(dev, nla_get_u32(tb[IFLA_GSO_IPV4_MAX_SIZE]));
3437 if (tb[IFLA_GRO_IPV4_MAX_SIZE])
3438 netif_set_gro_ipv4_max_size(dev, nla_get_u32(tb[IFLA_GRO_IPV4_MAX_SIZE]));
3442 EXPORT_SYMBOL(rtnl_create_link);
3444 static int rtnl_group_changelink(const struct sk_buff *skb,
3445 struct net *net, int group,
3446 struct ifinfomsg *ifm,
3447 struct netlink_ext_ack *extack,
3450 struct net_device *dev, *aux;
3453 for_each_netdev_safe(net, dev, aux) {
3454 if (dev->group == group) {
3455 err = validate_linkmsg(dev, tb, extack);
3458 err = do_setlink(skb, dev, ifm, extack, tb, 0);
3467 static int rtnl_newlink_create(struct sk_buff *skb, struct ifinfomsg *ifm,
3468 const struct rtnl_link_ops *ops,
3469 const struct nlmsghdr *nlh,
3470 struct nlattr **tb, struct nlattr **data,
3471 struct netlink_ext_ack *extack)
3473 unsigned char name_assign_type = NET_NAME_USER;
3474 struct net *net = sock_net(skb->sk);
3475 u32 portid = NETLINK_CB(skb).portid;
3476 struct net *dest_net, *link_net;
3477 struct net_device *dev;
3478 char ifname[IFNAMSIZ];
3481 if (!ops->alloc && !ops->setup)
3484 if (tb[IFLA_IFNAME]) {
3485 nla_strscpy(ifname, tb[IFLA_IFNAME], IFNAMSIZ);
3487 snprintf(ifname, IFNAMSIZ, "%s%%d", ops->kind);
3488 name_assign_type = NET_NAME_ENUM;
3491 dest_net = rtnl_link_get_net_capable(skb, net, tb, CAP_NET_ADMIN);
3492 if (IS_ERR(dest_net))
3493 return PTR_ERR(dest_net);
3495 if (tb[IFLA_LINK_NETNSID]) {
3496 int id = nla_get_s32(tb[IFLA_LINK_NETNSID]);
3498 link_net = get_net_ns_by_id(dest_net, id);
3500 NL_SET_ERR_MSG(extack, "Unknown network namespace id");
3505 if (!netlink_ns_capable(skb, link_net->user_ns, CAP_NET_ADMIN))
3511 dev = rtnl_create_link(link_net ? : dest_net, ifname,
3512 name_assign_type, ops, tb, extack);
3518 dev->ifindex = ifm->ifi_index;
3521 err = ops->newlink(link_net ? : net, dev, tb, data, extack);
3523 err = register_netdevice(dev);
3529 err = rtnl_configure_link(dev, ifm, portid, nlh);
3531 goto out_unregister;
3533 err = dev_change_net_namespace(dev, dest_net, ifname);
3535 goto out_unregister;
3537 if (tb[IFLA_MASTER]) {
3538 err = do_set_master(dev, nla_get_u32(tb[IFLA_MASTER]), extack);
3540 goto out_unregister;
3549 LIST_HEAD(list_kill);
3551 ops->dellink(dev, &list_kill);
3552 unregister_netdevice_many(&list_kill);
3554 unregister_netdevice(dev);
3559 struct rtnl_newlink_tbs {
3560 struct nlattr *tb[IFLA_MAX + 1];
3561 struct nlattr *attr[RTNL_MAX_TYPE + 1];
3562 struct nlattr *slave_attr[RTNL_SLAVE_MAX_TYPE + 1];
3565 static int __rtnl_newlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3566 struct rtnl_newlink_tbs *tbs,
3567 struct netlink_ext_ack *extack)
3569 struct nlattr *linkinfo[IFLA_INFO_MAX + 1];
3570 struct nlattr ** const tb = tbs->tb;
3571 const struct rtnl_link_ops *m_ops;
3572 struct net_device *master_dev;
3573 struct net *net = sock_net(skb->sk);
3574 const struct rtnl_link_ops *ops;
3575 struct nlattr **slave_data;
3576 char kind[MODULE_NAME_LEN];
3577 struct net_device *dev;
3578 struct ifinfomsg *ifm;
3579 struct nlattr **data;
3580 bool link_specified;
3583 #ifdef CONFIG_MODULES
3586 err = nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3587 ifla_policy, extack);
3591 err = rtnl_ensure_unique_netns(tb, extack, false);
3595 ifm = nlmsg_data(nlh);
3596 if (ifm->ifi_index > 0) {
3597 link_specified = true;
3598 dev = __dev_get_by_index(net, ifm->ifi_index);
3599 } else if (ifm->ifi_index < 0) {
3600 NL_SET_ERR_MSG(extack, "ifindex can't be negative");
3602 } else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME]) {
3603 link_specified = true;
3604 dev = rtnl_dev_get(net, tb);
3606 link_specified = false;
3613 master_dev = netdev_master_upper_dev_get(dev);
3615 m_ops = master_dev->rtnl_link_ops;
3618 if (tb[IFLA_LINKINFO]) {
3619 err = nla_parse_nested_deprecated(linkinfo, IFLA_INFO_MAX,
3621 ifla_info_policy, NULL);
3625 memset(linkinfo, 0, sizeof(linkinfo));
3627 if (linkinfo[IFLA_INFO_KIND]) {
3628 nla_strscpy(kind, linkinfo[IFLA_INFO_KIND], sizeof(kind));
3629 ops = rtnl_link_ops_get(kind);
3637 if (ops->maxtype > RTNL_MAX_TYPE)
3640 if (ops->maxtype && linkinfo[IFLA_INFO_DATA]) {
3641 err = nla_parse_nested_deprecated(tbs->attr, ops->maxtype,
3642 linkinfo[IFLA_INFO_DATA],
3643 ops->policy, extack);
3648 if (ops->validate) {
3649 err = ops->validate(tb, data, extack);
3657 if (m_ops->slave_maxtype > RTNL_SLAVE_MAX_TYPE)
3660 if (m_ops->slave_maxtype &&
3661 linkinfo[IFLA_INFO_SLAVE_DATA]) {
3662 err = nla_parse_nested_deprecated(tbs->slave_attr,
3663 m_ops->slave_maxtype,
3664 linkinfo[IFLA_INFO_SLAVE_DATA],
3665 m_ops->slave_policy,
3669 slave_data = tbs->slave_attr;
3676 if (nlh->nlmsg_flags & NLM_F_EXCL)
3678 if (nlh->nlmsg_flags & NLM_F_REPLACE)
3681 err = validate_linkmsg(dev, tb, extack);
3685 if (linkinfo[IFLA_INFO_DATA]) {
3686 if (!ops || ops != dev->rtnl_link_ops ||
3690 err = ops->changelink(dev, tb, data, extack);
3693 status |= DO_SETLINK_NOTIFY;
3696 if (linkinfo[IFLA_INFO_SLAVE_DATA]) {
3697 if (!m_ops || !m_ops->slave_changelink)
3700 err = m_ops->slave_changelink(master_dev, dev, tb,
3701 slave_data, extack);
3704 status |= DO_SETLINK_NOTIFY;
3707 return do_setlink(skb, dev, ifm, extack, tb, status);
3710 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
3711 /* No dev found and NLM_F_CREATE not set. Requested dev does not exist,
3712 * or it's for a group
3717 return rtnl_group_changelink(skb, net,
3718 nla_get_u32(tb[IFLA_GROUP]),
3723 if (tb[IFLA_MAP] || tb[IFLA_PROTINFO])
3727 #ifdef CONFIG_MODULES
3730 request_module("rtnl-link-%s", kind);
3732 ops = rtnl_link_ops_get(kind);
3737 NL_SET_ERR_MSG(extack, "Unknown device type");
3741 return rtnl_newlink_create(skb, ifm, ops, nlh, tb, data, extack);
3744 static int rtnl_newlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3745 struct netlink_ext_ack *extack)
3747 struct rtnl_newlink_tbs *tbs;
3750 tbs = kmalloc(sizeof(*tbs), GFP_KERNEL);
3754 ret = __rtnl_newlink(skb, nlh, tbs, extack);
3759 static int rtnl_valid_getlink_req(struct sk_buff *skb,
3760 const struct nlmsghdr *nlh,
3762 struct netlink_ext_ack *extack)
3764 struct ifinfomsg *ifm;
3767 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifm))) {
3768 NL_SET_ERR_MSG(extack, "Invalid header for get link");
3772 if (!netlink_strict_get_check(skb))
3773 return nlmsg_parse_deprecated(nlh, sizeof(*ifm), tb, IFLA_MAX,
3774 ifla_policy, extack);
3776 ifm = nlmsg_data(nlh);
3777 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags ||
3779 NL_SET_ERR_MSG(extack, "Invalid values in header for get link request");
3783 err = nlmsg_parse_deprecated_strict(nlh, sizeof(*ifm), tb, IFLA_MAX,
3784 ifla_policy, extack);
3788 for (i = 0; i <= IFLA_MAX; i++) {
3794 case IFLA_ALT_IFNAME:
3796 case IFLA_TARGET_NETNSID:
3799 NL_SET_ERR_MSG(extack, "Unsupported attribute in get link request");
3807 static int rtnl_getlink(struct sk_buff *skb, struct nlmsghdr *nlh,
3808 struct netlink_ext_ack *extack)
3810 struct net *net = sock_net(skb->sk);
3811 struct net *tgt_net = net;
3812 struct ifinfomsg *ifm;
3813 struct nlattr *tb[IFLA_MAX+1];
3814 struct net_device *dev = NULL;
3815 struct sk_buff *nskb;
3818 u32 ext_filter_mask = 0;
3820 err = rtnl_valid_getlink_req(skb, nlh, tb, extack);
3824 err = rtnl_ensure_unique_netns(tb, extack, true);
3828 if (tb[IFLA_TARGET_NETNSID]) {
3829 netnsid = nla_get_s32(tb[IFLA_TARGET_NETNSID]);
3830 tgt_net = rtnl_get_net_ns_capable(NETLINK_CB(skb).sk, netnsid);
3831 if (IS_ERR(tgt_net))
3832 return PTR_ERR(tgt_net);
3835 if (tb[IFLA_EXT_MASK])
3836 ext_filter_mask = nla_get_u32(tb[IFLA_EXT_MASK]);
3839 ifm = nlmsg_data(nlh);
3840 if (ifm->ifi_index > 0)
3841 dev = __dev_get_by_index(tgt_net, ifm->ifi_index);
3842 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3843 dev = rtnl_dev_get(tgt_net, tb);
3852 nskb = nlmsg_new(if_nlmsg_size(dev, ext_filter_mask), GFP_KERNEL);
3856 err = rtnl_fill_ifinfo(nskb, dev, net,
3857 RTM_NEWLINK, NETLINK_CB(skb).portid,
3858 nlh->nlmsg_seq, 0, 0, ext_filter_mask,
3859 0, NULL, 0, netnsid, GFP_KERNEL);
3861 /* -EMSGSIZE implies BUG in if_nlmsg_size */
3862 WARN_ON(err == -EMSGSIZE);
3865 err = rtnl_unicast(nskb, net, NETLINK_CB(skb).portid);
3873 static int rtnl_alt_ifname(int cmd, struct net_device *dev, struct nlattr *attr,
3874 bool *changed, struct netlink_ext_ack *extack)
3880 err = nla_validate(attr, attr->nla_len, IFLA_MAX, ifla_policy, extack);
3884 if (cmd == RTM_NEWLINKPROP) {
3885 size = rtnl_prop_list_size(dev);
3886 size += nla_total_size(ALTIFNAMSIZ);
3887 if (size >= U16_MAX) {
3888 NL_SET_ERR_MSG(extack,
3889 "effective property list too long");
3894 alt_ifname = nla_strdup(attr, GFP_KERNEL_ACCOUNT);
3898 if (cmd == RTM_NEWLINKPROP) {
3899 err = netdev_name_node_alt_create(dev, alt_ifname);
3902 } else if (cmd == RTM_DELLINKPROP) {
3903 err = netdev_name_node_alt_destroy(dev, alt_ifname);
3915 static int rtnl_linkprop(int cmd, struct sk_buff *skb, struct nlmsghdr *nlh,
3916 struct netlink_ext_ack *extack)
3918 struct net *net = sock_net(skb->sk);
3919 struct nlattr *tb[IFLA_MAX + 1];
3920 struct net_device *dev;
3921 struct ifinfomsg *ifm;
3922 bool changed = false;
3923 struct nlattr *attr;
3926 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFLA_MAX, ifla_policy, extack);
3930 err = rtnl_ensure_unique_netns(tb, extack, true);
3934 ifm = nlmsg_data(nlh);
3935 if (ifm->ifi_index > 0)
3936 dev = __dev_get_by_index(net, ifm->ifi_index);
3937 else if (tb[IFLA_IFNAME] || tb[IFLA_ALT_IFNAME])
3938 dev = rtnl_dev_get(net, tb);
3945 if (!tb[IFLA_PROP_LIST])
3948 nla_for_each_nested(attr, tb[IFLA_PROP_LIST], rem) {
3949 switch (nla_type(attr)) {
3950 case IFLA_ALT_IFNAME:
3951 err = rtnl_alt_ifname(cmd, dev, attr, &changed, extack);
3959 netdev_state_change(dev);
3963 static int rtnl_newlinkprop(struct sk_buff *skb, struct nlmsghdr *nlh,
3964 struct netlink_ext_ack *extack)
3966 return rtnl_linkprop(RTM_NEWLINKPROP, skb, nlh, extack);
3969 static int rtnl_dellinkprop(struct sk_buff *skb, struct nlmsghdr *nlh,
3970 struct netlink_ext_ack *extack)
3972 return rtnl_linkprop(RTM_DELLINKPROP, skb, nlh, extack);
3975 static u32 rtnl_calcit(struct sk_buff *skb, struct nlmsghdr *nlh)
3977 struct net *net = sock_net(skb->sk);
3978 size_t min_ifinfo_dump_size = 0;
3979 struct nlattr *tb[IFLA_MAX+1];
3980 u32 ext_filter_mask = 0;
3981 struct net_device *dev;
3984 /* Same kernel<->userspace interface hack as in rtnl_dump_ifinfo. */
3985 hdrlen = nlmsg_len(nlh) < sizeof(struct ifinfomsg) ?
3986 sizeof(struct rtgenmsg) : sizeof(struct ifinfomsg);
3988 if (nlmsg_parse_deprecated(nlh, hdrlen, tb, IFLA_MAX, ifla_policy, NULL) >= 0) {
3989 if (tb[IFLA_EXT_MASK])
3990 ext_filter_mask = nla_get_u32(tb[IFLA_EXT_MASK]);
3993 if (!ext_filter_mask)
3994 return NLMSG_GOODSIZE;
3996 * traverse the list of net devices and compute the minimum
3997 * buffer size based upon the filter mask.
4000 for_each_netdev_rcu(net, dev) {
4001 min_ifinfo_dump_size = max(min_ifinfo_dump_size,
4002 if_nlmsg_size(dev, ext_filter_mask));
4006 return nlmsg_total_size(min_ifinfo_dump_size);
4009 static int rtnl_dump_all(struct sk_buff *skb, struct netlink_callback *cb)
4012 int s_idx = cb->family;
4013 int type = cb->nlh->nlmsg_type - RTM_BASE;
4019 for (idx = 1; idx <= RTNL_FAMILY_MAX; idx++) {
4020 struct rtnl_link __rcu **tab;
4021 struct rtnl_link *link;
4022 rtnl_dumpit_func dumpit;
4024 if (idx < s_idx || idx == PF_PACKET)
4027 if (type < 0 || type >= RTM_NR_MSGTYPES)
4030 tab = rcu_dereference_rtnl(rtnl_msg_handlers[idx]);
4034 link = rcu_dereference_rtnl(tab[type]);
4038 dumpit = link->dumpit;
4043 memset(&cb->args[0], 0, sizeof(cb->args));
4047 ret = dumpit(skb, cb);
4053 return skb->len ? : ret;
4056 struct sk_buff *rtmsg_ifinfo_build_skb(int type, struct net_device *dev,
4057 unsigned int change,
4058 u32 event, gfp_t flags, int *new_nsid,
4059 int new_ifindex, u32 portid,
4060 const struct nlmsghdr *nlh)
4062 struct net *net = dev_net(dev);
4063 struct sk_buff *skb;
4067 skb = nlmsg_new(if_nlmsg_size(dev, 0), flags);
4071 if (nlmsg_report(nlh))
4072 seq = nlmsg_seq(nlh);
4076 err = rtnl_fill_ifinfo(skb, dev, dev_net(dev),
4077 type, portid, seq, change, 0, 0, event,
4078 new_nsid, new_ifindex, -1, flags);
4080 /* -EMSGSIZE implies BUG in if_nlmsg_size() */
4081 WARN_ON(err == -EMSGSIZE);
4088 rtnl_set_sk_err(net, RTNLGRP_LINK, err);
4092 void rtmsg_ifinfo_send(struct sk_buff *skb, struct net_device *dev, gfp_t flags,
4093 u32 portid, const struct nlmsghdr *nlh)
4095 struct net *net = dev_net(dev);
4097 rtnl_notify(skb, net, portid, RTNLGRP_LINK, nlh, flags);
4100 static void rtmsg_ifinfo_event(int type, struct net_device *dev,
4101 unsigned int change, u32 event,
4102 gfp_t flags, int *new_nsid, int new_ifindex,
4103 u32 portid, const struct nlmsghdr *nlh)
4105 struct sk_buff *skb;
4107 if (dev->reg_state != NETREG_REGISTERED)
4110 skb = rtmsg_ifinfo_build_skb(type, dev, change, event, flags, new_nsid,
4111 new_ifindex, portid, nlh);
4113 rtmsg_ifinfo_send(skb, dev, flags, portid, nlh);
4116 void rtmsg_ifinfo(int type, struct net_device *dev, unsigned int change,
4117 gfp_t flags, u32 portid, const struct nlmsghdr *nlh)
4119 rtmsg_ifinfo_event(type, dev, change, rtnl_get_event(0), flags,
4120 NULL, 0, portid, nlh);
4123 void rtmsg_ifinfo_newnet(int type, struct net_device *dev, unsigned int change,
4124 gfp_t flags, int *new_nsid, int new_ifindex)
4126 rtmsg_ifinfo_event(type, dev, change, rtnl_get_event(0), flags,
4127 new_nsid, new_ifindex, 0, NULL);
4130 static int nlmsg_populate_fdb_fill(struct sk_buff *skb,
4131 struct net_device *dev,
4132 u8 *addr, u16 vid, u32 pid, u32 seq,
4133 int type, unsigned int flags,
4134 int nlflags, u16 ndm_state)
4136 struct nlmsghdr *nlh;
4139 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), nlflags);
4143 ndm = nlmsg_data(nlh);
4144 ndm->ndm_family = AF_BRIDGE;
4147 ndm->ndm_flags = flags;
4149 ndm->ndm_ifindex = dev->ifindex;
4150 ndm->ndm_state = ndm_state;
4152 if (nla_put(skb, NDA_LLADDR, dev->addr_len, addr))
4153 goto nla_put_failure;
4155 if (nla_put(skb, NDA_VLAN, sizeof(u16), &vid))
4156 goto nla_put_failure;
4158 nlmsg_end(skb, nlh);
4162 nlmsg_cancel(skb, nlh);
4166 static inline size_t rtnl_fdb_nlmsg_size(const struct net_device *dev)
4168 return NLMSG_ALIGN(sizeof(struct ndmsg)) +
4169 nla_total_size(dev->addr_len) + /* NDA_LLADDR */
4170 nla_total_size(sizeof(u16)) + /* NDA_VLAN */
4174 static void rtnl_fdb_notify(struct net_device *dev, u8 *addr, u16 vid, int type,
4177 struct net *net = dev_net(dev);
4178 struct sk_buff *skb;
4181 skb = nlmsg_new(rtnl_fdb_nlmsg_size(dev), GFP_ATOMIC);
4185 err = nlmsg_populate_fdb_fill(skb, dev, addr, vid,
4186 0, 0, type, NTF_SELF, 0, ndm_state);
4192 rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
4195 rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
4199 * ndo_dflt_fdb_add - default netdevice operation to add an FDB entry
4201 int ndo_dflt_fdb_add(struct ndmsg *ndm,
4202 struct nlattr *tb[],
4203 struct net_device *dev,
4204 const unsigned char *addr, u16 vid,
4209 /* If aging addresses are supported device will need to
4210 * implement its own handler for this.
4212 if (ndm->ndm_state && !(ndm->ndm_state & NUD_PERMANENT)) {
4213 netdev_info(dev, "default FDB implementation only supports local addresses\n");
4217 if (tb[NDA_FLAGS_EXT]) {
4218 netdev_info(dev, "invalid flags given to default FDB implementation\n");
4223 netdev_info(dev, "vlans aren't supported yet for dev_uc|mc_add()\n");
4227 if (is_unicast_ether_addr(addr) || is_link_local_ether_addr(addr))
4228 err = dev_uc_add_excl(dev, addr);
4229 else if (is_multicast_ether_addr(addr))
4230 err = dev_mc_add_excl(dev, addr);
4232 /* Only return duplicate errors if NLM_F_EXCL is set */
4233 if (err == -EEXIST && !(flags & NLM_F_EXCL))
4238 EXPORT_SYMBOL(ndo_dflt_fdb_add);
4240 static int fdb_vid_parse(struct nlattr *vlan_attr, u16 *p_vid,
4241 struct netlink_ext_ack *extack)
4246 if (nla_len(vlan_attr) != sizeof(u16)) {
4247 NL_SET_ERR_MSG(extack, "invalid vlan attribute size");
4251 vid = nla_get_u16(vlan_attr);
4253 if (!vid || vid >= VLAN_VID_MASK) {
4254 NL_SET_ERR_MSG(extack, "invalid vlan id");
4262 static int rtnl_fdb_add(struct sk_buff *skb, struct nlmsghdr *nlh,
4263 struct netlink_ext_ack *extack)
4265 struct net *net = sock_net(skb->sk);
4267 struct nlattr *tb[NDA_MAX+1];
4268 struct net_device *dev;
4273 err = nlmsg_parse_deprecated(nlh, sizeof(*ndm), tb, NDA_MAX, NULL,
4278 ndm = nlmsg_data(nlh);
4279 if (ndm->ndm_ifindex == 0) {
4280 NL_SET_ERR_MSG(extack, "invalid ifindex");
4284 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
4286 NL_SET_ERR_MSG(extack, "unknown ifindex");
4290 if (!tb[NDA_LLADDR] || nla_len(tb[NDA_LLADDR]) != ETH_ALEN) {
4291 NL_SET_ERR_MSG(extack, "invalid address");
4295 if (dev->type != ARPHRD_ETHER) {
4296 NL_SET_ERR_MSG(extack, "FDB add only supported for Ethernet devices");
4300 addr = nla_data(tb[NDA_LLADDR]);
4302 err = fdb_vid_parse(tb[NDA_VLAN], &vid, extack);
4308 /* Support fdb on master device the net/bridge default case */
4309 if ((!ndm->ndm_flags || ndm->ndm_flags & NTF_MASTER) &&
4310 netif_is_bridge_port(dev)) {
4311 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
4312 const struct net_device_ops *ops = br_dev->netdev_ops;
4314 err = ops->ndo_fdb_add(ndm, tb, dev, addr, vid,
4315 nlh->nlmsg_flags, extack);
4319 ndm->ndm_flags &= ~NTF_MASTER;
4322 /* Embedded bridge, macvlan, and any other device support */
4323 if ((ndm->ndm_flags & NTF_SELF)) {
4324 if (dev->netdev_ops->ndo_fdb_add)
4325 err = dev->netdev_ops->ndo_fdb_add(ndm, tb, dev, addr,
4330 err = ndo_dflt_fdb_add(ndm, tb, dev, addr, vid,
4334 rtnl_fdb_notify(dev, addr, vid, RTM_NEWNEIGH,
4336 ndm->ndm_flags &= ~NTF_SELF;
4344 * ndo_dflt_fdb_del - default netdevice operation to delete an FDB entry
4346 int ndo_dflt_fdb_del(struct ndmsg *ndm,
4347 struct nlattr *tb[],
4348 struct net_device *dev,
4349 const unsigned char *addr, u16 vid)
4353 /* If aging addresses are supported device will need to
4354 * implement its own handler for this.
4356 if (!(ndm->ndm_state & NUD_PERMANENT)) {
4357 netdev_info(dev, "default FDB implementation only supports local addresses\n");
4361 if (is_unicast_ether_addr(addr) || is_link_local_ether_addr(addr))
4362 err = dev_uc_del(dev, addr);
4363 else if (is_multicast_ether_addr(addr))
4364 err = dev_mc_del(dev, addr);
4368 EXPORT_SYMBOL(ndo_dflt_fdb_del);
4370 static int rtnl_fdb_del(struct sk_buff *skb, struct nlmsghdr *nlh,
4371 struct netlink_ext_ack *extack)
4373 bool del_bulk = !!(nlh->nlmsg_flags & NLM_F_BULK);
4374 struct net *net = sock_net(skb->sk);
4375 const struct net_device_ops *ops;
4377 struct nlattr *tb[NDA_MAX+1];
4378 struct net_device *dev;
4383 if (!netlink_capable(skb, CAP_NET_ADMIN))
4387 err = nlmsg_parse_deprecated(nlh, sizeof(*ndm), tb, NDA_MAX,
4390 /* For bulk delete, the drivers will parse the message with
4393 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL, extack);
4398 ndm = nlmsg_data(nlh);
4399 if (ndm->ndm_ifindex == 0) {
4400 NL_SET_ERR_MSG(extack, "invalid ifindex");
4404 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
4406 NL_SET_ERR_MSG(extack, "unknown ifindex");
4411 if (!tb[NDA_LLADDR] || nla_len(tb[NDA_LLADDR]) != ETH_ALEN) {
4412 NL_SET_ERR_MSG(extack, "invalid address");
4415 addr = nla_data(tb[NDA_LLADDR]);
4417 err = fdb_vid_parse(tb[NDA_VLAN], &vid, extack);
4422 if (dev->type != ARPHRD_ETHER) {
4423 NL_SET_ERR_MSG(extack, "FDB delete only supported for Ethernet devices");
4429 /* Support fdb on master device the net/bridge default case */
4430 if ((!ndm->ndm_flags || ndm->ndm_flags & NTF_MASTER) &&
4431 netif_is_bridge_port(dev)) {
4432 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
4434 ops = br_dev->netdev_ops;
4436 if (ops->ndo_fdb_del)
4437 err = ops->ndo_fdb_del(ndm, tb, dev, addr, vid, extack);
4439 if (ops->ndo_fdb_del_bulk)
4440 err = ops->ndo_fdb_del_bulk(nlh, dev, extack);
4446 ndm->ndm_flags &= ~NTF_MASTER;
4449 /* Embedded bridge, macvlan, and any other device support */
4450 if (ndm->ndm_flags & NTF_SELF) {
4451 ops = dev->netdev_ops;
4453 if (ops->ndo_fdb_del)
4454 err = ops->ndo_fdb_del(ndm, tb, dev, addr, vid, extack);
4456 err = ndo_dflt_fdb_del(ndm, tb, dev, addr, vid);
4458 /* in case err was cleared by NTF_MASTER call */
4460 if (ops->ndo_fdb_del_bulk)
4461 err = ops->ndo_fdb_del_bulk(nlh, dev, extack);
4466 rtnl_fdb_notify(dev, addr, vid, RTM_DELNEIGH,
4468 ndm->ndm_flags &= ~NTF_SELF;
4475 static int nlmsg_populate_fdb(struct sk_buff *skb,
4476 struct netlink_callback *cb,
4477 struct net_device *dev,
4479 struct netdev_hw_addr_list *list)
4481 struct netdev_hw_addr *ha;
4485 portid = NETLINK_CB(cb->skb).portid;
4486 seq = cb->nlh->nlmsg_seq;
4488 list_for_each_entry(ha, &list->list, list) {
4489 if (*idx < cb->args[2])
4492 err = nlmsg_populate_fdb_fill(skb, dev, ha->addr, 0,
4494 RTM_NEWNEIGH, NTF_SELF,
4495 NLM_F_MULTI, NUD_PERMANENT);
4505 * ndo_dflt_fdb_dump - default netdevice operation to dump an FDB table.
4506 * @skb: socket buffer to store message in
4507 * @cb: netlink callback
4509 * @filter_dev: ignored
4510 * @idx: the number of FDB table entries dumped is added to *@idx
4512 * Default netdevice operation to dump the existing unicast address list.
4513 * Returns number of addresses from list put in skb.
4515 int ndo_dflt_fdb_dump(struct sk_buff *skb,
4516 struct netlink_callback *cb,
4517 struct net_device *dev,
4518 struct net_device *filter_dev,
4523 if (dev->type != ARPHRD_ETHER)
4526 netif_addr_lock_bh(dev);
4527 err = nlmsg_populate_fdb(skb, cb, dev, idx, &dev->uc);
4530 err = nlmsg_populate_fdb(skb, cb, dev, idx, &dev->mc);
4532 netif_addr_unlock_bh(dev);
4535 EXPORT_SYMBOL(ndo_dflt_fdb_dump);
4537 static int valid_fdb_dump_strict(const struct nlmsghdr *nlh,
4538 int *br_idx, int *brport_idx,
4539 struct netlink_ext_ack *extack)
4541 struct nlattr *tb[NDA_MAX + 1];
4545 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ndm))) {
4546 NL_SET_ERR_MSG(extack, "Invalid header for fdb dump request");
4550 ndm = nlmsg_data(nlh);
4551 if (ndm->ndm_pad1 || ndm->ndm_pad2 || ndm->ndm_state ||
4552 ndm->ndm_flags || ndm->ndm_type) {
4553 NL_SET_ERR_MSG(extack, "Invalid values in header for fdb dump request");
4557 err = nlmsg_parse_deprecated_strict(nlh, sizeof(struct ndmsg), tb,
4558 NDA_MAX, NULL, extack);
4562 *brport_idx = ndm->ndm_ifindex;
4563 for (i = 0; i <= NDA_MAX; ++i) {
4569 if (nla_len(tb[i]) != sizeof(u32)) {
4570 NL_SET_ERR_MSG(extack, "Invalid IFINDEX attribute in fdb dump request");
4573 *brport_idx = nla_get_u32(tb[NDA_IFINDEX]);
4576 if (nla_len(tb[i]) != sizeof(u32)) {
4577 NL_SET_ERR_MSG(extack, "Invalid MASTER attribute in fdb dump request");
4580 *br_idx = nla_get_u32(tb[NDA_MASTER]);
4583 NL_SET_ERR_MSG(extack, "Unsupported attribute in fdb dump request");
4591 static int valid_fdb_dump_legacy(const struct nlmsghdr *nlh,
4592 int *br_idx, int *brport_idx,
4593 struct netlink_ext_ack *extack)
4595 struct nlattr *tb[IFLA_MAX+1];
4598 /* A hack to preserve kernel<->userspace interface.
4599 * Before Linux v4.12 this code accepted ndmsg since iproute2 v3.3.0.
4600 * However, ndmsg is shorter than ifinfomsg thus nlmsg_parse() bails.
4601 * So, check for ndmsg with an optional u32 attribute (not used here).
4602 * Fortunately these sizes don't conflict with the size of ifinfomsg
4603 * with an optional attribute.
4605 if (nlmsg_len(nlh) != sizeof(struct ndmsg) &&
4606 (nlmsg_len(nlh) != sizeof(struct ndmsg) +
4607 nla_attr_size(sizeof(u32)))) {
4608 struct ifinfomsg *ifm;
4610 err = nlmsg_parse_deprecated(nlh, sizeof(struct ifinfomsg),
4611 tb, IFLA_MAX, ifla_policy,
4615 } else if (err == 0) {
4616 if (tb[IFLA_MASTER])
4617 *br_idx = nla_get_u32(tb[IFLA_MASTER]);
4620 ifm = nlmsg_data(nlh);
4621 *brport_idx = ifm->ifi_index;
4626 static int rtnl_fdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
4628 struct net_device *dev;
4629 struct net_device *br_dev = NULL;
4630 const struct net_device_ops *ops = NULL;
4631 const struct net_device_ops *cops = NULL;
4632 struct net *net = sock_net(skb->sk);
4633 struct hlist_head *head;
4641 if (cb->strict_check)
4642 err = valid_fdb_dump_strict(cb->nlh, &br_idx, &brport_idx,
4645 err = valid_fdb_dump_legacy(cb->nlh, &br_idx, &brport_idx,
4651 br_dev = __dev_get_by_index(net, br_idx);
4655 ops = br_dev->netdev_ops;
4659 s_idx = cb->args[1];
4661 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
4663 head = &net->dev_index_head[h];
4664 hlist_for_each_entry(dev, head, index_hlist) {
4666 if (brport_idx && (dev->ifindex != brport_idx))
4669 if (!br_idx) { /* user did not specify a specific bridge */
4670 if (netif_is_bridge_port(dev)) {
4671 br_dev = netdev_master_upper_dev_get(dev);
4672 cops = br_dev->netdev_ops;
4675 if (dev != br_dev &&
4676 !netif_is_bridge_port(dev))
4679 if (br_dev != netdev_master_upper_dev_get(dev) &&
4680 !netif_is_bridge_master(dev))
4688 if (netif_is_bridge_port(dev)) {
4689 if (cops && cops->ndo_fdb_dump) {
4690 err = cops->ndo_fdb_dump(skb, cb,
4693 if (err == -EMSGSIZE)
4698 if (dev->netdev_ops->ndo_fdb_dump)
4699 err = dev->netdev_ops->ndo_fdb_dump(skb, cb,
4703 err = ndo_dflt_fdb_dump(skb, cb, dev, NULL,
4705 if (err == -EMSGSIZE)
4710 /* reset fdb offset to 0 for rest of the interfaces */
4726 static int valid_fdb_get_strict(const struct nlmsghdr *nlh,
4727 struct nlattr **tb, u8 *ndm_flags,
4728 int *br_idx, int *brport_idx, u8 **addr,
4729 u16 *vid, struct netlink_ext_ack *extack)
4734 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ndm))) {
4735 NL_SET_ERR_MSG(extack, "Invalid header for fdb get request");
4739 ndm = nlmsg_data(nlh);
4740 if (ndm->ndm_pad1 || ndm->ndm_pad2 || ndm->ndm_state ||
4742 NL_SET_ERR_MSG(extack, "Invalid values in header for fdb get request");
4746 if (ndm->ndm_flags & ~(NTF_MASTER | NTF_SELF)) {
4747 NL_SET_ERR_MSG(extack, "Invalid flags in header for fdb get request");
4751 err = nlmsg_parse_deprecated_strict(nlh, sizeof(struct ndmsg), tb,
4752 NDA_MAX, nda_policy, extack);
4756 *ndm_flags = ndm->ndm_flags;
4757 *brport_idx = ndm->ndm_ifindex;
4758 for (i = 0; i <= NDA_MAX; ++i) {
4764 *br_idx = nla_get_u32(tb[i]);
4767 if (nla_len(tb[i]) != ETH_ALEN) {
4768 NL_SET_ERR_MSG(extack, "Invalid address in fdb get request");
4771 *addr = nla_data(tb[i]);
4774 err = fdb_vid_parse(tb[i], vid, extack);
4781 NL_SET_ERR_MSG(extack, "Unsupported attribute in fdb get request");
4789 static int rtnl_fdb_get(struct sk_buff *in_skb, struct nlmsghdr *nlh,
4790 struct netlink_ext_ack *extack)
4792 struct net_device *dev = NULL, *br_dev = NULL;
4793 const struct net_device_ops *ops = NULL;
4794 struct net *net = sock_net(in_skb->sk);
4795 struct nlattr *tb[NDA_MAX + 1];
4796 struct sk_buff *skb;
4804 err = valid_fdb_get_strict(nlh, tb, &ndm_flags, &br_idx,
4805 &brport_idx, &addr, &vid, extack);
4810 NL_SET_ERR_MSG(extack, "Missing lookup address for fdb get request");
4815 dev = __dev_get_by_index(net, brport_idx);
4817 NL_SET_ERR_MSG(extack, "Unknown device ifindex");
4824 NL_SET_ERR_MSG(extack, "Master and device are mutually exclusive");
4828 br_dev = __dev_get_by_index(net, br_idx);
4830 NL_SET_ERR_MSG(extack, "Invalid master ifindex");
4833 ops = br_dev->netdev_ops;
4837 if (!ndm_flags || (ndm_flags & NTF_MASTER)) {
4838 if (!netif_is_bridge_port(dev)) {
4839 NL_SET_ERR_MSG(extack, "Device is not a bridge port");
4842 br_dev = netdev_master_upper_dev_get(dev);
4844 NL_SET_ERR_MSG(extack, "Master of device not found");
4847 ops = br_dev->netdev_ops;
4849 if (!(ndm_flags & NTF_SELF)) {
4850 NL_SET_ERR_MSG(extack, "Missing NTF_SELF");
4853 ops = dev->netdev_ops;
4857 if (!br_dev && !dev) {
4858 NL_SET_ERR_MSG(extack, "No device specified");
4862 if (!ops || !ops->ndo_fdb_get) {
4863 NL_SET_ERR_MSG(extack, "Fdb get operation not supported by device");
4867 skb = nlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
4873 err = ops->ndo_fdb_get(skb, tb, dev, addr, vid,
4874 NETLINK_CB(in_skb).portid,
4875 nlh->nlmsg_seq, extack);
4879 return rtnl_unicast(skb, net, NETLINK_CB(in_skb).portid);
4885 static int brport_nla_put_flag(struct sk_buff *skb, u32 flags, u32 mask,
4886 unsigned int attrnum, unsigned int flag)
4889 return nla_put_u8(skb, attrnum, !!(flags & flag));
4893 int ndo_dflt_bridge_getlink(struct sk_buff *skb, u32 pid, u32 seq,
4894 struct net_device *dev, u16 mode,
4895 u32 flags, u32 mask, int nlflags,
4897 int (*vlan_fill)(struct sk_buff *skb,
4898 struct net_device *dev,
4901 struct nlmsghdr *nlh;
4902 struct ifinfomsg *ifm;
4903 struct nlattr *br_afspec;
4904 struct nlattr *protinfo;
4905 u8 operstate = netif_running(dev) ? dev->operstate : IF_OPER_DOWN;
4906 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
4909 nlh = nlmsg_put(skb, pid, seq, RTM_NEWLINK, sizeof(*ifm), nlflags);
4913 ifm = nlmsg_data(nlh);
4914 ifm->ifi_family = AF_BRIDGE;
4916 ifm->ifi_type = dev->type;
4917 ifm->ifi_index = dev->ifindex;
4918 ifm->ifi_flags = dev_get_flags(dev);
4919 ifm->ifi_change = 0;
4922 if (nla_put_string(skb, IFLA_IFNAME, dev->name) ||
4923 nla_put_u32(skb, IFLA_MTU, dev->mtu) ||
4924 nla_put_u8(skb, IFLA_OPERSTATE, operstate) ||
4926 nla_put_u32(skb, IFLA_MASTER, br_dev->ifindex)) ||
4928 nla_put(skb, IFLA_ADDRESS, dev->addr_len, dev->dev_addr)) ||
4929 (dev->ifindex != dev_get_iflink(dev) &&
4930 nla_put_u32(skb, IFLA_LINK, dev_get_iflink(dev))))
4931 goto nla_put_failure;
4933 br_afspec = nla_nest_start_noflag(skb, IFLA_AF_SPEC);
4935 goto nla_put_failure;
4937 if (nla_put_u16(skb, IFLA_BRIDGE_FLAGS, BRIDGE_FLAGS_SELF)) {
4938 nla_nest_cancel(skb, br_afspec);
4939 goto nla_put_failure;
4942 if (mode != BRIDGE_MODE_UNDEF) {
4943 if (nla_put_u16(skb, IFLA_BRIDGE_MODE, mode)) {
4944 nla_nest_cancel(skb, br_afspec);
4945 goto nla_put_failure;
4949 err = vlan_fill(skb, dev, filter_mask);
4951 nla_nest_cancel(skb, br_afspec);
4952 goto nla_put_failure;
4955 nla_nest_end(skb, br_afspec);
4957 protinfo = nla_nest_start(skb, IFLA_PROTINFO);
4959 goto nla_put_failure;
4961 if (brport_nla_put_flag(skb, flags, mask,
4962 IFLA_BRPORT_MODE, BR_HAIRPIN_MODE) ||
4963 brport_nla_put_flag(skb, flags, mask,
4964 IFLA_BRPORT_GUARD, BR_BPDU_GUARD) ||
4965 brport_nla_put_flag(skb, flags, mask,
4966 IFLA_BRPORT_FAST_LEAVE,
4967 BR_MULTICAST_FAST_LEAVE) ||
4968 brport_nla_put_flag(skb, flags, mask,
4969 IFLA_BRPORT_PROTECT, BR_ROOT_BLOCK) ||
4970 brport_nla_put_flag(skb, flags, mask,
4971 IFLA_BRPORT_LEARNING, BR_LEARNING) ||
4972 brport_nla_put_flag(skb, flags, mask,
4973 IFLA_BRPORT_LEARNING_SYNC, BR_LEARNING_SYNC) ||
4974 brport_nla_put_flag(skb, flags, mask,
4975 IFLA_BRPORT_UNICAST_FLOOD, BR_FLOOD) ||
4976 brport_nla_put_flag(skb, flags, mask,
4977 IFLA_BRPORT_PROXYARP, BR_PROXYARP) ||
4978 brport_nla_put_flag(skb, flags, mask,
4979 IFLA_BRPORT_MCAST_FLOOD, BR_MCAST_FLOOD) ||
4980 brport_nla_put_flag(skb, flags, mask,
4981 IFLA_BRPORT_BCAST_FLOOD, BR_BCAST_FLOOD)) {
4982 nla_nest_cancel(skb, protinfo);
4983 goto nla_put_failure;
4986 nla_nest_end(skb, protinfo);
4988 nlmsg_end(skb, nlh);
4991 nlmsg_cancel(skb, nlh);
4992 return err ? err : -EMSGSIZE;
4994 EXPORT_SYMBOL_GPL(ndo_dflt_bridge_getlink);
4996 static int valid_bridge_getlink_req(const struct nlmsghdr *nlh,
4997 bool strict_check, u32 *filter_mask,
4998 struct netlink_ext_ack *extack)
5000 struct nlattr *tb[IFLA_MAX+1];
5004 struct ifinfomsg *ifm;
5006 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifm))) {
5007 NL_SET_ERR_MSG(extack, "Invalid header for bridge link dump");
5011 ifm = nlmsg_data(nlh);
5012 if (ifm->__ifi_pad || ifm->ifi_type || ifm->ifi_flags ||
5013 ifm->ifi_change || ifm->ifi_index) {
5014 NL_SET_ERR_MSG(extack, "Invalid values in header for bridge link dump request");
5018 err = nlmsg_parse_deprecated_strict(nlh,
5019 sizeof(struct ifinfomsg),
5020 tb, IFLA_MAX, ifla_policy,
5023 err = nlmsg_parse_deprecated(nlh, sizeof(struct ifinfomsg),
5024 tb, IFLA_MAX, ifla_policy,
5030 /* new attributes should only be added with strict checking */
5031 for (i = 0; i <= IFLA_MAX; ++i) {
5037 *filter_mask = nla_get_u32(tb[i]);
5041 NL_SET_ERR_MSG(extack, "Unsupported attribute in bridge link dump request");
5050 static int rtnl_bridge_getlink(struct sk_buff *skb, struct netlink_callback *cb)
5052 const struct nlmsghdr *nlh = cb->nlh;
5053 struct net *net = sock_net(skb->sk);
5054 struct net_device *dev;
5056 u32 portid = NETLINK_CB(cb->skb).portid;
5057 u32 seq = nlh->nlmsg_seq;
5058 u32 filter_mask = 0;
5061 err = valid_bridge_getlink_req(nlh, cb->strict_check, &filter_mask,
5063 if (err < 0 && cb->strict_check)
5067 for_each_netdev_rcu(net, dev) {
5068 const struct net_device_ops *ops = dev->netdev_ops;
5069 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5071 if (br_dev && br_dev->netdev_ops->ndo_bridge_getlink) {
5072 if (idx >= cb->args[0]) {
5073 err = br_dev->netdev_ops->ndo_bridge_getlink(
5074 skb, portid, seq, dev,
5075 filter_mask, NLM_F_MULTI);
5076 if (err < 0 && err != -EOPNOTSUPP) {
5077 if (likely(skb->len))
5086 if (ops->ndo_bridge_getlink) {
5087 if (idx >= cb->args[0]) {
5088 err = ops->ndo_bridge_getlink(skb, portid,
5092 if (err < 0 && err != -EOPNOTSUPP) {
5093 if (likely(skb->len))
5110 static inline size_t bridge_nlmsg_size(void)
5112 return NLMSG_ALIGN(sizeof(struct ifinfomsg))
5113 + nla_total_size(IFNAMSIZ) /* IFLA_IFNAME */
5114 + nla_total_size(MAX_ADDR_LEN) /* IFLA_ADDRESS */
5115 + nla_total_size(sizeof(u32)) /* IFLA_MASTER */
5116 + nla_total_size(sizeof(u32)) /* IFLA_MTU */
5117 + nla_total_size(sizeof(u32)) /* IFLA_LINK */
5118 + nla_total_size(sizeof(u32)) /* IFLA_OPERSTATE */
5119 + nla_total_size(sizeof(u8)) /* IFLA_PROTINFO */
5120 + nla_total_size(sizeof(struct nlattr)) /* IFLA_AF_SPEC */
5121 + nla_total_size(sizeof(u16)) /* IFLA_BRIDGE_FLAGS */
5122 + nla_total_size(sizeof(u16)); /* IFLA_BRIDGE_MODE */
5125 static int rtnl_bridge_notify(struct net_device *dev)
5127 struct net *net = dev_net(dev);
5128 struct sk_buff *skb;
5129 int err = -EOPNOTSUPP;
5131 if (!dev->netdev_ops->ndo_bridge_getlink)
5134 skb = nlmsg_new(bridge_nlmsg_size(), GFP_ATOMIC);
5140 err = dev->netdev_ops->ndo_bridge_getlink(skb, 0, 0, dev, 0, 0);
5144 /* Notification info is only filled for bridge ports, not the bridge
5145 * device itself. Therefore, a zero notification length is valid and
5146 * should not result in an error.
5151 rtnl_notify(skb, net, 0, RTNLGRP_LINK, NULL, GFP_ATOMIC);
5154 WARN_ON(err == -EMSGSIZE);
5157 rtnl_set_sk_err(net, RTNLGRP_LINK, err);
5161 static int rtnl_bridge_setlink(struct sk_buff *skb, struct nlmsghdr *nlh,
5162 struct netlink_ext_ack *extack)
5164 struct net *net = sock_net(skb->sk);
5165 struct ifinfomsg *ifm;
5166 struct net_device *dev;
5167 struct nlattr *br_spec, *attr = NULL;
5168 int rem, err = -EOPNOTSUPP;
5170 bool have_flags = false;
5172 if (nlmsg_len(nlh) < sizeof(*ifm))
5175 ifm = nlmsg_data(nlh);
5176 if (ifm->ifi_family != AF_BRIDGE)
5177 return -EPFNOSUPPORT;
5179 dev = __dev_get_by_index(net, ifm->ifi_index);
5181 NL_SET_ERR_MSG(extack, "unknown ifindex");
5185 br_spec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg), IFLA_AF_SPEC);
5187 nla_for_each_nested(attr, br_spec, rem) {
5188 if (nla_type(attr) == IFLA_BRIDGE_FLAGS && !have_flags) {
5189 if (nla_len(attr) < sizeof(flags))
5193 flags = nla_get_u16(attr);
5196 if (nla_type(attr) == IFLA_BRIDGE_MODE) {
5197 if (nla_len(attr) < sizeof(u16))
5203 if (!flags || (flags & BRIDGE_FLAGS_MASTER)) {
5204 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5206 if (!br_dev || !br_dev->netdev_ops->ndo_bridge_setlink) {
5211 err = br_dev->netdev_ops->ndo_bridge_setlink(dev, nlh, flags,
5216 flags &= ~BRIDGE_FLAGS_MASTER;
5219 if ((flags & BRIDGE_FLAGS_SELF)) {
5220 if (!dev->netdev_ops->ndo_bridge_setlink)
5223 err = dev->netdev_ops->ndo_bridge_setlink(dev, nlh,
5227 flags &= ~BRIDGE_FLAGS_SELF;
5229 /* Generate event to notify upper layer of bridge
5232 err = rtnl_bridge_notify(dev);
5237 memcpy(nla_data(attr), &flags, sizeof(flags));
5242 static int rtnl_bridge_dellink(struct sk_buff *skb, struct nlmsghdr *nlh,
5243 struct netlink_ext_ack *extack)
5245 struct net *net = sock_net(skb->sk);
5246 struct ifinfomsg *ifm;
5247 struct net_device *dev;
5248 struct nlattr *br_spec, *attr = NULL;
5249 int rem, err = -EOPNOTSUPP;
5251 bool have_flags = false;
5253 if (nlmsg_len(nlh) < sizeof(*ifm))
5256 ifm = nlmsg_data(nlh);
5257 if (ifm->ifi_family != AF_BRIDGE)
5258 return -EPFNOSUPPORT;
5260 dev = __dev_get_by_index(net, ifm->ifi_index);
5262 NL_SET_ERR_MSG(extack, "unknown ifindex");
5266 br_spec = nlmsg_find_attr(nlh, sizeof(struct ifinfomsg), IFLA_AF_SPEC);
5268 nla_for_each_nested(attr, br_spec, rem) {
5269 if (nla_type(attr) == IFLA_BRIDGE_FLAGS) {
5270 if (nla_len(attr) < sizeof(flags))
5274 flags = nla_get_u16(attr);
5280 if (!flags || (flags & BRIDGE_FLAGS_MASTER)) {
5281 struct net_device *br_dev = netdev_master_upper_dev_get(dev);
5283 if (!br_dev || !br_dev->netdev_ops->ndo_bridge_dellink) {
5288 err = br_dev->netdev_ops->ndo_bridge_dellink(dev, nlh, flags);
5292 flags &= ~BRIDGE_FLAGS_MASTER;
5295 if ((flags & BRIDGE_FLAGS_SELF)) {
5296 if (!dev->netdev_ops->ndo_bridge_dellink)
5299 err = dev->netdev_ops->ndo_bridge_dellink(dev, nlh,
5303 flags &= ~BRIDGE_FLAGS_SELF;
5305 /* Generate event to notify upper layer of bridge
5308 err = rtnl_bridge_notify(dev);
5313 memcpy(nla_data(attr), &flags, sizeof(flags));
5318 static bool stats_attr_valid(unsigned int mask, int attrid, int idxattr)
5320 return (mask & IFLA_STATS_FILTER_BIT(attrid)) &&
5321 (!idxattr || idxattr == attrid);
5325 rtnl_offload_xstats_have_ndo(const struct net_device *dev, int attr_id)
5327 return dev->netdev_ops &&
5328 dev->netdev_ops->ndo_has_offload_stats &&
5329 dev->netdev_ops->ndo_get_offload_stats &&
5330 dev->netdev_ops->ndo_has_offload_stats(dev, attr_id);
5334 rtnl_offload_xstats_get_size_ndo(const struct net_device *dev, int attr_id)
5336 return rtnl_offload_xstats_have_ndo(dev, attr_id) ?
5337 sizeof(struct rtnl_link_stats64) : 0;
5341 rtnl_offload_xstats_fill_ndo(struct net_device *dev, int attr_id,
5342 struct sk_buff *skb)
5344 unsigned int size = rtnl_offload_xstats_get_size_ndo(dev, attr_id);
5345 struct nlattr *attr = NULL;
5352 attr = nla_reserve_64bit(skb, attr_id, size,
5353 IFLA_OFFLOAD_XSTATS_UNSPEC);
5357 attr_data = nla_data(attr);
5358 memset(attr_data, 0, size);
5360 err = dev->netdev_ops->ndo_get_offload_stats(attr_id, dev, attr_data);
5368 rtnl_offload_xstats_get_size_stats(const struct net_device *dev,
5369 enum netdev_offload_xstats_type type)
5371 bool enabled = netdev_offload_xstats_enabled(dev, type);
5373 return enabled ? sizeof(struct rtnl_hw_stats64) : 0;
5376 struct rtnl_offload_xstats_request_used {
5382 rtnl_offload_xstats_get_stats(struct net_device *dev,
5383 enum netdev_offload_xstats_type type,
5384 struct rtnl_offload_xstats_request_used *ru,
5385 struct rtnl_hw_stats64 *stats,
5386 struct netlink_ext_ack *extack)
5392 request = netdev_offload_xstats_enabled(dev, type);
5398 err = netdev_offload_xstats_get(dev, type, stats, &used, extack);
5404 ru->request = request;
5411 rtnl_offload_xstats_fill_hw_s_info_one(struct sk_buff *skb, int attr_id,
5412 struct rtnl_offload_xstats_request_used *ru)
5414 struct nlattr *nest;
5416 nest = nla_nest_start(skb, attr_id);
5420 if (nla_put_u8(skb, IFLA_OFFLOAD_XSTATS_HW_S_INFO_REQUEST, ru->request))
5421 goto nla_put_failure;
5423 if (nla_put_u8(skb, IFLA_OFFLOAD_XSTATS_HW_S_INFO_USED, ru->used))
5424 goto nla_put_failure;
5426 nla_nest_end(skb, nest);
5430 nla_nest_cancel(skb, nest);
5435 rtnl_offload_xstats_fill_hw_s_info(struct sk_buff *skb, struct net_device *dev,
5436 struct netlink_ext_ack *extack)
5438 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5439 struct rtnl_offload_xstats_request_used ru_l3;
5440 struct nlattr *nest;
5443 err = rtnl_offload_xstats_get_stats(dev, t_l3, &ru_l3, NULL, extack);
5447 nest = nla_nest_start(skb, IFLA_OFFLOAD_XSTATS_HW_S_INFO);
5451 if (rtnl_offload_xstats_fill_hw_s_info_one(skb,
5452 IFLA_OFFLOAD_XSTATS_L3_STATS,
5454 goto nla_put_failure;
5456 nla_nest_end(skb, nest);
5460 nla_nest_cancel(skb, nest);
5464 static int rtnl_offload_xstats_fill(struct sk_buff *skb, struct net_device *dev,
5465 int *prividx, u32 off_filter_mask,
5466 struct netlink_ext_ack *extack)
5468 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5469 int attr_id_hw_s_info = IFLA_OFFLOAD_XSTATS_HW_S_INFO;
5470 int attr_id_l3_stats = IFLA_OFFLOAD_XSTATS_L3_STATS;
5471 int attr_id_cpu_hit = IFLA_OFFLOAD_XSTATS_CPU_HIT;
5472 bool have_data = false;
5475 if (*prividx <= attr_id_cpu_hit &&
5477 IFLA_STATS_FILTER_BIT(attr_id_cpu_hit))) {
5478 err = rtnl_offload_xstats_fill_ndo(dev, attr_id_cpu_hit, skb);
5481 } else if (err != -ENODATA) {
5482 *prividx = attr_id_cpu_hit;
5487 if (*prividx <= attr_id_hw_s_info &&
5488 (off_filter_mask & IFLA_STATS_FILTER_BIT(attr_id_hw_s_info))) {
5489 *prividx = attr_id_hw_s_info;
5491 err = rtnl_offload_xstats_fill_hw_s_info(skb, dev, extack);
5499 if (*prividx <= attr_id_l3_stats &&
5500 (off_filter_mask & IFLA_STATS_FILTER_BIT(attr_id_l3_stats))) {
5501 unsigned int size_l3;
5502 struct nlattr *attr;
5504 *prividx = attr_id_l3_stats;
5506 size_l3 = rtnl_offload_xstats_get_size_stats(dev, t_l3);
5509 attr = nla_reserve_64bit(skb, attr_id_l3_stats, size_l3,
5510 IFLA_OFFLOAD_XSTATS_UNSPEC);
5514 err = rtnl_offload_xstats_get_stats(dev, t_l3, NULL,
5515 nla_data(attr), extack);
5532 rtnl_offload_xstats_get_size_hw_s_info_one(const struct net_device *dev,
5533 enum netdev_offload_xstats_type type)
5535 return nla_total_size(0) +
5536 /* IFLA_OFFLOAD_XSTATS_HW_S_INFO_REQUEST */
5537 nla_total_size(sizeof(u8)) +
5538 /* IFLA_OFFLOAD_XSTATS_HW_S_INFO_USED */
5539 nla_total_size(sizeof(u8)) +
5544 rtnl_offload_xstats_get_size_hw_s_info(const struct net_device *dev)
5546 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5548 return nla_total_size(0) +
5549 /* IFLA_OFFLOAD_XSTATS_L3_STATS */
5550 rtnl_offload_xstats_get_size_hw_s_info_one(dev, t_l3) +
5554 static int rtnl_offload_xstats_get_size(const struct net_device *dev,
5555 u32 off_filter_mask)
5557 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
5558 int attr_id_cpu_hit = IFLA_OFFLOAD_XSTATS_CPU_HIT;
5562 if (off_filter_mask &
5563 IFLA_STATS_FILTER_BIT(attr_id_cpu_hit)) {
5564 size = rtnl_offload_xstats_get_size_ndo(dev, attr_id_cpu_hit);
5565 nla_size += nla_total_size_64bit(size);
5568 if (off_filter_mask &
5569 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_HW_S_INFO))
5570 nla_size += rtnl_offload_xstats_get_size_hw_s_info(dev);
5572 if (off_filter_mask &
5573 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_L3_STATS)) {
5574 size = rtnl_offload_xstats_get_size_stats(dev, t_l3);
5575 nla_size += nla_total_size_64bit(size);
5579 nla_size += nla_total_size(0);
5584 struct rtnl_stats_dump_filters {
5585 /* mask[0] filters outer attributes. Then individual nests have their
5586 * filtering mask at the index of the nested attribute.
5588 u32 mask[IFLA_STATS_MAX + 1];
5591 static int rtnl_fill_statsinfo(struct sk_buff *skb, struct net_device *dev,
5592 int type, u32 pid, u32 seq, u32 change,
5594 const struct rtnl_stats_dump_filters *filters,
5595 int *idxattr, int *prividx,
5596 struct netlink_ext_ack *extack)
5598 unsigned int filter_mask = filters->mask[0];
5599 struct if_stats_msg *ifsm;
5600 struct nlmsghdr *nlh;
5601 struct nlattr *attr;
5602 int s_prividx = *prividx;
5607 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ifsm), flags);
5611 ifsm = nlmsg_data(nlh);
5612 ifsm->family = PF_UNSPEC;
5615 ifsm->ifindex = dev->ifindex;
5616 ifsm->filter_mask = filter_mask;
5618 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_64, *idxattr)) {
5619 struct rtnl_link_stats64 *sp;
5621 attr = nla_reserve_64bit(skb, IFLA_STATS_LINK_64,
5622 sizeof(struct rtnl_link_stats64),
5626 goto nla_put_failure;
5629 sp = nla_data(attr);
5630 dev_get_stats(dev, sp);
5633 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS, *idxattr)) {
5634 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
5636 if (ops && ops->fill_linkxstats) {
5637 *idxattr = IFLA_STATS_LINK_XSTATS;
5638 attr = nla_nest_start_noflag(skb,
5639 IFLA_STATS_LINK_XSTATS);
5642 goto nla_put_failure;
5645 err = ops->fill_linkxstats(skb, dev, prividx, *idxattr);
5646 nla_nest_end(skb, attr);
5648 goto nla_put_failure;
5653 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS_SLAVE,
5655 const struct rtnl_link_ops *ops = NULL;
5656 const struct net_device *master;
5658 master = netdev_master_upper_dev_get(dev);
5660 ops = master->rtnl_link_ops;
5661 if (ops && ops->fill_linkxstats) {
5662 *idxattr = IFLA_STATS_LINK_XSTATS_SLAVE;
5663 attr = nla_nest_start_noflag(skb,
5664 IFLA_STATS_LINK_XSTATS_SLAVE);
5667 goto nla_put_failure;
5670 err = ops->fill_linkxstats(skb, dev, prividx, *idxattr);
5671 nla_nest_end(skb, attr);
5673 goto nla_put_failure;
5678 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_OFFLOAD_XSTATS,
5680 u32 off_filter_mask;
5682 off_filter_mask = filters->mask[IFLA_STATS_LINK_OFFLOAD_XSTATS];
5683 *idxattr = IFLA_STATS_LINK_OFFLOAD_XSTATS;
5684 attr = nla_nest_start_noflag(skb,
5685 IFLA_STATS_LINK_OFFLOAD_XSTATS);
5688 goto nla_put_failure;
5691 err = rtnl_offload_xstats_fill(skb, dev, prividx,
5692 off_filter_mask, extack);
5693 if (err == -ENODATA)
5694 nla_nest_cancel(skb, attr);
5696 nla_nest_end(skb, attr);
5698 if (err && err != -ENODATA)
5699 goto nla_put_failure;
5703 if (stats_attr_valid(filter_mask, IFLA_STATS_AF_SPEC, *idxattr)) {
5704 struct rtnl_af_ops *af_ops;
5706 *idxattr = IFLA_STATS_AF_SPEC;
5707 attr = nla_nest_start_noflag(skb, IFLA_STATS_AF_SPEC);
5710 goto nla_put_failure;
5714 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
5715 if (af_ops->fill_stats_af) {
5718 af = nla_nest_start_noflag(skb,
5723 goto nla_put_failure;
5725 err = af_ops->fill_stats_af(skb, dev);
5727 if (err == -ENODATA) {
5728 nla_nest_cancel(skb, af);
5729 } else if (err < 0) {
5731 goto nla_put_failure;
5734 nla_nest_end(skb, af);
5739 nla_nest_end(skb, attr);
5744 nlmsg_end(skb, nlh);
5749 /* not a multi message or no progress mean a real error */
5750 if (!(flags & NLM_F_MULTI) || s_prividx == *prividx)
5751 nlmsg_cancel(skb, nlh);
5753 nlmsg_end(skb, nlh);
5758 static size_t if_nlmsg_stats_size(const struct net_device *dev,
5759 const struct rtnl_stats_dump_filters *filters)
5761 size_t size = NLMSG_ALIGN(sizeof(struct if_stats_msg));
5762 unsigned int filter_mask = filters->mask[0];
5764 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_64, 0))
5765 size += nla_total_size_64bit(sizeof(struct rtnl_link_stats64));
5767 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS, 0)) {
5768 const struct rtnl_link_ops *ops = dev->rtnl_link_ops;
5769 int attr = IFLA_STATS_LINK_XSTATS;
5771 if (ops && ops->get_linkxstats_size) {
5772 size += nla_total_size(ops->get_linkxstats_size(dev,
5774 /* for IFLA_STATS_LINK_XSTATS */
5775 size += nla_total_size(0);
5779 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_XSTATS_SLAVE, 0)) {
5780 struct net_device *_dev = (struct net_device *)dev;
5781 const struct rtnl_link_ops *ops = NULL;
5782 const struct net_device *master;
5784 /* netdev_master_upper_dev_get can't take const */
5785 master = netdev_master_upper_dev_get(_dev);
5787 ops = master->rtnl_link_ops;
5788 if (ops && ops->get_linkxstats_size) {
5789 int attr = IFLA_STATS_LINK_XSTATS_SLAVE;
5791 size += nla_total_size(ops->get_linkxstats_size(dev,
5793 /* for IFLA_STATS_LINK_XSTATS_SLAVE */
5794 size += nla_total_size(0);
5798 if (stats_attr_valid(filter_mask, IFLA_STATS_LINK_OFFLOAD_XSTATS, 0)) {
5799 u32 off_filter_mask;
5801 off_filter_mask = filters->mask[IFLA_STATS_LINK_OFFLOAD_XSTATS];
5802 size += rtnl_offload_xstats_get_size(dev, off_filter_mask);
5805 if (stats_attr_valid(filter_mask, IFLA_STATS_AF_SPEC, 0)) {
5806 struct rtnl_af_ops *af_ops;
5808 /* for IFLA_STATS_AF_SPEC */
5809 size += nla_total_size(0);
5812 list_for_each_entry_rcu(af_ops, &rtnl_af_ops, list) {
5813 if (af_ops->get_stats_af_size) {
5814 size += nla_total_size(
5815 af_ops->get_stats_af_size(dev));
5818 size += nla_total_size(0);
5827 #define RTNL_STATS_OFFLOAD_XSTATS_VALID ((1 << __IFLA_OFFLOAD_XSTATS_MAX) - 1)
5829 static const struct nla_policy
5830 rtnl_stats_get_policy_filters[IFLA_STATS_MAX + 1] = {
5831 [IFLA_STATS_LINK_OFFLOAD_XSTATS] =
5832 NLA_POLICY_MASK(NLA_U32, RTNL_STATS_OFFLOAD_XSTATS_VALID),
5835 static const struct nla_policy
5836 rtnl_stats_get_policy[IFLA_STATS_GETSET_MAX + 1] = {
5837 [IFLA_STATS_GET_FILTERS] =
5838 NLA_POLICY_NESTED(rtnl_stats_get_policy_filters),
5841 static const struct nla_policy
5842 ifla_stats_set_policy[IFLA_STATS_GETSET_MAX + 1] = {
5843 [IFLA_STATS_SET_OFFLOAD_XSTATS_L3_STATS] = NLA_POLICY_MAX(NLA_U8, 1),
5846 static int rtnl_stats_get_parse_filters(struct nlattr *ifla_filters,
5847 struct rtnl_stats_dump_filters *filters,
5848 struct netlink_ext_ack *extack)
5850 struct nlattr *tb[IFLA_STATS_MAX + 1];
5854 err = nla_parse_nested(tb, IFLA_STATS_MAX, ifla_filters,
5855 rtnl_stats_get_policy_filters, extack);
5859 for (at = 1; at <= IFLA_STATS_MAX; at++) {
5861 if (!(filters->mask[0] & IFLA_STATS_FILTER_BIT(at))) {
5862 NL_SET_ERR_MSG(extack, "Filtered attribute not enabled in filter_mask");
5865 filters->mask[at] = nla_get_u32(tb[at]);
5872 static int rtnl_stats_get_parse(const struct nlmsghdr *nlh,
5874 struct rtnl_stats_dump_filters *filters,
5875 struct netlink_ext_ack *extack)
5877 struct nlattr *tb[IFLA_STATS_GETSET_MAX + 1];
5881 filters->mask[0] = filter_mask;
5882 for (i = 1; i < ARRAY_SIZE(filters->mask); i++)
5883 filters->mask[i] = -1U;
5885 err = nlmsg_parse(nlh, sizeof(struct if_stats_msg), tb,
5886 IFLA_STATS_GETSET_MAX, rtnl_stats_get_policy, extack);
5890 if (tb[IFLA_STATS_GET_FILTERS]) {
5891 err = rtnl_stats_get_parse_filters(tb[IFLA_STATS_GET_FILTERS],
5900 static int rtnl_valid_stats_req(const struct nlmsghdr *nlh, bool strict_check,
5901 bool is_dump, struct netlink_ext_ack *extack)
5903 struct if_stats_msg *ifsm;
5905 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*ifsm))) {
5906 NL_SET_ERR_MSG(extack, "Invalid header for stats dump");
5913 ifsm = nlmsg_data(nlh);
5915 /* only requests using strict checks can pass data to influence
5916 * the dump. The legacy exception is filter_mask.
5918 if (ifsm->pad1 || ifsm->pad2 || (is_dump && ifsm->ifindex)) {
5919 NL_SET_ERR_MSG(extack, "Invalid values in header for stats dump request");
5922 if (ifsm->filter_mask >= IFLA_STATS_FILTER_BIT(IFLA_STATS_MAX + 1)) {
5923 NL_SET_ERR_MSG(extack, "Invalid stats requested through filter mask");
5930 static int rtnl_stats_get(struct sk_buff *skb, struct nlmsghdr *nlh,
5931 struct netlink_ext_ack *extack)
5933 struct rtnl_stats_dump_filters filters;
5934 struct net *net = sock_net(skb->sk);
5935 struct net_device *dev = NULL;
5936 int idxattr = 0, prividx = 0;
5937 struct if_stats_msg *ifsm;
5938 struct sk_buff *nskb;
5941 err = rtnl_valid_stats_req(nlh, netlink_strict_get_check(skb),
5946 ifsm = nlmsg_data(nlh);
5947 if (ifsm->ifindex > 0)
5948 dev = __dev_get_by_index(net, ifsm->ifindex);
5955 if (!ifsm->filter_mask) {
5956 NL_SET_ERR_MSG(extack, "Filter mask must be set for stats get");
5960 err = rtnl_stats_get_parse(nlh, ifsm->filter_mask, &filters, extack);
5964 nskb = nlmsg_new(if_nlmsg_stats_size(dev, &filters), GFP_KERNEL);
5968 err = rtnl_fill_statsinfo(nskb, dev, RTM_NEWSTATS,
5969 NETLINK_CB(skb).portid, nlh->nlmsg_seq, 0,
5970 0, &filters, &idxattr, &prividx, extack);
5972 /* -EMSGSIZE implies BUG in if_nlmsg_stats_size */
5973 WARN_ON(err == -EMSGSIZE);
5976 err = rtnl_unicast(nskb, net, NETLINK_CB(skb).portid);
5982 static int rtnl_stats_dump(struct sk_buff *skb, struct netlink_callback *cb)
5984 struct netlink_ext_ack *extack = cb->extack;
5985 int h, s_h, err, s_idx, s_idxattr, s_prividx;
5986 struct rtnl_stats_dump_filters filters;
5987 struct net *net = sock_net(skb->sk);
5988 unsigned int flags = NLM_F_MULTI;
5989 struct if_stats_msg *ifsm;
5990 struct hlist_head *head;
5991 struct net_device *dev;
5995 s_idx = cb->args[1];
5996 s_idxattr = cb->args[2];
5997 s_prividx = cb->args[3];
5999 cb->seq = net->dev_base_seq;
6001 err = rtnl_valid_stats_req(cb->nlh, cb->strict_check, true, extack);
6005 ifsm = nlmsg_data(cb->nlh);
6006 if (!ifsm->filter_mask) {
6007 NL_SET_ERR_MSG(extack, "Filter mask must be set for stats dump");
6011 err = rtnl_stats_get_parse(cb->nlh, ifsm->filter_mask, &filters,
6016 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
6018 head = &net->dev_index_head[h];
6019 hlist_for_each_entry(dev, head, index_hlist) {
6022 err = rtnl_fill_statsinfo(skb, dev, RTM_NEWSTATS,
6023 NETLINK_CB(cb->skb).portid,
6024 cb->nlh->nlmsg_seq, 0,
6026 &s_idxattr, &s_prividx,
6028 /* If we ran out of room on the first message,
6031 WARN_ON((err == -EMSGSIZE) && (skb->len == 0));
6037 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
6043 cb->args[3] = s_prividx;
6044 cb->args[2] = s_idxattr;
6051 void rtnl_offload_xstats_notify(struct net_device *dev)
6053 struct rtnl_stats_dump_filters response_filters = {};
6054 struct net *net = dev_net(dev);
6055 int idxattr = 0, prividx = 0;
6056 struct sk_buff *skb;
6061 response_filters.mask[0] |=
6062 IFLA_STATS_FILTER_BIT(IFLA_STATS_LINK_OFFLOAD_XSTATS);
6063 response_filters.mask[IFLA_STATS_LINK_OFFLOAD_XSTATS] |=
6064 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_HW_S_INFO);
6066 skb = nlmsg_new(if_nlmsg_stats_size(dev, &response_filters),
6071 err = rtnl_fill_statsinfo(skb, dev, RTM_NEWSTATS, 0, 0, 0, 0,
6072 &response_filters, &idxattr, &prividx, NULL);
6078 rtnl_notify(skb, net, 0, RTNLGRP_STATS, NULL, GFP_KERNEL);
6082 rtnl_set_sk_err(net, RTNLGRP_STATS, err);
6084 EXPORT_SYMBOL(rtnl_offload_xstats_notify);
6086 static int rtnl_stats_set(struct sk_buff *skb, struct nlmsghdr *nlh,
6087 struct netlink_ext_ack *extack)
6089 enum netdev_offload_xstats_type t_l3 = NETDEV_OFFLOAD_XSTATS_TYPE_L3;
6090 struct rtnl_stats_dump_filters response_filters = {};
6091 struct nlattr *tb[IFLA_STATS_GETSET_MAX + 1];
6092 struct net *net = sock_net(skb->sk);
6093 struct net_device *dev = NULL;
6094 struct if_stats_msg *ifsm;
6095 bool notify = false;
6098 err = rtnl_valid_stats_req(nlh, netlink_strict_get_check(skb),
6103 ifsm = nlmsg_data(nlh);
6104 if (ifsm->family != AF_UNSPEC) {
6105 NL_SET_ERR_MSG(extack, "Address family should be AF_UNSPEC");
6109 if (ifsm->ifindex > 0)
6110 dev = __dev_get_by_index(net, ifsm->ifindex);
6117 if (ifsm->filter_mask) {
6118 NL_SET_ERR_MSG(extack, "Filter mask must be 0 for stats set");
6122 err = nlmsg_parse(nlh, sizeof(*ifsm), tb, IFLA_STATS_GETSET_MAX,
6123 ifla_stats_set_policy, extack);
6127 if (tb[IFLA_STATS_SET_OFFLOAD_XSTATS_L3_STATS]) {
6128 u8 req = nla_get_u8(tb[IFLA_STATS_SET_OFFLOAD_XSTATS_L3_STATS]);
6131 err = netdev_offload_xstats_enable(dev, t_l3, extack);
6133 err = netdev_offload_xstats_disable(dev, t_l3);
6137 else if (err != -EALREADY)
6140 response_filters.mask[0] |=
6141 IFLA_STATS_FILTER_BIT(IFLA_STATS_LINK_OFFLOAD_XSTATS);
6142 response_filters.mask[IFLA_STATS_LINK_OFFLOAD_XSTATS] |=
6143 IFLA_STATS_FILTER_BIT(IFLA_OFFLOAD_XSTATS_HW_S_INFO);
6147 rtnl_offload_xstats_notify(dev);
6152 static int rtnl_mdb_valid_dump_req(const struct nlmsghdr *nlh,
6153 struct netlink_ext_ack *extack)
6155 struct br_port_msg *bpm;
6157 if (nlh->nlmsg_len < nlmsg_msg_size(sizeof(*bpm))) {
6158 NL_SET_ERR_MSG(extack, "Invalid header for mdb dump request");
6162 bpm = nlmsg_data(nlh);
6164 NL_SET_ERR_MSG(extack, "Filtering by device index is not supported for mdb dump request");
6167 if (nlmsg_attrlen(nlh, sizeof(*bpm))) {
6168 NL_SET_ERR_MSG(extack, "Invalid data after header in mdb dump request");
6175 struct rtnl_mdb_dump_ctx {
6179 static int rtnl_mdb_dump(struct sk_buff *skb, struct netlink_callback *cb)
6181 struct rtnl_mdb_dump_ctx *ctx = (void *)cb->ctx;
6182 struct net *net = sock_net(skb->sk);
6183 struct net_device *dev;
6187 NL_ASSERT_DUMP_CTX_FITS(struct rtnl_mdb_dump_ctx);
6189 if (cb->strict_check) {
6190 err = rtnl_mdb_valid_dump_req(cb->nlh, cb->extack);
6198 for_each_netdev(net, dev) {
6201 if (!dev->netdev_ops->ndo_mdb_dump)
6204 err = dev->netdev_ops->ndo_mdb_dump(dev, skb, cb);
6205 if (err == -EMSGSIZE)
6207 /* Moving on to next device, reset markers and sequence
6208 * counters since they are all maintained per-device.
6210 memset(cb->ctx, 0, sizeof(cb->ctx));
6222 static int rtnl_validate_mdb_entry_get(const struct nlattr *attr,
6223 struct netlink_ext_ack *extack)
6225 struct br_mdb_entry *entry = nla_data(attr);
6227 if (nla_len(attr) != sizeof(struct br_mdb_entry)) {
6228 NL_SET_ERR_MSG_ATTR(extack, attr, "Invalid attribute length");
6232 if (entry->ifindex) {
6233 NL_SET_ERR_MSG(extack, "Entry ifindex cannot be specified");
6238 NL_SET_ERR_MSG(extack, "Entry state cannot be specified");
6243 NL_SET_ERR_MSG(extack, "Entry flags cannot be specified");
6247 if (entry->vid >= VLAN_VID_MASK) {
6248 NL_SET_ERR_MSG(extack, "Invalid entry VLAN id");
6252 if (entry->addr.proto != htons(ETH_P_IP) &&
6253 entry->addr.proto != htons(ETH_P_IPV6) &&
6254 entry->addr.proto != 0) {
6255 NL_SET_ERR_MSG(extack, "Unknown entry protocol");
6262 static const struct nla_policy mdba_get_policy[MDBA_GET_ENTRY_MAX + 1] = {
6263 [MDBA_GET_ENTRY] = NLA_POLICY_VALIDATE_FN(NLA_BINARY,
6264 rtnl_validate_mdb_entry_get,
6265 sizeof(struct br_mdb_entry)),
6266 [MDBA_GET_ENTRY_ATTRS] = { .type = NLA_NESTED },
6269 static int rtnl_mdb_get(struct sk_buff *in_skb, struct nlmsghdr *nlh,
6270 struct netlink_ext_ack *extack)
6272 struct nlattr *tb[MDBA_GET_ENTRY_MAX + 1];
6273 struct net *net = sock_net(in_skb->sk);
6274 struct br_port_msg *bpm;
6275 struct net_device *dev;
6278 err = nlmsg_parse(nlh, sizeof(struct br_port_msg), tb,
6279 MDBA_GET_ENTRY_MAX, mdba_get_policy, extack);
6283 bpm = nlmsg_data(nlh);
6284 if (!bpm->ifindex) {
6285 NL_SET_ERR_MSG(extack, "Invalid ifindex");
6289 dev = __dev_get_by_index(net, bpm->ifindex);
6291 NL_SET_ERR_MSG(extack, "Device doesn't exist");
6295 if (NL_REQ_ATTR_CHECK(extack, NULL, tb, MDBA_GET_ENTRY)) {
6296 NL_SET_ERR_MSG(extack, "Missing MDBA_GET_ENTRY attribute");
6300 if (!dev->netdev_ops->ndo_mdb_get) {
6301 NL_SET_ERR_MSG(extack, "Device does not support MDB operations");
6305 return dev->netdev_ops->ndo_mdb_get(dev, tb, NETLINK_CB(in_skb).portid,
6306 nlh->nlmsg_seq, extack);
6309 static int rtnl_validate_mdb_entry(const struct nlattr *attr,
6310 struct netlink_ext_ack *extack)
6312 struct br_mdb_entry *entry = nla_data(attr);
6314 if (nla_len(attr) != sizeof(struct br_mdb_entry)) {
6315 NL_SET_ERR_MSG_ATTR(extack, attr, "Invalid attribute length");
6319 if (entry->ifindex == 0) {
6320 NL_SET_ERR_MSG(extack, "Zero entry ifindex is not allowed");
6324 if (entry->addr.proto == htons(ETH_P_IP)) {
6325 if (!ipv4_is_multicast(entry->addr.u.ip4) &&
6326 !ipv4_is_zeronet(entry->addr.u.ip4)) {
6327 NL_SET_ERR_MSG(extack, "IPv4 entry group address is not multicast or 0.0.0.0");
6330 if (ipv4_is_local_multicast(entry->addr.u.ip4)) {
6331 NL_SET_ERR_MSG(extack, "IPv4 entry group address is local multicast");
6334 #if IS_ENABLED(CONFIG_IPV6)
6335 } else if (entry->addr.proto == htons(ETH_P_IPV6)) {
6336 if (ipv6_addr_is_ll_all_nodes(&entry->addr.u.ip6)) {
6337 NL_SET_ERR_MSG(extack, "IPv6 entry group address is link-local all nodes");
6341 } else if (entry->addr.proto == 0) {
6343 if (!is_multicast_ether_addr(entry->addr.u.mac_addr)) {
6344 NL_SET_ERR_MSG(extack, "L2 entry group is not multicast");
6348 NL_SET_ERR_MSG(extack, "Unknown entry protocol");
6352 if (entry->state != MDB_PERMANENT && entry->state != MDB_TEMPORARY) {
6353 NL_SET_ERR_MSG(extack, "Unknown entry state");
6356 if (entry->vid >= VLAN_VID_MASK) {
6357 NL_SET_ERR_MSG(extack, "Invalid entry VLAN id");
6364 static const struct nla_policy mdba_policy[MDBA_SET_ENTRY_MAX + 1] = {
6365 [MDBA_SET_ENTRY_UNSPEC] = { .strict_start_type = MDBA_SET_ENTRY_ATTRS + 1 },
6366 [MDBA_SET_ENTRY] = NLA_POLICY_VALIDATE_FN(NLA_BINARY,
6367 rtnl_validate_mdb_entry,
6368 sizeof(struct br_mdb_entry)),
6369 [MDBA_SET_ENTRY_ATTRS] = { .type = NLA_NESTED },
6372 static int rtnl_mdb_add(struct sk_buff *skb, struct nlmsghdr *nlh,
6373 struct netlink_ext_ack *extack)
6375 struct nlattr *tb[MDBA_SET_ENTRY_MAX + 1];
6376 struct net *net = sock_net(skb->sk);
6377 struct br_port_msg *bpm;
6378 struct net_device *dev;
6381 err = nlmsg_parse_deprecated(nlh, sizeof(*bpm), tb,
6382 MDBA_SET_ENTRY_MAX, mdba_policy, extack);
6386 bpm = nlmsg_data(nlh);
6387 if (!bpm->ifindex) {
6388 NL_SET_ERR_MSG(extack, "Invalid ifindex");
6392 dev = __dev_get_by_index(net, bpm->ifindex);
6394 NL_SET_ERR_MSG(extack, "Device doesn't exist");
6398 if (NL_REQ_ATTR_CHECK(extack, NULL, tb, MDBA_SET_ENTRY)) {
6399 NL_SET_ERR_MSG(extack, "Missing MDBA_SET_ENTRY attribute");
6403 if (!dev->netdev_ops->ndo_mdb_add) {
6404 NL_SET_ERR_MSG(extack, "Device does not support MDB operations");
6408 return dev->netdev_ops->ndo_mdb_add(dev, tb, nlh->nlmsg_flags, extack);
6411 static int rtnl_mdb_del(struct sk_buff *skb, struct nlmsghdr *nlh,
6412 struct netlink_ext_ack *extack)
6414 struct nlattr *tb[MDBA_SET_ENTRY_MAX + 1];
6415 struct net *net = sock_net(skb->sk);
6416 struct br_port_msg *bpm;
6417 struct net_device *dev;
6420 err = nlmsg_parse_deprecated(nlh, sizeof(*bpm), tb,
6421 MDBA_SET_ENTRY_MAX, mdba_policy, extack);
6425 bpm = nlmsg_data(nlh);
6426 if (!bpm->ifindex) {
6427 NL_SET_ERR_MSG(extack, "Invalid ifindex");
6431 dev = __dev_get_by_index(net, bpm->ifindex);
6433 NL_SET_ERR_MSG(extack, "Device doesn't exist");
6437 if (NL_REQ_ATTR_CHECK(extack, NULL, tb, MDBA_SET_ENTRY)) {
6438 NL_SET_ERR_MSG(extack, "Missing MDBA_SET_ENTRY attribute");
6442 if (!dev->netdev_ops->ndo_mdb_del) {
6443 NL_SET_ERR_MSG(extack, "Device does not support MDB operations");
6447 return dev->netdev_ops->ndo_mdb_del(dev, tb, extack);
6450 /* Process one rtnetlink message. */
6452 static int rtnetlink_rcv_msg(struct sk_buff *skb, struct nlmsghdr *nlh,
6453 struct netlink_ext_ack *extack)
6455 struct net *net = sock_net(skb->sk);
6456 struct rtnl_link *link;
6457 enum rtnl_kinds kind;
6458 struct module *owner;
6459 int err = -EOPNOTSUPP;
6460 rtnl_doit_func doit;
6465 type = nlh->nlmsg_type;
6471 /* All the messages must have at least 1 byte length */
6472 if (nlmsg_len(nlh) < sizeof(struct rtgenmsg))
6475 family = ((struct rtgenmsg *)nlmsg_data(nlh))->rtgen_family;
6476 kind = rtnl_msgtype_kind(type);
6478 if (kind != RTNL_KIND_GET && !netlink_net_capable(skb, CAP_NET_ADMIN))
6482 if (kind == RTNL_KIND_GET && (nlh->nlmsg_flags & NLM_F_DUMP)) {
6484 rtnl_dumpit_func dumpit;
6485 u32 min_dump_alloc = 0;
6487 link = rtnl_get_link(family, type);
6488 if (!link || !link->dumpit) {
6490 link = rtnl_get_link(family, type);
6491 if (!link || !link->dumpit)
6494 owner = link->owner;
6495 dumpit = link->dumpit;
6497 if (type == RTM_GETLINK - RTM_BASE)
6498 min_dump_alloc = rtnl_calcit(skb, nlh);
6501 /* need to do this before rcu_read_unlock() */
6502 if (!try_module_get(owner))
6503 err = -EPROTONOSUPPORT;
6509 struct netlink_dump_control c = {
6511 .min_dump_alloc = min_dump_alloc,
6514 err = netlink_dump_start(rtnl, skb, nlh, &c);
6515 /* netlink_dump_start() will keep a reference on
6516 * module if dump is still in progress.
6523 link = rtnl_get_link(family, type);
6524 if (!link || !link->doit) {
6526 link = rtnl_get_link(PF_UNSPEC, type);
6527 if (!link || !link->doit)
6531 owner = link->owner;
6532 if (!try_module_get(owner)) {
6533 err = -EPROTONOSUPPORT;
6537 flags = link->flags;
6538 if (kind == RTNL_KIND_DEL && (nlh->nlmsg_flags & NLM_F_BULK) &&
6539 !(flags & RTNL_FLAG_BULK_DEL_SUPPORTED)) {
6540 NL_SET_ERR_MSG(extack, "Bulk delete is not supported");
6545 if (flags & RTNL_FLAG_DOIT_UNLOCKED) {
6549 err = doit(skb, nlh, extack);
6556 link = rtnl_get_link(family, type);
6557 if (link && link->doit)
6558 err = link->doit(skb, nlh, extack);
6574 static void rtnetlink_rcv(struct sk_buff *skb)
6576 netlink_rcv_skb(skb, &rtnetlink_rcv_msg);
6579 static int rtnetlink_bind(struct net *net, int group)
6582 case RTNLGRP_IPV4_MROUTE_R:
6583 case RTNLGRP_IPV6_MROUTE_R:
6584 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
6591 static int rtnetlink_event(struct notifier_block *this, unsigned long event, void *ptr)
6593 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
6597 case NETDEV_CHANGEMTU:
6598 case NETDEV_CHANGEADDR:
6599 case NETDEV_CHANGENAME:
6600 case NETDEV_FEAT_CHANGE:
6601 case NETDEV_BONDING_FAILOVER:
6602 case NETDEV_POST_TYPE_CHANGE:
6603 case NETDEV_NOTIFY_PEERS:
6604 case NETDEV_CHANGEUPPER:
6605 case NETDEV_RESEND_IGMP:
6606 case NETDEV_CHANGEINFODATA:
6607 case NETDEV_CHANGELOWERSTATE:
6608 case NETDEV_CHANGE_TX_QUEUE_LEN:
6609 rtmsg_ifinfo_event(RTM_NEWLINK, dev, 0, rtnl_get_event(event),
6610 GFP_KERNEL, NULL, 0, 0, NULL);
6618 static struct notifier_block rtnetlink_dev_notifier = {
6619 .notifier_call = rtnetlink_event,
6623 static int __net_init rtnetlink_net_init(struct net *net)
6626 struct netlink_kernel_cfg cfg = {
6627 .groups = RTNLGRP_MAX,
6628 .input = rtnetlink_rcv,
6629 .cb_mutex = &rtnl_mutex,
6630 .flags = NL_CFG_F_NONROOT_RECV,
6631 .bind = rtnetlink_bind,
6634 sk = netlink_kernel_create(net, NETLINK_ROUTE, &cfg);
6641 static void __net_exit rtnetlink_net_exit(struct net *net)
6643 netlink_kernel_release(net->rtnl);
6647 static struct pernet_operations rtnetlink_net_ops = {
6648 .init = rtnetlink_net_init,
6649 .exit = rtnetlink_net_exit,
6652 void __init rtnetlink_init(void)
6654 if (register_pernet_subsys(&rtnetlink_net_ops))
6655 panic("rtnetlink_init: cannot initialize rtnetlink\n");
6657 register_netdevice_notifier(&rtnetlink_dev_notifier);
6659 rtnl_register(PF_UNSPEC, RTM_GETLINK, rtnl_getlink,
6660 rtnl_dump_ifinfo, 0);
6661 rtnl_register(PF_UNSPEC, RTM_SETLINK, rtnl_setlink, NULL, 0);
6662 rtnl_register(PF_UNSPEC, RTM_NEWLINK, rtnl_newlink, NULL, 0);
6663 rtnl_register(PF_UNSPEC, RTM_DELLINK, rtnl_dellink, NULL, 0);
6665 rtnl_register(PF_UNSPEC, RTM_GETADDR, NULL, rtnl_dump_all, 0);
6666 rtnl_register(PF_UNSPEC, RTM_GETROUTE, NULL, rtnl_dump_all, 0);
6667 rtnl_register(PF_UNSPEC, RTM_GETNETCONF, NULL, rtnl_dump_all, 0);
6669 rtnl_register(PF_UNSPEC, RTM_NEWLINKPROP, rtnl_newlinkprop, NULL, 0);
6670 rtnl_register(PF_UNSPEC, RTM_DELLINKPROP, rtnl_dellinkprop, NULL, 0);
6672 rtnl_register(PF_BRIDGE, RTM_NEWNEIGH, rtnl_fdb_add, NULL, 0);
6673 rtnl_register(PF_BRIDGE, RTM_DELNEIGH, rtnl_fdb_del, NULL,
6674 RTNL_FLAG_BULK_DEL_SUPPORTED);
6675 rtnl_register(PF_BRIDGE, RTM_GETNEIGH, rtnl_fdb_get, rtnl_fdb_dump, 0);
6677 rtnl_register(PF_BRIDGE, RTM_GETLINK, NULL, rtnl_bridge_getlink, 0);
6678 rtnl_register(PF_BRIDGE, RTM_DELLINK, rtnl_bridge_dellink, NULL, 0);
6679 rtnl_register(PF_BRIDGE, RTM_SETLINK, rtnl_bridge_setlink, NULL, 0);
6681 rtnl_register(PF_UNSPEC, RTM_GETSTATS, rtnl_stats_get, rtnl_stats_dump,
6683 rtnl_register(PF_UNSPEC, RTM_SETSTATS, rtnl_stats_set, NULL, 0);
6685 rtnl_register(PF_BRIDGE, RTM_GETMDB, rtnl_mdb_get, rtnl_mdb_dump, 0);
6686 rtnl_register(PF_BRIDGE, RTM_NEWMDB, rtnl_mdb_add, NULL, 0);
6687 rtnl_register(PF_BRIDGE, RTM_DELMDB, rtnl_mdb_del, NULL, 0);