2 * INET An implementation of the TCP/IP protocol suite for the LINUX
3 * operating system. INET is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
6 * Routing netlink socket interface: protocol independent part.
8 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
16 * Vitaly E. Lavrov RTA_OK arithmetics was wrong.
19 #include <linux/errno.h>
20 #include <linux/module.h>
21 #include <linux/types.h>
22 #include <linux/socket.h>
23 #include <linux/kernel.h>
24 #include <linux/timer.h>
25 #include <linux/string.h>
26 #include <linux/sockios.h>
27 #include <linux/net.h>
28 #include <linux/fcntl.h>
30 #include <linux/slab.h>
31 #include <linux/interrupt.h>
32 #include <linux/capability.h>
33 #include <linux/skbuff.h>
34 #include <linux/init.h>
35 #include <linux/security.h>
36 #include <linux/mutex.h>
37 #include <linux/if_addr.h>
38 #include <linux/if_bridge.h>
39 #include <linux/if_vlan.h>
40 #include <linux/pci.h>
41 #include <linux/etherdevice.h>
43 #include <asm/uaccess.h>
45 #include <linux/inet.h>
46 #include <linux/netdevice.h>
47 #include <net/switchdev.h>
49 #include <net/protocol.h>
51 #include <net/route.h>
55 #include <net/pkt_sched.h>
56 #include <net/fib_rules.h>
57 #include <net/rtnetlink.h>
58 #include <net/net_namespace.h>
62 rtnl_dumpit_func dumpit
;
63 rtnl_calcit_func calcit
;
66 static DEFINE_MUTEX(rtnl_mutex
);
70 mutex_lock(&rtnl_mutex
);
72 EXPORT_SYMBOL(rtnl_lock
);
74 void __rtnl_unlock(void)
76 mutex_unlock(&rtnl_mutex
);
79 void rtnl_unlock(void)
81 /* This fellow will unlock it for us. */
84 EXPORT_SYMBOL(rtnl_unlock
);
86 int rtnl_trylock(void)
88 return mutex_trylock(&rtnl_mutex
);
90 EXPORT_SYMBOL(rtnl_trylock
);
92 int rtnl_is_locked(void)
94 return mutex_is_locked(&rtnl_mutex
);
96 EXPORT_SYMBOL(rtnl_is_locked
);
98 #ifdef CONFIG_PROVE_LOCKING
99 bool lockdep_rtnl_is_held(void)
101 return lockdep_is_held(&rtnl_mutex
);
103 EXPORT_SYMBOL(lockdep_rtnl_is_held
);
104 #endif /* #ifdef CONFIG_PROVE_LOCKING */
106 static struct rtnl_link
*rtnl_msg_handlers
[RTNL_FAMILY_MAX
+ 1];
108 static inline int rtm_msgindex(int msgtype
)
110 int msgindex
= msgtype
- RTM_BASE
;
113 * msgindex < 0 implies someone tried to register a netlink
114 * control code. msgindex >= RTM_NR_MSGTYPES may indicate that
115 * the message type has not been added to linux/rtnetlink.h
117 BUG_ON(msgindex
< 0 || msgindex
>= RTM_NR_MSGTYPES
);
122 static rtnl_doit_func
rtnl_get_doit(int protocol
, int msgindex
)
124 struct rtnl_link
*tab
;
126 if (protocol
<= RTNL_FAMILY_MAX
)
127 tab
= rtnl_msg_handlers
[protocol
];
131 if (tab
== NULL
|| tab
[msgindex
].doit
== NULL
)
132 tab
= rtnl_msg_handlers
[PF_UNSPEC
];
134 return tab
[msgindex
].doit
;
137 static rtnl_dumpit_func
rtnl_get_dumpit(int protocol
, int msgindex
)
139 struct rtnl_link
*tab
;
141 if (protocol
<= RTNL_FAMILY_MAX
)
142 tab
= rtnl_msg_handlers
[protocol
];
146 if (tab
== NULL
|| tab
[msgindex
].dumpit
== NULL
)
147 tab
= rtnl_msg_handlers
[PF_UNSPEC
];
149 return tab
[msgindex
].dumpit
;
152 static rtnl_calcit_func
rtnl_get_calcit(int protocol
, int msgindex
)
154 struct rtnl_link
*tab
;
156 if (protocol
<= RTNL_FAMILY_MAX
)
157 tab
= rtnl_msg_handlers
[protocol
];
161 if (tab
== NULL
|| tab
[msgindex
].calcit
== NULL
)
162 tab
= rtnl_msg_handlers
[PF_UNSPEC
];
164 return tab
[msgindex
].calcit
;
168 * __rtnl_register - Register a rtnetlink message type
169 * @protocol: Protocol family or PF_UNSPEC
170 * @msgtype: rtnetlink message type
171 * @doit: Function pointer called for each request message
172 * @dumpit: Function pointer called for each dump request (NLM_F_DUMP) message
173 * @calcit: Function pointer to calc size of dump message
175 * Registers the specified function pointers (at least one of them has
176 * to be non-NULL) to be called whenever a request message for the
177 * specified protocol family and message type is received.
179 * The special protocol family PF_UNSPEC may be used to define fallback
180 * function pointers for the case when no entry for the specific protocol
183 * Returns 0 on success or a negative error code.
185 int __rtnl_register(int protocol
, int msgtype
,
186 rtnl_doit_func doit
, rtnl_dumpit_func dumpit
,
187 rtnl_calcit_func calcit
)
189 struct rtnl_link
*tab
;
192 BUG_ON(protocol
< 0 || protocol
> RTNL_FAMILY_MAX
);
193 msgindex
= rtm_msgindex(msgtype
);
195 tab
= rtnl_msg_handlers
[protocol
];
197 tab
= kcalloc(RTM_NR_MSGTYPES
, sizeof(*tab
), GFP_KERNEL
);
201 rtnl_msg_handlers
[protocol
] = tab
;
205 tab
[msgindex
].doit
= doit
;
208 tab
[msgindex
].dumpit
= dumpit
;
211 tab
[msgindex
].calcit
= calcit
;
215 EXPORT_SYMBOL_GPL(__rtnl_register
);
218 * rtnl_register - Register a rtnetlink message type
220 * Identical to __rtnl_register() but panics on failure. This is useful
221 * as failure of this function is very unlikely, it can only happen due
222 * to lack of memory when allocating the chain to store all message
223 * handlers for a protocol. Meant for use in init functions where lack
224 * of memory implies no sense in continuing.
226 void rtnl_register(int protocol
, int msgtype
,
227 rtnl_doit_func doit
, rtnl_dumpit_func dumpit
,
228 rtnl_calcit_func calcit
)
230 if (__rtnl_register(protocol
, msgtype
, doit
, dumpit
, calcit
) < 0)
231 panic("Unable to register rtnetlink message handler, "
232 "protocol = %d, message type = %d\n",
235 EXPORT_SYMBOL_GPL(rtnl_register
);
238 * rtnl_unregister - Unregister a rtnetlink message type
239 * @protocol: Protocol family or PF_UNSPEC
240 * @msgtype: rtnetlink message type
242 * Returns 0 on success or a negative error code.
244 int rtnl_unregister(int protocol
, int msgtype
)
248 BUG_ON(protocol
< 0 || protocol
> RTNL_FAMILY_MAX
);
249 msgindex
= rtm_msgindex(msgtype
);
251 if (rtnl_msg_handlers
[protocol
] == NULL
)
254 rtnl_msg_handlers
[protocol
][msgindex
].doit
= NULL
;
255 rtnl_msg_handlers
[protocol
][msgindex
].dumpit
= NULL
;
259 EXPORT_SYMBOL_GPL(rtnl_unregister
);
262 * rtnl_unregister_all - Unregister all rtnetlink message type of a protocol
263 * @protocol : Protocol family or PF_UNSPEC
265 * Identical to calling rtnl_unregster() for all registered message types
266 * of a certain protocol family.
268 void rtnl_unregister_all(int protocol
)
270 BUG_ON(protocol
< 0 || protocol
> RTNL_FAMILY_MAX
);
272 kfree(rtnl_msg_handlers
[protocol
]);
273 rtnl_msg_handlers
[protocol
] = NULL
;
275 EXPORT_SYMBOL_GPL(rtnl_unregister_all
);
277 static LIST_HEAD(link_ops
);
279 static const struct rtnl_link_ops
*rtnl_link_ops_get(const char *kind
)
281 const struct rtnl_link_ops
*ops
;
283 list_for_each_entry(ops
, &link_ops
, list
) {
284 if (!strcmp(ops
->kind
, kind
))
291 * __rtnl_link_register - Register rtnl_link_ops with rtnetlink.
292 * @ops: struct rtnl_link_ops * to register
294 * The caller must hold the rtnl_mutex. This function should be used
295 * by drivers that create devices during module initialization. It
296 * must be called before registering the devices.
298 * Returns 0 on success or a negative error code.
300 int __rtnl_link_register(struct rtnl_link_ops
*ops
)
302 if (rtnl_link_ops_get(ops
->kind
))
305 /* The check for setup is here because if ops
306 * does not have that filled up, it is not possible
307 * to use the ops for creating device. So do not
308 * fill up dellink as well. That disables rtnl_dellink.
310 if (ops
->setup
&& !ops
->dellink
)
311 ops
->dellink
= unregister_netdevice_queue
;
313 list_add_tail(&ops
->list
, &link_ops
);
316 EXPORT_SYMBOL_GPL(__rtnl_link_register
);
319 * rtnl_link_register - Register rtnl_link_ops with rtnetlink.
320 * @ops: struct rtnl_link_ops * to register
322 * Returns 0 on success or a negative error code.
324 int rtnl_link_register(struct rtnl_link_ops
*ops
)
329 err
= __rtnl_link_register(ops
);
333 EXPORT_SYMBOL_GPL(rtnl_link_register
);
335 static void __rtnl_kill_links(struct net
*net
, struct rtnl_link_ops
*ops
)
337 struct net_device
*dev
;
338 LIST_HEAD(list_kill
);
340 for_each_netdev(net
, dev
) {
341 if (dev
->rtnl_link_ops
== ops
)
342 ops
->dellink(dev
, &list_kill
);
344 unregister_netdevice_many(&list_kill
);
348 * __rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
349 * @ops: struct rtnl_link_ops * to unregister
351 * The caller must hold the rtnl_mutex.
353 void __rtnl_link_unregister(struct rtnl_link_ops
*ops
)
358 __rtnl_kill_links(net
, ops
);
360 list_del(&ops
->list
);
362 EXPORT_SYMBOL_GPL(__rtnl_link_unregister
);
364 /* Return with the rtnl_lock held when there are no network
365 * devices unregistering in any network namespace.
367 static void rtnl_lock_unregistering_all(void)
371 DEFINE_WAIT_FUNC(wait
, woken_wake_function
);
373 add_wait_queue(&netdev_unregistering_wq
, &wait
);
375 unregistering
= false;
378 if (net
->dev_unreg_count
> 0) {
379 unregistering
= true;
387 wait_woken(&wait
, TASK_UNINTERRUPTIBLE
, MAX_SCHEDULE_TIMEOUT
);
389 remove_wait_queue(&netdev_unregistering_wq
, &wait
);
393 * rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
394 * @ops: struct rtnl_link_ops * to unregister
396 void rtnl_link_unregister(struct rtnl_link_ops
*ops
)
398 /* Close the race with cleanup_net() */
399 mutex_lock(&net_mutex
);
400 rtnl_lock_unregistering_all();
401 __rtnl_link_unregister(ops
);
403 mutex_unlock(&net_mutex
);
405 EXPORT_SYMBOL_GPL(rtnl_link_unregister
);
407 static size_t rtnl_link_get_slave_info_data_size(const struct net_device
*dev
)
409 struct net_device
*master_dev
;
410 const struct rtnl_link_ops
*ops
;
412 master_dev
= netdev_master_upper_dev_get((struct net_device
*) dev
);
415 ops
= master_dev
->rtnl_link_ops
;
416 if (!ops
|| !ops
->get_slave_size
)
418 /* IFLA_INFO_SLAVE_DATA + nested data */
419 return nla_total_size(sizeof(struct nlattr
)) +
420 ops
->get_slave_size(master_dev
, dev
);
423 static size_t rtnl_link_get_size(const struct net_device
*dev
)
425 const struct rtnl_link_ops
*ops
= dev
->rtnl_link_ops
;
431 size
= nla_total_size(sizeof(struct nlattr
)) + /* IFLA_LINKINFO */
432 nla_total_size(strlen(ops
->kind
) + 1); /* IFLA_INFO_KIND */
435 /* IFLA_INFO_DATA + nested data */
436 size
+= nla_total_size(sizeof(struct nlattr
)) +
439 if (ops
->get_xstats_size
)
440 /* IFLA_INFO_XSTATS */
441 size
+= nla_total_size(ops
->get_xstats_size(dev
));
443 size
+= rtnl_link_get_slave_info_data_size(dev
);
448 static LIST_HEAD(rtnl_af_ops
);
450 static const struct rtnl_af_ops
*rtnl_af_lookup(const int family
)
452 const struct rtnl_af_ops
*ops
;
454 list_for_each_entry(ops
, &rtnl_af_ops
, list
) {
455 if (ops
->family
== family
)
463 * rtnl_af_register - Register rtnl_af_ops with rtnetlink.
464 * @ops: struct rtnl_af_ops * to register
466 * Returns 0 on success or a negative error code.
468 void rtnl_af_register(struct rtnl_af_ops
*ops
)
471 list_add_tail(&ops
->list
, &rtnl_af_ops
);
474 EXPORT_SYMBOL_GPL(rtnl_af_register
);
477 * __rtnl_af_unregister - Unregister rtnl_af_ops from rtnetlink.
478 * @ops: struct rtnl_af_ops * to unregister
480 * The caller must hold the rtnl_mutex.
482 void __rtnl_af_unregister(struct rtnl_af_ops
*ops
)
484 list_del(&ops
->list
);
486 EXPORT_SYMBOL_GPL(__rtnl_af_unregister
);
489 * rtnl_af_unregister - Unregister rtnl_af_ops from rtnetlink.
490 * @ops: struct rtnl_af_ops * to unregister
492 void rtnl_af_unregister(struct rtnl_af_ops
*ops
)
495 __rtnl_af_unregister(ops
);
498 EXPORT_SYMBOL_GPL(rtnl_af_unregister
);
500 static size_t rtnl_link_get_af_size(const struct net_device
*dev
,
503 struct rtnl_af_ops
*af_ops
;
507 size
= nla_total_size(sizeof(struct nlattr
));
509 list_for_each_entry(af_ops
, &rtnl_af_ops
, list
) {
510 if (af_ops
->get_link_af_size
) {
511 /* AF_* + nested data */
512 size
+= nla_total_size(sizeof(struct nlattr
)) +
513 af_ops
->get_link_af_size(dev
, ext_filter_mask
);
520 static bool rtnl_have_link_slave_info(const struct net_device
*dev
)
522 struct net_device
*master_dev
;
524 master_dev
= netdev_master_upper_dev_get((struct net_device
*) dev
);
525 if (master_dev
&& master_dev
->rtnl_link_ops
)
530 static int rtnl_link_slave_info_fill(struct sk_buff
*skb
,
531 const struct net_device
*dev
)
533 struct net_device
*master_dev
;
534 const struct rtnl_link_ops
*ops
;
535 struct nlattr
*slave_data
;
538 master_dev
= netdev_master_upper_dev_get((struct net_device
*) dev
);
541 ops
= master_dev
->rtnl_link_ops
;
544 if (nla_put_string(skb
, IFLA_INFO_SLAVE_KIND
, ops
->kind
) < 0)
546 if (ops
->fill_slave_info
) {
547 slave_data
= nla_nest_start(skb
, IFLA_INFO_SLAVE_DATA
);
550 err
= ops
->fill_slave_info(skb
, master_dev
, dev
);
552 goto err_cancel_slave_data
;
553 nla_nest_end(skb
, slave_data
);
557 err_cancel_slave_data
:
558 nla_nest_cancel(skb
, slave_data
);
562 static int rtnl_link_info_fill(struct sk_buff
*skb
,
563 const struct net_device
*dev
)
565 const struct rtnl_link_ops
*ops
= dev
->rtnl_link_ops
;
571 if (nla_put_string(skb
, IFLA_INFO_KIND
, ops
->kind
) < 0)
573 if (ops
->fill_xstats
) {
574 err
= ops
->fill_xstats(skb
, dev
);
578 if (ops
->fill_info
) {
579 data
= nla_nest_start(skb
, IFLA_INFO_DATA
);
582 err
= ops
->fill_info(skb
, dev
);
584 goto err_cancel_data
;
585 nla_nest_end(skb
, data
);
590 nla_nest_cancel(skb
, data
);
594 static int rtnl_link_fill(struct sk_buff
*skb
, const struct net_device
*dev
)
596 struct nlattr
*linkinfo
;
599 linkinfo
= nla_nest_start(skb
, IFLA_LINKINFO
);
600 if (linkinfo
== NULL
)
603 err
= rtnl_link_info_fill(skb
, dev
);
605 goto err_cancel_link
;
607 err
= rtnl_link_slave_info_fill(skb
, dev
);
609 goto err_cancel_link
;
611 nla_nest_end(skb
, linkinfo
);
615 nla_nest_cancel(skb
, linkinfo
);
620 int rtnetlink_send(struct sk_buff
*skb
, struct net
*net
, u32 pid
, unsigned int group
, int echo
)
622 struct sock
*rtnl
= net
->rtnl
;
625 NETLINK_CB(skb
).dst_group
= group
;
627 atomic_inc(&skb
->users
);
628 netlink_broadcast(rtnl
, skb
, pid
, group
, GFP_KERNEL
);
630 err
= netlink_unicast(rtnl
, skb
, pid
, MSG_DONTWAIT
);
634 int rtnl_unicast(struct sk_buff
*skb
, struct net
*net
, u32 pid
)
636 struct sock
*rtnl
= net
->rtnl
;
638 return nlmsg_unicast(rtnl
, skb
, pid
);
640 EXPORT_SYMBOL(rtnl_unicast
);
642 void rtnl_notify(struct sk_buff
*skb
, struct net
*net
, u32 pid
, u32 group
,
643 struct nlmsghdr
*nlh
, gfp_t flags
)
645 struct sock
*rtnl
= net
->rtnl
;
649 report
= nlmsg_report(nlh
);
651 nlmsg_notify(rtnl
, skb
, pid
, group
, report
, flags
);
653 EXPORT_SYMBOL(rtnl_notify
);
655 void rtnl_set_sk_err(struct net
*net
, u32 group
, int error
)
657 struct sock
*rtnl
= net
->rtnl
;
659 netlink_set_err(rtnl
, 0, group
, error
);
661 EXPORT_SYMBOL(rtnl_set_sk_err
);
663 int rtnetlink_put_metrics(struct sk_buff
*skb
, u32
*metrics
)
668 mx
= nla_nest_start(skb
, RTA_METRICS
);
672 for (i
= 0; i
< RTAX_MAX
; i
++) {
674 if (i
== RTAX_CC_ALGO
- 1) {
675 char tmp
[TCP_CA_NAME_MAX
], *name
;
677 name
= tcp_ca_get_name_by_key(metrics
[i
], tmp
);
680 if (nla_put_string(skb
, i
+ 1, name
))
681 goto nla_put_failure
;
682 } else if (i
== RTAX_FEATURES
- 1) {
683 u32 user_features
= metrics
[i
] & RTAX_FEATURE_MASK
;
685 BUILD_BUG_ON(RTAX_FEATURE_MASK
& DST_FEATURE_MASK
);
686 if (nla_put_u32(skb
, i
+ 1, user_features
))
687 goto nla_put_failure
;
689 if (nla_put_u32(skb
, i
+ 1, metrics
[i
]))
690 goto nla_put_failure
;
697 nla_nest_cancel(skb
, mx
);
701 return nla_nest_end(skb
, mx
);
704 nla_nest_cancel(skb
, mx
);
707 EXPORT_SYMBOL(rtnetlink_put_metrics
);
709 int rtnl_put_cacheinfo(struct sk_buff
*skb
, struct dst_entry
*dst
, u32 id
,
710 long expires
, u32 error
)
712 struct rta_cacheinfo ci
= {
713 .rta_lastuse
= jiffies_delta_to_clock_t(jiffies
- dst
->lastuse
),
714 .rta_used
= dst
->__use
,
715 .rta_clntref
= atomic_read(&(dst
->__refcnt
)),
723 clock
= jiffies_to_clock_t(abs(expires
));
724 clock
= min_t(unsigned long, clock
, INT_MAX
);
725 ci
.rta_expires
= (expires
> 0) ? clock
: -clock
;
727 return nla_put(skb
, RTA_CACHEINFO
, sizeof(ci
), &ci
);
729 EXPORT_SYMBOL_GPL(rtnl_put_cacheinfo
);
731 static void set_operstate(struct net_device
*dev
, unsigned char transition
)
733 unsigned char operstate
= dev
->operstate
;
735 switch (transition
) {
737 if ((operstate
== IF_OPER_DORMANT
||
738 operstate
== IF_OPER_UNKNOWN
) &&
740 operstate
= IF_OPER_UP
;
743 case IF_OPER_DORMANT
:
744 if (operstate
== IF_OPER_UP
||
745 operstate
== IF_OPER_UNKNOWN
)
746 operstate
= IF_OPER_DORMANT
;
750 if (dev
->operstate
!= operstate
) {
751 write_lock_bh(&dev_base_lock
);
752 dev
->operstate
= operstate
;
753 write_unlock_bh(&dev_base_lock
);
754 netdev_state_change(dev
);
758 static unsigned int rtnl_dev_get_flags(const struct net_device
*dev
)
760 return (dev
->flags
& ~(IFF_PROMISC
| IFF_ALLMULTI
)) |
761 (dev
->gflags
& (IFF_PROMISC
| IFF_ALLMULTI
));
764 static unsigned int rtnl_dev_combine_flags(const struct net_device
*dev
,
765 const struct ifinfomsg
*ifm
)
767 unsigned int flags
= ifm
->ifi_flags
;
769 /* bugwards compatibility: ifi_change == 0 is treated as ~0 */
771 flags
= (flags
& ifm
->ifi_change
) |
772 (rtnl_dev_get_flags(dev
) & ~ifm
->ifi_change
);
777 static void copy_rtnl_link_stats(struct rtnl_link_stats
*a
,
778 const struct rtnl_link_stats64
*b
)
780 a
->rx_packets
= b
->rx_packets
;
781 a
->tx_packets
= b
->tx_packets
;
782 a
->rx_bytes
= b
->rx_bytes
;
783 a
->tx_bytes
= b
->tx_bytes
;
784 a
->rx_errors
= b
->rx_errors
;
785 a
->tx_errors
= b
->tx_errors
;
786 a
->rx_dropped
= b
->rx_dropped
;
787 a
->tx_dropped
= b
->tx_dropped
;
789 a
->multicast
= b
->multicast
;
790 a
->collisions
= b
->collisions
;
792 a
->rx_length_errors
= b
->rx_length_errors
;
793 a
->rx_over_errors
= b
->rx_over_errors
;
794 a
->rx_crc_errors
= b
->rx_crc_errors
;
795 a
->rx_frame_errors
= b
->rx_frame_errors
;
796 a
->rx_fifo_errors
= b
->rx_fifo_errors
;
797 a
->rx_missed_errors
= b
->rx_missed_errors
;
799 a
->tx_aborted_errors
= b
->tx_aborted_errors
;
800 a
->tx_carrier_errors
= b
->tx_carrier_errors
;
801 a
->tx_fifo_errors
= b
->tx_fifo_errors
;
802 a
->tx_heartbeat_errors
= b
->tx_heartbeat_errors
;
803 a
->tx_window_errors
= b
->tx_window_errors
;
805 a
->rx_compressed
= b
->rx_compressed
;
806 a
->tx_compressed
= b
->tx_compressed
;
808 a
->rx_nohandler
= b
->rx_nohandler
;
811 static void copy_rtnl_link_stats64(void *v
, const struct rtnl_link_stats64
*b
)
813 memcpy(v
, b
, sizeof(*b
));
817 static inline int rtnl_vfinfo_size(const struct net_device
*dev
,
820 if (dev
->dev
.parent
&& dev_is_pci(dev
->dev
.parent
) &&
821 (ext_filter_mask
& RTEXT_FILTER_VF
)) {
822 int num_vfs
= dev_num_vf(dev
->dev
.parent
);
823 size_t size
= nla_total_size(sizeof(struct nlattr
));
824 size
+= nla_total_size(num_vfs
* sizeof(struct nlattr
));
826 (nla_total_size(sizeof(struct ifla_vf_mac
)) +
827 nla_total_size(sizeof(struct ifla_vf_vlan
)) +
828 nla_total_size(sizeof(struct ifla_vf_spoofchk
)) +
829 nla_total_size(sizeof(struct ifla_vf_rate
)) +
830 nla_total_size(sizeof(struct ifla_vf_link_state
)) +
831 nla_total_size(sizeof(struct ifla_vf_rss_query_en
)) +
832 /* IFLA_VF_STATS_RX_PACKETS */
833 nla_total_size(sizeof(__u64
)) +
834 /* IFLA_VF_STATS_TX_PACKETS */
835 nla_total_size(sizeof(__u64
)) +
836 /* IFLA_VF_STATS_RX_BYTES */
837 nla_total_size(sizeof(__u64
)) +
838 /* IFLA_VF_STATS_TX_BYTES */
839 nla_total_size(sizeof(__u64
)) +
840 /* IFLA_VF_STATS_BROADCAST */
841 nla_total_size(sizeof(__u64
)) +
842 /* IFLA_VF_STATS_MULTICAST */
843 nla_total_size(sizeof(__u64
)) +
844 nla_total_size(sizeof(struct ifla_vf_trust
)));
850 static size_t rtnl_port_size(const struct net_device
*dev
,
853 size_t port_size
= nla_total_size(4) /* PORT_VF */
854 + nla_total_size(PORT_PROFILE_MAX
) /* PORT_PROFILE */
855 + nla_total_size(sizeof(struct ifla_port_vsi
))
857 + nla_total_size(PORT_UUID_MAX
) /* PORT_INSTANCE_UUID */
858 + nla_total_size(PORT_UUID_MAX
) /* PORT_HOST_UUID */
859 + nla_total_size(1) /* PROT_VDP_REQUEST */
860 + nla_total_size(2); /* PORT_VDP_RESPONSE */
861 size_t vf_ports_size
= nla_total_size(sizeof(struct nlattr
));
862 size_t vf_port_size
= nla_total_size(sizeof(struct nlattr
))
864 size_t port_self_size
= nla_total_size(sizeof(struct nlattr
))
867 if (!dev
->netdev_ops
->ndo_get_vf_port
|| !dev
->dev
.parent
||
868 !(ext_filter_mask
& RTEXT_FILTER_VF
))
870 if (dev_num_vf(dev
->dev
.parent
))
871 return port_self_size
+ vf_ports_size
+
872 vf_port_size
* dev_num_vf(dev
->dev
.parent
);
874 return port_self_size
;
877 static noinline
size_t if_nlmsg_size(const struct net_device
*dev
,
880 return NLMSG_ALIGN(sizeof(struct ifinfomsg
))
881 + nla_total_size(IFNAMSIZ
) /* IFLA_IFNAME */
882 + nla_total_size(IFALIASZ
) /* IFLA_IFALIAS */
883 + nla_total_size(IFNAMSIZ
) /* IFLA_QDISC */
884 + nla_total_size(sizeof(struct rtnl_link_ifmap
))
885 + nla_total_size(sizeof(struct rtnl_link_stats
))
886 + nla_total_size(sizeof(struct rtnl_link_stats64
))
887 + nla_total_size(MAX_ADDR_LEN
) /* IFLA_ADDRESS */
888 + nla_total_size(MAX_ADDR_LEN
) /* IFLA_BROADCAST */
889 + nla_total_size(4) /* IFLA_TXQLEN */
890 + nla_total_size(4) /* IFLA_WEIGHT */
891 + nla_total_size(4) /* IFLA_MTU */
892 + nla_total_size(4) /* IFLA_LINK */
893 + nla_total_size(4) /* IFLA_MASTER */
894 + nla_total_size(1) /* IFLA_CARRIER */
895 + nla_total_size(4) /* IFLA_PROMISCUITY */
896 + nla_total_size(4) /* IFLA_NUM_TX_QUEUES */
897 + nla_total_size(4) /* IFLA_NUM_RX_QUEUES */
898 + nla_total_size(4) /* IFLA_MAX_GSO_SEGS */
899 + nla_total_size(4) /* IFLA_MAX_GSO_SIZE */
900 + nla_total_size(1) /* IFLA_OPERSTATE */
901 + nla_total_size(1) /* IFLA_LINKMODE */
902 + nla_total_size(4) /* IFLA_CARRIER_CHANGES */
903 + nla_total_size(4) /* IFLA_LINK_NETNSID */
904 + nla_total_size(ext_filter_mask
905 & RTEXT_FILTER_VF
? 4 : 0) /* IFLA_NUM_VF */
906 + rtnl_vfinfo_size(dev
, ext_filter_mask
) /* IFLA_VFINFO_LIST */
907 + rtnl_port_size(dev
, ext_filter_mask
) /* IFLA_VF_PORTS + IFLA_PORT_SELF */
908 + rtnl_link_get_size(dev
) /* IFLA_LINKINFO */
909 + rtnl_link_get_af_size(dev
, ext_filter_mask
) /* IFLA_AF_SPEC */
910 + nla_total_size(MAX_PHYS_ITEM_ID_LEN
) /* IFLA_PHYS_PORT_ID */
911 + nla_total_size(MAX_PHYS_ITEM_ID_LEN
) /* IFLA_PHYS_SWITCH_ID */
912 + nla_total_size(IFNAMSIZ
) /* IFLA_PHYS_PORT_NAME */
913 + nla_total_size(1); /* IFLA_PROTO_DOWN */
917 static int rtnl_vf_ports_fill(struct sk_buff
*skb
, struct net_device
*dev
)
919 struct nlattr
*vf_ports
;
920 struct nlattr
*vf_port
;
924 vf_ports
= nla_nest_start(skb
, IFLA_VF_PORTS
);
928 for (vf
= 0; vf
< dev_num_vf(dev
->dev
.parent
); vf
++) {
929 vf_port
= nla_nest_start(skb
, IFLA_VF_PORT
);
931 goto nla_put_failure
;
932 if (nla_put_u32(skb
, IFLA_PORT_VF
, vf
))
933 goto nla_put_failure
;
934 err
= dev
->netdev_ops
->ndo_get_vf_port(dev
, vf
, skb
);
935 if (err
== -EMSGSIZE
)
936 goto nla_put_failure
;
938 nla_nest_cancel(skb
, vf_port
);
941 nla_nest_end(skb
, vf_port
);
944 nla_nest_end(skb
, vf_ports
);
949 nla_nest_cancel(skb
, vf_ports
);
953 static int rtnl_port_self_fill(struct sk_buff
*skb
, struct net_device
*dev
)
955 struct nlattr
*port_self
;
958 port_self
= nla_nest_start(skb
, IFLA_PORT_SELF
);
962 err
= dev
->netdev_ops
->ndo_get_vf_port(dev
, PORT_SELF_VF
, skb
);
964 nla_nest_cancel(skb
, port_self
);
965 return (err
== -EMSGSIZE
) ? err
: 0;
968 nla_nest_end(skb
, port_self
);
973 static int rtnl_port_fill(struct sk_buff
*skb
, struct net_device
*dev
,
978 if (!dev
->netdev_ops
->ndo_get_vf_port
|| !dev
->dev
.parent
||
979 !(ext_filter_mask
& RTEXT_FILTER_VF
))
982 err
= rtnl_port_self_fill(skb
, dev
);
986 if (dev_num_vf(dev
->dev
.parent
)) {
987 err
= rtnl_vf_ports_fill(skb
, dev
);
995 static int rtnl_phys_port_id_fill(struct sk_buff
*skb
, struct net_device
*dev
)
998 struct netdev_phys_item_id ppid
;
1000 err
= dev_get_phys_port_id(dev
, &ppid
);
1002 if (err
== -EOPNOTSUPP
)
1007 if (nla_put(skb
, IFLA_PHYS_PORT_ID
, ppid
.id_len
, ppid
.id
))
1013 static int rtnl_phys_port_name_fill(struct sk_buff
*skb
, struct net_device
*dev
)
1015 char name
[IFNAMSIZ
];
1018 err
= dev_get_phys_port_name(dev
, name
, sizeof(name
));
1020 if (err
== -EOPNOTSUPP
)
1025 if (nla_put(skb
, IFLA_PHYS_PORT_NAME
, strlen(name
), name
))
1031 static int rtnl_phys_switch_id_fill(struct sk_buff
*skb
, struct net_device
*dev
)
1034 struct switchdev_attr attr
= {
1036 .id
= SWITCHDEV_ATTR_ID_PORT_PARENT_ID
,
1037 .flags
= SWITCHDEV_F_NO_RECURSE
,
1040 err
= switchdev_port_attr_get(dev
, &attr
);
1042 if (err
== -EOPNOTSUPP
)
1047 if (nla_put(skb
, IFLA_PHYS_SWITCH_ID
, attr
.u
.ppid
.id_len
,
1054 static noinline_for_stack
int rtnl_fill_stats(struct sk_buff
*skb
,
1055 struct net_device
*dev
)
1057 const struct rtnl_link_stats64
*stats
;
1058 struct rtnl_link_stats64 temp
;
1059 struct nlattr
*attr
;
1061 stats
= dev_get_stats(dev
, &temp
);
1063 attr
= nla_reserve(skb
, IFLA_STATS
,
1064 sizeof(struct rtnl_link_stats
));
1068 copy_rtnl_link_stats(nla_data(attr
), stats
);
1070 attr
= nla_reserve(skb
, IFLA_STATS64
,
1071 sizeof(struct rtnl_link_stats64
));
1075 copy_rtnl_link_stats64(nla_data(attr
), stats
);
1080 static noinline_for_stack
int rtnl_fill_vfinfo(struct sk_buff
*skb
,
1081 struct net_device
*dev
,
1083 struct nlattr
*vfinfo
)
1085 struct ifla_vf_rss_query_en vf_rss_query_en
;
1086 struct ifla_vf_link_state vf_linkstate
;
1087 struct ifla_vf_spoofchk vf_spoofchk
;
1088 struct ifla_vf_tx_rate vf_tx_rate
;
1089 struct ifla_vf_stats vf_stats
;
1090 struct ifla_vf_trust vf_trust
;
1091 struct ifla_vf_vlan vf_vlan
;
1092 struct ifla_vf_rate vf_rate
;
1093 struct nlattr
*vf
, *vfstats
;
1094 struct ifla_vf_mac vf_mac
;
1095 struct ifla_vf_info ivi
;
1097 /* Not all SR-IOV capable drivers support the
1098 * spoofcheck and "RSS query enable" query. Preset to
1099 * -1 so the user space tool can detect that the driver
1100 * didn't report anything.
1103 ivi
.rss_query_en
= -1;
1105 memset(ivi
.mac
, 0, sizeof(ivi
.mac
));
1106 /* The default value for VF link state is "auto"
1107 * IFLA_VF_LINK_STATE_AUTO which equals zero
1110 if (dev
->netdev_ops
->ndo_get_vf_config(dev
, vfs_num
, &ivi
))
1119 vf_rss_query_en
.vf
=
1120 vf_trust
.vf
= ivi
.vf
;
1122 memcpy(vf_mac
.mac
, ivi
.mac
, sizeof(ivi
.mac
));
1123 vf_vlan
.vlan
= ivi
.vlan
;
1124 vf_vlan
.qos
= ivi
.qos
;
1125 vf_tx_rate
.rate
= ivi
.max_tx_rate
;
1126 vf_rate
.min_tx_rate
= ivi
.min_tx_rate
;
1127 vf_rate
.max_tx_rate
= ivi
.max_tx_rate
;
1128 vf_spoofchk
.setting
= ivi
.spoofchk
;
1129 vf_linkstate
.link_state
= ivi
.linkstate
;
1130 vf_rss_query_en
.setting
= ivi
.rss_query_en
;
1131 vf_trust
.setting
= ivi
.trusted
;
1132 vf
= nla_nest_start(skb
, IFLA_VF_INFO
);
1134 nla_nest_cancel(skb
, vfinfo
);
1137 if (nla_put(skb
, IFLA_VF_MAC
, sizeof(vf_mac
), &vf_mac
) ||
1138 nla_put(skb
, IFLA_VF_VLAN
, sizeof(vf_vlan
), &vf_vlan
) ||
1139 nla_put(skb
, IFLA_VF_RATE
, sizeof(vf_rate
),
1141 nla_put(skb
, IFLA_VF_TX_RATE
, sizeof(vf_tx_rate
),
1143 nla_put(skb
, IFLA_VF_SPOOFCHK
, sizeof(vf_spoofchk
),
1145 nla_put(skb
, IFLA_VF_LINK_STATE
, sizeof(vf_linkstate
),
1147 nla_put(skb
, IFLA_VF_RSS_QUERY_EN
,
1148 sizeof(vf_rss_query_en
),
1149 &vf_rss_query_en
) ||
1150 nla_put(skb
, IFLA_VF_TRUST
,
1151 sizeof(vf_trust
), &vf_trust
))
1153 memset(&vf_stats
, 0, sizeof(vf_stats
));
1154 if (dev
->netdev_ops
->ndo_get_vf_stats
)
1155 dev
->netdev_ops
->ndo_get_vf_stats(dev
, vfs_num
,
1157 vfstats
= nla_nest_start(skb
, IFLA_VF_STATS
);
1159 nla_nest_cancel(skb
, vf
);
1160 nla_nest_cancel(skb
, vfinfo
);
1163 if (nla_put_u64(skb
, IFLA_VF_STATS_RX_PACKETS
,
1164 vf_stats
.rx_packets
) ||
1165 nla_put_u64(skb
, IFLA_VF_STATS_TX_PACKETS
,
1166 vf_stats
.tx_packets
) ||
1167 nla_put_u64(skb
, IFLA_VF_STATS_RX_BYTES
,
1168 vf_stats
.rx_bytes
) ||
1169 nla_put_u64(skb
, IFLA_VF_STATS_TX_BYTES
,
1170 vf_stats
.tx_bytes
) ||
1171 nla_put_u64(skb
, IFLA_VF_STATS_BROADCAST
,
1172 vf_stats
.broadcast
) ||
1173 nla_put_u64(skb
, IFLA_VF_STATS_MULTICAST
,
1174 vf_stats
.multicast
))
1176 nla_nest_end(skb
, vfstats
);
1177 nla_nest_end(skb
, vf
);
1181 static int rtnl_fill_link_ifmap(struct sk_buff
*skb
, struct net_device
*dev
)
1183 struct rtnl_link_ifmap map
;
1185 memset(&map
, 0, sizeof(map
));
1186 map
.mem_start
= dev
->mem_start
;
1187 map
.mem_end
= dev
->mem_end
;
1188 map
.base_addr
= dev
->base_addr
;
1191 map
.port
= dev
->if_port
;
1193 if (nla_put(skb
, IFLA_MAP
, sizeof(map
), &map
))
1199 static int rtnl_fill_ifinfo(struct sk_buff
*skb
, struct net_device
*dev
,
1200 int type
, u32 pid
, u32 seq
, u32 change
,
1201 unsigned int flags
, u32 ext_filter_mask
)
1203 struct ifinfomsg
*ifm
;
1204 struct nlmsghdr
*nlh
;
1205 struct nlattr
*af_spec
;
1206 struct rtnl_af_ops
*af_ops
;
1207 struct net_device
*upper_dev
= netdev_master_upper_dev_get(dev
);
1210 nlh
= nlmsg_put(skb
, pid
, seq
, type
, sizeof(*ifm
), flags
);
1214 ifm
= nlmsg_data(nlh
);
1215 ifm
->ifi_family
= AF_UNSPEC
;
1217 ifm
->ifi_type
= dev
->type
;
1218 ifm
->ifi_index
= dev
->ifindex
;
1219 ifm
->ifi_flags
= dev_get_flags(dev
);
1220 ifm
->ifi_change
= change
;
1222 if (nla_put_string(skb
, IFLA_IFNAME
, dev
->name
) ||
1223 nla_put_u32(skb
, IFLA_TXQLEN
, dev
->tx_queue_len
) ||
1224 nla_put_u8(skb
, IFLA_OPERSTATE
,
1225 netif_running(dev
) ? dev
->operstate
: IF_OPER_DOWN
) ||
1226 nla_put_u8(skb
, IFLA_LINKMODE
, dev
->link_mode
) ||
1227 nla_put_u32(skb
, IFLA_MTU
, dev
->mtu
) ||
1228 nla_put_u32(skb
, IFLA_GROUP
, dev
->group
) ||
1229 nla_put_u32(skb
, IFLA_PROMISCUITY
, dev
->promiscuity
) ||
1230 nla_put_u32(skb
, IFLA_NUM_TX_QUEUES
, dev
->num_tx_queues
) ||
1231 nla_put_u32(skb
, IFLA_GSO_MAX_SEGS
, dev
->gso_max_segs
) ||
1232 nla_put_u32(skb
, IFLA_GSO_MAX_SIZE
, dev
->gso_max_size
) ||
1234 nla_put_u32(skb
, IFLA_NUM_RX_QUEUES
, dev
->num_rx_queues
) ||
1236 (dev
->ifindex
!= dev_get_iflink(dev
) &&
1237 nla_put_u32(skb
, IFLA_LINK
, dev_get_iflink(dev
))) ||
1239 nla_put_u32(skb
, IFLA_MASTER
, upper_dev
->ifindex
)) ||
1240 nla_put_u8(skb
, IFLA_CARRIER
, netif_carrier_ok(dev
)) ||
1242 nla_put_string(skb
, IFLA_QDISC
, dev
->qdisc
->ops
->id
)) ||
1244 nla_put_string(skb
, IFLA_IFALIAS
, dev
->ifalias
)) ||
1245 nla_put_u32(skb
, IFLA_CARRIER_CHANGES
,
1246 atomic_read(&dev
->carrier_changes
)) ||
1247 nla_put_u8(skb
, IFLA_PROTO_DOWN
, dev
->proto_down
))
1248 goto nla_put_failure
;
1250 if (rtnl_fill_link_ifmap(skb
, dev
))
1251 goto nla_put_failure
;
1253 if (dev
->addr_len
) {
1254 if (nla_put(skb
, IFLA_ADDRESS
, dev
->addr_len
, dev
->dev_addr
) ||
1255 nla_put(skb
, IFLA_BROADCAST
, dev
->addr_len
, dev
->broadcast
))
1256 goto nla_put_failure
;
1259 if (rtnl_phys_port_id_fill(skb
, dev
))
1260 goto nla_put_failure
;
1262 if (rtnl_phys_port_name_fill(skb
, dev
))
1263 goto nla_put_failure
;
1265 if (rtnl_phys_switch_id_fill(skb
, dev
))
1266 goto nla_put_failure
;
1268 if (rtnl_fill_stats(skb
, dev
))
1269 goto nla_put_failure
;
1271 if (dev
->dev
.parent
&& (ext_filter_mask
& RTEXT_FILTER_VF
) &&
1272 nla_put_u32(skb
, IFLA_NUM_VF
, dev_num_vf(dev
->dev
.parent
)))
1273 goto nla_put_failure
;
1275 if (dev
->netdev_ops
->ndo_get_vf_config
&& dev
->dev
.parent
&&
1276 ext_filter_mask
& RTEXT_FILTER_VF
) {
1278 struct nlattr
*vfinfo
;
1279 int num_vfs
= dev_num_vf(dev
->dev
.parent
);
1281 vfinfo
= nla_nest_start(skb
, IFLA_VFINFO_LIST
);
1283 goto nla_put_failure
;
1284 for (i
= 0; i
< num_vfs
; i
++) {
1285 if (rtnl_fill_vfinfo(skb
, dev
, i
, vfinfo
))
1286 goto nla_put_failure
;
1289 nla_nest_end(skb
, vfinfo
);
1292 if (rtnl_port_fill(skb
, dev
, ext_filter_mask
))
1293 goto nla_put_failure
;
1295 if (dev
->rtnl_link_ops
|| rtnl_have_link_slave_info(dev
)) {
1296 if (rtnl_link_fill(skb
, dev
) < 0)
1297 goto nla_put_failure
;
1300 if (dev
->rtnl_link_ops
&&
1301 dev
->rtnl_link_ops
->get_link_net
) {
1302 struct net
*link_net
= dev
->rtnl_link_ops
->get_link_net(dev
);
1304 if (!net_eq(dev_net(dev
), link_net
)) {
1305 int id
= peernet2id_alloc(dev_net(dev
), link_net
);
1307 if (nla_put_s32(skb
, IFLA_LINK_NETNSID
, id
))
1308 goto nla_put_failure
;
1312 if (!(af_spec
= nla_nest_start(skb
, IFLA_AF_SPEC
)))
1313 goto nla_put_failure
;
1315 list_for_each_entry(af_ops
, &rtnl_af_ops
, list
) {
1316 if (af_ops
->fill_link_af
) {
1320 if (!(af
= nla_nest_start(skb
, af_ops
->family
)))
1321 goto nla_put_failure
;
1323 err
= af_ops
->fill_link_af(skb
, dev
, ext_filter_mask
);
1326 * Caller may return ENODATA to indicate that there
1327 * was no data to be dumped. This is not an error, it
1328 * means we should trim the attribute header and
1331 if (err
== -ENODATA
)
1332 nla_nest_cancel(skb
, af
);
1334 goto nla_put_failure
;
1336 nla_nest_end(skb
, af
);
1340 nla_nest_end(skb
, af_spec
);
1342 nlmsg_end(skb
, nlh
);
1346 nlmsg_cancel(skb
, nlh
);
1350 static const struct nla_policy ifla_policy
[IFLA_MAX
+1] = {
1351 [IFLA_IFNAME
] = { .type
= NLA_STRING
, .len
= IFNAMSIZ
-1 },
1352 [IFLA_ADDRESS
] = { .type
= NLA_BINARY
, .len
= MAX_ADDR_LEN
},
1353 [IFLA_BROADCAST
] = { .type
= NLA_BINARY
, .len
= MAX_ADDR_LEN
},
1354 [IFLA_MAP
] = { .len
= sizeof(struct rtnl_link_ifmap
) },
1355 [IFLA_MTU
] = { .type
= NLA_U32
},
1356 [IFLA_LINK
] = { .type
= NLA_U32
},
1357 [IFLA_MASTER
] = { .type
= NLA_U32
},
1358 [IFLA_CARRIER
] = { .type
= NLA_U8
},
1359 [IFLA_TXQLEN
] = { .type
= NLA_U32
},
1360 [IFLA_WEIGHT
] = { .type
= NLA_U32
},
1361 [IFLA_OPERSTATE
] = { .type
= NLA_U8
},
1362 [IFLA_LINKMODE
] = { .type
= NLA_U8
},
1363 [IFLA_LINKINFO
] = { .type
= NLA_NESTED
},
1364 [IFLA_NET_NS_PID
] = { .type
= NLA_U32
},
1365 [IFLA_NET_NS_FD
] = { .type
= NLA_U32
},
1366 [IFLA_IFALIAS
] = { .type
= NLA_STRING
, .len
= IFALIASZ
-1 },
1367 [IFLA_VFINFO_LIST
] = {. type
= NLA_NESTED
},
1368 [IFLA_VF_PORTS
] = { .type
= NLA_NESTED
},
1369 [IFLA_PORT_SELF
] = { .type
= NLA_NESTED
},
1370 [IFLA_AF_SPEC
] = { .type
= NLA_NESTED
},
1371 [IFLA_EXT_MASK
] = { .type
= NLA_U32
},
1372 [IFLA_PROMISCUITY
] = { .type
= NLA_U32
},
1373 [IFLA_NUM_TX_QUEUES
] = { .type
= NLA_U32
},
1374 [IFLA_NUM_RX_QUEUES
] = { .type
= NLA_U32
},
1375 [IFLA_PHYS_PORT_ID
] = { .type
= NLA_BINARY
, .len
= MAX_PHYS_ITEM_ID_LEN
},
1376 [IFLA_CARRIER_CHANGES
] = { .type
= NLA_U32
}, /* ignored */
1377 [IFLA_PHYS_SWITCH_ID
] = { .type
= NLA_BINARY
, .len
= MAX_PHYS_ITEM_ID_LEN
},
1378 [IFLA_LINK_NETNSID
] = { .type
= NLA_S32
},
1379 [IFLA_PROTO_DOWN
] = { .type
= NLA_U8
},
1382 static const struct nla_policy ifla_info_policy
[IFLA_INFO_MAX
+1] = {
1383 [IFLA_INFO_KIND
] = { .type
= NLA_STRING
},
1384 [IFLA_INFO_DATA
] = { .type
= NLA_NESTED
},
1385 [IFLA_INFO_SLAVE_KIND
] = { .type
= NLA_STRING
},
1386 [IFLA_INFO_SLAVE_DATA
] = { .type
= NLA_NESTED
},
1389 static const struct nla_policy ifla_vf_policy
[IFLA_VF_MAX
+1] = {
1390 [IFLA_VF_MAC
] = { .len
= sizeof(struct ifla_vf_mac
) },
1391 [IFLA_VF_VLAN
] = { .len
= sizeof(struct ifla_vf_vlan
) },
1392 [IFLA_VF_TX_RATE
] = { .len
= sizeof(struct ifla_vf_tx_rate
) },
1393 [IFLA_VF_SPOOFCHK
] = { .len
= sizeof(struct ifla_vf_spoofchk
) },
1394 [IFLA_VF_RATE
] = { .len
= sizeof(struct ifla_vf_rate
) },
1395 [IFLA_VF_LINK_STATE
] = { .len
= sizeof(struct ifla_vf_link_state
) },
1396 [IFLA_VF_RSS_QUERY_EN
] = { .len
= sizeof(struct ifla_vf_rss_query_en
) },
1397 [IFLA_VF_STATS
] = { .type
= NLA_NESTED
},
1398 [IFLA_VF_TRUST
] = { .len
= sizeof(struct ifla_vf_trust
) },
1399 [IFLA_VF_IB_NODE_GUID
] = { .len
= sizeof(struct ifla_vf_guid
) },
1400 [IFLA_VF_IB_PORT_GUID
] = { .len
= sizeof(struct ifla_vf_guid
) },
1403 static const struct nla_policy ifla_port_policy
[IFLA_PORT_MAX
+1] = {
1404 [IFLA_PORT_VF
] = { .type
= NLA_U32
},
1405 [IFLA_PORT_PROFILE
] = { .type
= NLA_STRING
,
1406 .len
= PORT_PROFILE_MAX
},
1407 [IFLA_PORT_VSI_TYPE
] = { .type
= NLA_BINARY
,
1408 .len
= sizeof(struct ifla_port_vsi
)},
1409 [IFLA_PORT_INSTANCE_UUID
] = { .type
= NLA_BINARY
,
1410 .len
= PORT_UUID_MAX
},
1411 [IFLA_PORT_HOST_UUID
] = { .type
= NLA_STRING
,
1412 .len
= PORT_UUID_MAX
},
1413 [IFLA_PORT_REQUEST
] = { .type
= NLA_U8
, },
1414 [IFLA_PORT_RESPONSE
] = { .type
= NLA_U16
, },
1417 static const struct rtnl_link_ops
*linkinfo_to_kind_ops(const struct nlattr
*nla
)
1419 const struct rtnl_link_ops
*ops
= NULL
;
1420 struct nlattr
*linfo
[IFLA_INFO_MAX
+ 1];
1422 if (nla_parse_nested(linfo
, IFLA_INFO_MAX
, nla
, ifla_info_policy
) < 0)
1425 if (linfo
[IFLA_INFO_KIND
]) {
1426 char kind
[MODULE_NAME_LEN
];
1428 nla_strlcpy(kind
, linfo
[IFLA_INFO_KIND
], sizeof(kind
));
1429 ops
= rtnl_link_ops_get(kind
);
1435 static bool link_master_filtered(struct net_device
*dev
, int master_idx
)
1437 struct net_device
*master
;
1442 master
= netdev_master_upper_dev_get(dev
);
1443 if (!master
|| master
->ifindex
!= master_idx
)
1449 static bool link_kind_filtered(const struct net_device
*dev
,
1450 const struct rtnl_link_ops
*kind_ops
)
1452 if (kind_ops
&& dev
->rtnl_link_ops
!= kind_ops
)
1458 static bool link_dump_filtered(struct net_device
*dev
,
1460 const struct rtnl_link_ops
*kind_ops
)
1462 if (link_master_filtered(dev
, master_idx
) ||
1463 link_kind_filtered(dev
, kind_ops
))
1469 static int rtnl_dump_ifinfo(struct sk_buff
*skb
, struct netlink_callback
*cb
)
1471 struct net
*net
= sock_net(skb
->sk
);
1474 struct net_device
*dev
;
1475 struct hlist_head
*head
;
1476 struct nlattr
*tb
[IFLA_MAX
+1];
1477 u32 ext_filter_mask
= 0;
1478 const struct rtnl_link_ops
*kind_ops
= NULL
;
1479 unsigned int flags
= NLM_F_MULTI
;
1485 s_idx
= cb
->args
[1];
1487 cb
->seq
= net
->dev_base_seq
;
1489 /* A hack to preserve kernel<->userspace interface.
1490 * The correct header is ifinfomsg. It is consistent with rtnl_getlink.
1491 * However, before Linux v3.9 the code here assumed rtgenmsg and that's
1492 * what iproute2 < v3.9.0 used.
1493 * We can detect the old iproute2. Even including the IFLA_EXT_MASK
1494 * attribute, its netlink message is shorter than struct ifinfomsg.
1496 hdrlen
= nlmsg_len(cb
->nlh
) < sizeof(struct ifinfomsg
) ?
1497 sizeof(struct rtgenmsg
) : sizeof(struct ifinfomsg
);
1499 if (nlmsg_parse(cb
->nlh
, hdrlen
, tb
, IFLA_MAX
, ifla_policy
) >= 0) {
1501 if (tb
[IFLA_EXT_MASK
])
1502 ext_filter_mask
= nla_get_u32(tb
[IFLA_EXT_MASK
]);
1504 if (tb
[IFLA_MASTER
])
1505 master_idx
= nla_get_u32(tb
[IFLA_MASTER
]);
1507 if (tb
[IFLA_LINKINFO
])
1508 kind_ops
= linkinfo_to_kind_ops(tb
[IFLA_LINKINFO
]);
1510 if (master_idx
|| kind_ops
)
1511 flags
|= NLM_F_DUMP_FILTERED
;
1514 for (h
= s_h
; h
< NETDEV_HASHENTRIES
; h
++, s_idx
= 0) {
1516 head
= &net
->dev_index_head
[h
];
1517 hlist_for_each_entry(dev
, head
, index_hlist
) {
1518 if (link_dump_filtered(dev
, master_idx
, kind_ops
))
1522 err
= rtnl_fill_ifinfo(skb
, dev
, RTM_NEWLINK
,
1523 NETLINK_CB(cb
->skb
).portid
,
1524 cb
->nlh
->nlmsg_seq
, 0,
1527 /* If we ran out of room on the first message,
1530 WARN_ON((err
== -EMSGSIZE
) && (skb
->len
== 0));
1535 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
1547 int rtnl_nla_parse_ifla(struct nlattr
**tb
, const struct nlattr
*head
, int len
)
1549 return nla_parse(tb
, IFLA_MAX
, head
, len
, ifla_policy
);
1551 EXPORT_SYMBOL(rtnl_nla_parse_ifla
);
1553 struct net
*rtnl_link_get_net(struct net
*src_net
, struct nlattr
*tb
[])
1556 /* Examine the link attributes and figure out which
1557 * network namespace we are talking about.
1559 if (tb
[IFLA_NET_NS_PID
])
1560 net
= get_net_ns_by_pid(nla_get_u32(tb
[IFLA_NET_NS_PID
]));
1561 else if (tb
[IFLA_NET_NS_FD
])
1562 net
= get_net_ns_by_fd(nla_get_u32(tb
[IFLA_NET_NS_FD
]));
1564 net
= get_net(src_net
);
1567 EXPORT_SYMBOL(rtnl_link_get_net
);
1569 static int validate_linkmsg(struct net_device
*dev
, struct nlattr
*tb
[])
1572 if (tb
[IFLA_ADDRESS
] &&
1573 nla_len(tb
[IFLA_ADDRESS
]) < dev
->addr_len
)
1576 if (tb
[IFLA_BROADCAST
] &&
1577 nla_len(tb
[IFLA_BROADCAST
]) < dev
->addr_len
)
1581 if (tb
[IFLA_AF_SPEC
]) {
1585 nla_for_each_nested(af
, tb
[IFLA_AF_SPEC
], rem
) {
1586 const struct rtnl_af_ops
*af_ops
;
1588 if (!(af_ops
= rtnl_af_lookup(nla_type(af
))))
1589 return -EAFNOSUPPORT
;
1591 if (!af_ops
->set_link_af
)
1594 if (af_ops
->validate_link_af
) {
1595 err
= af_ops
->validate_link_af(dev
, af
);
1605 static int handle_infiniband_guid(struct net_device
*dev
, struct ifla_vf_guid
*ivt
,
1608 const struct net_device_ops
*ops
= dev
->netdev_ops
;
1610 return ops
->ndo_set_vf_guid(dev
, ivt
->vf
, ivt
->guid
, guid_type
);
1613 static int handle_vf_guid(struct net_device
*dev
, struct ifla_vf_guid
*ivt
, int guid_type
)
1615 if (dev
->type
!= ARPHRD_INFINIBAND
)
1618 return handle_infiniband_guid(dev
, ivt
, guid_type
);
1621 static int do_setvfinfo(struct net_device
*dev
, struct nlattr
**tb
)
1623 const struct net_device_ops
*ops
= dev
->netdev_ops
;
1626 if (tb
[IFLA_VF_MAC
]) {
1627 struct ifla_vf_mac
*ivm
= nla_data(tb
[IFLA_VF_MAC
]);
1630 if (ops
->ndo_set_vf_mac
)
1631 err
= ops
->ndo_set_vf_mac(dev
, ivm
->vf
,
1637 if (tb
[IFLA_VF_VLAN
]) {
1638 struct ifla_vf_vlan
*ivv
= nla_data(tb
[IFLA_VF_VLAN
]);
1641 if (ops
->ndo_set_vf_vlan
)
1642 err
= ops
->ndo_set_vf_vlan(dev
, ivv
->vf
, ivv
->vlan
,
1648 if (tb
[IFLA_VF_TX_RATE
]) {
1649 struct ifla_vf_tx_rate
*ivt
= nla_data(tb
[IFLA_VF_TX_RATE
]);
1650 struct ifla_vf_info ivf
;
1653 if (ops
->ndo_get_vf_config
)
1654 err
= ops
->ndo_get_vf_config(dev
, ivt
->vf
, &ivf
);
1659 if (ops
->ndo_set_vf_rate
)
1660 err
= ops
->ndo_set_vf_rate(dev
, ivt
->vf
,
1667 if (tb
[IFLA_VF_RATE
]) {
1668 struct ifla_vf_rate
*ivt
= nla_data(tb
[IFLA_VF_RATE
]);
1671 if (ops
->ndo_set_vf_rate
)
1672 err
= ops
->ndo_set_vf_rate(dev
, ivt
->vf
,
1679 if (tb
[IFLA_VF_SPOOFCHK
]) {
1680 struct ifla_vf_spoofchk
*ivs
= nla_data(tb
[IFLA_VF_SPOOFCHK
]);
1683 if (ops
->ndo_set_vf_spoofchk
)
1684 err
= ops
->ndo_set_vf_spoofchk(dev
, ivs
->vf
,
1690 if (tb
[IFLA_VF_LINK_STATE
]) {
1691 struct ifla_vf_link_state
*ivl
= nla_data(tb
[IFLA_VF_LINK_STATE
]);
1694 if (ops
->ndo_set_vf_link_state
)
1695 err
= ops
->ndo_set_vf_link_state(dev
, ivl
->vf
,
1701 if (tb
[IFLA_VF_RSS_QUERY_EN
]) {
1702 struct ifla_vf_rss_query_en
*ivrssq_en
;
1705 ivrssq_en
= nla_data(tb
[IFLA_VF_RSS_QUERY_EN
]);
1706 if (ops
->ndo_set_vf_rss_query_en
)
1707 err
= ops
->ndo_set_vf_rss_query_en(dev
, ivrssq_en
->vf
,
1708 ivrssq_en
->setting
);
1713 if (tb
[IFLA_VF_TRUST
]) {
1714 struct ifla_vf_trust
*ivt
= nla_data(tb
[IFLA_VF_TRUST
]);
1717 if (ops
->ndo_set_vf_trust
)
1718 err
= ops
->ndo_set_vf_trust(dev
, ivt
->vf
, ivt
->setting
);
1723 if (tb
[IFLA_VF_IB_NODE_GUID
]) {
1724 struct ifla_vf_guid
*ivt
= nla_data(tb
[IFLA_VF_IB_NODE_GUID
]);
1726 if (!ops
->ndo_set_vf_guid
)
1729 return handle_vf_guid(dev
, ivt
, IFLA_VF_IB_NODE_GUID
);
1732 if (tb
[IFLA_VF_IB_PORT_GUID
]) {
1733 struct ifla_vf_guid
*ivt
= nla_data(tb
[IFLA_VF_IB_PORT_GUID
]);
1735 if (!ops
->ndo_set_vf_guid
)
1738 return handle_vf_guid(dev
, ivt
, IFLA_VF_IB_PORT_GUID
);
1744 static int do_set_master(struct net_device
*dev
, int ifindex
)
1746 struct net_device
*upper_dev
= netdev_master_upper_dev_get(dev
);
1747 const struct net_device_ops
*ops
;
1751 if (upper_dev
->ifindex
== ifindex
)
1753 ops
= upper_dev
->netdev_ops
;
1754 if (ops
->ndo_del_slave
) {
1755 err
= ops
->ndo_del_slave(upper_dev
, dev
);
1764 upper_dev
= __dev_get_by_index(dev_net(dev
), ifindex
);
1767 ops
= upper_dev
->netdev_ops
;
1768 if (ops
->ndo_add_slave
) {
1769 err
= ops
->ndo_add_slave(upper_dev
, dev
);
1779 #define DO_SETLINK_MODIFIED 0x01
1780 /* notify flag means notify + modified. */
1781 #define DO_SETLINK_NOTIFY 0x03
1782 static int do_setlink(const struct sk_buff
*skb
,
1783 struct net_device
*dev
, struct ifinfomsg
*ifm
,
1784 struct nlattr
**tb
, char *ifname
, int status
)
1786 const struct net_device_ops
*ops
= dev
->netdev_ops
;
1789 if (tb
[IFLA_NET_NS_PID
] || tb
[IFLA_NET_NS_FD
]) {
1790 struct net
*net
= rtnl_link_get_net(dev_net(dev
), tb
);
1795 if (!netlink_ns_capable(skb
, net
->user_ns
, CAP_NET_ADMIN
)) {
1800 err
= dev_change_net_namespace(dev
, net
, ifname
);
1804 status
|= DO_SETLINK_MODIFIED
;
1808 struct rtnl_link_ifmap
*u_map
;
1811 if (!ops
->ndo_set_config
) {
1816 if (!netif_device_present(dev
)) {
1821 u_map
= nla_data(tb
[IFLA_MAP
]);
1822 k_map
.mem_start
= (unsigned long) u_map
->mem_start
;
1823 k_map
.mem_end
= (unsigned long) u_map
->mem_end
;
1824 k_map
.base_addr
= (unsigned short) u_map
->base_addr
;
1825 k_map
.irq
= (unsigned char) u_map
->irq
;
1826 k_map
.dma
= (unsigned char) u_map
->dma
;
1827 k_map
.port
= (unsigned char) u_map
->port
;
1829 err
= ops
->ndo_set_config(dev
, &k_map
);
1833 status
|= DO_SETLINK_NOTIFY
;
1836 if (tb
[IFLA_ADDRESS
]) {
1837 struct sockaddr
*sa
;
1840 len
= sizeof(sa_family_t
) + dev
->addr_len
;
1841 sa
= kmalloc(len
, GFP_KERNEL
);
1846 sa
->sa_family
= dev
->type
;
1847 memcpy(sa
->sa_data
, nla_data(tb
[IFLA_ADDRESS
]),
1849 err
= dev_set_mac_address(dev
, sa
);
1853 status
|= DO_SETLINK_MODIFIED
;
1857 err
= dev_set_mtu(dev
, nla_get_u32(tb
[IFLA_MTU
]));
1860 status
|= DO_SETLINK_MODIFIED
;
1863 if (tb
[IFLA_GROUP
]) {
1864 dev_set_group(dev
, nla_get_u32(tb
[IFLA_GROUP
]));
1865 status
|= DO_SETLINK_NOTIFY
;
1869 * Interface selected by interface index but interface
1870 * name provided implies that a name change has been
1873 if (ifm
->ifi_index
> 0 && ifname
[0]) {
1874 err
= dev_change_name(dev
, ifname
);
1877 status
|= DO_SETLINK_MODIFIED
;
1880 if (tb
[IFLA_IFALIAS
]) {
1881 err
= dev_set_alias(dev
, nla_data(tb
[IFLA_IFALIAS
]),
1882 nla_len(tb
[IFLA_IFALIAS
]));
1885 status
|= DO_SETLINK_NOTIFY
;
1888 if (tb
[IFLA_BROADCAST
]) {
1889 nla_memcpy(dev
->broadcast
, tb
[IFLA_BROADCAST
], dev
->addr_len
);
1890 call_netdevice_notifiers(NETDEV_CHANGEADDR
, dev
);
1893 if (ifm
->ifi_flags
|| ifm
->ifi_change
) {
1894 err
= dev_change_flags(dev
, rtnl_dev_combine_flags(dev
, ifm
));
1899 if (tb
[IFLA_MASTER
]) {
1900 err
= do_set_master(dev
, nla_get_u32(tb
[IFLA_MASTER
]));
1903 status
|= DO_SETLINK_MODIFIED
;
1906 if (tb
[IFLA_CARRIER
]) {
1907 err
= dev_change_carrier(dev
, nla_get_u8(tb
[IFLA_CARRIER
]));
1910 status
|= DO_SETLINK_MODIFIED
;
1913 if (tb
[IFLA_TXQLEN
]) {
1914 unsigned long value
= nla_get_u32(tb
[IFLA_TXQLEN
]);
1916 if (dev
->tx_queue_len
^ value
)
1917 status
|= DO_SETLINK_NOTIFY
;
1919 dev
->tx_queue_len
= value
;
1922 if (tb
[IFLA_OPERSTATE
])
1923 set_operstate(dev
, nla_get_u8(tb
[IFLA_OPERSTATE
]));
1925 if (tb
[IFLA_LINKMODE
]) {
1926 unsigned char value
= nla_get_u8(tb
[IFLA_LINKMODE
]);
1928 write_lock_bh(&dev_base_lock
);
1929 if (dev
->link_mode
^ value
)
1930 status
|= DO_SETLINK_NOTIFY
;
1931 dev
->link_mode
= value
;
1932 write_unlock_bh(&dev_base_lock
);
1935 if (tb
[IFLA_VFINFO_LIST
]) {
1936 struct nlattr
*vfinfo
[IFLA_VF_MAX
+ 1];
1937 struct nlattr
*attr
;
1940 nla_for_each_nested(attr
, tb
[IFLA_VFINFO_LIST
], rem
) {
1941 if (nla_type(attr
) != IFLA_VF_INFO
||
1942 nla_len(attr
) < NLA_HDRLEN
) {
1946 err
= nla_parse_nested(vfinfo
, IFLA_VF_MAX
, attr
,
1950 err
= do_setvfinfo(dev
, vfinfo
);
1953 status
|= DO_SETLINK_NOTIFY
;
1958 if (tb
[IFLA_VF_PORTS
]) {
1959 struct nlattr
*port
[IFLA_PORT_MAX
+1];
1960 struct nlattr
*attr
;
1965 if (!ops
->ndo_set_vf_port
)
1968 nla_for_each_nested(attr
, tb
[IFLA_VF_PORTS
], rem
) {
1969 if (nla_type(attr
) != IFLA_VF_PORT
||
1970 nla_len(attr
) < NLA_HDRLEN
) {
1974 err
= nla_parse_nested(port
, IFLA_PORT_MAX
, attr
,
1978 if (!port
[IFLA_PORT_VF
]) {
1982 vf
= nla_get_u32(port
[IFLA_PORT_VF
]);
1983 err
= ops
->ndo_set_vf_port(dev
, vf
, port
);
1986 status
|= DO_SETLINK_NOTIFY
;
1991 if (tb
[IFLA_PORT_SELF
]) {
1992 struct nlattr
*port
[IFLA_PORT_MAX
+1];
1994 err
= nla_parse_nested(port
, IFLA_PORT_MAX
,
1995 tb
[IFLA_PORT_SELF
], ifla_port_policy
);
2000 if (ops
->ndo_set_vf_port
)
2001 err
= ops
->ndo_set_vf_port(dev
, PORT_SELF_VF
, port
);
2004 status
|= DO_SETLINK_NOTIFY
;
2007 if (tb
[IFLA_AF_SPEC
]) {
2011 nla_for_each_nested(af
, tb
[IFLA_AF_SPEC
], rem
) {
2012 const struct rtnl_af_ops
*af_ops
;
2014 if (!(af_ops
= rtnl_af_lookup(nla_type(af
))))
2017 err
= af_ops
->set_link_af(dev
, af
);
2021 status
|= DO_SETLINK_NOTIFY
;
2026 if (tb
[IFLA_PROTO_DOWN
]) {
2027 err
= dev_change_proto_down(dev
,
2028 nla_get_u8(tb
[IFLA_PROTO_DOWN
]));
2031 status
|= DO_SETLINK_NOTIFY
;
2035 if (status
& DO_SETLINK_MODIFIED
) {
2036 if (status
& DO_SETLINK_NOTIFY
)
2037 netdev_state_change(dev
);
2040 net_warn_ratelimited("A link change request failed with some changes committed already. Interface %s may have been left with an inconsistent configuration, please check.\n",
2047 static int rtnl_setlink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2049 struct net
*net
= sock_net(skb
->sk
);
2050 struct ifinfomsg
*ifm
;
2051 struct net_device
*dev
;
2053 struct nlattr
*tb
[IFLA_MAX
+1];
2054 char ifname
[IFNAMSIZ
];
2056 err
= nlmsg_parse(nlh
, sizeof(*ifm
), tb
, IFLA_MAX
, ifla_policy
);
2060 if (tb
[IFLA_IFNAME
])
2061 nla_strlcpy(ifname
, tb
[IFLA_IFNAME
], IFNAMSIZ
);
2066 ifm
= nlmsg_data(nlh
);
2067 if (ifm
->ifi_index
> 0)
2068 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
2069 else if (tb
[IFLA_IFNAME
])
2070 dev
= __dev_get_by_name(net
, ifname
);
2079 err
= validate_linkmsg(dev
, tb
);
2083 err
= do_setlink(skb
, dev
, ifm
, tb
, ifname
, 0);
2088 static int rtnl_group_dellink(const struct net
*net
, int group
)
2090 struct net_device
*dev
, *aux
;
2091 LIST_HEAD(list_kill
);
2097 for_each_netdev(net
, dev
) {
2098 if (dev
->group
== group
) {
2099 const struct rtnl_link_ops
*ops
;
2102 ops
= dev
->rtnl_link_ops
;
2103 if (!ops
|| !ops
->dellink
)
2111 for_each_netdev_safe(net
, dev
, aux
) {
2112 if (dev
->group
== group
) {
2113 const struct rtnl_link_ops
*ops
;
2115 ops
= dev
->rtnl_link_ops
;
2116 ops
->dellink(dev
, &list_kill
);
2119 unregister_netdevice_many(&list_kill
);
2124 int rtnl_delete_link(struct net_device
*dev
)
2126 const struct rtnl_link_ops
*ops
;
2127 LIST_HEAD(list_kill
);
2129 ops
= dev
->rtnl_link_ops
;
2130 if (!ops
|| !ops
->dellink
)
2133 ops
->dellink(dev
, &list_kill
);
2134 unregister_netdevice_many(&list_kill
);
2138 EXPORT_SYMBOL_GPL(rtnl_delete_link
);
2140 static int rtnl_dellink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2142 struct net
*net
= sock_net(skb
->sk
);
2143 struct net_device
*dev
;
2144 struct ifinfomsg
*ifm
;
2145 char ifname
[IFNAMSIZ
];
2146 struct nlattr
*tb
[IFLA_MAX
+1];
2149 err
= nlmsg_parse(nlh
, sizeof(*ifm
), tb
, IFLA_MAX
, ifla_policy
);
2153 if (tb
[IFLA_IFNAME
])
2154 nla_strlcpy(ifname
, tb
[IFLA_IFNAME
], IFNAMSIZ
);
2156 ifm
= nlmsg_data(nlh
);
2157 if (ifm
->ifi_index
> 0)
2158 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
2159 else if (tb
[IFLA_IFNAME
])
2160 dev
= __dev_get_by_name(net
, ifname
);
2161 else if (tb
[IFLA_GROUP
])
2162 return rtnl_group_dellink(net
, nla_get_u32(tb
[IFLA_GROUP
]));
2169 return rtnl_delete_link(dev
);
2172 int rtnl_configure_link(struct net_device
*dev
, const struct ifinfomsg
*ifm
)
2174 unsigned int old_flags
;
2177 old_flags
= dev
->flags
;
2178 if (ifm
&& (ifm
->ifi_flags
|| ifm
->ifi_change
)) {
2179 err
= __dev_change_flags(dev
, rtnl_dev_combine_flags(dev
, ifm
));
2184 dev
->rtnl_link_state
= RTNL_LINK_INITIALIZED
;
2186 __dev_notify_flags(dev
, old_flags
, ~0U);
2189 EXPORT_SYMBOL(rtnl_configure_link
);
2191 struct net_device
*rtnl_create_link(struct net
*net
,
2192 const char *ifname
, unsigned char name_assign_type
,
2193 const struct rtnl_link_ops
*ops
, struct nlattr
*tb
[])
2196 struct net_device
*dev
;
2197 unsigned int num_tx_queues
= 1;
2198 unsigned int num_rx_queues
= 1;
2200 if (tb
[IFLA_NUM_TX_QUEUES
])
2201 num_tx_queues
= nla_get_u32(tb
[IFLA_NUM_TX_QUEUES
]);
2202 else if (ops
->get_num_tx_queues
)
2203 num_tx_queues
= ops
->get_num_tx_queues();
2205 if (tb
[IFLA_NUM_RX_QUEUES
])
2206 num_rx_queues
= nla_get_u32(tb
[IFLA_NUM_RX_QUEUES
]);
2207 else if (ops
->get_num_rx_queues
)
2208 num_rx_queues
= ops
->get_num_rx_queues();
2211 dev
= alloc_netdev_mqs(ops
->priv_size
, ifname
, name_assign_type
,
2212 ops
->setup
, num_tx_queues
, num_rx_queues
);
2216 dev_net_set(dev
, net
);
2217 dev
->rtnl_link_ops
= ops
;
2218 dev
->rtnl_link_state
= RTNL_LINK_INITIALIZING
;
2221 dev
->mtu
= nla_get_u32(tb
[IFLA_MTU
]);
2222 if (tb
[IFLA_ADDRESS
]) {
2223 memcpy(dev
->dev_addr
, nla_data(tb
[IFLA_ADDRESS
]),
2224 nla_len(tb
[IFLA_ADDRESS
]));
2225 dev
->addr_assign_type
= NET_ADDR_SET
;
2227 if (tb
[IFLA_BROADCAST
])
2228 memcpy(dev
->broadcast
, nla_data(tb
[IFLA_BROADCAST
]),
2229 nla_len(tb
[IFLA_BROADCAST
]));
2230 if (tb
[IFLA_TXQLEN
])
2231 dev
->tx_queue_len
= nla_get_u32(tb
[IFLA_TXQLEN
]);
2232 if (tb
[IFLA_OPERSTATE
])
2233 set_operstate(dev
, nla_get_u8(tb
[IFLA_OPERSTATE
]));
2234 if (tb
[IFLA_LINKMODE
])
2235 dev
->link_mode
= nla_get_u8(tb
[IFLA_LINKMODE
]);
2237 dev_set_group(dev
, nla_get_u32(tb
[IFLA_GROUP
]));
2242 return ERR_PTR(err
);
2244 EXPORT_SYMBOL(rtnl_create_link
);
2246 static int rtnl_group_changelink(const struct sk_buff
*skb
,
2247 struct net
*net
, int group
,
2248 struct ifinfomsg
*ifm
,
2251 struct net_device
*dev
, *aux
;
2254 for_each_netdev_safe(net
, dev
, aux
) {
2255 if (dev
->group
== group
) {
2256 err
= do_setlink(skb
, dev
, ifm
, tb
, NULL
, 0);
2265 static int rtnl_newlink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2267 struct net
*net
= sock_net(skb
->sk
);
2268 const struct rtnl_link_ops
*ops
;
2269 const struct rtnl_link_ops
*m_ops
= NULL
;
2270 struct net_device
*dev
;
2271 struct net_device
*master_dev
= NULL
;
2272 struct ifinfomsg
*ifm
;
2273 char kind
[MODULE_NAME_LEN
];
2274 char ifname
[IFNAMSIZ
];
2275 struct nlattr
*tb
[IFLA_MAX
+1];
2276 struct nlattr
*linkinfo
[IFLA_INFO_MAX
+1];
2277 unsigned char name_assign_type
= NET_NAME_USER
;
2280 #ifdef CONFIG_MODULES
2283 err
= nlmsg_parse(nlh
, sizeof(*ifm
), tb
, IFLA_MAX
, ifla_policy
);
2287 if (tb
[IFLA_IFNAME
])
2288 nla_strlcpy(ifname
, tb
[IFLA_IFNAME
], IFNAMSIZ
);
2292 ifm
= nlmsg_data(nlh
);
2293 if (ifm
->ifi_index
> 0)
2294 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
2297 dev
= __dev_get_by_name(net
, ifname
);
2303 master_dev
= netdev_master_upper_dev_get(dev
);
2305 m_ops
= master_dev
->rtnl_link_ops
;
2308 err
= validate_linkmsg(dev
, tb
);
2312 if (tb
[IFLA_LINKINFO
]) {
2313 err
= nla_parse_nested(linkinfo
, IFLA_INFO_MAX
,
2314 tb
[IFLA_LINKINFO
], ifla_info_policy
);
2318 memset(linkinfo
, 0, sizeof(linkinfo
));
2320 if (linkinfo
[IFLA_INFO_KIND
]) {
2321 nla_strlcpy(kind
, linkinfo
[IFLA_INFO_KIND
], sizeof(kind
));
2322 ops
= rtnl_link_ops_get(kind
);
2329 struct nlattr
*attr
[ops
? ops
->maxtype
+ 1 : 1];
2330 struct nlattr
*slave_attr
[m_ops
? m_ops
->slave_maxtype
+ 1 : 1];
2331 struct nlattr
**data
= NULL
;
2332 struct nlattr
**slave_data
= NULL
;
2333 struct net
*dest_net
, *link_net
= NULL
;
2336 if (ops
->maxtype
&& linkinfo
[IFLA_INFO_DATA
]) {
2337 err
= nla_parse_nested(attr
, ops
->maxtype
,
2338 linkinfo
[IFLA_INFO_DATA
],
2344 if (ops
->validate
) {
2345 err
= ops
->validate(tb
, data
);
2352 if (m_ops
->slave_maxtype
&&
2353 linkinfo
[IFLA_INFO_SLAVE_DATA
]) {
2354 err
= nla_parse_nested(slave_attr
,
2355 m_ops
->slave_maxtype
,
2356 linkinfo
[IFLA_INFO_SLAVE_DATA
],
2357 m_ops
->slave_policy
);
2360 slave_data
= slave_attr
;
2362 if (m_ops
->slave_validate
) {
2363 err
= m_ops
->slave_validate(tb
, slave_data
);
2372 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
2374 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
2377 if (linkinfo
[IFLA_INFO_DATA
]) {
2378 if (!ops
|| ops
!= dev
->rtnl_link_ops
||
2382 err
= ops
->changelink(dev
, tb
, data
);
2385 status
|= DO_SETLINK_NOTIFY
;
2388 if (linkinfo
[IFLA_INFO_SLAVE_DATA
]) {
2389 if (!m_ops
|| !m_ops
->slave_changelink
)
2392 err
= m_ops
->slave_changelink(master_dev
, dev
,
2396 status
|= DO_SETLINK_NOTIFY
;
2399 return do_setlink(skb
, dev
, ifm
, tb
, ifname
, status
);
2402 if (!(nlh
->nlmsg_flags
& NLM_F_CREATE
)) {
2403 if (ifm
->ifi_index
== 0 && tb
[IFLA_GROUP
])
2404 return rtnl_group_changelink(skb
, net
,
2405 nla_get_u32(tb
[IFLA_GROUP
]),
2410 if (tb
[IFLA_MAP
] || tb
[IFLA_MASTER
] || tb
[IFLA_PROTINFO
])
2414 #ifdef CONFIG_MODULES
2417 request_module("rtnl-link-%s", kind
);
2419 ops
= rtnl_link_ops_get(kind
);
2431 snprintf(ifname
, IFNAMSIZ
, "%s%%d", ops
->kind
);
2432 name_assign_type
= NET_NAME_ENUM
;
2435 dest_net
= rtnl_link_get_net(net
, tb
);
2436 if (IS_ERR(dest_net
))
2437 return PTR_ERR(dest_net
);
2440 if (!netlink_ns_capable(skb
, dest_net
->user_ns
, CAP_NET_ADMIN
))
2443 if (tb
[IFLA_LINK_NETNSID
]) {
2444 int id
= nla_get_s32(tb
[IFLA_LINK_NETNSID
]);
2446 link_net
= get_net_ns_by_id(dest_net
, id
);
2452 if (!netlink_ns_capable(skb
, link_net
->user_ns
, CAP_NET_ADMIN
))
2456 dev
= rtnl_create_link(link_net
? : dest_net
, ifname
,
2457 name_assign_type
, ops
, tb
);
2463 dev
->ifindex
= ifm
->ifi_index
;
2466 err
= ops
->newlink(link_net
? : net
, dev
, tb
, data
);
2467 /* Drivers should call free_netdev() in ->destructor
2468 * and unregister it on failure after registration
2469 * so that device could be finally freed in rtnl_unlock.
2472 /* If device is not registered at all, free it now */
2473 if (dev
->reg_state
== NETREG_UNINITIALIZED
)
2478 err
= register_netdevice(dev
);
2484 err
= rtnl_configure_link(dev
, ifm
);
2486 goto out_unregister
;
2488 err
= dev_change_net_namespace(dev
, dest_net
, ifname
);
2490 goto out_unregister
;
2499 LIST_HEAD(list_kill
);
2501 ops
->dellink(dev
, &list_kill
);
2502 unregister_netdevice_many(&list_kill
);
2504 unregister_netdevice(dev
);
2510 static int rtnl_getlink(struct sk_buff
*skb
, struct nlmsghdr
* nlh
)
2512 struct net
*net
= sock_net(skb
->sk
);
2513 struct ifinfomsg
*ifm
;
2514 char ifname
[IFNAMSIZ
];
2515 struct nlattr
*tb
[IFLA_MAX
+1];
2516 struct net_device
*dev
= NULL
;
2517 struct sk_buff
*nskb
;
2519 u32 ext_filter_mask
= 0;
2521 err
= nlmsg_parse(nlh
, sizeof(*ifm
), tb
, IFLA_MAX
, ifla_policy
);
2525 if (tb
[IFLA_IFNAME
])
2526 nla_strlcpy(ifname
, tb
[IFLA_IFNAME
], IFNAMSIZ
);
2528 if (tb
[IFLA_EXT_MASK
])
2529 ext_filter_mask
= nla_get_u32(tb
[IFLA_EXT_MASK
]);
2531 ifm
= nlmsg_data(nlh
);
2532 if (ifm
->ifi_index
> 0)
2533 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
2534 else if (tb
[IFLA_IFNAME
])
2535 dev
= __dev_get_by_name(net
, ifname
);
2542 nskb
= nlmsg_new(if_nlmsg_size(dev
, ext_filter_mask
), GFP_KERNEL
);
2546 err
= rtnl_fill_ifinfo(nskb
, dev
, RTM_NEWLINK
, NETLINK_CB(skb
).portid
,
2547 nlh
->nlmsg_seq
, 0, 0, ext_filter_mask
);
2549 /* -EMSGSIZE implies BUG in if_nlmsg_size */
2550 WARN_ON(err
== -EMSGSIZE
);
2553 err
= rtnl_unicast(nskb
, net
, NETLINK_CB(skb
).portid
);
2558 static u16
rtnl_calcit(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2560 struct net
*net
= sock_net(skb
->sk
);
2561 struct net_device
*dev
;
2562 struct nlattr
*tb
[IFLA_MAX
+1];
2563 u32 ext_filter_mask
= 0;
2564 u16 min_ifinfo_dump_size
= 0;
2567 /* Same kernel<->userspace interface hack as in rtnl_dump_ifinfo. */
2568 hdrlen
= nlmsg_len(nlh
) < sizeof(struct ifinfomsg
) ?
2569 sizeof(struct rtgenmsg
) : sizeof(struct ifinfomsg
);
2571 if (nlmsg_parse(nlh
, hdrlen
, tb
, IFLA_MAX
, ifla_policy
) >= 0) {
2572 if (tb
[IFLA_EXT_MASK
])
2573 ext_filter_mask
= nla_get_u32(tb
[IFLA_EXT_MASK
]);
2576 if (!ext_filter_mask
)
2577 return NLMSG_GOODSIZE
;
2579 * traverse the list of net devices and compute the minimum
2580 * buffer size based upon the filter mask.
2582 list_for_each_entry(dev
, &net
->dev_base_head
, dev_list
) {
2583 min_ifinfo_dump_size
= max_t(u16
, min_ifinfo_dump_size
,
2588 return min_ifinfo_dump_size
;
2591 static int rtnl_dump_all(struct sk_buff
*skb
, struct netlink_callback
*cb
)
2594 int s_idx
= cb
->family
;
2598 for (idx
= 1; idx
<= RTNL_FAMILY_MAX
; idx
++) {
2599 int type
= cb
->nlh
->nlmsg_type
-RTM_BASE
;
2600 if (idx
< s_idx
|| idx
== PF_PACKET
)
2602 if (rtnl_msg_handlers
[idx
] == NULL
||
2603 rtnl_msg_handlers
[idx
][type
].dumpit
== NULL
)
2606 memset(&cb
->args
[0], 0, sizeof(cb
->args
));
2610 if (rtnl_msg_handlers
[idx
][type
].dumpit(skb
, cb
))
2618 struct sk_buff
*rtmsg_ifinfo_build_skb(int type
, struct net_device
*dev
,
2619 unsigned int change
, gfp_t flags
)
2621 struct net
*net
= dev_net(dev
);
2622 struct sk_buff
*skb
;
2624 size_t if_info_size
;
2626 skb
= nlmsg_new((if_info_size
= if_nlmsg_size(dev
, 0)), flags
);
2630 err
= rtnl_fill_ifinfo(skb
, dev
, type
, 0, 0, change
, 0, 0);
2632 /* -EMSGSIZE implies BUG in if_nlmsg_size() */
2633 WARN_ON(err
== -EMSGSIZE
);
2640 rtnl_set_sk_err(net
, RTNLGRP_LINK
, err
);
2644 void rtmsg_ifinfo_send(struct sk_buff
*skb
, struct net_device
*dev
, gfp_t flags
)
2646 struct net
*net
= dev_net(dev
);
2648 rtnl_notify(skb
, net
, 0, RTNLGRP_LINK
, NULL
, flags
);
2651 void rtmsg_ifinfo(int type
, struct net_device
*dev
, unsigned int change
,
2654 struct sk_buff
*skb
;
2656 if (dev
->reg_state
!= NETREG_REGISTERED
)
2659 skb
= rtmsg_ifinfo_build_skb(type
, dev
, change
, flags
);
2661 rtmsg_ifinfo_send(skb
, dev
, flags
);
2663 EXPORT_SYMBOL(rtmsg_ifinfo
);
2665 static int nlmsg_populate_fdb_fill(struct sk_buff
*skb
,
2666 struct net_device
*dev
,
2667 u8
*addr
, u16 vid
, u32 pid
, u32 seq
,
2668 int type
, unsigned int flags
,
2669 int nlflags
, u16 ndm_state
)
2671 struct nlmsghdr
*nlh
;
2674 nlh
= nlmsg_put(skb
, pid
, seq
, type
, sizeof(*ndm
), nlflags
);
2678 ndm
= nlmsg_data(nlh
);
2679 ndm
->ndm_family
= AF_BRIDGE
;
2682 ndm
->ndm_flags
= flags
;
2684 ndm
->ndm_ifindex
= dev
->ifindex
;
2685 ndm
->ndm_state
= ndm_state
;
2687 if (nla_put(skb
, NDA_LLADDR
, ETH_ALEN
, addr
))
2688 goto nla_put_failure
;
2690 if (nla_put(skb
, NDA_VLAN
, sizeof(u16
), &vid
))
2691 goto nla_put_failure
;
2693 nlmsg_end(skb
, nlh
);
2697 nlmsg_cancel(skb
, nlh
);
2701 static inline size_t rtnl_fdb_nlmsg_size(void)
2703 return NLMSG_ALIGN(sizeof(struct ndmsg
)) + nla_total_size(ETH_ALEN
);
2706 static void rtnl_fdb_notify(struct net_device
*dev
, u8
*addr
, u16 vid
, int type
,
2709 struct net
*net
= dev_net(dev
);
2710 struct sk_buff
*skb
;
2713 skb
= nlmsg_new(rtnl_fdb_nlmsg_size(), GFP_ATOMIC
);
2717 err
= nlmsg_populate_fdb_fill(skb
, dev
, addr
, vid
,
2718 0, 0, type
, NTF_SELF
, 0, ndm_state
);
2724 rtnl_notify(skb
, net
, 0, RTNLGRP_NEIGH
, NULL
, GFP_ATOMIC
);
2727 rtnl_set_sk_err(net
, RTNLGRP_NEIGH
, err
);
2731 * ndo_dflt_fdb_add - default netdevice operation to add an FDB entry
2733 int ndo_dflt_fdb_add(struct ndmsg
*ndm
,
2734 struct nlattr
*tb
[],
2735 struct net_device
*dev
,
2736 const unsigned char *addr
, u16 vid
,
2741 /* If aging addresses are supported device will need to
2742 * implement its own handler for this.
2744 if (ndm
->ndm_state
&& !(ndm
->ndm_state
& NUD_PERMANENT
)) {
2745 pr_info("%s: FDB only supports static addresses\n", dev
->name
);
2750 pr_info("%s: vlans aren't supported yet for dev_uc|mc_add()\n", dev
->name
);
2754 if (is_unicast_ether_addr(addr
) || is_link_local_ether_addr(addr
))
2755 err
= dev_uc_add_excl(dev
, addr
);
2756 else if (is_multicast_ether_addr(addr
))
2757 err
= dev_mc_add_excl(dev
, addr
);
2759 /* Only return duplicate errors if NLM_F_EXCL is set */
2760 if (err
== -EEXIST
&& !(flags
& NLM_F_EXCL
))
2765 EXPORT_SYMBOL(ndo_dflt_fdb_add
);
2767 static int fdb_vid_parse(struct nlattr
*vlan_attr
, u16
*p_vid
)
2772 if (nla_len(vlan_attr
) != sizeof(u16
)) {
2773 pr_info("PF_BRIDGE: RTM_NEWNEIGH with invalid vlan\n");
2777 vid
= nla_get_u16(vlan_attr
);
2779 if (!vid
|| vid
>= VLAN_VID_MASK
) {
2780 pr_info("PF_BRIDGE: RTM_NEWNEIGH with invalid vlan id %d\n",
2789 static int rtnl_fdb_add(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2791 struct net
*net
= sock_net(skb
->sk
);
2793 struct nlattr
*tb
[NDA_MAX
+1];
2794 struct net_device
*dev
;
2799 err
= nlmsg_parse(nlh
, sizeof(*ndm
), tb
, NDA_MAX
, NULL
);
2803 ndm
= nlmsg_data(nlh
);
2804 if (ndm
->ndm_ifindex
== 0) {
2805 pr_info("PF_BRIDGE: RTM_NEWNEIGH with invalid ifindex\n");
2809 dev
= __dev_get_by_index(net
, ndm
->ndm_ifindex
);
2811 pr_info("PF_BRIDGE: RTM_NEWNEIGH with unknown ifindex\n");
2815 if (!tb
[NDA_LLADDR
] || nla_len(tb
[NDA_LLADDR
]) != ETH_ALEN
) {
2816 pr_info("PF_BRIDGE: RTM_NEWNEIGH with invalid address\n");
2820 addr
= nla_data(tb
[NDA_LLADDR
]);
2822 err
= fdb_vid_parse(tb
[NDA_VLAN
], &vid
);
2828 /* Support fdb on master device the net/bridge default case */
2829 if ((!ndm
->ndm_flags
|| ndm
->ndm_flags
& NTF_MASTER
) &&
2830 (dev
->priv_flags
& IFF_BRIDGE_PORT
)) {
2831 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
2832 const struct net_device_ops
*ops
= br_dev
->netdev_ops
;
2834 err
= ops
->ndo_fdb_add(ndm
, tb
, dev
, addr
, vid
,
2839 ndm
->ndm_flags
&= ~NTF_MASTER
;
2842 /* Embedded bridge, macvlan, and any other device support */
2843 if ((ndm
->ndm_flags
& NTF_SELF
)) {
2844 if (dev
->netdev_ops
->ndo_fdb_add
)
2845 err
= dev
->netdev_ops
->ndo_fdb_add(ndm
, tb
, dev
, addr
,
2849 err
= ndo_dflt_fdb_add(ndm
, tb
, dev
, addr
, vid
,
2853 rtnl_fdb_notify(dev
, addr
, vid
, RTM_NEWNEIGH
,
2855 ndm
->ndm_flags
&= ~NTF_SELF
;
2863 * ndo_dflt_fdb_del - default netdevice operation to delete an FDB entry
2865 int ndo_dflt_fdb_del(struct ndmsg
*ndm
,
2866 struct nlattr
*tb
[],
2867 struct net_device
*dev
,
2868 const unsigned char *addr
, u16 vid
)
2872 /* If aging addresses are supported device will need to
2873 * implement its own handler for this.
2875 if (!(ndm
->ndm_state
& NUD_PERMANENT
)) {
2876 pr_info("%s: FDB only supports static addresses\n", dev
->name
);
2880 if (is_unicast_ether_addr(addr
) || is_link_local_ether_addr(addr
))
2881 err
= dev_uc_del(dev
, addr
);
2882 else if (is_multicast_ether_addr(addr
))
2883 err
= dev_mc_del(dev
, addr
);
2887 EXPORT_SYMBOL(ndo_dflt_fdb_del
);
2889 static int rtnl_fdb_del(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2891 struct net
*net
= sock_net(skb
->sk
);
2893 struct nlattr
*tb
[NDA_MAX
+1];
2894 struct net_device
*dev
;
2899 if (!netlink_capable(skb
, CAP_NET_ADMIN
))
2902 err
= nlmsg_parse(nlh
, sizeof(*ndm
), tb
, NDA_MAX
, NULL
);
2906 ndm
= nlmsg_data(nlh
);
2907 if (ndm
->ndm_ifindex
== 0) {
2908 pr_info("PF_BRIDGE: RTM_DELNEIGH with invalid ifindex\n");
2912 dev
= __dev_get_by_index(net
, ndm
->ndm_ifindex
);
2914 pr_info("PF_BRIDGE: RTM_DELNEIGH with unknown ifindex\n");
2918 if (!tb
[NDA_LLADDR
] || nla_len(tb
[NDA_LLADDR
]) != ETH_ALEN
) {
2919 pr_info("PF_BRIDGE: RTM_DELNEIGH with invalid address\n");
2923 addr
= nla_data(tb
[NDA_LLADDR
]);
2925 err
= fdb_vid_parse(tb
[NDA_VLAN
], &vid
);
2931 /* Support fdb on master device the net/bridge default case */
2932 if ((!ndm
->ndm_flags
|| ndm
->ndm_flags
& NTF_MASTER
) &&
2933 (dev
->priv_flags
& IFF_BRIDGE_PORT
)) {
2934 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
2935 const struct net_device_ops
*ops
= br_dev
->netdev_ops
;
2937 if (ops
->ndo_fdb_del
)
2938 err
= ops
->ndo_fdb_del(ndm
, tb
, dev
, addr
, vid
);
2943 ndm
->ndm_flags
&= ~NTF_MASTER
;
2946 /* Embedded bridge, macvlan, and any other device support */
2947 if (ndm
->ndm_flags
& NTF_SELF
) {
2948 if (dev
->netdev_ops
->ndo_fdb_del
)
2949 err
= dev
->netdev_ops
->ndo_fdb_del(ndm
, tb
, dev
, addr
,
2952 err
= ndo_dflt_fdb_del(ndm
, tb
, dev
, addr
, vid
);
2955 rtnl_fdb_notify(dev
, addr
, vid
, RTM_DELNEIGH
,
2957 ndm
->ndm_flags
&= ~NTF_SELF
;
2964 static int nlmsg_populate_fdb(struct sk_buff
*skb
,
2965 struct netlink_callback
*cb
,
2966 struct net_device
*dev
,
2968 struct netdev_hw_addr_list
*list
)
2970 struct netdev_hw_addr
*ha
;
2974 portid
= NETLINK_CB(cb
->skb
).portid
;
2975 seq
= cb
->nlh
->nlmsg_seq
;
2977 list_for_each_entry(ha
, &list
->list
, list
) {
2978 if (*idx
< cb
->args
[0])
2981 err
= nlmsg_populate_fdb_fill(skb
, dev
, ha
->addr
, 0,
2983 RTM_NEWNEIGH
, NTF_SELF
,
2984 NLM_F_MULTI
, NUD_PERMANENT
);
2994 * ndo_dflt_fdb_dump - default netdevice operation to dump an FDB table.
2995 * @nlh: netlink message header
2998 * Default netdevice operation to dump the existing unicast address list.
2999 * Returns number of addresses from list put in skb.
3001 int ndo_dflt_fdb_dump(struct sk_buff
*skb
,
3002 struct netlink_callback
*cb
,
3003 struct net_device
*dev
,
3004 struct net_device
*filter_dev
,
3009 netif_addr_lock_bh(dev
);
3010 err
= nlmsg_populate_fdb(skb
, cb
, dev
, &idx
, &dev
->uc
);
3013 nlmsg_populate_fdb(skb
, cb
, dev
, &idx
, &dev
->mc
);
3015 netif_addr_unlock_bh(dev
);
3019 EXPORT_SYMBOL(ndo_dflt_fdb_dump
);
3021 static int rtnl_fdb_dump(struct sk_buff
*skb
, struct netlink_callback
*cb
)
3023 struct net_device
*dev
;
3024 struct nlattr
*tb
[IFLA_MAX
+1];
3025 struct net_device
*br_dev
= NULL
;
3026 const struct net_device_ops
*ops
= NULL
;
3027 const struct net_device_ops
*cops
= NULL
;
3028 struct ifinfomsg
*ifm
= nlmsg_data(cb
->nlh
);
3029 struct net
*net
= sock_net(skb
->sk
);
3034 if (nlmsg_parse(cb
->nlh
, sizeof(struct ifinfomsg
), tb
, IFLA_MAX
,
3035 ifla_policy
) == 0) {
3036 if (tb
[IFLA_MASTER
])
3037 br_idx
= nla_get_u32(tb
[IFLA_MASTER
]);
3040 brport_idx
= ifm
->ifi_index
;
3043 br_dev
= __dev_get_by_index(net
, br_idx
);
3047 ops
= br_dev
->netdev_ops
;
3051 for_each_netdev(net
, dev
) {
3052 if (brport_idx
&& (dev
->ifindex
!= brport_idx
))
3055 if (!br_idx
) { /* user did not specify a specific bridge */
3056 if (dev
->priv_flags
& IFF_BRIDGE_PORT
) {
3057 br_dev
= netdev_master_upper_dev_get(dev
);
3058 cops
= br_dev
->netdev_ops
;
3062 if (dev
!= br_dev
&&
3063 !(dev
->priv_flags
& IFF_BRIDGE_PORT
))
3066 if (br_dev
!= netdev_master_upper_dev_get(dev
) &&
3067 !(dev
->priv_flags
& IFF_EBRIDGE
))
3073 if (dev
->priv_flags
& IFF_BRIDGE_PORT
) {
3074 if (cops
&& cops
->ndo_fdb_dump
)
3075 idx
= cops
->ndo_fdb_dump(skb
, cb
, br_dev
, dev
,
3078 if (cb
->args
[1] == -EMSGSIZE
)
3081 if (dev
->netdev_ops
->ndo_fdb_dump
)
3082 idx
= dev
->netdev_ops
->ndo_fdb_dump(skb
, cb
, dev
, NULL
,
3085 idx
= ndo_dflt_fdb_dump(skb
, cb
, dev
, NULL
, idx
);
3086 if (cb
->args
[1] == -EMSGSIZE
)
3096 static int brport_nla_put_flag(struct sk_buff
*skb
, u32 flags
, u32 mask
,
3097 unsigned int attrnum
, unsigned int flag
)
3100 return nla_put_u8(skb
, attrnum
, !!(flags
& flag
));
3104 int ndo_dflt_bridge_getlink(struct sk_buff
*skb
, u32 pid
, u32 seq
,
3105 struct net_device
*dev
, u16 mode
,
3106 u32 flags
, u32 mask
, int nlflags
,
3108 int (*vlan_fill
)(struct sk_buff
*skb
,
3109 struct net_device
*dev
,
3112 struct nlmsghdr
*nlh
;
3113 struct ifinfomsg
*ifm
;
3114 struct nlattr
*br_afspec
;
3115 struct nlattr
*protinfo
;
3116 u8 operstate
= netif_running(dev
) ? dev
->operstate
: IF_OPER_DOWN
;
3117 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
3120 nlh
= nlmsg_put(skb
, pid
, seq
, RTM_NEWLINK
, sizeof(*ifm
), nlflags
);
3124 ifm
= nlmsg_data(nlh
);
3125 ifm
->ifi_family
= AF_BRIDGE
;
3127 ifm
->ifi_type
= dev
->type
;
3128 ifm
->ifi_index
= dev
->ifindex
;
3129 ifm
->ifi_flags
= dev_get_flags(dev
);
3130 ifm
->ifi_change
= 0;
3133 if (nla_put_string(skb
, IFLA_IFNAME
, dev
->name
) ||
3134 nla_put_u32(skb
, IFLA_MTU
, dev
->mtu
) ||
3135 nla_put_u8(skb
, IFLA_OPERSTATE
, operstate
) ||
3137 nla_put_u32(skb
, IFLA_MASTER
, br_dev
->ifindex
)) ||
3139 nla_put(skb
, IFLA_ADDRESS
, dev
->addr_len
, dev
->dev_addr
)) ||
3140 (dev
->ifindex
!= dev_get_iflink(dev
) &&
3141 nla_put_u32(skb
, IFLA_LINK
, dev_get_iflink(dev
))))
3142 goto nla_put_failure
;
3144 br_afspec
= nla_nest_start(skb
, IFLA_AF_SPEC
);
3146 goto nla_put_failure
;
3148 if (nla_put_u16(skb
, IFLA_BRIDGE_FLAGS
, BRIDGE_FLAGS_SELF
)) {
3149 nla_nest_cancel(skb
, br_afspec
);
3150 goto nla_put_failure
;
3153 if (mode
!= BRIDGE_MODE_UNDEF
) {
3154 if (nla_put_u16(skb
, IFLA_BRIDGE_MODE
, mode
)) {
3155 nla_nest_cancel(skb
, br_afspec
);
3156 goto nla_put_failure
;
3160 err
= vlan_fill(skb
, dev
, filter_mask
);
3162 nla_nest_cancel(skb
, br_afspec
);
3163 goto nla_put_failure
;
3166 nla_nest_end(skb
, br_afspec
);
3168 protinfo
= nla_nest_start(skb
, IFLA_PROTINFO
| NLA_F_NESTED
);
3170 goto nla_put_failure
;
3172 if (brport_nla_put_flag(skb
, flags
, mask
,
3173 IFLA_BRPORT_MODE
, BR_HAIRPIN_MODE
) ||
3174 brport_nla_put_flag(skb
, flags
, mask
,
3175 IFLA_BRPORT_GUARD
, BR_BPDU_GUARD
) ||
3176 brport_nla_put_flag(skb
, flags
, mask
,
3177 IFLA_BRPORT_FAST_LEAVE
,
3178 BR_MULTICAST_FAST_LEAVE
) ||
3179 brport_nla_put_flag(skb
, flags
, mask
,
3180 IFLA_BRPORT_PROTECT
, BR_ROOT_BLOCK
) ||
3181 brport_nla_put_flag(skb
, flags
, mask
,
3182 IFLA_BRPORT_LEARNING
, BR_LEARNING
) ||
3183 brport_nla_put_flag(skb
, flags
, mask
,
3184 IFLA_BRPORT_LEARNING_SYNC
, BR_LEARNING_SYNC
) ||
3185 brport_nla_put_flag(skb
, flags
, mask
,
3186 IFLA_BRPORT_UNICAST_FLOOD
, BR_FLOOD
) ||
3187 brport_nla_put_flag(skb
, flags
, mask
,
3188 IFLA_BRPORT_PROXYARP
, BR_PROXYARP
)) {
3189 nla_nest_cancel(skb
, protinfo
);
3190 goto nla_put_failure
;
3193 nla_nest_end(skb
, protinfo
);
3195 nlmsg_end(skb
, nlh
);
3198 nlmsg_cancel(skb
, nlh
);
3199 return err
? err
: -EMSGSIZE
;
3201 EXPORT_SYMBOL_GPL(ndo_dflt_bridge_getlink
);
3203 static int rtnl_bridge_getlink(struct sk_buff
*skb
, struct netlink_callback
*cb
)
3205 struct net
*net
= sock_net(skb
->sk
);
3206 struct net_device
*dev
;
3208 u32 portid
= NETLINK_CB(cb
->skb
).portid
;
3209 u32 seq
= cb
->nlh
->nlmsg_seq
;
3210 u32 filter_mask
= 0;
3213 if (nlmsg_len(cb
->nlh
) > sizeof(struct ifinfomsg
)) {
3214 struct nlattr
*extfilt
;
3216 extfilt
= nlmsg_find_attr(cb
->nlh
, sizeof(struct ifinfomsg
),
3219 if (nla_len(extfilt
) < sizeof(filter_mask
))
3222 filter_mask
= nla_get_u32(extfilt
);
3227 for_each_netdev_rcu(net
, dev
) {
3228 const struct net_device_ops
*ops
= dev
->netdev_ops
;
3229 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
3231 if (br_dev
&& br_dev
->netdev_ops
->ndo_bridge_getlink
) {
3232 if (idx
>= cb
->args
[0]) {
3233 err
= br_dev
->netdev_ops
->ndo_bridge_getlink(
3234 skb
, portid
, seq
, dev
,
3235 filter_mask
, NLM_F_MULTI
);
3236 if (err
< 0 && err
!= -EOPNOTSUPP
)
3242 if (ops
->ndo_bridge_getlink
) {
3243 if (idx
>= cb
->args
[0]) {
3244 err
= ops
->ndo_bridge_getlink(skb
, portid
,
3248 if (err
< 0 && err
!= -EOPNOTSUPP
)
3260 static inline size_t bridge_nlmsg_size(void)
3262 return NLMSG_ALIGN(sizeof(struct ifinfomsg
))
3263 + nla_total_size(IFNAMSIZ
) /* IFLA_IFNAME */
3264 + nla_total_size(MAX_ADDR_LEN
) /* IFLA_ADDRESS */
3265 + nla_total_size(sizeof(u32
)) /* IFLA_MASTER */
3266 + nla_total_size(sizeof(u32
)) /* IFLA_MTU */
3267 + nla_total_size(sizeof(u32
)) /* IFLA_LINK */
3268 + nla_total_size(sizeof(u32
)) /* IFLA_OPERSTATE */
3269 + nla_total_size(sizeof(u8
)) /* IFLA_PROTINFO */
3270 + nla_total_size(sizeof(struct nlattr
)) /* IFLA_AF_SPEC */
3271 + nla_total_size(sizeof(u16
)) /* IFLA_BRIDGE_FLAGS */
3272 + nla_total_size(sizeof(u16
)); /* IFLA_BRIDGE_MODE */
3275 static int rtnl_bridge_notify(struct net_device
*dev
)
3277 struct net
*net
= dev_net(dev
);
3278 struct sk_buff
*skb
;
3279 int err
= -EOPNOTSUPP
;
3281 if (!dev
->netdev_ops
->ndo_bridge_getlink
)
3284 skb
= nlmsg_new(bridge_nlmsg_size(), GFP_ATOMIC
);
3290 err
= dev
->netdev_ops
->ndo_bridge_getlink(skb
, 0, 0, dev
, 0, 0);
3297 rtnl_notify(skb
, net
, 0, RTNLGRP_LINK
, NULL
, GFP_ATOMIC
);
3300 WARN_ON(err
== -EMSGSIZE
);
3303 rtnl_set_sk_err(net
, RTNLGRP_LINK
, err
);
3307 static int rtnl_bridge_setlink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
3309 struct net
*net
= sock_net(skb
->sk
);
3310 struct ifinfomsg
*ifm
;
3311 struct net_device
*dev
;
3312 struct nlattr
*br_spec
, *attr
= NULL
;
3313 int rem
, err
= -EOPNOTSUPP
;
3315 bool have_flags
= false;
3317 if (nlmsg_len(nlh
) < sizeof(*ifm
))
3320 ifm
= nlmsg_data(nlh
);
3321 if (ifm
->ifi_family
!= AF_BRIDGE
)
3322 return -EPFNOSUPPORT
;
3324 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
3326 pr_info("PF_BRIDGE: RTM_SETLINK with unknown ifindex\n");
3330 br_spec
= nlmsg_find_attr(nlh
, sizeof(struct ifinfomsg
), IFLA_AF_SPEC
);
3332 nla_for_each_nested(attr
, br_spec
, rem
) {
3333 if (nla_type(attr
) == IFLA_BRIDGE_FLAGS
) {
3334 if (nla_len(attr
) < sizeof(flags
))
3338 flags
= nla_get_u16(attr
);
3344 if (!flags
|| (flags
& BRIDGE_FLAGS_MASTER
)) {
3345 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
3347 if (!br_dev
|| !br_dev
->netdev_ops
->ndo_bridge_setlink
) {
3352 err
= br_dev
->netdev_ops
->ndo_bridge_setlink(dev
, nlh
, flags
);
3356 flags
&= ~BRIDGE_FLAGS_MASTER
;
3359 if ((flags
& BRIDGE_FLAGS_SELF
)) {
3360 if (!dev
->netdev_ops
->ndo_bridge_setlink
)
3363 err
= dev
->netdev_ops
->ndo_bridge_setlink(dev
, nlh
,
3366 flags
&= ~BRIDGE_FLAGS_SELF
;
3368 /* Generate event to notify upper layer of bridge
3371 err
= rtnl_bridge_notify(dev
);
3376 memcpy(nla_data(attr
), &flags
, sizeof(flags
));
3381 static int rtnl_bridge_dellink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
3383 struct net
*net
= sock_net(skb
->sk
);
3384 struct ifinfomsg
*ifm
;
3385 struct net_device
*dev
;
3386 struct nlattr
*br_spec
, *attr
= NULL
;
3387 int rem
, err
= -EOPNOTSUPP
;
3389 bool have_flags
= false;
3391 if (nlmsg_len(nlh
) < sizeof(*ifm
))
3394 ifm
= nlmsg_data(nlh
);
3395 if (ifm
->ifi_family
!= AF_BRIDGE
)
3396 return -EPFNOSUPPORT
;
3398 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
3400 pr_info("PF_BRIDGE: RTM_SETLINK with unknown ifindex\n");
3404 br_spec
= nlmsg_find_attr(nlh
, sizeof(struct ifinfomsg
), IFLA_AF_SPEC
);
3406 nla_for_each_nested(attr
, br_spec
, rem
) {
3407 if (nla_type(attr
) == IFLA_BRIDGE_FLAGS
) {
3408 if (nla_len(attr
) < sizeof(flags
))
3412 flags
= nla_get_u16(attr
);
3418 if (!flags
|| (flags
& BRIDGE_FLAGS_MASTER
)) {
3419 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
3421 if (!br_dev
|| !br_dev
->netdev_ops
->ndo_bridge_dellink
) {
3426 err
= br_dev
->netdev_ops
->ndo_bridge_dellink(dev
, nlh
, flags
);
3430 flags
&= ~BRIDGE_FLAGS_MASTER
;
3433 if ((flags
& BRIDGE_FLAGS_SELF
)) {
3434 if (!dev
->netdev_ops
->ndo_bridge_dellink
)
3437 err
= dev
->netdev_ops
->ndo_bridge_dellink(dev
, nlh
,
3441 flags
&= ~BRIDGE_FLAGS_SELF
;
3443 /* Generate event to notify upper layer of bridge
3446 err
= rtnl_bridge_notify(dev
);
3451 memcpy(nla_data(attr
), &flags
, sizeof(flags
));
3456 /* Process one rtnetlink message. */
3458 static int rtnetlink_rcv_msg(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
3460 struct net
*net
= sock_net(skb
->sk
);
3461 rtnl_doit_func doit
;
3467 type
= nlh
->nlmsg_type
;
3473 /* All the messages must have at least 1 byte length */
3474 if (nlmsg_len(nlh
) < sizeof(struct rtgenmsg
))
3477 family
= ((struct rtgenmsg
*)nlmsg_data(nlh
))->rtgen_family
;
3480 if (kind
!= 2 && !netlink_net_capable(skb
, CAP_NET_ADMIN
))
3483 if (kind
== 2 && nlh
->nlmsg_flags
&NLM_F_DUMP
) {
3485 rtnl_dumpit_func dumpit
;
3486 rtnl_calcit_func calcit
;
3487 u16 min_dump_alloc
= 0;
3489 dumpit
= rtnl_get_dumpit(family
, type
);
3492 calcit
= rtnl_get_calcit(family
, type
);
3494 min_dump_alloc
= calcit(skb
, nlh
);
3499 struct netlink_dump_control c
= {
3501 .min_dump_alloc
= min_dump_alloc
,
3503 err
= netlink_dump_start(rtnl
, skb
, nlh
, &c
);
3509 doit
= rtnl_get_doit(family
, type
);
3513 return doit(skb
, nlh
);
3516 static void rtnetlink_rcv(struct sk_buff
*skb
)
3519 netlink_rcv_skb(skb
, &rtnetlink_rcv_msg
);
3523 static int rtnetlink_event(struct notifier_block
*this, unsigned long event
, void *ptr
)
3525 struct net_device
*dev
= netdev_notifier_info_to_dev(ptr
);
3531 case NETDEV_POST_INIT
:
3532 case NETDEV_REGISTER
:
3534 case NETDEV_PRE_TYPE_CHANGE
:
3535 case NETDEV_GOING_DOWN
:
3536 case NETDEV_UNREGISTER
:
3537 case NETDEV_UNREGISTER_FINAL
:
3538 case NETDEV_RELEASE
:
3540 case NETDEV_BONDING_INFO
:
3543 rtmsg_ifinfo(RTM_NEWLINK
, dev
, 0, GFP_KERNEL
);
3549 static struct notifier_block rtnetlink_dev_notifier
= {
3550 .notifier_call
= rtnetlink_event
,
3554 static int __net_init
rtnetlink_net_init(struct net
*net
)
3557 struct netlink_kernel_cfg cfg
= {
3558 .groups
= RTNLGRP_MAX
,
3559 .input
= rtnetlink_rcv
,
3560 .cb_mutex
= &rtnl_mutex
,
3561 .flags
= NL_CFG_F_NONROOT_RECV
,
3564 sk
= netlink_kernel_create(net
, NETLINK_ROUTE
, &cfg
);
3571 static void __net_exit
rtnetlink_net_exit(struct net
*net
)
3573 netlink_kernel_release(net
->rtnl
);
3577 static struct pernet_operations rtnetlink_net_ops
= {
3578 .init
= rtnetlink_net_init
,
3579 .exit
= rtnetlink_net_exit
,
3582 void __init
rtnetlink_init(void)
3584 if (register_pernet_subsys(&rtnetlink_net_ops
))
3585 panic("rtnetlink_init: cannot initialize rtnetlink\n");
3587 register_netdevice_notifier(&rtnetlink_dev_notifier
);
3589 rtnl_register(PF_UNSPEC
, RTM_GETLINK
, rtnl_getlink
,
3590 rtnl_dump_ifinfo
, rtnl_calcit
);
3591 rtnl_register(PF_UNSPEC
, RTM_SETLINK
, rtnl_setlink
, NULL
, NULL
);
3592 rtnl_register(PF_UNSPEC
, RTM_NEWLINK
, rtnl_newlink
, NULL
, NULL
);
3593 rtnl_register(PF_UNSPEC
, RTM_DELLINK
, rtnl_dellink
, NULL
, NULL
);
3595 rtnl_register(PF_UNSPEC
, RTM_GETADDR
, NULL
, rtnl_dump_all
, NULL
);
3596 rtnl_register(PF_UNSPEC
, RTM_GETROUTE
, NULL
, rtnl_dump_all
, NULL
);
3598 rtnl_register(PF_BRIDGE
, RTM_NEWNEIGH
, rtnl_fdb_add
, NULL
, NULL
);
3599 rtnl_register(PF_BRIDGE
, RTM_DELNEIGH
, rtnl_fdb_del
, NULL
, NULL
);
3600 rtnl_register(PF_BRIDGE
, RTM_GETNEIGH
, NULL
, rtnl_fdb_dump
, NULL
);
3602 rtnl_register(PF_BRIDGE
, RTM_GETLINK
, NULL
, rtnl_bridge_getlink
, NULL
);
3603 rtnl_register(PF_BRIDGE
, RTM_DELLINK
, rtnl_bridge_dellink
, NULL
, NULL
);
3604 rtnl_register(PF_BRIDGE
, RTM_SETLINK
, rtnl_bridge_setlink
, NULL
, NULL
);