2 * INET An implementation of the TCP/IP protocol suite for the LINUX
3 * operating system. INET is implemented using the BSD Socket
4 * interface as the means of communication with the user level.
6 * Routing netlink socket interface: protocol independent part.
8 * Authors: Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
16 * Vitaly E. Lavrov RTA_OK arithmetics was wrong.
19 #include <linux/errno.h>
20 #include <linux/module.h>
21 #include <linux/types.h>
22 #include <linux/socket.h>
23 #include <linux/kernel.h>
24 #include <linux/timer.h>
25 #include <linux/string.h>
26 #include <linux/sockios.h>
27 #include <linux/net.h>
28 #include <linux/fcntl.h>
30 #include <linux/slab.h>
31 #include <linux/interrupt.h>
32 #include <linux/capability.h>
33 #include <linux/skbuff.h>
34 #include <linux/init.h>
35 #include <linux/security.h>
36 #include <linux/mutex.h>
37 #include <linux/if_addr.h>
38 #include <linux/if_bridge.h>
39 #include <linux/pci.h>
40 #include <linux/etherdevice.h>
42 #include <asm/uaccess.h>
44 #include <linux/inet.h>
45 #include <linux/netdevice.h>
47 #include <net/protocol.h>
49 #include <net/route.h>
52 #include <net/pkt_sched.h>
53 #include <net/fib_rules.h>
54 #include <net/rtnetlink.h>
55 #include <net/net_namespace.h>
59 rtnl_dumpit_func dumpit
;
60 rtnl_calcit_func calcit
;
63 static DEFINE_MUTEX(rtnl_mutex
);
67 mutex_lock(&rtnl_mutex
);
69 EXPORT_SYMBOL(rtnl_lock
);
71 void __rtnl_unlock(void)
73 mutex_unlock(&rtnl_mutex
);
76 void rtnl_unlock(void)
78 /* This fellow will unlock it for us. */
81 EXPORT_SYMBOL(rtnl_unlock
);
83 int rtnl_trylock(void)
85 return mutex_trylock(&rtnl_mutex
);
87 EXPORT_SYMBOL(rtnl_trylock
);
89 int rtnl_is_locked(void)
91 return mutex_is_locked(&rtnl_mutex
);
93 EXPORT_SYMBOL(rtnl_is_locked
);
95 #ifdef CONFIG_PROVE_LOCKING
96 int lockdep_rtnl_is_held(void)
98 return lockdep_is_held(&rtnl_mutex
);
100 EXPORT_SYMBOL(lockdep_rtnl_is_held
);
101 #endif /* #ifdef CONFIG_PROVE_LOCKING */
103 static struct rtnl_link
*rtnl_msg_handlers
[RTNL_FAMILY_MAX
+ 1];
105 static inline int rtm_msgindex(int msgtype
)
107 int msgindex
= msgtype
- RTM_BASE
;
110 * msgindex < 0 implies someone tried to register a netlink
111 * control code. msgindex >= RTM_NR_MSGTYPES may indicate that
112 * the message type has not been added to linux/rtnetlink.h
114 BUG_ON(msgindex
< 0 || msgindex
>= RTM_NR_MSGTYPES
);
119 static rtnl_doit_func
rtnl_get_doit(int protocol
, int msgindex
)
121 struct rtnl_link
*tab
;
123 if (protocol
<= RTNL_FAMILY_MAX
)
124 tab
= rtnl_msg_handlers
[protocol
];
128 if (tab
== NULL
|| tab
[msgindex
].doit
== NULL
)
129 tab
= rtnl_msg_handlers
[PF_UNSPEC
];
131 return tab
[msgindex
].doit
;
134 static rtnl_dumpit_func
rtnl_get_dumpit(int protocol
, int msgindex
)
136 struct rtnl_link
*tab
;
138 if (protocol
<= RTNL_FAMILY_MAX
)
139 tab
= rtnl_msg_handlers
[protocol
];
143 if (tab
== NULL
|| tab
[msgindex
].dumpit
== NULL
)
144 tab
= rtnl_msg_handlers
[PF_UNSPEC
];
146 return tab
[msgindex
].dumpit
;
149 static rtnl_calcit_func
rtnl_get_calcit(int protocol
, int msgindex
)
151 struct rtnl_link
*tab
;
153 if (protocol
<= RTNL_FAMILY_MAX
)
154 tab
= rtnl_msg_handlers
[protocol
];
158 if (tab
== NULL
|| tab
[msgindex
].calcit
== NULL
)
159 tab
= rtnl_msg_handlers
[PF_UNSPEC
];
161 return tab
[msgindex
].calcit
;
165 * __rtnl_register - Register a rtnetlink message type
166 * @protocol: Protocol family or PF_UNSPEC
167 * @msgtype: rtnetlink message type
168 * @doit: Function pointer called for each request message
169 * @dumpit: Function pointer called for each dump request (NLM_F_DUMP) message
170 * @calcit: Function pointer to calc size of dump message
172 * Registers the specified function pointers (at least one of them has
173 * to be non-NULL) to be called whenever a request message for the
174 * specified protocol family and message type is received.
176 * The special protocol family PF_UNSPEC may be used to define fallback
177 * function pointers for the case when no entry for the specific protocol
180 * Returns 0 on success or a negative error code.
182 int __rtnl_register(int protocol
, int msgtype
,
183 rtnl_doit_func doit
, rtnl_dumpit_func dumpit
,
184 rtnl_calcit_func calcit
)
186 struct rtnl_link
*tab
;
189 BUG_ON(protocol
< 0 || protocol
> RTNL_FAMILY_MAX
);
190 msgindex
= rtm_msgindex(msgtype
);
192 tab
= rtnl_msg_handlers
[protocol
];
194 tab
= kcalloc(RTM_NR_MSGTYPES
, sizeof(*tab
), GFP_KERNEL
);
198 rtnl_msg_handlers
[protocol
] = tab
;
202 tab
[msgindex
].doit
= doit
;
205 tab
[msgindex
].dumpit
= dumpit
;
208 tab
[msgindex
].calcit
= calcit
;
212 EXPORT_SYMBOL_GPL(__rtnl_register
);
215 * rtnl_register - Register a rtnetlink message type
217 * Identical to __rtnl_register() but panics on failure. This is useful
218 * as failure of this function is very unlikely, it can only happen due
219 * to lack of memory when allocating the chain to store all message
220 * handlers for a protocol. Meant for use in init functions where lack
221 * of memory implies no sense in continuing.
223 void rtnl_register(int protocol
, int msgtype
,
224 rtnl_doit_func doit
, rtnl_dumpit_func dumpit
,
225 rtnl_calcit_func calcit
)
227 if (__rtnl_register(protocol
, msgtype
, doit
, dumpit
, calcit
) < 0)
228 panic("Unable to register rtnetlink message handler, "
229 "protocol = %d, message type = %d\n",
232 EXPORT_SYMBOL_GPL(rtnl_register
);
235 * rtnl_unregister - Unregister a rtnetlink message type
236 * @protocol: Protocol family or PF_UNSPEC
237 * @msgtype: rtnetlink message type
239 * Returns 0 on success or a negative error code.
241 int rtnl_unregister(int protocol
, int msgtype
)
245 BUG_ON(protocol
< 0 || protocol
> RTNL_FAMILY_MAX
);
246 msgindex
= rtm_msgindex(msgtype
);
248 if (rtnl_msg_handlers
[protocol
] == NULL
)
251 rtnl_msg_handlers
[protocol
][msgindex
].doit
= NULL
;
252 rtnl_msg_handlers
[protocol
][msgindex
].dumpit
= NULL
;
256 EXPORT_SYMBOL_GPL(rtnl_unregister
);
259 * rtnl_unregister_all - Unregister all rtnetlink message type of a protocol
260 * @protocol : Protocol family or PF_UNSPEC
262 * Identical to calling rtnl_unregster() for all registered message types
263 * of a certain protocol family.
265 void rtnl_unregister_all(int protocol
)
267 BUG_ON(protocol
< 0 || protocol
> RTNL_FAMILY_MAX
);
269 kfree(rtnl_msg_handlers
[protocol
]);
270 rtnl_msg_handlers
[protocol
] = NULL
;
272 EXPORT_SYMBOL_GPL(rtnl_unregister_all
);
274 static LIST_HEAD(link_ops
);
276 static const struct rtnl_link_ops
*rtnl_link_ops_get(const char *kind
)
278 const struct rtnl_link_ops
*ops
;
280 list_for_each_entry(ops
, &link_ops
, list
) {
281 if (!strcmp(ops
->kind
, kind
))
288 * __rtnl_link_register - Register rtnl_link_ops with rtnetlink.
289 * @ops: struct rtnl_link_ops * to register
291 * The caller must hold the rtnl_mutex. This function should be used
292 * by drivers that create devices during module initialization. It
293 * must be called before registering the devices.
295 * Returns 0 on success or a negative error code.
297 int __rtnl_link_register(struct rtnl_link_ops
*ops
)
299 if (rtnl_link_ops_get(ops
->kind
))
302 /* The check for setup is here because if ops
303 * does not have that filled up, it is not possible
304 * to use the ops for creating device. So do not
305 * fill up dellink as well. That disables rtnl_dellink.
307 if (ops
->setup
&& !ops
->dellink
)
308 ops
->dellink
= unregister_netdevice_queue
;
310 list_add_tail(&ops
->list
, &link_ops
);
313 EXPORT_SYMBOL_GPL(__rtnl_link_register
);
316 * rtnl_link_register - Register rtnl_link_ops with rtnetlink.
317 * @ops: struct rtnl_link_ops * to register
319 * Returns 0 on success or a negative error code.
321 int rtnl_link_register(struct rtnl_link_ops
*ops
)
326 err
= __rtnl_link_register(ops
);
330 EXPORT_SYMBOL_GPL(rtnl_link_register
);
332 static void __rtnl_kill_links(struct net
*net
, struct rtnl_link_ops
*ops
)
334 struct net_device
*dev
;
335 LIST_HEAD(list_kill
);
337 for_each_netdev(net
, dev
) {
338 if (dev
->rtnl_link_ops
== ops
)
339 ops
->dellink(dev
, &list_kill
);
341 unregister_netdevice_many(&list_kill
);
345 * __rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
346 * @ops: struct rtnl_link_ops * to unregister
348 * The caller must hold the rtnl_mutex.
350 void __rtnl_link_unregister(struct rtnl_link_ops
*ops
)
355 __rtnl_kill_links(net
, ops
);
357 list_del(&ops
->list
);
359 EXPORT_SYMBOL_GPL(__rtnl_link_unregister
);
361 /* Return with the rtnl_lock held when there are no network
362 * devices unregistering in any network namespace.
364 static void rtnl_lock_unregistering_all(void)
371 prepare_to_wait(&netdev_unregistering_wq
, &wait
,
372 TASK_UNINTERRUPTIBLE
);
373 unregistering
= false;
376 if (net
->dev_unreg_count
> 0) {
377 unregistering
= true;
386 finish_wait(&netdev_unregistering_wq
, &wait
);
390 * rtnl_link_unregister - Unregister rtnl_link_ops from rtnetlink.
391 * @ops: struct rtnl_link_ops * to unregister
393 void rtnl_link_unregister(struct rtnl_link_ops
*ops
)
395 /* Close the race with cleanup_net() */
396 mutex_lock(&net_mutex
);
397 rtnl_lock_unregistering_all();
398 __rtnl_link_unregister(ops
);
400 mutex_unlock(&net_mutex
);
402 EXPORT_SYMBOL_GPL(rtnl_link_unregister
);
404 static size_t rtnl_link_get_slave_info_data_size(const struct net_device
*dev
)
406 struct net_device
*master_dev
;
407 const struct rtnl_link_ops
*ops
;
409 master_dev
= netdev_master_upper_dev_get((struct net_device
*) dev
);
412 ops
= master_dev
->rtnl_link_ops
;
413 if (!ops
|| !ops
->get_slave_size
)
415 /* IFLA_INFO_SLAVE_DATA + nested data */
416 return nla_total_size(sizeof(struct nlattr
)) +
417 ops
->get_slave_size(master_dev
, dev
);
420 static size_t rtnl_link_get_size(const struct net_device
*dev
)
422 const struct rtnl_link_ops
*ops
= dev
->rtnl_link_ops
;
428 size
= nla_total_size(sizeof(struct nlattr
)) + /* IFLA_LINKINFO */
429 nla_total_size(strlen(ops
->kind
) + 1); /* IFLA_INFO_KIND */
432 /* IFLA_INFO_DATA + nested data */
433 size
+= nla_total_size(sizeof(struct nlattr
)) +
436 if (ops
->get_xstats_size
)
437 /* IFLA_INFO_XSTATS */
438 size
+= nla_total_size(ops
->get_xstats_size(dev
));
440 size
+= rtnl_link_get_slave_info_data_size(dev
);
445 static LIST_HEAD(rtnl_af_ops
);
447 static const struct rtnl_af_ops
*rtnl_af_lookup(const int family
)
449 const struct rtnl_af_ops
*ops
;
451 list_for_each_entry(ops
, &rtnl_af_ops
, list
) {
452 if (ops
->family
== family
)
460 * rtnl_af_register - Register rtnl_af_ops with rtnetlink.
461 * @ops: struct rtnl_af_ops * to register
463 * Returns 0 on success or a negative error code.
465 void rtnl_af_register(struct rtnl_af_ops
*ops
)
468 list_add_tail(&ops
->list
, &rtnl_af_ops
);
471 EXPORT_SYMBOL_GPL(rtnl_af_register
);
474 * __rtnl_af_unregister - Unregister rtnl_af_ops from rtnetlink.
475 * @ops: struct rtnl_af_ops * to unregister
477 * The caller must hold the rtnl_mutex.
479 void __rtnl_af_unregister(struct rtnl_af_ops
*ops
)
481 list_del(&ops
->list
);
483 EXPORT_SYMBOL_GPL(__rtnl_af_unregister
);
486 * rtnl_af_unregister - Unregister rtnl_af_ops from rtnetlink.
487 * @ops: struct rtnl_af_ops * to unregister
489 void rtnl_af_unregister(struct rtnl_af_ops
*ops
)
492 __rtnl_af_unregister(ops
);
495 EXPORT_SYMBOL_GPL(rtnl_af_unregister
);
497 static size_t rtnl_link_get_af_size(const struct net_device
*dev
)
499 struct rtnl_af_ops
*af_ops
;
503 size
= nla_total_size(sizeof(struct nlattr
));
505 list_for_each_entry(af_ops
, &rtnl_af_ops
, list
) {
506 if (af_ops
->get_link_af_size
) {
507 /* AF_* + nested data */
508 size
+= nla_total_size(sizeof(struct nlattr
)) +
509 af_ops
->get_link_af_size(dev
);
516 static bool rtnl_have_link_slave_info(const struct net_device
*dev
)
518 struct net_device
*master_dev
;
520 master_dev
= netdev_master_upper_dev_get((struct net_device
*) dev
);
521 if (master_dev
&& master_dev
->rtnl_link_ops
)
526 static int rtnl_link_slave_info_fill(struct sk_buff
*skb
,
527 const struct net_device
*dev
)
529 struct net_device
*master_dev
;
530 const struct rtnl_link_ops
*ops
;
531 struct nlattr
*slave_data
;
534 master_dev
= netdev_master_upper_dev_get((struct net_device
*) dev
);
537 ops
= master_dev
->rtnl_link_ops
;
540 if (nla_put_string(skb
, IFLA_INFO_SLAVE_KIND
, ops
->kind
) < 0)
542 if (ops
->fill_slave_info
) {
543 slave_data
= nla_nest_start(skb
, IFLA_INFO_SLAVE_DATA
);
546 err
= ops
->fill_slave_info(skb
, master_dev
, dev
);
548 goto err_cancel_slave_data
;
549 nla_nest_end(skb
, slave_data
);
553 err_cancel_slave_data
:
554 nla_nest_cancel(skb
, slave_data
);
558 static int rtnl_link_info_fill(struct sk_buff
*skb
,
559 const struct net_device
*dev
)
561 const struct rtnl_link_ops
*ops
= dev
->rtnl_link_ops
;
567 if (nla_put_string(skb
, IFLA_INFO_KIND
, ops
->kind
) < 0)
569 if (ops
->fill_xstats
) {
570 err
= ops
->fill_xstats(skb
, dev
);
574 if (ops
->fill_info
) {
575 data
= nla_nest_start(skb
, IFLA_INFO_DATA
);
578 err
= ops
->fill_info(skb
, dev
);
580 goto err_cancel_data
;
581 nla_nest_end(skb
, data
);
586 nla_nest_cancel(skb
, data
);
590 static int rtnl_link_fill(struct sk_buff
*skb
, const struct net_device
*dev
)
592 struct nlattr
*linkinfo
;
595 linkinfo
= nla_nest_start(skb
, IFLA_LINKINFO
);
596 if (linkinfo
== NULL
)
599 err
= rtnl_link_info_fill(skb
, dev
);
601 goto err_cancel_link
;
603 err
= rtnl_link_slave_info_fill(skb
, dev
);
605 goto err_cancel_link
;
607 nla_nest_end(skb
, linkinfo
);
611 nla_nest_cancel(skb
, linkinfo
);
616 int rtnetlink_send(struct sk_buff
*skb
, struct net
*net
, u32 pid
, unsigned int group
, int echo
)
618 struct sock
*rtnl
= net
->rtnl
;
621 NETLINK_CB(skb
).dst_group
= group
;
623 atomic_inc(&skb
->users
);
624 netlink_broadcast(rtnl
, skb
, pid
, group
, GFP_KERNEL
);
626 err
= netlink_unicast(rtnl
, skb
, pid
, MSG_DONTWAIT
);
630 int rtnl_unicast(struct sk_buff
*skb
, struct net
*net
, u32 pid
)
632 struct sock
*rtnl
= net
->rtnl
;
634 return nlmsg_unicast(rtnl
, skb
, pid
);
636 EXPORT_SYMBOL(rtnl_unicast
);
638 void rtnl_notify(struct sk_buff
*skb
, struct net
*net
, u32 pid
, u32 group
,
639 struct nlmsghdr
*nlh
, gfp_t flags
)
641 struct sock
*rtnl
= net
->rtnl
;
645 report
= nlmsg_report(nlh
);
647 nlmsg_notify(rtnl
, skb
, pid
, group
, report
, flags
);
649 EXPORT_SYMBOL(rtnl_notify
);
651 void rtnl_set_sk_err(struct net
*net
, u32 group
, int error
)
653 struct sock
*rtnl
= net
->rtnl
;
655 netlink_set_err(rtnl
, 0, group
, error
);
657 EXPORT_SYMBOL(rtnl_set_sk_err
);
659 int rtnetlink_put_metrics(struct sk_buff
*skb
, u32
*metrics
)
664 mx
= nla_nest_start(skb
, RTA_METRICS
);
668 for (i
= 0; i
< RTAX_MAX
; i
++) {
671 if (nla_put_u32(skb
, i
+1, metrics
[i
]))
672 goto nla_put_failure
;
677 nla_nest_cancel(skb
, mx
);
681 return nla_nest_end(skb
, mx
);
684 nla_nest_cancel(skb
, mx
);
687 EXPORT_SYMBOL(rtnetlink_put_metrics
);
689 int rtnl_put_cacheinfo(struct sk_buff
*skb
, struct dst_entry
*dst
, u32 id
,
690 long expires
, u32 error
)
692 struct rta_cacheinfo ci
= {
693 .rta_lastuse
= jiffies_delta_to_clock_t(jiffies
- dst
->lastuse
),
694 .rta_used
= dst
->__use
,
695 .rta_clntref
= atomic_read(&(dst
->__refcnt
)),
703 clock
= jiffies_to_clock_t(abs(expires
));
704 clock
= min_t(unsigned long, clock
, INT_MAX
);
705 ci
.rta_expires
= (expires
> 0) ? clock
: -clock
;
707 return nla_put(skb
, RTA_CACHEINFO
, sizeof(ci
), &ci
);
709 EXPORT_SYMBOL_GPL(rtnl_put_cacheinfo
);
711 static void set_operstate(struct net_device
*dev
, unsigned char transition
)
713 unsigned char operstate
= dev
->operstate
;
715 switch (transition
) {
717 if ((operstate
== IF_OPER_DORMANT
||
718 operstate
== IF_OPER_UNKNOWN
) &&
720 operstate
= IF_OPER_UP
;
723 case IF_OPER_DORMANT
:
724 if (operstate
== IF_OPER_UP
||
725 operstate
== IF_OPER_UNKNOWN
)
726 operstate
= IF_OPER_DORMANT
;
730 if (dev
->operstate
!= operstate
) {
731 write_lock_bh(&dev_base_lock
);
732 dev
->operstate
= operstate
;
733 write_unlock_bh(&dev_base_lock
);
734 netdev_state_change(dev
);
738 static unsigned int rtnl_dev_get_flags(const struct net_device
*dev
)
740 return (dev
->flags
& ~(IFF_PROMISC
| IFF_ALLMULTI
)) |
741 (dev
->gflags
& (IFF_PROMISC
| IFF_ALLMULTI
));
744 static unsigned int rtnl_dev_combine_flags(const struct net_device
*dev
,
745 const struct ifinfomsg
*ifm
)
747 unsigned int flags
= ifm
->ifi_flags
;
749 /* bugwards compatibility: ifi_change == 0 is treated as ~0 */
751 flags
= (flags
& ifm
->ifi_change
) |
752 (rtnl_dev_get_flags(dev
) & ~ifm
->ifi_change
);
757 static void copy_rtnl_link_stats(struct rtnl_link_stats
*a
,
758 const struct rtnl_link_stats64
*b
)
760 a
->rx_packets
= b
->rx_packets
;
761 a
->tx_packets
= b
->tx_packets
;
762 a
->rx_bytes
= b
->rx_bytes
;
763 a
->tx_bytes
= b
->tx_bytes
;
764 a
->rx_errors
= b
->rx_errors
;
765 a
->tx_errors
= b
->tx_errors
;
766 a
->rx_dropped
= b
->rx_dropped
;
767 a
->tx_dropped
= b
->tx_dropped
;
769 a
->multicast
= b
->multicast
;
770 a
->collisions
= b
->collisions
;
772 a
->rx_length_errors
= b
->rx_length_errors
;
773 a
->rx_over_errors
= b
->rx_over_errors
;
774 a
->rx_crc_errors
= b
->rx_crc_errors
;
775 a
->rx_frame_errors
= b
->rx_frame_errors
;
776 a
->rx_fifo_errors
= b
->rx_fifo_errors
;
777 a
->rx_missed_errors
= b
->rx_missed_errors
;
779 a
->tx_aborted_errors
= b
->tx_aborted_errors
;
780 a
->tx_carrier_errors
= b
->tx_carrier_errors
;
781 a
->tx_fifo_errors
= b
->tx_fifo_errors
;
782 a
->tx_heartbeat_errors
= b
->tx_heartbeat_errors
;
783 a
->tx_window_errors
= b
->tx_window_errors
;
785 a
->rx_compressed
= b
->rx_compressed
;
786 a
->tx_compressed
= b
->tx_compressed
;
789 static void copy_rtnl_link_stats64(void *v
, const struct rtnl_link_stats64
*b
)
791 memcpy(v
, b
, sizeof(*b
));
795 static inline int rtnl_vfinfo_size(const struct net_device
*dev
,
798 if (dev
->dev
.parent
&& dev_is_pci(dev
->dev
.parent
) &&
799 (ext_filter_mask
& RTEXT_FILTER_VF
)) {
800 int num_vfs
= dev_num_vf(dev
->dev
.parent
);
801 size_t size
= nla_total_size(sizeof(struct nlattr
));
802 size
+= nla_total_size(num_vfs
* sizeof(struct nlattr
));
804 (nla_total_size(sizeof(struct ifla_vf_mac
)) +
805 nla_total_size(sizeof(struct ifla_vf_vlan
)) +
806 nla_total_size(sizeof(struct ifla_vf_spoofchk
)) +
807 nla_total_size(sizeof(struct ifla_vf_rate
)));
813 static size_t rtnl_port_size(const struct net_device
*dev
,
816 size_t port_size
= nla_total_size(4) /* PORT_VF */
817 + nla_total_size(PORT_PROFILE_MAX
) /* PORT_PROFILE */
818 + nla_total_size(sizeof(struct ifla_port_vsi
))
820 + nla_total_size(PORT_UUID_MAX
) /* PORT_INSTANCE_UUID */
821 + nla_total_size(PORT_UUID_MAX
) /* PORT_HOST_UUID */
822 + nla_total_size(1) /* PROT_VDP_REQUEST */
823 + nla_total_size(2); /* PORT_VDP_RESPONSE */
824 size_t vf_ports_size
= nla_total_size(sizeof(struct nlattr
));
825 size_t vf_port_size
= nla_total_size(sizeof(struct nlattr
))
827 size_t port_self_size
= nla_total_size(sizeof(struct nlattr
))
830 if (!dev
->netdev_ops
->ndo_get_vf_port
|| !dev
->dev
.parent
||
831 !(ext_filter_mask
& RTEXT_FILTER_VF
))
833 if (dev_num_vf(dev
->dev
.parent
))
834 return port_self_size
+ vf_ports_size
+
835 vf_port_size
* dev_num_vf(dev
->dev
.parent
);
837 return port_self_size
;
840 static noinline
size_t if_nlmsg_size(const struct net_device
*dev
,
843 return NLMSG_ALIGN(sizeof(struct ifinfomsg
))
844 + nla_total_size(IFNAMSIZ
) /* IFLA_IFNAME */
845 + nla_total_size(IFALIASZ
) /* IFLA_IFALIAS */
846 + nla_total_size(IFNAMSIZ
) /* IFLA_QDISC */
847 + nla_total_size(sizeof(struct rtnl_link_ifmap
))
848 + nla_total_size(sizeof(struct rtnl_link_stats
))
849 + nla_total_size(sizeof(struct rtnl_link_stats64
))
850 + nla_total_size(MAX_ADDR_LEN
) /* IFLA_ADDRESS */
851 + nla_total_size(MAX_ADDR_LEN
) /* IFLA_BROADCAST */
852 + nla_total_size(4) /* IFLA_TXQLEN */
853 + nla_total_size(4) /* IFLA_WEIGHT */
854 + nla_total_size(4) /* IFLA_MTU */
855 + nla_total_size(4) /* IFLA_LINK */
856 + nla_total_size(4) /* IFLA_MASTER */
857 + nla_total_size(1) /* IFLA_CARRIER */
858 + nla_total_size(4) /* IFLA_PROMISCUITY */
859 + nla_total_size(4) /* IFLA_NUM_TX_QUEUES */
860 + nla_total_size(4) /* IFLA_NUM_RX_QUEUES */
861 + nla_total_size(1) /* IFLA_OPERSTATE */
862 + nla_total_size(1) /* IFLA_LINKMODE */
863 + nla_total_size(4) /* IFLA_CARRIER_CHANGES */
864 + nla_total_size(ext_filter_mask
865 & RTEXT_FILTER_VF
? 4 : 0) /* IFLA_NUM_VF */
866 + rtnl_vfinfo_size(dev
, ext_filter_mask
) /* IFLA_VFINFO_LIST */
867 + rtnl_port_size(dev
, ext_filter_mask
) /* IFLA_VF_PORTS + IFLA_PORT_SELF */
868 + rtnl_link_get_size(dev
) /* IFLA_LINKINFO */
869 + rtnl_link_get_af_size(dev
) /* IFLA_AF_SPEC */
870 + nla_total_size(MAX_PHYS_PORT_ID_LEN
); /* IFLA_PHYS_PORT_ID */
873 static int rtnl_vf_ports_fill(struct sk_buff
*skb
, struct net_device
*dev
)
875 struct nlattr
*vf_ports
;
876 struct nlattr
*vf_port
;
880 vf_ports
= nla_nest_start(skb
, IFLA_VF_PORTS
);
884 for (vf
= 0; vf
< dev_num_vf(dev
->dev
.parent
); vf
++) {
885 vf_port
= nla_nest_start(skb
, IFLA_VF_PORT
);
887 goto nla_put_failure
;
888 if (nla_put_u32(skb
, IFLA_PORT_VF
, vf
))
889 goto nla_put_failure
;
890 err
= dev
->netdev_ops
->ndo_get_vf_port(dev
, vf
, skb
);
891 if (err
== -EMSGSIZE
)
892 goto nla_put_failure
;
894 nla_nest_cancel(skb
, vf_port
);
897 nla_nest_end(skb
, vf_port
);
900 nla_nest_end(skb
, vf_ports
);
905 nla_nest_cancel(skb
, vf_ports
);
909 static int rtnl_port_self_fill(struct sk_buff
*skb
, struct net_device
*dev
)
911 struct nlattr
*port_self
;
914 port_self
= nla_nest_start(skb
, IFLA_PORT_SELF
);
918 err
= dev
->netdev_ops
->ndo_get_vf_port(dev
, PORT_SELF_VF
, skb
);
920 nla_nest_cancel(skb
, port_self
);
921 return (err
== -EMSGSIZE
) ? err
: 0;
924 nla_nest_end(skb
, port_self
);
929 static int rtnl_port_fill(struct sk_buff
*skb
, struct net_device
*dev
,
934 if (!dev
->netdev_ops
->ndo_get_vf_port
|| !dev
->dev
.parent
||
935 !(ext_filter_mask
& RTEXT_FILTER_VF
))
938 err
= rtnl_port_self_fill(skb
, dev
);
942 if (dev_num_vf(dev
->dev
.parent
)) {
943 err
= rtnl_vf_ports_fill(skb
, dev
);
951 static int rtnl_phys_port_id_fill(struct sk_buff
*skb
, struct net_device
*dev
)
954 struct netdev_phys_port_id ppid
;
956 err
= dev_get_phys_port_id(dev
, &ppid
);
958 if (err
== -EOPNOTSUPP
)
963 if (nla_put(skb
, IFLA_PHYS_PORT_ID
, ppid
.id_len
, ppid
.id
))
969 static int rtnl_fill_ifinfo(struct sk_buff
*skb
, struct net_device
*dev
,
970 int type
, u32 pid
, u32 seq
, u32 change
,
971 unsigned int flags
, u32 ext_filter_mask
)
973 struct ifinfomsg
*ifm
;
974 struct nlmsghdr
*nlh
;
975 struct rtnl_link_stats64 temp
;
976 const struct rtnl_link_stats64
*stats
;
977 struct nlattr
*attr
, *af_spec
;
978 struct rtnl_af_ops
*af_ops
;
979 struct net_device
*upper_dev
= netdev_master_upper_dev_get(dev
);
982 nlh
= nlmsg_put(skb
, pid
, seq
, type
, sizeof(*ifm
), flags
);
986 ifm
= nlmsg_data(nlh
);
987 ifm
->ifi_family
= AF_UNSPEC
;
989 ifm
->ifi_type
= dev
->type
;
990 ifm
->ifi_index
= dev
->ifindex
;
991 ifm
->ifi_flags
= dev_get_flags(dev
);
992 ifm
->ifi_change
= change
;
994 if (nla_put_string(skb
, IFLA_IFNAME
, dev
->name
) ||
995 nla_put_u32(skb
, IFLA_TXQLEN
, dev
->tx_queue_len
) ||
996 nla_put_u8(skb
, IFLA_OPERSTATE
,
997 netif_running(dev
) ? dev
->operstate
: IF_OPER_DOWN
) ||
998 nla_put_u8(skb
, IFLA_LINKMODE
, dev
->link_mode
) ||
999 nla_put_u32(skb
, IFLA_MTU
, dev
->mtu
) ||
1000 nla_put_u32(skb
, IFLA_GROUP
, dev
->group
) ||
1001 nla_put_u32(skb
, IFLA_PROMISCUITY
, dev
->promiscuity
) ||
1002 nla_put_u32(skb
, IFLA_NUM_TX_QUEUES
, dev
->num_tx_queues
) ||
1004 nla_put_u32(skb
, IFLA_NUM_RX_QUEUES
, dev
->num_rx_queues
) ||
1006 (dev
->ifindex
!= dev
->iflink
&&
1007 nla_put_u32(skb
, IFLA_LINK
, dev
->iflink
)) ||
1009 nla_put_u32(skb
, IFLA_MASTER
, upper_dev
->ifindex
)) ||
1010 nla_put_u8(skb
, IFLA_CARRIER
, netif_carrier_ok(dev
)) ||
1012 nla_put_string(skb
, IFLA_QDISC
, dev
->qdisc
->ops
->id
)) ||
1014 nla_put_string(skb
, IFLA_IFALIAS
, dev
->ifalias
)) ||
1015 nla_put_u32(skb
, IFLA_CARRIER_CHANGES
,
1016 atomic_read(&dev
->carrier_changes
)))
1017 goto nla_put_failure
;
1020 struct rtnl_link_ifmap map
= {
1021 .mem_start
= dev
->mem_start
,
1022 .mem_end
= dev
->mem_end
,
1023 .base_addr
= dev
->base_addr
,
1026 .port
= dev
->if_port
,
1028 if (nla_put(skb
, IFLA_MAP
, sizeof(map
), &map
))
1029 goto nla_put_failure
;
1032 if (dev
->addr_len
) {
1033 if (nla_put(skb
, IFLA_ADDRESS
, dev
->addr_len
, dev
->dev_addr
) ||
1034 nla_put(skb
, IFLA_BROADCAST
, dev
->addr_len
, dev
->broadcast
))
1035 goto nla_put_failure
;
1038 if (rtnl_phys_port_id_fill(skb
, dev
))
1039 goto nla_put_failure
;
1041 attr
= nla_reserve(skb
, IFLA_STATS
,
1042 sizeof(struct rtnl_link_stats
));
1044 goto nla_put_failure
;
1046 stats
= dev_get_stats(dev
, &temp
);
1047 copy_rtnl_link_stats(nla_data(attr
), stats
);
1049 attr
= nla_reserve(skb
, IFLA_STATS64
,
1050 sizeof(struct rtnl_link_stats64
));
1052 goto nla_put_failure
;
1053 copy_rtnl_link_stats64(nla_data(attr
), stats
);
1055 if (dev
->dev
.parent
&& (ext_filter_mask
& RTEXT_FILTER_VF
) &&
1056 nla_put_u32(skb
, IFLA_NUM_VF
, dev_num_vf(dev
->dev
.parent
)))
1057 goto nla_put_failure
;
1059 if (dev
->netdev_ops
->ndo_get_vf_config
&& dev
->dev
.parent
1060 && (ext_filter_mask
& RTEXT_FILTER_VF
)) {
1063 struct nlattr
*vfinfo
, *vf
;
1064 int num_vfs
= dev_num_vf(dev
->dev
.parent
);
1066 vfinfo
= nla_nest_start(skb
, IFLA_VFINFO_LIST
);
1068 goto nla_put_failure
;
1069 for (i
= 0; i
< num_vfs
; i
++) {
1070 struct ifla_vf_info ivi
;
1071 struct ifla_vf_mac vf_mac
;
1072 struct ifla_vf_vlan vf_vlan
;
1073 struct ifla_vf_rate vf_rate
;
1074 struct ifla_vf_tx_rate vf_tx_rate
;
1075 struct ifla_vf_spoofchk vf_spoofchk
;
1076 struct ifla_vf_link_state vf_linkstate
;
1079 * Not all SR-IOV capable drivers support the
1080 * spoofcheck query. Preset to -1 so the user
1081 * space tool can detect that the driver didn't
1085 memset(ivi
.mac
, 0, sizeof(ivi
.mac
));
1086 /* The default value for VF link state is "auto"
1087 * IFLA_VF_LINK_STATE_AUTO which equals zero
1090 if (dev
->netdev_ops
->ndo_get_vf_config(dev
, i
, &ivi
))
1097 vf_linkstate
.vf
= ivi
.vf
;
1099 memcpy(vf_mac
.mac
, ivi
.mac
, sizeof(ivi
.mac
));
1100 vf_vlan
.vlan
= ivi
.vlan
;
1101 vf_vlan
.qos
= ivi
.qos
;
1102 vf_tx_rate
.rate
= ivi
.max_tx_rate
;
1103 vf_rate
.min_tx_rate
= ivi
.min_tx_rate
;
1104 vf_rate
.max_tx_rate
= ivi
.max_tx_rate
;
1105 vf_spoofchk
.setting
= ivi
.spoofchk
;
1106 vf_linkstate
.link_state
= ivi
.linkstate
;
1107 vf
= nla_nest_start(skb
, IFLA_VF_INFO
);
1109 nla_nest_cancel(skb
, vfinfo
);
1110 goto nla_put_failure
;
1112 if (nla_put(skb
, IFLA_VF_MAC
, sizeof(vf_mac
), &vf_mac
) ||
1113 nla_put(skb
, IFLA_VF_VLAN
, sizeof(vf_vlan
), &vf_vlan
) ||
1114 nla_put(skb
, IFLA_VF_RATE
, sizeof(vf_rate
),
1116 nla_put(skb
, IFLA_VF_TX_RATE
, sizeof(vf_tx_rate
),
1118 nla_put(skb
, IFLA_VF_SPOOFCHK
, sizeof(vf_spoofchk
),
1120 nla_put(skb
, IFLA_VF_LINK_STATE
, sizeof(vf_linkstate
),
1122 goto nla_put_failure
;
1123 nla_nest_end(skb
, vf
);
1125 nla_nest_end(skb
, vfinfo
);
1128 if (rtnl_port_fill(skb
, dev
, ext_filter_mask
))
1129 goto nla_put_failure
;
1131 if (dev
->rtnl_link_ops
|| rtnl_have_link_slave_info(dev
)) {
1132 if (rtnl_link_fill(skb
, dev
) < 0)
1133 goto nla_put_failure
;
1136 if (!(af_spec
= nla_nest_start(skb
, IFLA_AF_SPEC
)))
1137 goto nla_put_failure
;
1139 list_for_each_entry(af_ops
, &rtnl_af_ops
, list
) {
1140 if (af_ops
->fill_link_af
) {
1144 if (!(af
= nla_nest_start(skb
, af_ops
->family
)))
1145 goto nla_put_failure
;
1147 err
= af_ops
->fill_link_af(skb
, dev
);
1150 * Caller may return ENODATA to indicate that there
1151 * was no data to be dumped. This is not an error, it
1152 * means we should trim the attribute header and
1155 if (err
== -ENODATA
)
1156 nla_nest_cancel(skb
, af
);
1158 goto nla_put_failure
;
1160 nla_nest_end(skb
, af
);
1164 nla_nest_end(skb
, af_spec
);
1166 return nlmsg_end(skb
, nlh
);
1169 nlmsg_cancel(skb
, nlh
);
1173 static const struct nla_policy ifla_policy
[IFLA_MAX
+1] = {
1174 [IFLA_IFNAME
] = { .type
= NLA_STRING
, .len
= IFNAMSIZ
-1 },
1175 [IFLA_ADDRESS
] = { .type
= NLA_BINARY
, .len
= MAX_ADDR_LEN
},
1176 [IFLA_BROADCAST
] = { .type
= NLA_BINARY
, .len
= MAX_ADDR_LEN
},
1177 [IFLA_MAP
] = { .len
= sizeof(struct rtnl_link_ifmap
) },
1178 [IFLA_MTU
] = { .type
= NLA_U32
},
1179 [IFLA_LINK
] = { .type
= NLA_U32
},
1180 [IFLA_MASTER
] = { .type
= NLA_U32
},
1181 [IFLA_CARRIER
] = { .type
= NLA_U8
},
1182 [IFLA_TXQLEN
] = { .type
= NLA_U32
},
1183 [IFLA_WEIGHT
] = { .type
= NLA_U32
},
1184 [IFLA_OPERSTATE
] = { .type
= NLA_U8
},
1185 [IFLA_LINKMODE
] = { .type
= NLA_U8
},
1186 [IFLA_LINKINFO
] = { .type
= NLA_NESTED
},
1187 [IFLA_NET_NS_PID
] = { .type
= NLA_U32
},
1188 [IFLA_NET_NS_FD
] = { .type
= NLA_U32
},
1189 [IFLA_IFALIAS
] = { .type
= NLA_STRING
, .len
= IFALIASZ
-1 },
1190 [IFLA_VFINFO_LIST
] = {. type
= NLA_NESTED
},
1191 [IFLA_VF_PORTS
] = { .type
= NLA_NESTED
},
1192 [IFLA_PORT_SELF
] = { .type
= NLA_NESTED
},
1193 [IFLA_AF_SPEC
] = { .type
= NLA_NESTED
},
1194 [IFLA_EXT_MASK
] = { .type
= NLA_U32
},
1195 [IFLA_PROMISCUITY
] = { .type
= NLA_U32
},
1196 [IFLA_NUM_TX_QUEUES
] = { .type
= NLA_U32
},
1197 [IFLA_NUM_RX_QUEUES
] = { .type
= NLA_U32
},
1198 [IFLA_PHYS_PORT_ID
] = { .type
= NLA_BINARY
, .len
= MAX_PHYS_PORT_ID_LEN
},
1199 [IFLA_CARRIER_CHANGES
] = { .type
= NLA_U32
}, /* ignored */
1202 static const struct nla_policy ifla_info_policy
[IFLA_INFO_MAX
+1] = {
1203 [IFLA_INFO_KIND
] = { .type
= NLA_STRING
},
1204 [IFLA_INFO_DATA
] = { .type
= NLA_NESTED
},
1205 [IFLA_INFO_SLAVE_KIND
] = { .type
= NLA_STRING
},
1206 [IFLA_INFO_SLAVE_DATA
] = { .type
= NLA_NESTED
},
1209 static const struct nla_policy ifla_vfinfo_policy
[IFLA_VF_INFO_MAX
+1] = {
1210 [IFLA_VF_INFO
] = { .type
= NLA_NESTED
},
1213 static const struct nla_policy ifla_vf_policy
[IFLA_VF_MAX
+1] = {
1214 [IFLA_VF_MAC
] = { .type
= NLA_BINARY
,
1215 .len
= sizeof(struct ifla_vf_mac
) },
1216 [IFLA_VF_VLAN
] = { .type
= NLA_BINARY
,
1217 .len
= sizeof(struct ifla_vf_vlan
) },
1218 [IFLA_VF_TX_RATE
] = { .type
= NLA_BINARY
,
1219 .len
= sizeof(struct ifla_vf_tx_rate
) },
1220 [IFLA_VF_SPOOFCHK
] = { .type
= NLA_BINARY
,
1221 .len
= sizeof(struct ifla_vf_spoofchk
) },
1222 [IFLA_VF_RATE
] = { .type
= NLA_BINARY
,
1223 .len
= sizeof(struct ifla_vf_rate
) },
1224 [IFLA_VF_LINK_STATE
] = { .type
= NLA_BINARY
,
1225 .len
= sizeof(struct ifla_vf_link_state
) },
1228 static const struct nla_policy ifla_port_policy
[IFLA_PORT_MAX
+1] = {
1229 [IFLA_PORT_VF
] = { .type
= NLA_U32
},
1230 [IFLA_PORT_PROFILE
] = { .type
= NLA_STRING
,
1231 .len
= PORT_PROFILE_MAX
},
1232 [IFLA_PORT_VSI_TYPE
] = { .type
= NLA_BINARY
,
1233 .len
= sizeof(struct ifla_port_vsi
)},
1234 [IFLA_PORT_INSTANCE_UUID
] = { .type
= NLA_BINARY
,
1235 .len
= PORT_UUID_MAX
},
1236 [IFLA_PORT_HOST_UUID
] = { .type
= NLA_STRING
,
1237 .len
= PORT_UUID_MAX
},
1238 [IFLA_PORT_REQUEST
] = { .type
= NLA_U8
, },
1239 [IFLA_PORT_RESPONSE
] = { .type
= NLA_U16
, },
1242 static int rtnl_dump_ifinfo(struct sk_buff
*skb
, struct netlink_callback
*cb
)
1244 struct net
*net
= sock_net(skb
->sk
);
1247 struct net_device
*dev
;
1248 struct hlist_head
*head
;
1249 struct nlattr
*tb
[IFLA_MAX
+1];
1250 u32 ext_filter_mask
= 0;
1255 s_idx
= cb
->args
[1];
1258 cb
->seq
= net
->dev_base_seq
;
1260 /* A hack to preserve kernel<->userspace interface.
1261 * The correct header is ifinfomsg. It is consistent with rtnl_getlink.
1262 * However, before Linux v3.9 the code here assumed rtgenmsg and that's
1263 * what iproute2 < v3.9.0 used.
1264 * We can detect the old iproute2. Even including the IFLA_EXT_MASK
1265 * attribute, its netlink message is shorter than struct ifinfomsg.
1267 hdrlen
= nlmsg_len(cb
->nlh
) < sizeof(struct ifinfomsg
) ?
1268 sizeof(struct rtgenmsg
) : sizeof(struct ifinfomsg
);
1270 if (nlmsg_parse(cb
->nlh
, hdrlen
, tb
, IFLA_MAX
, ifla_policy
) >= 0) {
1272 if (tb
[IFLA_EXT_MASK
])
1273 ext_filter_mask
= nla_get_u32(tb
[IFLA_EXT_MASK
]);
1276 for (h
= s_h
; h
< NETDEV_HASHENTRIES
; h
++, s_idx
= 0) {
1278 head
= &net
->dev_index_head
[h
];
1279 hlist_for_each_entry_rcu(dev
, head
, index_hlist
) {
1282 err
= rtnl_fill_ifinfo(skb
, dev
, RTM_NEWLINK
,
1283 NETLINK_CB(cb
->skb
).portid
,
1284 cb
->nlh
->nlmsg_seq
, 0,
1287 /* If we ran out of room on the first message,
1290 WARN_ON((err
== -EMSGSIZE
) && (skb
->len
== 0));
1295 nl_dump_check_consistent(cb
, nlmsg_hdr(skb
));
1308 int rtnl_nla_parse_ifla(struct nlattr
**tb
, const struct nlattr
*head
, int len
)
1310 return nla_parse(tb
, IFLA_MAX
, head
, len
, ifla_policy
);
1312 EXPORT_SYMBOL(rtnl_nla_parse_ifla
);
1314 struct net
*rtnl_link_get_net(struct net
*src_net
, struct nlattr
*tb
[])
1317 /* Examine the link attributes and figure out which
1318 * network namespace we are talking about.
1320 if (tb
[IFLA_NET_NS_PID
])
1321 net
= get_net_ns_by_pid(nla_get_u32(tb
[IFLA_NET_NS_PID
]));
1322 else if (tb
[IFLA_NET_NS_FD
])
1323 net
= get_net_ns_by_fd(nla_get_u32(tb
[IFLA_NET_NS_FD
]));
1325 net
= get_net(src_net
);
1328 EXPORT_SYMBOL(rtnl_link_get_net
);
1330 static int validate_linkmsg(struct net_device
*dev
, struct nlattr
*tb
[])
1333 if (tb
[IFLA_ADDRESS
] &&
1334 nla_len(tb
[IFLA_ADDRESS
]) < dev
->addr_len
)
1337 if (tb
[IFLA_BROADCAST
] &&
1338 nla_len(tb
[IFLA_BROADCAST
]) < dev
->addr_len
)
1342 if (tb
[IFLA_AF_SPEC
]) {
1346 nla_for_each_nested(af
, tb
[IFLA_AF_SPEC
], rem
) {
1347 const struct rtnl_af_ops
*af_ops
;
1349 if (!(af_ops
= rtnl_af_lookup(nla_type(af
))))
1350 return -EAFNOSUPPORT
;
1352 if (!af_ops
->set_link_af
)
1355 if (af_ops
->validate_link_af
) {
1356 err
= af_ops
->validate_link_af(dev
, af
);
1366 static int do_setvfinfo(struct net_device
*dev
, struct nlattr
*attr
)
1368 int rem
, err
= -EINVAL
;
1370 const struct net_device_ops
*ops
= dev
->netdev_ops
;
1372 nla_for_each_nested(vf
, attr
, rem
) {
1373 switch (nla_type(vf
)) {
1375 struct ifla_vf_mac
*ivm
;
1378 if (ops
->ndo_set_vf_mac
)
1379 err
= ops
->ndo_set_vf_mac(dev
, ivm
->vf
,
1383 case IFLA_VF_VLAN
: {
1384 struct ifla_vf_vlan
*ivv
;
1387 if (ops
->ndo_set_vf_vlan
)
1388 err
= ops
->ndo_set_vf_vlan(dev
, ivv
->vf
,
1393 case IFLA_VF_TX_RATE
: {
1394 struct ifla_vf_tx_rate
*ivt
;
1395 struct ifla_vf_info ivf
;
1398 if (ops
->ndo_get_vf_config
)
1399 err
= ops
->ndo_get_vf_config(dev
, ivt
->vf
,
1404 if (ops
->ndo_set_vf_rate
)
1405 err
= ops
->ndo_set_vf_rate(dev
, ivt
->vf
,
1410 case IFLA_VF_RATE
: {
1411 struct ifla_vf_rate
*ivt
;
1414 if (ops
->ndo_set_vf_rate
)
1415 err
= ops
->ndo_set_vf_rate(dev
, ivt
->vf
,
1420 case IFLA_VF_SPOOFCHK
: {
1421 struct ifla_vf_spoofchk
*ivs
;
1424 if (ops
->ndo_set_vf_spoofchk
)
1425 err
= ops
->ndo_set_vf_spoofchk(dev
, ivs
->vf
,
1429 case IFLA_VF_LINK_STATE
: {
1430 struct ifla_vf_link_state
*ivl
;
1433 if (ops
->ndo_set_vf_link_state
)
1434 err
= ops
->ndo_set_vf_link_state(dev
, ivl
->vf
,
1448 static int do_set_master(struct net_device
*dev
, int ifindex
)
1450 struct net_device
*upper_dev
= netdev_master_upper_dev_get(dev
);
1451 const struct net_device_ops
*ops
;
1455 if (upper_dev
->ifindex
== ifindex
)
1457 ops
= upper_dev
->netdev_ops
;
1458 if (ops
->ndo_del_slave
) {
1459 err
= ops
->ndo_del_slave(upper_dev
, dev
);
1468 upper_dev
= __dev_get_by_index(dev_net(dev
), ifindex
);
1471 ops
= upper_dev
->netdev_ops
;
1472 if (ops
->ndo_add_slave
) {
1473 err
= ops
->ndo_add_slave(upper_dev
, dev
);
1483 static int do_setlink(const struct sk_buff
*skb
,
1484 struct net_device
*dev
, struct ifinfomsg
*ifm
,
1485 struct nlattr
**tb
, char *ifname
, int modified
)
1487 const struct net_device_ops
*ops
= dev
->netdev_ops
;
1490 if (tb
[IFLA_NET_NS_PID
] || tb
[IFLA_NET_NS_FD
]) {
1491 struct net
*net
= rtnl_link_get_net(dev_net(dev
), tb
);
1496 if (!netlink_ns_capable(skb
, net
->user_ns
, CAP_NET_ADMIN
)) {
1500 err
= dev_change_net_namespace(dev
, net
, ifname
);
1508 struct rtnl_link_ifmap
*u_map
;
1511 if (!ops
->ndo_set_config
) {
1516 if (!netif_device_present(dev
)) {
1521 u_map
= nla_data(tb
[IFLA_MAP
]);
1522 k_map
.mem_start
= (unsigned long) u_map
->mem_start
;
1523 k_map
.mem_end
= (unsigned long) u_map
->mem_end
;
1524 k_map
.base_addr
= (unsigned short) u_map
->base_addr
;
1525 k_map
.irq
= (unsigned char) u_map
->irq
;
1526 k_map
.dma
= (unsigned char) u_map
->dma
;
1527 k_map
.port
= (unsigned char) u_map
->port
;
1529 err
= ops
->ndo_set_config(dev
, &k_map
);
1536 if (tb
[IFLA_ADDRESS
]) {
1537 struct sockaddr
*sa
;
1540 len
= sizeof(sa_family_t
) + dev
->addr_len
;
1541 sa
= kmalloc(len
, GFP_KERNEL
);
1546 sa
->sa_family
= dev
->type
;
1547 memcpy(sa
->sa_data
, nla_data(tb
[IFLA_ADDRESS
]),
1549 err
= dev_set_mac_address(dev
, sa
);
1557 err
= dev_set_mtu(dev
, nla_get_u32(tb
[IFLA_MTU
]));
1563 if (tb
[IFLA_GROUP
]) {
1564 dev_set_group(dev
, nla_get_u32(tb
[IFLA_GROUP
]));
1569 * Interface selected by interface index but interface
1570 * name provided implies that a name change has been
1573 if (ifm
->ifi_index
> 0 && ifname
[0]) {
1574 err
= dev_change_name(dev
, ifname
);
1580 if (tb
[IFLA_IFALIAS
]) {
1581 err
= dev_set_alias(dev
, nla_data(tb
[IFLA_IFALIAS
]),
1582 nla_len(tb
[IFLA_IFALIAS
]));
1588 if (tb
[IFLA_BROADCAST
]) {
1589 nla_memcpy(dev
->broadcast
, tb
[IFLA_BROADCAST
], dev
->addr_len
);
1590 call_netdevice_notifiers(NETDEV_CHANGEADDR
, dev
);
1593 if (ifm
->ifi_flags
|| ifm
->ifi_change
) {
1594 err
= dev_change_flags(dev
, rtnl_dev_combine_flags(dev
, ifm
));
1599 if (tb
[IFLA_MASTER
]) {
1600 err
= do_set_master(dev
, nla_get_u32(tb
[IFLA_MASTER
]));
1606 if (tb
[IFLA_CARRIER
]) {
1607 err
= dev_change_carrier(dev
, nla_get_u8(tb
[IFLA_CARRIER
]));
1613 if (tb
[IFLA_TXQLEN
])
1614 dev
->tx_queue_len
= nla_get_u32(tb
[IFLA_TXQLEN
]);
1616 if (tb
[IFLA_OPERSTATE
])
1617 set_operstate(dev
, nla_get_u8(tb
[IFLA_OPERSTATE
]));
1619 if (tb
[IFLA_LINKMODE
]) {
1620 write_lock_bh(&dev_base_lock
);
1621 dev
->link_mode
= nla_get_u8(tb
[IFLA_LINKMODE
]);
1622 write_unlock_bh(&dev_base_lock
);
1625 if (tb
[IFLA_VFINFO_LIST
]) {
1626 struct nlattr
*attr
;
1628 nla_for_each_nested(attr
, tb
[IFLA_VFINFO_LIST
], rem
) {
1629 if (nla_type(attr
) != IFLA_VF_INFO
) {
1633 err
= do_setvfinfo(dev
, attr
);
1641 if (tb
[IFLA_VF_PORTS
]) {
1642 struct nlattr
*port
[IFLA_PORT_MAX
+1];
1643 struct nlattr
*attr
;
1648 if (!ops
->ndo_set_vf_port
)
1651 nla_for_each_nested(attr
, tb
[IFLA_VF_PORTS
], rem
) {
1652 if (nla_type(attr
) != IFLA_VF_PORT
)
1654 err
= nla_parse_nested(port
, IFLA_PORT_MAX
,
1655 attr
, ifla_port_policy
);
1658 if (!port
[IFLA_PORT_VF
]) {
1662 vf
= nla_get_u32(port
[IFLA_PORT_VF
]);
1663 err
= ops
->ndo_set_vf_port(dev
, vf
, port
);
1671 if (tb
[IFLA_PORT_SELF
]) {
1672 struct nlattr
*port
[IFLA_PORT_MAX
+1];
1674 err
= nla_parse_nested(port
, IFLA_PORT_MAX
,
1675 tb
[IFLA_PORT_SELF
], ifla_port_policy
);
1680 if (ops
->ndo_set_vf_port
)
1681 err
= ops
->ndo_set_vf_port(dev
, PORT_SELF_VF
, port
);
1687 if (tb
[IFLA_AF_SPEC
]) {
1691 nla_for_each_nested(af
, tb
[IFLA_AF_SPEC
], rem
) {
1692 const struct rtnl_af_ops
*af_ops
;
1694 if (!(af_ops
= rtnl_af_lookup(nla_type(af
))))
1697 err
= af_ops
->set_link_af(dev
, af
);
1707 if (err
< 0 && modified
)
1708 net_warn_ratelimited("A link change request failed with some changes committed already. Interface %s may have been left with an inconsistent configuration, please check.\n",
1714 static int rtnl_setlink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
1716 struct net
*net
= sock_net(skb
->sk
);
1717 struct ifinfomsg
*ifm
;
1718 struct net_device
*dev
;
1720 struct nlattr
*tb
[IFLA_MAX
+1];
1721 char ifname
[IFNAMSIZ
];
1723 err
= nlmsg_parse(nlh
, sizeof(*ifm
), tb
, IFLA_MAX
, ifla_policy
);
1727 if (tb
[IFLA_IFNAME
])
1728 nla_strlcpy(ifname
, tb
[IFLA_IFNAME
], IFNAMSIZ
);
1733 ifm
= nlmsg_data(nlh
);
1734 if (ifm
->ifi_index
> 0)
1735 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
1736 else if (tb
[IFLA_IFNAME
])
1737 dev
= __dev_get_by_name(net
, ifname
);
1746 err
= validate_linkmsg(dev
, tb
);
1750 err
= do_setlink(skb
, dev
, ifm
, tb
, ifname
, 0);
1755 static int rtnl_dellink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
1757 struct net
*net
= sock_net(skb
->sk
);
1758 const struct rtnl_link_ops
*ops
;
1759 struct net_device
*dev
;
1760 struct ifinfomsg
*ifm
;
1761 char ifname
[IFNAMSIZ
];
1762 struct nlattr
*tb
[IFLA_MAX
+1];
1764 LIST_HEAD(list_kill
);
1766 err
= nlmsg_parse(nlh
, sizeof(*ifm
), tb
, IFLA_MAX
, ifla_policy
);
1770 if (tb
[IFLA_IFNAME
])
1771 nla_strlcpy(ifname
, tb
[IFLA_IFNAME
], IFNAMSIZ
);
1773 ifm
= nlmsg_data(nlh
);
1774 if (ifm
->ifi_index
> 0)
1775 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
1776 else if (tb
[IFLA_IFNAME
])
1777 dev
= __dev_get_by_name(net
, ifname
);
1784 ops
= dev
->rtnl_link_ops
;
1785 if (!ops
|| !ops
->dellink
)
1788 ops
->dellink(dev
, &list_kill
);
1789 unregister_netdevice_many(&list_kill
);
1793 int rtnl_configure_link(struct net_device
*dev
, const struct ifinfomsg
*ifm
)
1795 unsigned int old_flags
;
1798 old_flags
= dev
->flags
;
1799 if (ifm
&& (ifm
->ifi_flags
|| ifm
->ifi_change
)) {
1800 err
= __dev_change_flags(dev
, rtnl_dev_combine_flags(dev
, ifm
));
1805 dev
->rtnl_link_state
= RTNL_LINK_INITIALIZED
;
1807 __dev_notify_flags(dev
, old_flags
, ~0U);
1810 EXPORT_SYMBOL(rtnl_configure_link
);
1812 struct net_device
*rtnl_create_link(struct net
*net
,
1813 char *ifname
, const struct rtnl_link_ops
*ops
, struct nlattr
*tb
[])
1816 struct net_device
*dev
;
1817 unsigned int num_tx_queues
= 1;
1818 unsigned int num_rx_queues
= 1;
1820 if (tb
[IFLA_NUM_TX_QUEUES
])
1821 num_tx_queues
= nla_get_u32(tb
[IFLA_NUM_TX_QUEUES
]);
1822 else if (ops
->get_num_tx_queues
)
1823 num_tx_queues
= ops
->get_num_tx_queues();
1825 if (tb
[IFLA_NUM_RX_QUEUES
])
1826 num_rx_queues
= nla_get_u32(tb
[IFLA_NUM_RX_QUEUES
]);
1827 else if (ops
->get_num_rx_queues
)
1828 num_rx_queues
= ops
->get_num_rx_queues();
1831 dev
= alloc_netdev_mqs(ops
->priv_size
, ifname
, ops
->setup
,
1832 num_tx_queues
, num_rx_queues
);
1836 dev_net_set(dev
, net
);
1837 dev
->rtnl_link_ops
= ops
;
1838 dev
->rtnl_link_state
= RTNL_LINK_INITIALIZING
;
1841 dev
->mtu
= nla_get_u32(tb
[IFLA_MTU
]);
1842 if (tb
[IFLA_ADDRESS
]) {
1843 memcpy(dev
->dev_addr
, nla_data(tb
[IFLA_ADDRESS
]),
1844 nla_len(tb
[IFLA_ADDRESS
]));
1845 dev
->addr_assign_type
= NET_ADDR_SET
;
1847 if (tb
[IFLA_BROADCAST
])
1848 memcpy(dev
->broadcast
, nla_data(tb
[IFLA_BROADCAST
]),
1849 nla_len(tb
[IFLA_BROADCAST
]));
1850 if (tb
[IFLA_TXQLEN
])
1851 dev
->tx_queue_len
= nla_get_u32(tb
[IFLA_TXQLEN
]);
1852 if (tb
[IFLA_OPERSTATE
])
1853 set_operstate(dev
, nla_get_u8(tb
[IFLA_OPERSTATE
]));
1854 if (tb
[IFLA_LINKMODE
])
1855 dev
->link_mode
= nla_get_u8(tb
[IFLA_LINKMODE
]);
1857 dev_set_group(dev
, nla_get_u32(tb
[IFLA_GROUP
]));
1862 return ERR_PTR(err
);
1864 EXPORT_SYMBOL(rtnl_create_link
);
1866 static int rtnl_group_changelink(const struct sk_buff
*skb
,
1867 struct net
*net
, int group
,
1868 struct ifinfomsg
*ifm
,
1871 struct net_device
*dev
;
1874 for_each_netdev(net
, dev
) {
1875 if (dev
->group
== group
) {
1876 err
= do_setlink(skb
, dev
, ifm
, tb
, NULL
, 0);
1885 static int rtnl_newlink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
1887 struct net
*net
= sock_net(skb
->sk
);
1888 const struct rtnl_link_ops
*ops
;
1889 const struct rtnl_link_ops
*m_ops
= NULL
;
1890 struct net_device
*dev
;
1891 struct net_device
*master_dev
= NULL
;
1892 struct ifinfomsg
*ifm
;
1893 char kind
[MODULE_NAME_LEN
];
1894 char ifname
[IFNAMSIZ
];
1895 struct nlattr
*tb
[IFLA_MAX
+1];
1896 struct nlattr
*linkinfo
[IFLA_INFO_MAX
+1];
1899 #ifdef CONFIG_MODULES
1902 err
= nlmsg_parse(nlh
, sizeof(*ifm
), tb
, IFLA_MAX
, ifla_policy
);
1906 if (tb
[IFLA_IFNAME
])
1907 nla_strlcpy(ifname
, tb
[IFLA_IFNAME
], IFNAMSIZ
);
1911 ifm
= nlmsg_data(nlh
);
1912 if (ifm
->ifi_index
> 0)
1913 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
1916 dev
= __dev_get_by_name(net
, ifname
);
1922 master_dev
= netdev_master_upper_dev_get(dev
);
1924 m_ops
= master_dev
->rtnl_link_ops
;
1927 err
= validate_linkmsg(dev
, tb
);
1931 if (tb
[IFLA_LINKINFO
]) {
1932 err
= nla_parse_nested(linkinfo
, IFLA_INFO_MAX
,
1933 tb
[IFLA_LINKINFO
], ifla_info_policy
);
1937 memset(linkinfo
, 0, sizeof(linkinfo
));
1939 if (linkinfo
[IFLA_INFO_KIND
]) {
1940 nla_strlcpy(kind
, linkinfo
[IFLA_INFO_KIND
], sizeof(kind
));
1941 ops
= rtnl_link_ops_get(kind
);
1948 struct nlattr
*attr
[ops
? ops
->maxtype
+ 1 : 0];
1949 struct nlattr
*slave_attr
[m_ops
? m_ops
->slave_maxtype
+ 1 : 0];
1950 struct nlattr
**data
= NULL
;
1951 struct nlattr
**slave_data
= NULL
;
1952 struct net
*dest_net
;
1955 if (ops
->maxtype
&& linkinfo
[IFLA_INFO_DATA
]) {
1956 err
= nla_parse_nested(attr
, ops
->maxtype
,
1957 linkinfo
[IFLA_INFO_DATA
],
1963 if (ops
->validate
) {
1964 err
= ops
->validate(tb
, data
);
1971 if (m_ops
->slave_maxtype
&&
1972 linkinfo
[IFLA_INFO_SLAVE_DATA
]) {
1973 err
= nla_parse_nested(slave_attr
,
1974 m_ops
->slave_maxtype
,
1975 linkinfo
[IFLA_INFO_SLAVE_DATA
],
1976 m_ops
->slave_policy
);
1979 slave_data
= slave_attr
;
1981 if (m_ops
->slave_validate
) {
1982 err
= m_ops
->slave_validate(tb
, slave_data
);
1991 if (nlh
->nlmsg_flags
& NLM_F_EXCL
)
1993 if (nlh
->nlmsg_flags
& NLM_F_REPLACE
)
1996 if (linkinfo
[IFLA_INFO_DATA
]) {
1997 if (!ops
|| ops
!= dev
->rtnl_link_ops
||
2001 err
= ops
->changelink(dev
, tb
, data
);
2007 if (linkinfo
[IFLA_INFO_SLAVE_DATA
]) {
2008 if (!m_ops
|| !m_ops
->slave_changelink
)
2011 err
= m_ops
->slave_changelink(master_dev
, dev
,
2018 return do_setlink(skb
, dev
, ifm
, tb
, ifname
, modified
);
2021 if (!(nlh
->nlmsg_flags
& NLM_F_CREATE
)) {
2022 if (ifm
->ifi_index
== 0 && tb
[IFLA_GROUP
])
2023 return rtnl_group_changelink(skb
, net
,
2024 nla_get_u32(tb
[IFLA_GROUP
]),
2029 if (tb
[IFLA_MAP
] || tb
[IFLA_MASTER
] || tb
[IFLA_PROTINFO
])
2033 #ifdef CONFIG_MODULES
2036 request_module("rtnl-link-%s", kind
);
2038 ops
= rtnl_link_ops_get(kind
);
2050 snprintf(ifname
, IFNAMSIZ
, "%s%%d", ops
->kind
);
2052 dest_net
= rtnl_link_get_net(net
, tb
);
2053 if (IS_ERR(dest_net
))
2054 return PTR_ERR(dest_net
);
2056 dev
= rtnl_create_link(dest_net
, ifname
, ops
, tb
);
2062 dev
->ifindex
= ifm
->ifi_index
;
2065 err
= ops
->newlink(net
, dev
, tb
, data
);
2066 /* Drivers should call free_netdev() in ->destructor
2067 * and unregister it on failure after registration
2068 * so that device could be finally freed in rtnl_unlock.
2071 /* If device is not registered at all, free it now */
2072 if (dev
->reg_state
== NETREG_UNINITIALIZED
)
2077 err
= register_netdevice(dev
);
2083 err
= rtnl_configure_link(dev
, ifm
);
2085 unregister_netdevice(dev
);
2092 static int rtnl_getlink(struct sk_buff
*skb
, struct nlmsghdr
* nlh
)
2094 struct net
*net
= sock_net(skb
->sk
);
2095 struct ifinfomsg
*ifm
;
2096 char ifname
[IFNAMSIZ
];
2097 struct nlattr
*tb
[IFLA_MAX
+1];
2098 struct net_device
*dev
= NULL
;
2099 struct sk_buff
*nskb
;
2101 u32 ext_filter_mask
= 0;
2103 err
= nlmsg_parse(nlh
, sizeof(*ifm
), tb
, IFLA_MAX
, ifla_policy
);
2107 if (tb
[IFLA_IFNAME
])
2108 nla_strlcpy(ifname
, tb
[IFLA_IFNAME
], IFNAMSIZ
);
2110 if (tb
[IFLA_EXT_MASK
])
2111 ext_filter_mask
= nla_get_u32(tb
[IFLA_EXT_MASK
]);
2113 ifm
= nlmsg_data(nlh
);
2114 if (ifm
->ifi_index
> 0)
2115 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
2116 else if (tb
[IFLA_IFNAME
])
2117 dev
= __dev_get_by_name(net
, ifname
);
2124 nskb
= nlmsg_new(if_nlmsg_size(dev
, ext_filter_mask
), GFP_KERNEL
);
2128 err
= rtnl_fill_ifinfo(nskb
, dev
, RTM_NEWLINK
, NETLINK_CB(skb
).portid
,
2129 nlh
->nlmsg_seq
, 0, 0, ext_filter_mask
);
2131 /* -EMSGSIZE implies BUG in if_nlmsg_size */
2132 WARN_ON(err
== -EMSGSIZE
);
2135 err
= rtnl_unicast(nskb
, net
, NETLINK_CB(skb
).portid
);
2140 static u16
rtnl_calcit(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2142 struct net
*net
= sock_net(skb
->sk
);
2143 struct net_device
*dev
;
2144 struct nlattr
*tb
[IFLA_MAX
+1];
2145 u32 ext_filter_mask
= 0;
2146 u16 min_ifinfo_dump_size
= 0;
2149 /* Same kernel<->userspace interface hack as in rtnl_dump_ifinfo. */
2150 hdrlen
= nlmsg_len(nlh
) < sizeof(struct ifinfomsg
) ?
2151 sizeof(struct rtgenmsg
) : sizeof(struct ifinfomsg
);
2153 if (nlmsg_parse(nlh
, hdrlen
, tb
, IFLA_MAX
, ifla_policy
) >= 0) {
2154 if (tb
[IFLA_EXT_MASK
])
2155 ext_filter_mask
= nla_get_u32(tb
[IFLA_EXT_MASK
]);
2158 if (!ext_filter_mask
)
2159 return NLMSG_GOODSIZE
;
2161 * traverse the list of net devices and compute the minimum
2162 * buffer size based upon the filter mask.
2164 list_for_each_entry(dev
, &net
->dev_base_head
, dev_list
) {
2165 min_ifinfo_dump_size
= max_t(u16
, min_ifinfo_dump_size
,
2170 return min_ifinfo_dump_size
;
2173 static int rtnl_dump_all(struct sk_buff
*skb
, struct netlink_callback
*cb
)
2176 int s_idx
= cb
->family
;
2180 for (idx
= 1; idx
<= RTNL_FAMILY_MAX
; idx
++) {
2181 int type
= cb
->nlh
->nlmsg_type
-RTM_BASE
;
2182 if (idx
< s_idx
|| idx
== PF_PACKET
)
2184 if (rtnl_msg_handlers
[idx
] == NULL
||
2185 rtnl_msg_handlers
[idx
][type
].dumpit
== NULL
)
2188 memset(&cb
->args
[0], 0, sizeof(cb
->args
));
2192 if (rtnl_msg_handlers
[idx
][type
].dumpit(skb
, cb
))
2200 void rtmsg_ifinfo(int type
, struct net_device
*dev
, unsigned int change
,
2203 struct net
*net
= dev_net(dev
);
2204 struct sk_buff
*skb
;
2206 size_t if_info_size
;
2208 skb
= nlmsg_new((if_info_size
= if_nlmsg_size(dev
, 0)), flags
);
2212 err
= rtnl_fill_ifinfo(skb
, dev
, type
, 0, 0, change
, 0, 0);
2214 /* -EMSGSIZE implies BUG in if_nlmsg_size() */
2215 WARN_ON(err
== -EMSGSIZE
);
2219 rtnl_notify(skb
, net
, 0, RTNLGRP_LINK
, NULL
, flags
);
2223 rtnl_set_sk_err(net
, RTNLGRP_LINK
, err
);
2225 EXPORT_SYMBOL(rtmsg_ifinfo
);
2227 static int nlmsg_populate_fdb_fill(struct sk_buff
*skb
,
2228 struct net_device
*dev
,
2229 u8
*addr
, u32 pid
, u32 seq
,
2230 int type
, unsigned int flags
,
2233 struct nlmsghdr
*nlh
;
2236 nlh
= nlmsg_put(skb
, pid
, seq
, type
, sizeof(*ndm
), nlflags
);
2240 ndm
= nlmsg_data(nlh
);
2241 ndm
->ndm_family
= AF_BRIDGE
;
2244 ndm
->ndm_flags
= flags
;
2246 ndm
->ndm_ifindex
= dev
->ifindex
;
2247 ndm
->ndm_state
= NUD_PERMANENT
;
2249 if (nla_put(skb
, NDA_LLADDR
, ETH_ALEN
, addr
))
2250 goto nla_put_failure
;
2252 return nlmsg_end(skb
, nlh
);
2255 nlmsg_cancel(skb
, nlh
);
2259 static inline size_t rtnl_fdb_nlmsg_size(void)
2261 return NLMSG_ALIGN(sizeof(struct ndmsg
)) + nla_total_size(ETH_ALEN
);
2264 static void rtnl_fdb_notify(struct net_device
*dev
, u8
*addr
, int type
)
2266 struct net
*net
= dev_net(dev
);
2267 struct sk_buff
*skb
;
2270 skb
= nlmsg_new(rtnl_fdb_nlmsg_size(), GFP_ATOMIC
);
2274 err
= nlmsg_populate_fdb_fill(skb
, dev
, addr
, 0, 0, type
, NTF_SELF
, 0);
2280 rtnl_notify(skb
, net
, 0, RTNLGRP_NEIGH
, NULL
, GFP_ATOMIC
);
2283 rtnl_set_sk_err(net
, RTNLGRP_NEIGH
, err
);
2287 * ndo_dflt_fdb_add - default netdevice operation to add an FDB entry
2289 int ndo_dflt_fdb_add(struct ndmsg
*ndm
,
2290 struct nlattr
*tb
[],
2291 struct net_device
*dev
,
2292 const unsigned char *addr
,
2297 /* If aging addresses are supported device will need to
2298 * implement its own handler for this.
2300 if (ndm
->ndm_state
&& !(ndm
->ndm_state
& NUD_PERMANENT
)) {
2301 pr_info("%s: FDB only supports static addresses\n", dev
->name
);
2305 if (is_unicast_ether_addr(addr
) || is_link_local_ether_addr(addr
))
2306 err
= dev_uc_add_excl(dev
, addr
);
2307 else if (is_multicast_ether_addr(addr
))
2308 err
= dev_mc_add_excl(dev
, addr
);
2310 /* Only return duplicate errors if NLM_F_EXCL is set */
2311 if (err
== -EEXIST
&& !(flags
& NLM_F_EXCL
))
2316 EXPORT_SYMBOL(ndo_dflt_fdb_add
);
2318 static int rtnl_fdb_add(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2320 struct net
*net
= sock_net(skb
->sk
);
2322 struct nlattr
*tb
[NDA_MAX
+1];
2323 struct net_device
*dev
;
2327 err
= nlmsg_parse(nlh
, sizeof(*ndm
), tb
, NDA_MAX
, NULL
);
2331 ndm
= nlmsg_data(nlh
);
2332 if (ndm
->ndm_ifindex
== 0) {
2333 pr_info("PF_BRIDGE: RTM_NEWNEIGH with invalid ifindex\n");
2337 dev
= __dev_get_by_index(net
, ndm
->ndm_ifindex
);
2339 pr_info("PF_BRIDGE: RTM_NEWNEIGH with unknown ifindex\n");
2343 if (!tb
[NDA_LLADDR
] || nla_len(tb
[NDA_LLADDR
]) != ETH_ALEN
) {
2344 pr_info("PF_BRIDGE: RTM_NEWNEIGH with invalid address\n");
2348 addr
= nla_data(tb
[NDA_LLADDR
]);
2352 /* Support fdb on master device the net/bridge default case */
2353 if ((!ndm
->ndm_flags
|| ndm
->ndm_flags
& NTF_MASTER
) &&
2354 (dev
->priv_flags
& IFF_BRIDGE_PORT
)) {
2355 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
2356 const struct net_device_ops
*ops
= br_dev
->netdev_ops
;
2358 err
= ops
->ndo_fdb_add(ndm
, tb
, dev
, addr
, nlh
->nlmsg_flags
);
2362 ndm
->ndm_flags
&= ~NTF_MASTER
;
2365 /* Embedded bridge, macvlan, and any other device support */
2366 if ((ndm
->ndm_flags
& NTF_SELF
)) {
2367 if (dev
->netdev_ops
->ndo_fdb_add
)
2368 err
= dev
->netdev_ops
->ndo_fdb_add(ndm
, tb
, dev
, addr
,
2371 err
= ndo_dflt_fdb_add(ndm
, tb
, dev
, addr
,
2375 rtnl_fdb_notify(dev
, addr
, RTM_NEWNEIGH
);
2376 ndm
->ndm_flags
&= ~NTF_SELF
;
2384 * ndo_dflt_fdb_del - default netdevice operation to delete an FDB entry
2386 int ndo_dflt_fdb_del(struct ndmsg
*ndm
,
2387 struct nlattr
*tb
[],
2388 struct net_device
*dev
,
2389 const unsigned char *addr
)
2391 int err
= -EOPNOTSUPP
;
2393 /* If aging addresses are supported device will need to
2394 * implement its own handler for this.
2396 if (!(ndm
->ndm_state
& NUD_PERMANENT
)) {
2397 pr_info("%s: FDB only supports static addresses\n", dev
->name
);
2401 if (is_unicast_ether_addr(addr
) || is_link_local_ether_addr(addr
))
2402 err
= dev_uc_del(dev
, addr
);
2403 else if (is_multicast_ether_addr(addr
))
2404 err
= dev_mc_del(dev
, addr
);
2410 EXPORT_SYMBOL(ndo_dflt_fdb_del
);
2412 static int rtnl_fdb_del(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2414 struct net
*net
= sock_net(skb
->sk
);
2416 struct nlattr
*tb
[NDA_MAX
+1];
2417 struct net_device
*dev
;
2421 if (!netlink_capable(skb
, CAP_NET_ADMIN
))
2424 err
= nlmsg_parse(nlh
, sizeof(*ndm
), tb
, NDA_MAX
, NULL
);
2428 ndm
= nlmsg_data(nlh
);
2429 if (ndm
->ndm_ifindex
== 0) {
2430 pr_info("PF_BRIDGE: RTM_DELNEIGH with invalid ifindex\n");
2434 dev
= __dev_get_by_index(net
, ndm
->ndm_ifindex
);
2436 pr_info("PF_BRIDGE: RTM_DELNEIGH with unknown ifindex\n");
2440 if (!tb
[NDA_LLADDR
] || nla_len(tb
[NDA_LLADDR
]) != ETH_ALEN
) {
2441 pr_info("PF_BRIDGE: RTM_DELNEIGH with invalid address\n");
2445 addr
= nla_data(tb
[NDA_LLADDR
]);
2449 /* Support fdb on master device the net/bridge default case */
2450 if ((!ndm
->ndm_flags
|| ndm
->ndm_flags
& NTF_MASTER
) &&
2451 (dev
->priv_flags
& IFF_BRIDGE_PORT
)) {
2452 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
2453 const struct net_device_ops
*ops
= br_dev
->netdev_ops
;
2455 if (ops
->ndo_fdb_del
)
2456 err
= ops
->ndo_fdb_del(ndm
, tb
, dev
, addr
);
2461 ndm
->ndm_flags
&= ~NTF_MASTER
;
2464 /* Embedded bridge, macvlan, and any other device support */
2465 if (ndm
->ndm_flags
& NTF_SELF
) {
2466 if (dev
->netdev_ops
->ndo_fdb_del
)
2467 err
= dev
->netdev_ops
->ndo_fdb_del(ndm
, tb
, dev
, addr
);
2469 err
= ndo_dflt_fdb_del(ndm
, tb
, dev
, addr
);
2472 rtnl_fdb_notify(dev
, addr
, RTM_DELNEIGH
);
2473 ndm
->ndm_flags
&= ~NTF_SELF
;
2480 static int nlmsg_populate_fdb(struct sk_buff
*skb
,
2481 struct netlink_callback
*cb
,
2482 struct net_device
*dev
,
2484 struct netdev_hw_addr_list
*list
)
2486 struct netdev_hw_addr
*ha
;
2490 portid
= NETLINK_CB(cb
->skb
).portid
;
2491 seq
= cb
->nlh
->nlmsg_seq
;
2493 list_for_each_entry(ha
, &list
->list
, list
) {
2494 if (*idx
< cb
->args
[0])
2497 err
= nlmsg_populate_fdb_fill(skb
, dev
, ha
->addr
,
2499 RTM_NEWNEIGH
, NTF_SELF
,
2510 * ndo_dflt_fdb_dump - default netdevice operation to dump an FDB table.
2511 * @nlh: netlink message header
2514 * Default netdevice operation to dump the existing unicast address list.
2515 * Returns number of addresses from list put in skb.
2517 int ndo_dflt_fdb_dump(struct sk_buff
*skb
,
2518 struct netlink_callback
*cb
,
2519 struct net_device
*dev
,
2520 struct net_device
*filter_dev
,
2525 netif_addr_lock_bh(dev
);
2526 err
= nlmsg_populate_fdb(skb
, cb
, dev
, &idx
, &dev
->uc
);
2529 nlmsg_populate_fdb(skb
, cb
, dev
, &idx
, &dev
->mc
);
2531 netif_addr_unlock_bh(dev
);
2534 EXPORT_SYMBOL(ndo_dflt_fdb_dump
);
2536 static int rtnl_fdb_dump(struct sk_buff
*skb
, struct netlink_callback
*cb
)
2539 struct net
*net
= sock_net(skb
->sk
);
2540 struct net_device
*dev
;
2543 for_each_netdev_rcu(net
, dev
) {
2544 if (dev
->priv_flags
& IFF_BRIDGE_PORT
) {
2545 struct net_device
*br_dev
;
2546 const struct net_device_ops
*ops
;
2548 br_dev
= netdev_master_upper_dev_get(dev
);
2549 ops
= br_dev
->netdev_ops
;
2550 if (ops
->ndo_fdb_dump
)
2551 idx
= ops
->ndo_fdb_dump(skb
, cb
, dev
, NULL
,
2555 if (dev
->netdev_ops
->ndo_fdb_dump
)
2556 idx
= dev
->netdev_ops
->ndo_fdb_dump(skb
, cb
, dev
, NULL
,
2559 idx
= ndo_dflt_fdb_dump(skb
, cb
, dev
, NULL
, idx
);
2567 int ndo_dflt_bridge_getlink(struct sk_buff
*skb
, u32 pid
, u32 seq
,
2568 struct net_device
*dev
, u16 mode
)
2570 struct nlmsghdr
*nlh
;
2571 struct ifinfomsg
*ifm
;
2572 struct nlattr
*br_afspec
;
2573 u8 operstate
= netif_running(dev
) ? dev
->operstate
: IF_OPER_DOWN
;
2574 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
2576 nlh
= nlmsg_put(skb
, pid
, seq
, RTM_NEWLINK
, sizeof(*ifm
), NLM_F_MULTI
);
2580 ifm
= nlmsg_data(nlh
);
2581 ifm
->ifi_family
= AF_BRIDGE
;
2583 ifm
->ifi_type
= dev
->type
;
2584 ifm
->ifi_index
= dev
->ifindex
;
2585 ifm
->ifi_flags
= dev_get_flags(dev
);
2586 ifm
->ifi_change
= 0;
2589 if (nla_put_string(skb
, IFLA_IFNAME
, dev
->name
) ||
2590 nla_put_u32(skb
, IFLA_MTU
, dev
->mtu
) ||
2591 nla_put_u8(skb
, IFLA_OPERSTATE
, operstate
) ||
2593 nla_put_u32(skb
, IFLA_MASTER
, br_dev
->ifindex
)) ||
2595 nla_put(skb
, IFLA_ADDRESS
, dev
->addr_len
, dev
->dev_addr
)) ||
2596 (dev
->ifindex
!= dev
->iflink
&&
2597 nla_put_u32(skb
, IFLA_LINK
, dev
->iflink
)))
2598 goto nla_put_failure
;
2600 br_afspec
= nla_nest_start(skb
, IFLA_AF_SPEC
);
2602 goto nla_put_failure
;
2604 if (nla_put_u16(skb
, IFLA_BRIDGE_FLAGS
, BRIDGE_FLAGS_SELF
) ||
2605 nla_put_u16(skb
, IFLA_BRIDGE_MODE
, mode
)) {
2606 nla_nest_cancel(skb
, br_afspec
);
2607 goto nla_put_failure
;
2609 nla_nest_end(skb
, br_afspec
);
2611 return nlmsg_end(skb
, nlh
);
2613 nlmsg_cancel(skb
, nlh
);
2616 EXPORT_SYMBOL(ndo_dflt_bridge_getlink
);
2618 static int rtnl_bridge_getlink(struct sk_buff
*skb
, struct netlink_callback
*cb
)
2620 struct net
*net
= sock_net(skb
->sk
);
2621 struct net_device
*dev
;
2623 u32 portid
= NETLINK_CB(cb
->skb
).portid
;
2624 u32 seq
= cb
->nlh
->nlmsg_seq
;
2625 struct nlattr
*extfilt
;
2626 u32 filter_mask
= 0;
2628 extfilt
= nlmsg_find_attr(cb
->nlh
, sizeof(struct ifinfomsg
),
2631 filter_mask
= nla_get_u32(extfilt
);
2634 for_each_netdev_rcu(net
, dev
) {
2635 const struct net_device_ops
*ops
= dev
->netdev_ops
;
2636 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
2638 if (br_dev
&& br_dev
->netdev_ops
->ndo_bridge_getlink
) {
2639 if (idx
>= cb
->args
[0] &&
2640 br_dev
->netdev_ops
->ndo_bridge_getlink(
2641 skb
, portid
, seq
, dev
, filter_mask
) < 0)
2646 if (ops
->ndo_bridge_getlink
) {
2647 if (idx
>= cb
->args
[0] &&
2648 ops
->ndo_bridge_getlink(skb
, portid
, seq
, dev
,
2660 static inline size_t bridge_nlmsg_size(void)
2662 return NLMSG_ALIGN(sizeof(struct ifinfomsg
))
2663 + nla_total_size(IFNAMSIZ
) /* IFLA_IFNAME */
2664 + nla_total_size(MAX_ADDR_LEN
) /* IFLA_ADDRESS */
2665 + nla_total_size(sizeof(u32
)) /* IFLA_MASTER */
2666 + nla_total_size(sizeof(u32
)) /* IFLA_MTU */
2667 + nla_total_size(sizeof(u32
)) /* IFLA_LINK */
2668 + nla_total_size(sizeof(u32
)) /* IFLA_OPERSTATE */
2669 + nla_total_size(sizeof(u8
)) /* IFLA_PROTINFO */
2670 + nla_total_size(sizeof(struct nlattr
)) /* IFLA_AF_SPEC */
2671 + nla_total_size(sizeof(u16
)) /* IFLA_BRIDGE_FLAGS */
2672 + nla_total_size(sizeof(u16
)); /* IFLA_BRIDGE_MODE */
2675 static int rtnl_bridge_notify(struct net_device
*dev
, u16 flags
)
2677 struct net
*net
= dev_net(dev
);
2678 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
2679 struct sk_buff
*skb
;
2680 int err
= -EOPNOTSUPP
;
2682 skb
= nlmsg_new(bridge_nlmsg_size(), GFP_ATOMIC
);
2688 if ((!flags
|| (flags
& BRIDGE_FLAGS_MASTER
)) &&
2689 br_dev
&& br_dev
->netdev_ops
->ndo_bridge_getlink
) {
2690 err
= br_dev
->netdev_ops
->ndo_bridge_getlink(skb
, 0, 0, dev
, 0);
2695 if ((flags
& BRIDGE_FLAGS_SELF
) &&
2696 dev
->netdev_ops
->ndo_bridge_getlink
) {
2697 err
= dev
->netdev_ops
->ndo_bridge_getlink(skb
, 0, 0, dev
, 0);
2702 rtnl_notify(skb
, net
, 0, RTNLGRP_LINK
, NULL
, GFP_ATOMIC
);
2705 WARN_ON(err
== -EMSGSIZE
);
2707 rtnl_set_sk_err(net
, RTNLGRP_LINK
, err
);
2711 static int rtnl_bridge_setlink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2713 struct net
*net
= sock_net(skb
->sk
);
2714 struct ifinfomsg
*ifm
;
2715 struct net_device
*dev
;
2716 struct nlattr
*br_spec
, *attr
= NULL
;
2717 int rem
, err
= -EOPNOTSUPP
;
2718 u16 oflags
, flags
= 0;
2719 bool have_flags
= false;
2721 if (nlmsg_len(nlh
) < sizeof(*ifm
))
2724 ifm
= nlmsg_data(nlh
);
2725 if (ifm
->ifi_family
!= AF_BRIDGE
)
2726 return -EPFNOSUPPORT
;
2728 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
2730 pr_info("PF_BRIDGE: RTM_SETLINK with unknown ifindex\n");
2734 br_spec
= nlmsg_find_attr(nlh
, sizeof(struct ifinfomsg
), IFLA_AF_SPEC
);
2736 nla_for_each_nested(attr
, br_spec
, rem
) {
2737 if (nla_type(attr
) == IFLA_BRIDGE_FLAGS
) {
2739 flags
= nla_get_u16(attr
);
2747 if (!flags
|| (flags
& BRIDGE_FLAGS_MASTER
)) {
2748 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
2750 if (!br_dev
|| !br_dev
->netdev_ops
->ndo_bridge_setlink
) {
2755 err
= br_dev
->netdev_ops
->ndo_bridge_setlink(dev
, nlh
);
2759 flags
&= ~BRIDGE_FLAGS_MASTER
;
2762 if ((flags
& BRIDGE_FLAGS_SELF
)) {
2763 if (!dev
->netdev_ops
->ndo_bridge_setlink
)
2766 err
= dev
->netdev_ops
->ndo_bridge_setlink(dev
, nlh
);
2769 flags
&= ~BRIDGE_FLAGS_SELF
;
2773 memcpy(nla_data(attr
), &flags
, sizeof(flags
));
2774 /* Generate event to notify upper layer of bridge change */
2776 err
= rtnl_bridge_notify(dev
, oflags
);
2781 static int rtnl_bridge_dellink(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2783 struct net
*net
= sock_net(skb
->sk
);
2784 struct ifinfomsg
*ifm
;
2785 struct net_device
*dev
;
2786 struct nlattr
*br_spec
, *attr
= NULL
;
2787 int rem
, err
= -EOPNOTSUPP
;
2788 u16 oflags
, flags
= 0;
2789 bool have_flags
= false;
2791 if (nlmsg_len(nlh
) < sizeof(*ifm
))
2794 ifm
= nlmsg_data(nlh
);
2795 if (ifm
->ifi_family
!= AF_BRIDGE
)
2796 return -EPFNOSUPPORT
;
2798 dev
= __dev_get_by_index(net
, ifm
->ifi_index
);
2800 pr_info("PF_BRIDGE: RTM_SETLINK with unknown ifindex\n");
2804 br_spec
= nlmsg_find_attr(nlh
, sizeof(struct ifinfomsg
), IFLA_AF_SPEC
);
2806 nla_for_each_nested(attr
, br_spec
, rem
) {
2807 if (nla_type(attr
) == IFLA_BRIDGE_FLAGS
) {
2809 flags
= nla_get_u16(attr
);
2817 if (!flags
|| (flags
& BRIDGE_FLAGS_MASTER
)) {
2818 struct net_device
*br_dev
= netdev_master_upper_dev_get(dev
);
2820 if (!br_dev
|| !br_dev
->netdev_ops
->ndo_bridge_dellink
) {
2825 err
= br_dev
->netdev_ops
->ndo_bridge_dellink(dev
, nlh
);
2829 flags
&= ~BRIDGE_FLAGS_MASTER
;
2832 if ((flags
& BRIDGE_FLAGS_SELF
)) {
2833 if (!dev
->netdev_ops
->ndo_bridge_dellink
)
2836 err
= dev
->netdev_ops
->ndo_bridge_dellink(dev
, nlh
);
2839 flags
&= ~BRIDGE_FLAGS_SELF
;
2843 memcpy(nla_data(attr
), &flags
, sizeof(flags
));
2844 /* Generate event to notify upper layer of bridge change */
2846 err
= rtnl_bridge_notify(dev
, oflags
);
2851 /* Process one rtnetlink message. */
2853 static int rtnetlink_rcv_msg(struct sk_buff
*skb
, struct nlmsghdr
*nlh
)
2855 struct net
*net
= sock_net(skb
->sk
);
2856 rtnl_doit_func doit
;
2862 type
= nlh
->nlmsg_type
;
2868 /* All the messages must have at least 1 byte length */
2869 if (nlmsg_len(nlh
) < sizeof(struct rtgenmsg
))
2872 family
= ((struct rtgenmsg
*)nlmsg_data(nlh
))->rtgen_family
;
2876 if (kind
!= 2 && !netlink_net_capable(skb
, CAP_NET_ADMIN
))
2879 if (kind
== 2 && nlh
->nlmsg_flags
&NLM_F_DUMP
) {
2881 rtnl_dumpit_func dumpit
;
2882 rtnl_calcit_func calcit
;
2883 u16 min_dump_alloc
= 0;
2885 dumpit
= rtnl_get_dumpit(family
, type
);
2888 calcit
= rtnl_get_calcit(family
, type
);
2890 min_dump_alloc
= calcit(skb
, nlh
);
2895 struct netlink_dump_control c
= {
2897 .min_dump_alloc
= min_dump_alloc
,
2899 err
= netlink_dump_start(rtnl
, skb
, nlh
, &c
);
2905 doit
= rtnl_get_doit(family
, type
);
2909 return doit(skb
, nlh
);
2912 static void rtnetlink_rcv(struct sk_buff
*skb
)
2915 netlink_rcv_skb(skb
, &rtnetlink_rcv_msg
);
2919 static int rtnetlink_event(struct notifier_block
*this, unsigned long event
, void *ptr
)
2921 struct net_device
*dev
= netdev_notifier_info_to_dev(ptr
);
2927 case NETDEV_POST_INIT
:
2928 case NETDEV_REGISTER
:
2930 case NETDEV_PRE_TYPE_CHANGE
:
2931 case NETDEV_GOING_DOWN
:
2932 case NETDEV_UNREGISTER
:
2933 case NETDEV_UNREGISTER_FINAL
:
2934 case NETDEV_RELEASE
:
2938 rtmsg_ifinfo(RTM_NEWLINK
, dev
, 0, GFP_KERNEL
);
2944 static struct notifier_block rtnetlink_dev_notifier
= {
2945 .notifier_call
= rtnetlink_event
,
2949 static int __net_init
rtnetlink_net_init(struct net
*net
)
2952 struct netlink_kernel_cfg cfg
= {
2953 .groups
= RTNLGRP_MAX
,
2954 .input
= rtnetlink_rcv
,
2955 .cb_mutex
= &rtnl_mutex
,
2956 .flags
= NL_CFG_F_NONROOT_RECV
,
2959 sk
= netlink_kernel_create(net
, NETLINK_ROUTE
, &cfg
);
2966 static void __net_exit
rtnetlink_net_exit(struct net
*net
)
2968 netlink_kernel_release(net
->rtnl
);
2972 static struct pernet_operations rtnetlink_net_ops
= {
2973 .init
= rtnetlink_net_init
,
2974 .exit
= rtnetlink_net_exit
,
2977 void __init
rtnetlink_init(void)
2979 if (register_pernet_subsys(&rtnetlink_net_ops
))
2980 panic("rtnetlink_init: cannot initialize rtnetlink\n");
2982 register_netdevice_notifier(&rtnetlink_dev_notifier
);
2984 rtnl_register(PF_UNSPEC
, RTM_GETLINK
, rtnl_getlink
,
2985 rtnl_dump_ifinfo
, rtnl_calcit
);
2986 rtnl_register(PF_UNSPEC
, RTM_SETLINK
, rtnl_setlink
, NULL
, NULL
);
2987 rtnl_register(PF_UNSPEC
, RTM_NEWLINK
, rtnl_newlink
, NULL
, NULL
);
2988 rtnl_register(PF_UNSPEC
, RTM_DELLINK
, rtnl_dellink
, NULL
, NULL
);
2990 rtnl_register(PF_UNSPEC
, RTM_GETADDR
, NULL
, rtnl_dump_all
, NULL
);
2991 rtnl_register(PF_UNSPEC
, RTM_GETROUTE
, NULL
, rtnl_dump_all
, NULL
);
2993 rtnl_register(PF_BRIDGE
, RTM_NEWNEIGH
, rtnl_fdb_add
, NULL
, NULL
);
2994 rtnl_register(PF_BRIDGE
, RTM_DELNEIGH
, rtnl_fdb_del
, NULL
, NULL
);
2995 rtnl_register(PF_BRIDGE
, RTM_GETNEIGH
, NULL
, rtnl_fdb_dump
, NULL
);
2997 rtnl_register(PF_BRIDGE
, RTM_GETLINK
, NULL
, rtnl_bridge_getlink
, NULL
);
2998 rtnl_register(PF_BRIDGE
, RTM_DELLINK
, rtnl_bridge_dellink
, NULL
, NULL
);
2999 rtnl_register(PF_BRIDGE
, RTM_SETLINK
, rtnl_bridge_setlink
, NULL
, NULL
);