]>
Commit | Line | Data |
---|---|---|
b863ceb7 PM |
1 | /* |
2 | * Copyright (c) 2007 Patrick McHardy <kaber@trash.net> | |
3 | * | |
4 | * This program is free software; you can redistribute it and/or | |
5 | * modify it under the terms of the GNU General Public License as | |
6 | * published by the Free Software Foundation; either version 2 of | |
7 | * the License, or (at your option) any later version. | |
8 | * | |
9 | * The code this is based on carried the following copyright notice: | |
10 | * --- | |
11 | * (C) Copyright 2001-2006 | |
12 | * Alex Zeffertt, Cambridge Broadband Ltd, ajz@cambridgebroadband.com | |
13 | * Re-worked by Ben Greear <greearb@candelatech.com> | |
14 | * --- | |
15 | */ | |
16 | #include <linux/kernel.h> | |
17 | #include <linux/types.h> | |
18 | #include <linux/module.h> | |
19 | #include <linux/init.h> | |
20 | #include <linux/errno.h> | |
21 | #include <linux/slab.h> | |
22 | #include <linux/string.h> | |
23 | #include <linux/list.h> | |
24 | #include <linux/notifier.h> | |
25 | #include <linux/netdevice.h> | |
26 | #include <linux/etherdevice.h> | |
27 | #include <linux/ethtool.h> | |
28 | #include <linux/if_arp.h> | |
29 | #include <linux/if_link.h> | |
30 | #include <linux/if_macvlan.h> | |
31 | #include <net/rtnetlink.h> | |
32 | ||
33 | #define MACVLAN_HASH_SIZE (1 << BITS_PER_BYTE) | |
34 | ||
35 | struct macvlan_port { | |
36 | struct net_device *dev; | |
37 | struct hlist_head vlan_hash[MACVLAN_HASH_SIZE]; | |
38 | struct list_head vlans; | |
39 | }; | |
40 | ||
41 | struct macvlan_dev { | |
42 | struct net_device *dev; | |
43 | struct list_head list; | |
44 | struct hlist_node hlist; | |
45 | struct macvlan_port *port; | |
46 | struct net_device *lowerdev; | |
47 | }; | |
48 | ||
49 | ||
50 | static struct macvlan_dev *macvlan_hash_lookup(const struct macvlan_port *port, | |
51 | const unsigned char *addr) | |
52 | { | |
53 | struct macvlan_dev *vlan; | |
54 | struct hlist_node *n; | |
55 | ||
56 | hlist_for_each_entry_rcu(vlan, n, &port->vlan_hash[addr[5]], hlist) { | |
57 | if (!compare_ether_addr(vlan->dev->dev_addr, addr)) | |
58 | return vlan; | |
59 | } | |
60 | return NULL; | |
61 | } | |
62 | ||
63 | static void macvlan_broadcast(struct sk_buff *skb, | |
64 | const struct macvlan_port *port) | |
65 | { | |
66 | const struct ethhdr *eth = eth_hdr(skb); | |
67 | const struct macvlan_dev *vlan; | |
68 | struct hlist_node *n; | |
69 | struct net_device *dev; | |
70 | struct sk_buff *nskb; | |
71 | unsigned int i; | |
72 | ||
73 | for (i = 0; i < MACVLAN_HASH_SIZE; i++) { | |
74 | hlist_for_each_entry_rcu(vlan, n, &port->vlan_hash[i], hlist) { | |
75 | dev = vlan->dev; | |
b863ceb7 PM |
76 | |
77 | nskb = skb_clone(skb, GFP_ATOMIC); | |
78 | if (nskb == NULL) { | |
79 | dev->stats.rx_errors++; | |
80 | dev->stats.rx_dropped++; | |
81 | continue; | |
82 | } | |
83 | ||
84 | dev->stats.rx_bytes += skb->len + ETH_HLEN; | |
85 | dev->stats.rx_packets++; | |
86 | dev->stats.multicast++; | |
87 | dev->last_rx = jiffies; | |
88 | ||
89 | nskb->dev = dev; | |
90 | if (!compare_ether_addr(eth->h_dest, dev->broadcast)) | |
91 | nskb->pkt_type = PACKET_BROADCAST; | |
92 | else | |
93 | nskb->pkt_type = PACKET_MULTICAST; | |
94 | ||
95 | netif_rx(nskb); | |
96 | } | |
97 | } | |
98 | } | |
99 | ||
100 | /* called under rcu_read_lock() from netif_receive_skb */ | |
101 | static struct sk_buff *macvlan_handle_frame(struct sk_buff *skb) | |
102 | { | |
103 | const struct ethhdr *eth = eth_hdr(skb); | |
104 | const struct macvlan_port *port; | |
105 | const struct macvlan_dev *vlan; | |
106 | struct net_device *dev; | |
107 | ||
108 | port = rcu_dereference(skb->dev->macvlan_port); | |
109 | if (port == NULL) | |
110 | return skb; | |
111 | ||
112 | if (is_multicast_ether_addr(eth->h_dest)) { | |
113 | macvlan_broadcast(skb, port); | |
114 | return skb; | |
115 | } | |
116 | ||
117 | vlan = macvlan_hash_lookup(port, eth->h_dest); | |
118 | if (vlan == NULL) | |
119 | return skb; | |
120 | ||
121 | dev = vlan->dev; | |
122 | if (unlikely(!(dev->flags & IFF_UP))) { | |
123 | kfree_skb(skb); | |
124 | return NULL; | |
125 | } | |
126 | ||
127 | skb = skb_share_check(skb, GFP_ATOMIC); | |
128 | if (skb == NULL) { | |
129 | dev->stats.rx_errors++; | |
130 | dev->stats.rx_dropped++; | |
131 | return NULL; | |
132 | } | |
133 | ||
134 | dev->stats.rx_bytes += skb->len + ETH_HLEN; | |
135 | dev->stats.rx_packets++; | |
136 | dev->last_rx = jiffies; | |
137 | ||
138 | skb->dev = dev; | |
139 | skb->pkt_type = PACKET_HOST; | |
140 | ||
141 | netif_rx(skb); | |
142 | return NULL; | |
143 | } | |
144 | ||
145 | static int macvlan_hard_start_xmit(struct sk_buff *skb, struct net_device *dev) | |
146 | { | |
147 | const struct macvlan_dev *vlan = netdev_priv(dev); | |
148 | unsigned int len = skb->len; | |
149 | int ret; | |
150 | ||
151 | skb->dev = vlan->lowerdev; | |
152 | ret = dev_queue_xmit(skb); | |
153 | ||
154 | if (likely(ret == NET_XMIT_SUCCESS)) { | |
155 | dev->stats.tx_packets++; | |
156 | dev->stats.tx_bytes += len; | |
157 | } else { | |
158 | dev->stats.tx_errors++; | |
159 | dev->stats.tx_aborted_errors++; | |
160 | } | |
161 | return NETDEV_TX_OK; | |
162 | } | |
163 | ||
164 | static int macvlan_hard_header(struct sk_buff *skb, struct net_device *dev, | |
3b04ddde SH |
165 | unsigned short type, const void *daddr, |
166 | const void *saddr, unsigned len) | |
b863ceb7 PM |
167 | { |
168 | const struct macvlan_dev *vlan = netdev_priv(dev); | |
169 | struct net_device *lowerdev = vlan->lowerdev; | |
170 | ||
0c4e8581 SH |
171 | return dev_hard_header(skb, lowerdev, type, daddr, |
172 | saddr ? : dev->dev_addr, len); | |
b863ceb7 PM |
173 | } |
174 | ||
3b04ddde SH |
175 | static const struct header_ops macvlan_hard_header_ops = { |
176 | .create = macvlan_hard_header, | |
177 | .rebuild = eth_rebuild_header, | |
178 | .parse = eth_header_parse, | |
3b04ddde SH |
179 | .cache = eth_header_cache, |
180 | .cache_update = eth_header_cache_update, | |
181 | }; | |
182 | ||
b863ceb7 PM |
183 | static int macvlan_open(struct net_device *dev) |
184 | { | |
185 | struct macvlan_dev *vlan = netdev_priv(dev); | |
186 | struct macvlan_port *port = vlan->port; | |
187 | struct net_device *lowerdev = vlan->lowerdev; | |
188 | int err; | |
189 | ||
190 | err = dev_unicast_add(lowerdev, dev->dev_addr, ETH_ALEN); | |
191 | if (err < 0) | |
b89fb7da WC |
192 | goto out; |
193 | if (dev->flags & IFF_ALLMULTI) { | |
194 | err = dev_set_allmulti(lowerdev, 1); | |
195 | if (err < 0) | |
196 | goto del_unicast; | |
197 | } | |
b863ceb7 PM |
198 | |
199 | hlist_add_head_rcu(&vlan->hlist, &port->vlan_hash[dev->dev_addr[5]]); | |
200 | return 0; | |
b89fb7da WC |
201 | |
202 | del_unicast: | |
203 | dev_unicast_delete(lowerdev, dev->dev_addr, ETH_ALEN); | |
204 | out: | |
205 | return err; | |
b863ceb7 PM |
206 | } |
207 | ||
208 | static int macvlan_stop(struct net_device *dev) | |
209 | { | |
210 | struct macvlan_dev *vlan = netdev_priv(dev); | |
211 | struct net_device *lowerdev = vlan->lowerdev; | |
212 | ||
213 | dev_mc_unsync(lowerdev, dev); | |
214 | if (dev->flags & IFF_ALLMULTI) | |
215 | dev_set_allmulti(lowerdev, -1); | |
216 | ||
217 | dev_unicast_delete(lowerdev, dev->dev_addr, ETH_ALEN); | |
218 | ||
219 | hlist_del_rcu(&vlan->hlist); | |
220 | synchronize_rcu(); | |
221 | return 0; | |
222 | } | |
223 | ||
ad5d20a6 PM |
224 | static int macvlan_set_mac_address(struct net_device *dev, void *p) |
225 | { | |
226 | struct macvlan_dev *vlan = netdev_priv(dev); | |
227 | struct net_device *lowerdev = vlan->lowerdev; | |
228 | struct sockaddr *addr = p; | |
229 | int err; | |
230 | ||
231 | if (!is_valid_ether_addr(addr->sa_data)) | |
232 | return -EADDRNOTAVAIL; | |
233 | ||
234 | if (!(dev->flags & IFF_UP)) | |
235 | goto out; | |
236 | ||
237 | err = dev_unicast_add(lowerdev, addr->sa_data, ETH_ALEN); | |
238 | if (err < 0) | |
239 | return err; | |
240 | dev_unicast_delete(lowerdev, dev->dev_addr, ETH_ALEN); | |
241 | ||
242 | out: | |
243 | memcpy(dev->dev_addr, addr->sa_data, ETH_ALEN); | |
244 | return 0; | |
245 | } | |
246 | ||
b863ceb7 PM |
247 | static void macvlan_change_rx_flags(struct net_device *dev, int change) |
248 | { | |
249 | struct macvlan_dev *vlan = netdev_priv(dev); | |
250 | struct net_device *lowerdev = vlan->lowerdev; | |
251 | ||
252 | if (change & IFF_ALLMULTI) | |
253 | dev_set_allmulti(lowerdev, dev->flags & IFF_ALLMULTI ? 1 : -1); | |
254 | } | |
255 | ||
256 | static void macvlan_set_multicast_list(struct net_device *dev) | |
257 | { | |
258 | struct macvlan_dev *vlan = netdev_priv(dev); | |
259 | ||
260 | dev_mc_sync(vlan->lowerdev, dev); | |
261 | } | |
262 | ||
263 | static int macvlan_change_mtu(struct net_device *dev, int new_mtu) | |
264 | { | |
265 | struct macvlan_dev *vlan = netdev_priv(dev); | |
266 | ||
267 | if (new_mtu < 68 || vlan->lowerdev->mtu < new_mtu) | |
268 | return -EINVAL; | |
269 | dev->mtu = new_mtu; | |
270 | return 0; | |
271 | } | |
272 | ||
273 | /* | |
274 | * macvlan network devices have devices nesting below it and are a special | |
275 | * "super class" of normal network devices; split their locks off into a | |
276 | * separate class since they always nest. | |
277 | */ | |
278 | static struct lock_class_key macvlan_netdev_xmit_lock_key; | |
279 | ||
280 | #define MACVLAN_FEATURES \ | |
281 | (NETIF_F_SG | NETIF_F_ALL_CSUM | NETIF_F_HIGHDMA | NETIF_F_FRAGLIST | \ | |
282 | NETIF_F_GSO | NETIF_F_TSO | NETIF_F_UFO | NETIF_F_GSO_ROBUST | \ | |
283 | NETIF_F_TSO_ECN | NETIF_F_TSO6) | |
284 | ||
285 | #define MACVLAN_STATE_MASK \ | |
286 | ((1<<__LINK_STATE_NOCARRIER) | (1<<__LINK_STATE_DORMANT)) | |
287 | ||
c773e847 DM |
288 | static void macvlan_set_lockdep_class_one(struct netdev_queue *txq) |
289 | { | |
290 | lockdep_set_class(&txq->_xmit_lock, | |
291 | &macvlan_netdev_xmit_lock_key); | |
292 | } | |
293 | ||
294 | static void macvlan_set_lockdep_class(struct net_device *dev) | |
295 | { | |
296 | macvlan_set_lockdep_class_one(&dev->tx_queue); | |
297 | } | |
298 | ||
b863ceb7 PM |
299 | static int macvlan_init(struct net_device *dev) |
300 | { | |
301 | struct macvlan_dev *vlan = netdev_priv(dev); | |
302 | const struct net_device *lowerdev = vlan->lowerdev; | |
303 | ||
304 | dev->state = (dev->state & ~MACVLAN_STATE_MASK) | | |
305 | (lowerdev->state & MACVLAN_STATE_MASK); | |
306 | dev->features = lowerdev->features & MACVLAN_FEATURES; | |
307 | dev->iflink = lowerdev->ifindex; | |
308 | ||
c773e847 DM |
309 | macvlan_set_lockdep_class(dev); |
310 | ||
b863ceb7 PM |
311 | return 0; |
312 | } | |
313 | ||
314 | static void macvlan_ethtool_get_drvinfo(struct net_device *dev, | |
315 | struct ethtool_drvinfo *drvinfo) | |
316 | { | |
317 | snprintf(drvinfo->driver, 32, "macvlan"); | |
318 | snprintf(drvinfo->version, 32, "0.1"); | |
319 | } | |
320 | ||
321 | static u32 macvlan_ethtool_get_rx_csum(struct net_device *dev) | |
322 | { | |
323 | const struct macvlan_dev *vlan = netdev_priv(dev); | |
324 | struct net_device *lowerdev = vlan->lowerdev; | |
325 | ||
326 | if (lowerdev->ethtool_ops->get_rx_csum == NULL) | |
327 | return 0; | |
328 | return lowerdev->ethtool_ops->get_rx_csum(lowerdev); | |
329 | } | |
330 | ||
331 | static const struct ethtool_ops macvlan_ethtool_ops = { | |
332 | .get_link = ethtool_op_get_link, | |
333 | .get_rx_csum = macvlan_ethtool_get_rx_csum, | |
b863ceb7 PM |
334 | .get_drvinfo = macvlan_ethtool_get_drvinfo, |
335 | }; | |
336 | ||
337 | static void macvlan_setup(struct net_device *dev) | |
338 | { | |
339 | ether_setup(dev); | |
340 | ||
341 | dev->init = macvlan_init; | |
342 | dev->open = macvlan_open; | |
343 | dev->stop = macvlan_stop; | |
344 | dev->change_mtu = macvlan_change_mtu; | |
345 | dev->change_rx_flags = macvlan_change_rx_flags; | |
ad5d20a6 | 346 | dev->set_mac_address = macvlan_set_mac_address; |
b863ceb7 | 347 | dev->set_multicast_list = macvlan_set_multicast_list; |
b863ceb7 PM |
348 | dev->hard_start_xmit = macvlan_hard_start_xmit; |
349 | dev->destructor = free_netdev; | |
3b04ddde | 350 | dev->header_ops = &macvlan_hard_header_ops, |
b863ceb7 PM |
351 | dev->ethtool_ops = &macvlan_ethtool_ops; |
352 | dev->tx_queue_len = 0; | |
353 | } | |
354 | ||
355 | static int macvlan_port_create(struct net_device *dev) | |
356 | { | |
357 | struct macvlan_port *port; | |
358 | unsigned int i; | |
359 | ||
360 | if (dev->type != ARPHRD_ETHER || dev->flags & IFF_LOOPBACK) | |
361 | return -EINVAL; | |
362 | ||
363 | port = kzalloc(sizeof(*port), GFP_KERNEL); | |
364 | if (port == NULL) | |
365 | return -ENOMEM; | |
366 | ||
367 | port->dev = dev; | |
368 | INIT_LIST_HEAD(&port->vlans); | |
369 | for (i = 0; i < MACVLAN_HASH_SIZE; i++) | |
370 | INIT_HLIST_HEAD(&port->vlan_hash[i]); | |
371 | rcu_assign_pointer(dev->macvlan_port, port); | |
372 | return 0; | |
373 | } | |
374 | ||
375 | static void macvlan_port_destroy(struct net_device *dev) | |
376 | { | |
377 | struct macvlan_port *port = dev->macvlan_port; | |
378 | ||
379 | rcu_assign_pointer(dev->macvlan_port, NULL); | |
380 | synchronize_rcu(); | |
381 | kfree(port); | |
382 | } | |
383 | ||
384 | static void macvlan_transfer_operstate(struct net_device *dev) | |
385 | { | |
386 | struct macvlan_dev *vlan = netdev_priv(dev); | |
387 | const struct net_device *lowerdev = vlan->lowerdev; | |
388 | ||
389 | if (lowerdev->operstate == IF_OPER_DORMANT) | |
390 | netif_dormant_on(dev); | |
391 | else | |
392 | netif_dormant_off(dev); | |
393 | ||
394 | if (netif_carrier_ok(lowerdev)) { | |
395 | if (!netif_carrier_ok(dev)) | |
396 | netif_carrier_on(dev); | |
397 | } else { | |
f12ca5f9 | 398 | if (netif_carrier_ok(dev)) |
b863ceb7 PM |
399 | netif_carrier_off(dev); |
400 | } | |
401 | } | |
402 | ||
403 | static int macvlan_validate(struct nlattr *tb[], struct nlattr *data[]) | |
404 | { | |
405 | if (tb[IFLA_ADDRESS]) { | |
406 | if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN) | |
407 | return -EINVAL; | |
408 | if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS]))) | |
409 | return -EADDRNOTAVAIL; | |
410 | } | |
411 | return 0; | |
412 | } | |
413 | ||
414 | static int macvlan_newlink(struct net_device *dev, | |
415 | struct nlattr *tb[], struct nlattr *data[]) | |
416 | { | |
417 | struct macvlan_dev *vlan = netdev_priv(dev); | |
418 | struct macvlan_port *port; | |
419 | struct net_device *lowerdev; | |
420 | int err; | |
421 | ||
422 | if (!tb[IFLA_LINK]) | |
423 | return -EINVAL; | |
424 | ||
c346dca1 | 425 | lowerdev = __dev_get_by_index(dev_net(dev), nla_get_u32(tb[IFLA_LINK])); |
b863ceb7 PM |
426 | if (lowerdev == NULL) |
427 | return -ENODEV; | |
428 | ||
a6ca5f1d PM |
429 | /* Don't allow macvlans on top of other macvlans - its not really |
430 | * wrong, but lockdep can't handle it and its not useful for anything | |
431 | * you couldn't do directly on top of the real device. | |
432 | */ | |
433 | if (lowerdev->rtnl_link_ops == dev->rtnl_link_ops) | |
434 | return -ENODEV; | |
435 | ||
b863ceb7 PM |
436 | if (!tb[IFLA_MTU]) |
437 | dev->mtu = lowerdev->mtu; | |
438 | else if (dev->mtu > lowerdev->mtu) | |
439 | return -EINVAL; | |
440 | ||
441 | if (!tb[IFLA_ADDRESS]) | |
442 | random_ether_addr(dev->dev_addr); | |
443 | ||
444 | if (lowerdev->macvlan_port == NULL) { | |
445 | err = macvlan_port_create(lowerdev); | |
446 | if (err < 0) | |
447 | return err; | |
448 | } | |
449 | port = lowerdev->macvlan_port; | |
450 | ||
451 | vlan->lowerdev = lowerdev; | |
452 | vlan->dev = dev; | |
453 | vlan->port = port; | |
454 | ||
455 | err = register_netdevice(dev); | |
456 | if (err < 0) | |
457 | return err; | |
458 | ||
459 | list_add_tail(&vlan->list, &port->vlans); | |
460 | macvlan_transfer_operstate(dev); | |
461 | return 0; | |
462 | } | |
463 | ||
464 | static void macvlan_dellink(struct net_device *dev) | |
465 | { | |
466 | struct macvlan_dev *vlan = netdev_priv(dev); | |
467 | struct macvlan_port *port = vlan->port; | |
468 | ||
469 | list_del(&vlan->list); | |
470 | unregister_netdevice(dev); | |
471 | ||
472 | if (list_empty(&port->vlans)) | |
73120964 | 473 | macvlan_port_destroy(port->dev); |
b863ceb7 PM |
474 | } |
475 | ||
476 | static struct rtnl_link_ops macvlan_link_ops __read_mostly = { | |
477 | .kind = "macvlan", | |
478 | .priv_size = sizeof(struct macvlan_dev), | |
479 | .setup = macvlan_setup, | |
480 | .validate = macvlan_validate, | |
481 | .newlink = macvlan_newlink, | |
482 | .dellink = macvlan_dellink, | |
483 | }; | |
484 | ||
485 | static int macvlan_device_event(struct notifier_block *unused, | |
486 | unsigned long event, void *ptr) | |
487 | { | |
488 | struct net_device *dev = ptr; | |
489 | struct macvlan_dev *vlan, *next; | |
490 | struct macvlan_port *port; | |
491 | ||
492 | port = dev->macvlan_port; | |
493 | if (port == NULL) | |
494 | return NOTIFY_DONE; | |
495 | ||
496 | switch (event) { | |
497 | case NETDEV_CHANGE: | |
498 | list_for_each_entry(vlan, &port->vlans, list) | |
499 | macvlan_transfer_operstate(vlan->dev); | |
500 | break; | |
501 | case NETDEV_FEAT_CHANGE: | |
502 | list_for_each_entry(vlan, &port->vlans, list) { | |
503 | vlan->dev->features = dev->features & MACVLAN_FEATURES; | |
504 | netdev_features_change(vlan->dev); | |
505 | } | |
506 | break; | |
507 | case NETDEV_UNREGISTER: | |
508 | list_for_each_entry_safe(vlan, next, &port->vlans, list) | |
509 | macvlan_dellink(vlan->dev); | |
510 | break; | |
511 | } | |
512 | return NOTIFY_DONE; | |
513 | } | |
514 | ||
515 | static struct notifier_block macvlan_notifier_block __read_mostly = { | |
516 | .notifier_call = macvlan_device_event, | |
517 | }; | |
518 | ||
519 | static int __init macvlan_init_module(void) | |
520 | { | |
521 | int err; | |
522 | ||
523 | register_netdevice_notifier(&macvlan_notifier_block); | |
524 | macvlan_handle_frame_hook = macvlan_handle_frame; | |
525 | ||
526 | err = rtnl_link_register(&macvlan_link_ops); | |
527 | if (err < 0) | |
528 | goto err1; | |
529 | return 0; | |
530 | err1: | |
52913246 | 531 | macvlan_handle_frame_hook = NULL; |
b863ceb7 PM |
532 | unregister_netdevice_notifier(&macvlan_notifier_block); |
533 | return err; | |
534 | } | |
535 | ||
536 | static void __exit macvlan_cleanup_module(void) | |
537 | { | |
538 | rtnl_link_unregister(&macvlan_link_ops); | |
539 | macvlan_handle_frame_hook = NULL; | |
540 | unregister_netdevice_notifier(&macvlan_notifier_block); | |
541 | } | |
542 | ||
543 | module_init(macvlan_init_module); | |
544 | module_exit(macvlan_cleanup_module); | |
545 | ||
546 | MODULE_LICENSE("GPL"); | |
547 | MODULE_AUTHOR("Patrick McHardy <kaber@trash.net>"); | |
548 | MODULE_DESCRIPTION("Driver for MAC address based VLANs"); | |
549 | MODULE_ALIAS_RTNL_LINK("macvlan"); |