]> git.proxmox.com Git - mirror_ovs.git/blob - datapath/vport-internal_dev.c
datapath: Improve kernel hash table
[mirror_ovs.git] / datapath / vport-internal_dev.c
1 /*
2 * Copyright (c) 2009, 2010, 2011 Nicira Networks.
3 * Distributed under the terms of the GNU GPL version 2.
4 *
5 * Significant portions of this file may be copied from parts of the Linux
6 * kernel, by Linus Torvalds and others.
7 */
8
9 #include <linux/hardirq.h>
10 #include <linux/if_vlan.h>
11 #include <linux/kernel.h>
12 #include <linux/netdevice.h>
13 #include <linux/etherdevice.h>
14 #include <linux/ethtool.h>
15 #include <linux/skbuff.h>
16 #include <linux/version.h>
17
18 #include "checksum.h"
19 #include "datapath.h"
20 #include "vlan.h"
21 #include "vport-generic.h"
22 #include "vport-internal_dev.h"
23 #include "vport-netdev.h"
24
25 struct internal_dev {
26 struct vport *vport;
27 struct net_device_stats stats;
28 };
29
30 static inline struct internal_dev *internal_dev_priv(struct net_device *netdev)
31 {
32 return netdev_priv(netdev);
33 }
34
35 /* This function is only called by the kernel network layer. It is not a vport
36 * get_stats() function. If a vport get_stats() function is defined that
37 * results in this being called it will cause infinite recursion. */
38 static struct net_device_stats *internal_dev_sys_stats(struct net_device *netdev)
39 {
40 struct vport *vport = internal_dev_get_vport(netdev);
41 struct net_device_stats *stats = &internal_dev_priv(netdev)->stats;
42
43 if (vport) {
44 struct rtnl_link_stats64 vport_stats;
45
46 vport_get_stats(vport, &vport_stats);
47
48 /* The tx and rx stats need to be swapped because the switch
49 * and host OS have opposite perspectives. */
50 stats->rx_packets = vport_stats.tx_packets;
51 stats->tx_packets = vport_stats.rx_packets;
52 stats->rx_bytes = vport_stats.tx_bytes;
53 stats->tx_bytes = vport_stats.rx_bytes;
54 stats->rx_errors = vport_stats.tx_errors;
55 stats->tx_errors = vport_stats.rx_errors;
56 stats->rx_dropped = vport_stats.tx_dropped;
57 stats->tx_dropped = vport_stats.rx_dropped;
58 stats->collisions = vport_stats.collisions;
59 }
60
61 return stats;
62 }
63
64 static int internal_dev_mac_addr(struct net_device *dev, void *p)
65 {
66 struct sockaddr *addr = p;
67
68 if (!is_valid_ether_addr(addr->sa_data))
69 return -EADDRNOTAVAIL;
70 memcpy(dev->dev_addr, addr->sa_data, dev->addr_len);
71 return 0;
72 }
73
74 /* Called with rcu_read_lock and bottom-halves disabled. */
75 static int internal_dev_xmit(struct sk_buff *skb, struct net_device *netdev)
76 {
77 if (unlikely(compute_ip_summed(skb, true))) {
78 kfree_skb(skb);
79 return 0;
80 }
81
82 vlan_copy_skb_tci(skb);
83 OVS_CB(skb)->flow = NULL;
84
85 vport_receive(internal_dev_priv(netdev)->vport, skb);
86 return 0;
87 }
88
89 static int internal_dev_open(struct net_device *netdev)
90 {
91 netif_start_queue(netdev);
92 return 0;
93 }
94
95 static int internal_dev_stop(struct net_device *netdev)
96 {
97 netif_stop_queue(netdev);
98 return 0;
99 }
100
101 static void internal_dev_getinfo(struct net_device *netdev,
102 struct ethtool_drvinfo *info)
103 {
104 strcpy(info->driver, "openvswitch");
105 }
106
107 static const struct ethtool_ops internal_dev_ethtool_ops = {
108 .get_drvinfo = internal_dev_getinfo,
109 .get_link = ethtool_op_get_link,
110 .get_sg = ethtool_op_get_sg,
111 .set_sg = ethtool_op_set_sg,
112 .get_tx_csum = ethtool_op_get_tx_csum,
113 .set_tx_csum = ethtool_op_set_tx_hw_csum,
114 .get_tso = ethtool_op_get_tso,
115 .set_tso = ethtool_op_set_tso,
116 };
117
118 static int internal_dev_change_mtu(struct net_device *netdev, int new_mtu)
119 {
120 struct vport *vport = internal_dev_get_vport(netdev);
121
122 if (new_mtu < 68)
123 return -EINVAL;
124
125 if (new_mtu > dp_min_mtu(vport->dp))
126 return -EINVAL;
127
128 netdev->mtu = new_mtu;
129 return 0;
130 }
131
132 static int internal_dev_do_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
133 {
134 if (dp_ioctl_hook)
135 return dp_ioctl_hook(dev, ifr, cmd);
136
137 return -EOPNOTSUPP;
138 }
139
140 static void internal_dev_destructor(struct net_device *dev)
141 {
142 struct vport *vport = internal_dev_get_vport(dev);
143
144 vport_free(vport);
145 free_netdev(dev);
146 }
147
148 #ifdef HAVE_NET_DEVICE_OPS
149 static const struct net_device_ops internal_dev_netdev_ops = {
150 .ndo_open = internal_dev_open,
151 .ndo_stop = internal_dev_stop,
152 .ndo_start_xmit = internal_dev_xmit,
153 .ndo_set_mac_address = internal_dev_mac_addr,
154 .ndo_do_ioctl = internal_dev_do_ioctl,
155 .ndo_change_mtu = internal_dev_change_mtu,
156 .ndo_get_stats = internal_dev_sys_stats,
157 };
158 #endif
159
160 static void do_setup(struct net_device *netdev)
161 {
162 ether_setup(netdev);
163
164 #ifdef HAVE_NET_DEVICE_OPS
165 netdev->netdev_ops = &internal_dev_netdev_ops;
166 #else
167 netdev->do_ioctl = internal_dev_do_ioctl;
168 netdev->get_stats = internal_dev_sys_stats;
169 netdev->hard_start_xmit = internal_dev_xmit;
170 netdev->open = internal_dev_open;
171 netdev->stop = internal_dev_stop;
172 netdev->set_mac_address = internal_dev_mac_addr;
173 netdev->change_mtu = internal_dev_change_mtu;
174 #endif
175
176 netdev->destructor = internal_dev_destructor;
177 SET_ETHTOOL_OPS(netdev, &internal_dev_ethtool_ops);
178 netdev->tx_queue_len = 0;
179
180 netdev->flags = IFF_BROADCAST | IFF_MULTICAST;
181 netdev->features = NETIF_F_LLTX | NETIF_F_SG | NETIF_F_FRAGLIST |
182 NETIF_F_HIGHDMA | NETIF_F_HW_CSUM | NETIF_F_TSO;
183
184 #if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,27)
185 netdev->vlan_features = netdev->features;
186 netdev->features |= NETIF_F_HW_VLAN_TX;
187 #endif
188
189 vport_gen_rand_ether_addr(netdev->dev_addr);
190 }
191
192 static struct vport *internal_dev_create(const struct vport_parms *parms)
193 {
194 struct vport *vport;
195 struct netdev_vport *netdev_vport;
196 struct internal_dev *internal_dev;
197 int err;
198
199 vport = vport_alloc(sizeof(struct netdev_vport), &internal_vport_ops, parms);
200 if (IS_ERR(vport)) {
201 err = PTR_ERR(vport);
202 goto error;
203 }
204
205 netdev_vport = netdev_vport_priv(vport);
206
207 netdev_vport->dev = alloc_netdev(sizeof(struct internal_dev), parms->name, do_setup);
208 if (!netdev_vport->dev) {
209 err = -ENOMEM;
210 goto error_free_vport;
211 }
212
213 internal_dev = internal_dev_priv(netdev_vport->dev);
214 internal_dev->vport = vport;
215
216 err = register_netdevice(netdev_vport->dev);
217 if (err)
218 goto error_free_netdev;
219
220 dev_set_promiscuity(netdev_vport->dev, 1);
221 netif_start_queue(netdev_vport->dev);
222
223 return vport;
224
225 error_free_netdev:
226 free_netdev(netdev_vport->dev);
227 error_free_vport:
228 vport_free(vport);
229 error:
230 return ERR_PTR(err);
231 }
232
233 static void internal_dev_destroy(struct vport *vport)
234 {
235 struct netdev_vport *netdev_vport = netdev_vport_priv(vport);
236
237 netif_stop_queue(netdev_vport->dev);
238 dev_set_promiscuity(netdev_vport->dev, -1);
239
240 /* unregister_netdevice() waits for an RCU grace period. */
241 unregister_netdevice(netdev_vport->dev);
242 }
243
244 static int internal_dev_recv(struct vport *vport, struct sk_buff *skb)
245 {
246 struct net_device *netdev = netdev_vport_priv(vport)->dev;
247 int len;
248
249 #if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,37)
250 if (unlikely(vlan_deaccel_tag(skb)))
251 return 0;
252 #endif
253
254 len = skb->len;
255 skb->dev = netdev;
256 skb->pkt_type = PACKET_HOST;
257 skb->protocol = eth_type_trans(skb, netdev);
258 forward_ip_summed(skb, false);
259
260 if (in_interrupt())
261 netif_rx(skb);
262 else
263 netif_rx_ni(skb);
264
265 #if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,29)
266 netdev->last_rx = jiffies;
267 #endif
268
269 return len;
270 }
271
272 const struct vport_ops internal_vport_ops = {
273 .type = OVS_VPORT_TYPE_INTERNAL,
274 .flags = VPORT_F_REQUIRED | VPORT_F_GEN_STATS | VPORT_F_FLOW,
275 .create = internal_dev_create,
276 .destroy = internal_dev_destroy,
277 .set_mtu = netdev_set_mtu,
278 .set_addr = netdev_set_addr,
279 .get_name = netdev_get_name,
280 .get_addr = netdev_get_addr,
281 .get_kobj = netdev_get_kobj,
282 .get_dev_flags = netdev_get_dev_flags,
283 .is_running = netdev_is_running,
284 .get_operstate = netdev_get_operstate,
285 .get_ifindex = netdev_get_ifindex,
286 .get_mtu = netdev_get_mtu,
287 .send = internal_dev_recv,
288 };
289
290 int is_internal_dev(const struct net_device *netdev)
291 {
292 #ifdef HAVE_NET_DEVICE_OPS
293 return netdev->netdev_ops == &internal_dev_netdev_ops;
294 #else
295 return netdev->open == internal_dev_open;
296 #endif
297 }
298
299 int is_internal_vport(const struct vport *vport)
300 {
301 return vport->ops == &internal_vport_ops;
302 }
303
304 struct vport *internal_dev_get_vport(struct net_device *netdev)
305 {
306 if (!is_internal_dev(netdev))
307 return NULL;
308
309 return internal_dev_priv(netdev)->vport;
310 }