]> git.proxmox.com Git - mirror_ovs.git/blob - datapath/vport-internal_dev.c
datapath: Don't free vport until all references are gone.
[mirror_ovs.git] / datapath / vport-internal_dev.c
1 /*
2 * Copyright (c) 2009, 2010, 2011 Nicira Networks.
3 * Distributed under the terms of the GNU GPL version 2.
4 *
5 * Significant portions of this file may be copied from parts of the Linux
6 * kernel, by Linus Torvalds and others.
7 */
8
9 #include <linux/if_vlan.h>
10 #include <linux/kernel.h>
11 #include <linux/netdevice.h>
12 #include <linux/etherdevice.h>
13 #include <linux/ethtool.h>
14 #include <linux/skbuff.h>
15 #include <linux/version.h>
16
17 #include "checksum.h"
18 #include "datapath.h"
19 #include "vlan.h"
20 #include "vport-generic.h"
21 #include "vport-internal_dev.h"
22 #include "vport-netdev.h"
23
24 struct internal_dev {
25 struct vport *vport;
26 struct net_device_stats stats;
27 };
28
29 static inline struct internal_dev *internal_dev_priv(struct net_device *netdev)
30 {
31 return netdev_priv(netdev);
32 }
33
34 /* This function is only called by the kernel network layer. It is not a vport
35 * get_stats() function. If a vport get_stats() function is defined that
36 * results in this being called it will cause infinite recursion. */
37 static struct net_device_stats *internal_dev_sys_stats(struct net_device *netdev)
38 {
39 struct vport *vport = internal_dev_get_vport(netdev);
40 struct net_device_stats *stats = &internal_dev_priv(netdev)->stats;
41
42 if (vport) {
43 struct rtnl_link_stats64 vport_stats;
44
45 vport_get_stats(vport, &vport_stats);
46
47 /* The tx and rx stats need to be swapped because the switch
48 * and host OS have opposite perspectives. */
49 stats->rx_packets = vport_stats.tx_packets;
50 stats->tx_packets = vport_stats.rx_packets;
51 stats->rx_bytes = vport_stats.tx_bytes;
52 stats->tx_bytes = vport_stats.rx_bytes;
53 stats->rx_errors = vport_stats.tx_errors;
54 stats->tx_errors = vport_stats.rx_errors;
55 stats->rx_dropped = vport_stats.tx_dropped;
56 stats->tx_dropped = vport_stats.rx_dropped;
57 stats->collisions = vport_stats.collisions;
58 }
59
60 return stats;
61 }
62
63 static int internal_dev_mac_addr(struct net_device *dev, void *p)
64 {
65 struct sockaddr *addr = p;
66
67 if (!is_valid_ether_addr(addr->sa_data))
68 return -EADDRNOTAVAIL;
69 memcpy(dev->dev_addr, addr->sa_data, dev->addr_len);
70 return 0;
71 }
72
73 /* Called with rcu_read_lock and bottom-halves disabled. */
74 static int internal_dev_xmit(struct sk_buff *skb, struct net_device *netdev)
75 {
76 compute_ip_summed(skb, true);
77 vlan_copy_skb_tci(skb);
78 OVS_CB(skb)->flow = NULL;
79
80 vport_receive(internal_dev_priv(netdev)->vport, skb);
81 return 0;
82 }
83
84 static int internal_dev_open(struct net_device *netdev)
85 {
86 netif_start_queue(netdev);
87 return 0;
88 }
89
90 static int internal_dev_stop(struct net_device *netdev)
91 {
92 netif_stop_queue(netdev);
93 return 0;
94 }
95
96 static void internal_dev_getinfo(struct net_device *netdev,
97 struct ethtool_drvinfo *info)
98 {
99 strcpy(info->driver, "openvswitch");
100 }
101
102 static const struct ethtool_ops internal_dev_ethtool_ops = {
103 .get_drvinfo = internal_dev_getinfo,
104 .get_link = ethtool_op_get_link,
105 .get_sg = ethtool_op_get_sg,
106 .set_sg = ethtool_op_set_sg,
107 .get_tx_csum = ethtool_op_get_tx_csum,
108 .set_tx_csum = ethtool_op_set_tx_hw_csum,
109 .get_tso = ethtool_op_get_tso,
110 .set_tso = ethtool_op_set_tso,
111 };
112
113 static int internal_dev_change_mtu(struct net_device *netdev, int new_mtu)
114 {
115 struct vport *vport = internal_dev_get_vport(netdev);
116
117 if (new_mtu < 68)
118 return -EINVAL;
119
120 if (new_mtu > dp_min_mtu(vport->dp))
121 return -EINVAL;
122
123 netdev->mtu = new_mtu;
124 return 0;
125 }
126
127 static int internal_dev_do_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
128 {
129 if (dp_ioctl_hook)
130 return dp_ioctl_hook(dev, ifr, cmd);
131
132 return -EOPNOTSUPP;
133 }
134
135 static void internal_dev_destructor(struct net_device *dev)
136 {
137 struct vport *vport = internal_dev_get_vport(dev);
138
139 vport_free(vport);
140 free_netdev(dev);
141 }
142
143 #ifdef HAVE_NET_DEVICE_OPS
144 static const struct net_device_ops internal_dev_netdev_ops = {
145 .ndo_open = internal_dev_open,
146 .ndo_stop = internal_dev_stop,
147 .ndo_start_xmit = internal_dev_xmit,
148 .ndo_set_mac_address = internal_dev_mac_addr,
149 .ndo_do_ioctl = internal_dev_do_ioctl,
150 .ndo_change_mtu = internal_dev_change_mtu,
151 .ndo_get_stats = internal_dev_sys_stats,
152 };
153 #endif
154
155 static void do_setup(struct net_device *netdev)
156 {
157 ether_setup(netdev);
158
159 #ifdef HAVE_NET_DEVICE_OPS
160 netdev->netdev_ops = &internal_dev_netdev_ops;
161 #else
162 netdev->do_ioctl = internal_dev_do_ioctl;
163 netdev->get_stats = internal_dev_sys_stats;
164 netdev->hard_start_xmit = internal_dev_xmit;
165 netdev->open = internal_dev_open;
166 netdev->stop = internal_dev_stop;
167 netdev->set_mac_address = internal_dev_mac_addr;
168 netdev->change_mtu = internal_dev_change_mtu;
169 #endif
170
171 netdev->destructor = internal_dev_destructor;
172 SET_ETHTOOL_OPS(netdev, &internal_dev_ethtool_ops);
173 netdev->tx_queue_len = 0;
174
175 netdev->flags = IFF_BROADCAST | IFF_MULTICAST;
176 netdev->features = NETIF_F_LLTX | NETIF_F_SG | NETIF_F_FRAGLIST |
177 NETIF_F_HIGHDMA | NETIF_F_HW_CSUM | NETIF_F_TSO;
178
179 vport_gen_rand_ether_addr(netdev->dev_addr);
180 }
181
182 static struct vport *internal_dev_create(const struct vport_parms *parms)
183 {
184 struct vport *vport;
185 struct netdev_vport *netdev_vport;
186 struct internal_dev *internal_dev;
187 int err;
188
189 vport = vport_alloc(sizeof(struct netdev_vport), &internal_vport_ops, parms);
190 if (IS_ERR(vport)) {
191 err = PTR_ERR(vport);
192 goto error;
193 }
194
195 netdev_vport = netdev_vport_priv(vport);
196
197 netdev_vport->dev = alloc_netdev(sizeof(struct internal_dev), parms->name, do_setup);
198 if (!netdev_vport->dev) {
199 err = -ENOMEM;
200 goto error_free_vport;
201 }
202
203 internal_dev = internal_dev_priv(netdev_vport->dev);
204 internal_dev->vport = vport;
205
206 err = register_netdevice(netdev_vport->dev);
207 if (err)
208 goto error_free_netdev;
209
210 dev_set_promiscuity(netdev_vport->dev, 1);
211 netif_start_queue(netdev_vport->dev);
212
213 return vport;
214
215 error_free_netdev:
216 free_netdev(netdev_vport->dev);
217 error_free_vport:
218 vport_free(vport);
219 error:
220 return ERR_PTR(err);
221 }
222
223 static int internal_dev_destroy(struct vport *vport)
224 {
225 struct netdev_vport *netdev_vport = netdev_vport_priv(vport);
226
227 netif_stop_queue(netdev_vport->dev);
228 dev_set_promiscuity(netdev_vport->dev, -1);
229
230 /* unregister_netdevice() waits for an RCU grace period. */
231 unregister_netdevice(netdev_vport->dev);
232
233 return 0;
234 }
235
236 static int internal_dev_recv(struct vport *vport, struct sk_buff *skb)
237 {
238 struct net_device *netdev = netdev_vport_priv(vport)->dev;
239 int len;
240
241 #if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,37)
242 if (unlikely(vlan_deaccel_tag(skb)))
243 return 0;
244 #endif
245
246 len = skb->len;
247 skb->dev = netdev;
248 skb->pkt_type = PACKET_HOST;
249 skb->protocol = eth_type_trans(skb, netdev);
250
251 if (in_interrupt())
252 netif_rx(skb);
253 else
254 netif_rx_ni(skb);
255
256 #if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,29)
257 netdev->last_rx = jiffies;
258 #endif
259
260 return len;
261 }
262
263 const struct vport_ops internal_vport_ops = {
264 .type = ODP_VPORT_TYPE_INTERNAL,
265 .flags = VPORT_F_REQUIRED | VPORT_F_GEN_STATS | VPORT_F_FLOW,
266 .create = internal_dev_create,
267 .destroy = internal_dev_destroy,
268 .set_mtu = netdev_set_mtu,
269 .set_addr = netdev_set_addr,
270 .get_name = netdev_get_name,
271 .get_addr = netdev_get_addr,
272 .get_kobj = netdev_get_kobj,
273 .get_dev_flags = netdev_get_dev_flags,
274 .is_running = netdev_is_running,
275 .get_operstate = netdev_get_operstate,
276 .get_ifindex = netdev_get_ifindex,
277 .get_iflink = netdev_get_iflink,
278 .get_mtu = netdev_get_mtu,
279 .send = internal_dev_recv,
280 };
281
282 int is_internal_dev(const struct net_device *netdev)
283 {
284 #ifdef HAVE_NET_DEVICE_OPS
285 return netdev->netdev_ops == &internal_dev_netdev_ops;
286 #else
287 return netdev->open == internal_dev_open;
288 #endif
289 }
290
291 int is_internal_vport(const struct vport *vport)
292 {
293 return vport->ops == &internal_vport_ops;
294 }
295
296 struct vport *internal_dev_get_vport(struct net_device *netdev)
297 {
298 if (!is_internal_dev(netdev))
299 return NULL;
300
301 return internal_dev_priv(netdev)->vport;
302 }