]> git.proxmox.com Git - mirror_ovs.git/blame - datapath/vport-internal_dev.c
datapath: Add missing #include to datapath/flow.h.
[mirror_ovs.git] / datapath / vport-internal_dev.c
CommitLineData
f2459fe7
JG
1/*
2 * Copyright (c) 2009, 2010 Nicira Networks.
3 * Distributed under the terms of the GNU GPL version 2.
4 *
5 * Significant portions of this file may be copied from parts of the Linux
6 * kernel, by Linus Torvalds and others.
7 */
8
9#include <linux/kernel.h>
10#include <linux/netdevice.h>
11#include <linux/etherdevice.h>
12#include <linux/ethtool.h>
13#include <linux/percpu.h>
f2459fe7
JG
14#include <linux/rcupdate.h>
15#include <linux/skbuff.h>
f2459fe7
JG
16
17#include "datapath.h"
8722022c 18#include "openvswitch/internal_dev.h"
b19e8815 19#include "vport-generic.h"
f2459fe7
JG
20#include "vport-internal_dev.h"
21#include "vport-netdev.h"
22
23struct pcpu_lstats {
24 unsigned long rx_packets;
25 unsigned long rx_bytes;
26 unsigned long tx_packets;
27 unsigned long tx_bytes;
28};
29
30struct internal_dev {
31 struct vport *vport;
32
33 struct net_device_stats stats;
34 struct pcpu_lstats *lstats;
8722022c
BP
35
36 /* This is warty support for XAPI, which does not support summing bond
37 * device statistics itself. 'extra_stats' can be set by userspace via
38 * the DP_DEV_SET_STATS ioctl and, if they are, then they are added to
39 * the real device stats. */
40 struct pcpu_lstats extra_stats;
f2459fe7
JG
41};
42
43struct vport_ops internal_vport_ops;
44
45static inline struct internal_dev *internal_dev_priv(struct net_device *netdev)
46{
47 return netdev_priv(netdev);
48}
49
50static struct net_device_stats *internal_dev_get_stats(struct net_device *netdev)
51{
52 struct internal_dev *internal_dev = internal_dev_priv(netdev);
53 struct net_device_stats *stats;
54 int i;
55
56 stats = &internal_dev->stats;
8722022c
BP
57 stats->rx_bytes = internal_dev->extra_stats.rx_bytes;
58 stats->rx_packets = internal_dev->extra_stats.rx_packets;
59 stats->tx_bytes = internal_dev->extra_stats.tx_bytes;
60 stats->tx_packets = internal_dev->extra_stats.tx_packets;
f2459fe7
JG
61 for_each_possible_cpu(i) {
62 const struct pcpu_lstats *lb_stats;
63
64 lb_stats = per_cpu_ptr(internal_dev->lstats, i);
65 stats->rx_bytes += lb_stats->rx_bytes;
66 stats->rx_packets += lb_stats->rx_packets;
67 stats->tx_bytes += lb_stats->tx_bytes;
68 stats->tx_packets += lb_stats->tx_packets;
69 }
70 return stats;
71}
72
73static int internal_dev_mac_addr(struct net_device *dev, void *p)
74{
75 struct sockaddr *addr = p;
76
77 if (!is_valid_ether_addr(addr->sa_data))
78 return -EADDRNOTAVAIL;
79 memcpy(dev->dev_addr, addr->sa_data, dev->addr_len);
80 return 0;
81}
82
1c075d0a 83/* Called with rcu_read_lock and bottom-halves disabled. */
f2459fe7
JG
84static int internal_dev_xmit(struct sk_buff *skb, struct net_device *netdev)
85{
86 struct internal_dev *internal_dev = internal_dev_priv(netdev);
87 struct vport *vport = internal_dev_get_vport(netdev);
88 struct pcpu_lstats *lb_stats;
89
90 /* We need our own clone. */
91 skb = skb_share_check(skb, GFP_ATOMIC);
92 if (!skb)
93 return 0;
94
95 lb_stats = per_cpu_ptr(internal_dev->lstats, smp_processor_id());
96 lb_stats->tx_packets++;
97 lb_stats->tx_bytes += skb->len;
98
99 skb_reset_mac_header(skb);
f4267e34
JG
100 compute_ip_summed(skb, true);
101
f2459fe7 102 vport_receive(vport, skb);
f2459fe7
JG
103
104 return 0;
105}
106
107static int internal_dev_open(struct net_device *netdev)
108{
109 netif_start_queue(netdev);
110 return 0;
111}
112
113static int internal_dev_stop(struct net_device *netdev)
114{
115 netif_stop_queue(netdev);
116 return 0;
117}
118
119static void internal_dev_getinfo(struct net_device *netdev,
120 struct ethtool_drvinfo *info)
121{
122 struct dp_port *dp_port = vport_get_dp_port(internal_dev_get_vport(netdev));
123
124 strcpy(info->driver, "openvswitch");
125 if (dp_port)
126 sprintf(info->bus_info, "%d.%d", dp_port->dp->dp_idx, dp_port->port_no);
127}
128
129static struct ethtool_ops internal_dev_ethtool_ops = {
f4267e34
JG
130 .get_drvinfo = internal_dev_getinfo,
131 .get_link = ethtool_op_get_link,
132 .get_sg = ethtool_op_get_sg,
133 .set_sg = ethtool_op_set_sg,
134 .get_tx_csum = ethtool_op_get_tx_csum,
135 .set_tx_csum = ethtool_op_set_tx_hw_csum,
136 .get_tso = ethtool_op_get_tso,
137 .set_tso = ethtool_op_set_tso,
f2459fe7
JG
138};
139
140static int internal_dev_change_mtu(struct net_device *netdev, int new_mtu)
141{
142 struct dp_port *dp_port = vport_get_dp_port(internal_dev_get_vport(netdev));
143
144 if (new_mtu < 68)
145 return -EINVAL;
146
147 if (dp_port) {
d8b5d43a 148 if (new_mtu > dp_min_mtu(dp_port->dp))
f2459fe7
JG
149 return -EINVAL;
150 }
151
152 netdev->mtu = new_mtu;
153 return 0;
154}
155
156static int internal_dev_init(struct net_device *netdev)
157{
158 struct internal_dev *internal_dev = internal_dev_priv(netdev);
159
160 internal_dev->lstats = alloc_percpu(struct pcpu_lstats);
161 if (!internal_dev->lstats)
162 return -ENOMEM;
163
164 return 0;
165}
166
167static void internal_dev_free(struct net_device *netdev)
168{
169 struct internal_dev *internal_dev = internal_dev_priv(netdev);
170
171 free_percpu(internal_dev->lstats);
172 free_netdev(netdev);
173}
174
175static int internal_dev_do_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd)
176{
8722022c
BP
177 struct internal_dev *internal_dev = internal_dev_priv(dev);
178
179 if (cmd == INTERNAL_DEV_SET_STATS) {
180 struct internal_dev_stats stats;
181
182 if (copy_from_user(&stats, ifr->ifr_data, sizeof(stats)))
183 return -EFAULT;
184
185 internal_dev->extra_stats.rx_bytes = stats.rx_bytes;
186 internal_dev->extra_stats.rx_packets = stats.rx_packets;
187 internal_dev->extra_stats.tx_bytes = stats.tx_bytes;
188 internal_dev->extra_stats.tx_packets = stats.tx_packets;
189
190 return 0;
191 }
192
f2459fe7
JG
193 if (dp_ioctl_hook)
194 return dp_ioctl_hook(dev, ifr, cmd);
195 return -EOPNOTSUPP;
196}
197
198#ifdef HAVE_NET_DEVICE_OPS
199static const struct net_device_ops internal_dev_netdev_ops = {
200 .ndo_init = internal_dev_init,
201 .ndo_open = internal_dev_open,
202 .ndo_stop = internal_dev_stop,
203 .ndo_start_xmit = internal_dev_xmit,
204 .ndo_set_mac_address = internal_dev_mac_addr,
205 .ndo_do_ioctl = internal_dev_do_ioctl,
206 .ndo_change_mtu = internal_dev_change_mtu,
207 .ndo_get_stats = internal_dev_get_stats,
208};
209#endif
210
211static void
212do_setup(struct net_device *netdev)
213{
214 ether_setup(netdev);
215
216#ifdef HAVE_NET_DEVICE_OPS
217 netdev->netdev_ops = &internal_dev_netdev_ops;
218#else
219 netdev->do_ioctl = internal_dev_do_ioctl;
220 netdev->get_stats = internal_dev_get_stats;
221 netdev->hard_start_xmit = internal_dev_xmit;
222 netdev->open = internal_dev_open;
223 netdev->stop = internal_dev_stop;
224 netdev->set_mac_address = internal_dev_mac_addr;
225 netdev->change_mtu = internal_dev_change_mtu;
226 netdev->init = internal_dev_init;
227#endif
228
229 netdev->destructor = internal_dev_free;
230 SET_ETHTOOL_OPS(netdev, &internal_dev_ethtool_ops);
231 netdev->tx_queue_len = 0;
232
233 netdev->flags = IFF_BROADCAST | IFF_MULTICAST;
f4267e34
JG
234 netdev->features = NETIF_F_LLTX | NETIF_F_SG | NETIF_F_HIGHDMA
235 | NETIF_F_HW_CSUM | NETIF_F_TSO;
f2459fe7 236
b19e8815 237 vport_gen_rand_ether_addr(netdev->dev_addr);
f2459fe7
JG
238}
239
240static struct vport *
241internal_dev_create(const char *name, const void __user *config)
242{
243 struct vport *vport;
244 struct netdev_vport *netdev_vport;
245 struct internal_dev *internal_dev;
246 int err;
247
248 vport = vport_alloc(sizeof(struct netdev_vport), &internal_vport_ops);
249 if (IS_ERR(vport)) {
250 err = PTR_ERR(vport);
251 goto error;
252 }
253
254 netdev_vport = netdev_vport_priv(vport);
255
256 netdev_vport->dev = alloc_netdev(sizeof(struct internal_dev), name, do_setup);
257 if (!netdev_vport->dev) {
258 err = -ENOMEM;
259 goto error_free_vport;
260 }
261
262 internal_dev = internal_dev_priv(netdev_vport->dev);
263 internal_dev->vport = vport;
264
265 err = register_netdevice(netdev_vport->dev);
266 if (err)
267 goto error_free_netdev;
268
269 return vport;
270
271error_free_netdev:
272 free_netdev(netdev_vport->dev);
273error_free_vport:
274 vport_free(vport);
275error:
276 return ERR_PTR(err);
277}
278
279static int
280internal_dev_destroy(struct vport *vport)
281{
282 struct netdev_vport *netdev_vport = netdev_vport_priv(vport);
283
284 unregister_netdevice(netdev_vport->dev);
285 vport_free(vport);
286
287 return 0;
288}
289
290static int
291internal_dev_attach(struct vport *vport)
292{
293 struct netdev_vport *netdev_vport = netdev_vport_priv(vport);
294
295 dev_set_promiscuity(netdev_vport->dev, 1);
296
297 /* It would make sense to assign dev->br_port here too, but
298 * that causes packets received on internal ports to get caught
299 * in netdev_frame_hook(). In turn netdev_frame_hook() can reject them
300 * back to the network stack, but that's a waste of time. */
301
302 return 0;
303}
304
305static int
306internal_dev_detach(struct vport *vport)
307{
308 struct netdev_vport *netdev_vport = netdev_vport_priv(vport);
309
310 dev_set_promiscuity(netdev_vport->dev, -1);
311
312 /* Make sure that no packets arrive from now on, since
313 * internal_dev_xmit() will try to find itself through
314 * p->dp->ports[], and we're about to set that to null. */
315 netif_tx_disable(netdev_vport->dev);
316
317 return 0;
318}
319
320static int
321internal_dev_recv(struct vport *vport, struct sk_buff *skb)
322{
323 struct net_device *netdev = netdev_vport_priv(vport)->dev;
324 struct internal_dev *internal_dev = internal_dev_priv(netdev);
325 struct pcpu_lstats *lb_stats;
326 int len;
327
328 skb->dev = netdev;
329 len = skb->len;
330 skb->pkt_type = PACKET_HOST;
331 skb->protocol = eth_type_trans(skb, netdev);
332
333 if (in_interrupt())
334 netif_rx(skb);
335 else
336 netif_rx_ni(skb);
337 netdev->last_rx = jiffies;
338
1c075d0a 339 local_bh_disable();
f2459fe7
JG
340 lb_stats = per_cpu_ptr(internal_dev->lstats, smp_processor_id());
341 lb_stats->rx_packets++;
342 lb_stats->rx_bytes += len;
1c075d0a 343 local_bh_enable();
f2459fe7
JG
344
345 return len;
346}
347
348struct vport_ops internal_vport_ops = {
349 .type = "internal",
350 .flags = VPORT_F_REQUIRED,
351 .create = internal_dev_create,
352 .destroy = internal_dev_destroy,
353 .attach = internal_dev_attach,
354 .detach = internal_dev_detach,
355 .set_mtu = netdev_set_mtu,
356 .set_addr = netdev_set_addr,
357 .get_name = netdev_get_name,
358 .get_addr = netdev_get_addr,
359 .get_kobj = netdev_get_kobj,
360 .get_stats = netdev_get_stats,
361 .get_dev_flags = netdev_get_dev_flags,
362 .is_running = netdev_is_running,
363 .get_operstate = netdev_get_operstate,
364 .get_ifindex = netdev_get_ifindex,
365 .get_iflink = netdev_get_iflink,
366 .get_mtu = netdev_get_mtu,
367 .send = internal_dev_recv,
368};
369
370int is_internal_dev(const struct net_device *netdev)
371{
372#ifdef HAVE_NET_DEVICE_OPS
373 return netdev->netdev_ops == &internal_dev_netdev_ops;
374#else
375 return netdev->open == internal_dev_open;
376#endif
377}
378
379int
380is_internal_vport(const struct vport *vport)
381{
382 return vport->ops == &internal_vport_ops;
383}
384
385struct vport *
386internal_dev_get_vport(struct net_device *netdev)
387{
388 struct internal_dev *internal_dev = internal_dev_priv(netdev);
389 return rcu_dereference(internal_dev->vport);
390}