]>
Commit | Line | Data |
---|---|---|
1da177e4 | 1 | /* |
e905a9ed | 2 | * Linux NET3: IP/IP protocol decoder. |
1da177e4 | 3 | * |
1da177e4 LT |
4 | * Authors: |
5 | * Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95 | |
6 | * | |
7 | * Fixes: | |
8 | * Alan Cox : Merged and made usable non modular (its so tiny its silly as | |
9 | * a module taking up 2 pages). | |
10 | * Alan Cox : Fixed bug with 1.3.18 and IPIP not working (now needs to set skb->h.iph) | |
11 | * to keep ip_forward happy. | |
12 | * Alan Cox : More fixes for 1.3.21, and firewall fix. Maybe this will work soon 8). | |
13 | * Kai Schulte : Fixed #defines for IP_FIREWALL->FIREWALL | |
14 | * David Woodhouse : Perform some basic ICMP handling. | |
15 | * IPIP Routing without decapsulation. | |
16 | * Carlos Picoto : GRE over IP support | |
17 | * Alexey Kuznetsov: Reworked. Really, now it is truncated version of ipv4/ip_gre.c. | |
18 | * I do not want to merge them together. | |
19 | * | |
20 | * This program is free software; you can redistribute it and/or | |
21 | * modify it under the terms of the GNU General Public License | |
22 | * as published by the Free Software Foundation; either version | |
23 | * 2 of the License, or (at your option) any later version. | |
24 | * | |
25 | */ | |
26 | ||
27 | /* tunnel.c: an IP tunnel driver | |
28 | ||
29 | The purpose of this driver is to provide an IP tunnel through | |
30 | which you can tunnel network traffic transparently across subnets. | |
31 | ||
32 | This was written by looking at Nick Holloway's dummy driver | |
33 | Thanks for the great code! | |
34 | ||
35 | -Sam Lantinga (slouken@cs.ucdavis.edu) 02/01/95 | |
e905a9ed | 36 | |
1da177e4 LT |
37 | Minor tweaks: |
38 | Cleaned up the code a little and added some pre-1.3.0 tweaks. | |
39 | dev->hard_header/hard_header_len changed to use no headers. | |
40 | Comments/bracketing tweaked. | |
41 | Made the tunnels use dev->name not tunnel: when error reporting. | |
42 | Added tx_dropped stat | |
e905a9ed | 43 | |
113aa838 | 44 | -Alan Cox (alan@lxorguk.ukuu.org.uk) 21 March 95 |
1da177e4 LT |
45 | |
46 | Reworked: | |
47 | Changed to tunnel to destination gateway in addition to the | |
48 | tunnel's pointopoint address | |
49 | Almost completely rewritten | |
50 | Note: There is currently no firewall or ICMP handling done. | |
51 | ||
52 | -Sam Lantinga (slouken@cs.ucdavis.edu) 02/13/96 | |
e905a9ed | 53 | |
1da177e4 LT |
54 | */ |
55 | ||
56 | /* Things I wish I had known when writing the tunnel driver: | |
57 | ||
58 | When the tunnel_xmit() function is called, the skb contains the | |
59 | packet to be sent (plus a great deal of extra info), and dev | |
60 | contains the tunnel device that _we_ are. | |
61 | ||
62 | When we are passed a packet, we are expected to fill in the | |
63 | source address with our source IP address. | |
64 | ||
65 | What is the proper way to allocate, copy and free a buffer? | |
66 | After you allocate it, it is a "0 length" chunk of memory | |
67 | starting at zero. If you want to add headers to the buffer | |
68 | later, you'll have to call "skb_reserve(skb, amount)" with | |
69 | the amount of memory you want reserved. Then, you call | |
70 | "skb_put(skb, amount)" with the amount of space you want in | |
71 | the buffer. skb_put() returns a pointer to the top (#0) of | |
72 | that buffer. skb->len is set to the amount of space you have | |
73 | "allocated" with skb_put(). You can then write up to skb->len | |
74 | bytes to that buffer. If you need more, you can call skb_put() | |
75 | again with the additional amount of space you need. You can | |
e905a9ed | 76 | find out how much more space you can allocate by calling |
1da177e4 LT |
77 | "skb_tailroom(skb)". |
78 | Now, to add header space, call "skb_push(skb, header_len)". | |
79 | This creates space at the beginning of the buffer and returns | |
80 | a pointer to this new space. If later you need to strip a | |
81 | header from a buffer, call "skb_pull(skb, header_len)". | |
82 | skb_headroom() will return how much space is left at the top | |
83 | of the buffer (before the main data). Remember, this headroom | |
84 | space must be reserved before the skb_put() function is called. | |
85 | */ | |
86 | ||
87 | /* | |
88 | This version of net/ipv4/ipip.c is cloned of net/ipv4/ip_gre.c | |
89 | ||
90 | For comments look at net/ipv4/ip_gre.c --ANK | |
91 | */ | |
92 | ||
e905a9ed | 93 | |
4fc268d2 | 94 | #include <linux/capability.h> |
1da177e4 LT |
95 | #include <linux/module.h> |
96 | #include <linux/types.h> | |
1da177e4 | 97 | #include <linux/kernel.h> |
5a0e3ad6 | 98 | #include <linux/slab.h> |
7c0f6ba6 | 99 | #include <linux/uaccess.h> |
1da177e4 LT |
100 | #include <linux/skbuff.h> |
101 | #include <linux/netdevice.h> | |
102 | #include <linux/in.h> | |
103 | #include <linux/tcp.h> | |
104 | #include <linux/udp.h> | |
105 | #include <linux/if_arp.h> | |
1da177e4 LT |
106 | #include <linux/init.h> |
107 | #include <linux/netfilter_ipv4.h> | |
46f25dff | 108 | #include <linux/if_ether.h> |
1da177e4 LT |
109 | |
110 | #include <net/sock.h> | |
111 | #include <net/ip.h> | |
112 | #include <net/icmp.h> | |
c5441932 | 113 | #include <net/ip_tunnels.h> |
1da177e4 LT |
114 | #include <net/inet_ecn.h> |
115 | #include <net/xfrm.h> | |
10dc4c7b PE |
116 | #include <net/net_namespace.h> |
117 | #include <net/netns/generic.h> | |
cfc7381b | 118 | #include <net/dst_metadata.h> |
1da177e4 | 119 | |
eccc1bb8 | 120 | static bool log_ecn_error = true; |
121 | module_param(log_ecn_error, bool, 0644); | |
122 | MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN"); | |
123 | ||
c7d03a00 | 124 | static unsigned int ipip_net_id __read_mostly; |
10dc4c7b | 125 | |
3c97af99 | 126 | static int ipip_tunnel_init(struct net_device *dev); |
0974658d | 127 | static struct rtnl_link_ops ipip_link_ops __read_mostly; |
1da177e4 | 128 | |
d2acc347 | 129 | static int ipip_err(struct sk_buff *skb, u32 info) |
1da177e4 | 130 | { |
f3594f0a XL |
131 | /* All the routers (except for Linux) return only |
132 | * 8 bytes of packet payload. It means, that precise relaying of | |
133 | * ICMP in the real Internet is absolutely infeasible. | |
134 | */ | |
fd58156e PS |
135 | struct net *net = dev_net(skb->dev); |
136 | struct ip_tunnel_net *itn = net_generic(net, ipip_net_id); | |
b71d1d42 | 137 | const struct iphdr *iph = (const struct iphdr *)skb->data; |
fd58156e PS |
138 | const int type = icmp_hdr(skb)->type; |
139 | const int code = icmp_hdr(skb)->code; | |
f3594f0a XL |
140 | struct ip_tunnel *t; |
141 | int err = 0; | |
142 | ||
143 | switch (type) { | |
144 | case ICMP_DEST_UNREACH: | |
145 | switch (code) { | |
146 | case ICMP_SR_FAILED: | |
147 | /* Impossible event. */ | |
148 | goto out; | |
149 | default: | |
150 | /* All others are translated to HOST_UNREACH. | |
151 | * rfc2003 contains "deep thoughts" about NET_UNREACH, | |
152 | * I believe they are just ether pollution. --ANK | |
153 | */ | |
154 | break; | |
155 | } | |
156 | break; | |
157 | ||
158 | case ICMP_TIME_EXCEEDED: | |
159 | if (code != ICMP_EXC_TTL) | |
160 | goto out; | |
161 | break; | |
162 | ||
163 | case ICMP_REDIRECT: | |
164 | break; | |
165 | ||
166 | default: | |
167 | goto out; | |
168 | } | |
1da177e4 | 169 | |
fd58156e PS |
170 | t = ip_tunnel_lookup(itn, skb->dev->ifindex, TUNNEL_NO_KEY, |
171 | iph->daddr, iph->saddr, 0); | |
f3594f0a XL |
172 | if (!t) { |
173 | err = -ENOENT; | |
36393395 | 174 | goto out; |
f3594f0a | 175 | } |
36393395 DM |
176 | |
177 | if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) { | |
f3594f0a XL |
178 | ipv4_update_pmtu(skb, net, info, t->parms.link, 0, |
179 | iph->protocol, 0); | |
36393395 DM |
180 | goto out; |
181 | } | |
182 | ||
55be7a9c | 183 | if (type == ICMP_REDIRECT) { |
f3594f0a | 184 | ipv4_redirect(skb, net, t->parms.link, 0, iph->protocol, 0); |
55be7a9c DM |
185 | goto out; |
186 | } | |
187 | ||
f3594f0a XL |
188 | if (t->parms.iph.daddr == 0) { |
189 | err = -ENOENT; | |
1da177e4 | 190 | goto out; |
f3594f0a | 191 | } |
d2acc347 | 192 | |
1da177e4 LT |
193 | if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED) |
194 | goto out; | |
195 | ||
26d94b46 | 196 | if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO)) |
1da177e4 LT |
197 | t->err_count++; |
198 | else | |
199 | t->err_count = 1; | |
200 | t->err_time = jiffies; | |
b0558ef2 | 201 | |
fd58156e | 202 | out: |
d2acc347 | 203 | return err; |
1da177e4 LT |
204 | } |
205 | ||
1b69e7e6 | 206 | static const struct tnl_ptk_info ipip_tpi = { |
fd58156e PS |
207 | /* no tunnel info required for ipip. */ |
208 | .proto = htons(ETH_P_IP), | |
209 | }; | |
210 | ||
1b69e7e6 SH |
211 | #if IS_ENABLED(CONFIG_MPLS) |
212 | static const struct tnl_ptk_info mplsip_tpi = { | |
213 | /* no tunnel info required for mplsip. */ | |
214 | .proto = htons(ETH_P_MPLS_UC), | |
215 | }; | |
216 | #endif | |
217 | ||
218 | static int ipip_tunnel_rcv(struct sk_buff *skb, u8 ipproto) | |
1da177e4 | 219 | { |
fd58156e PS |
220 | struct net *net = dev_net(skb->dev); |
221 | struct ip_tunnel_net *itn = net_generic(net, ipip_net_id); | |
cfc7381b | 222 | struct metadata_dst *tun_dst = NULL; |
1da177e4 | 223 | struct ip_tunnel *tunnel; |
3d7b46cd | 224 | const struct iphdr *iph; |
3c97af99 | 225 | |
3d7b46cd | 226 | iph = ip_hdr(skb); |
fd58156e PS |
227 | tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, TUNNEL_NO_KEY, |
228 | iph->saddr, iph->daddr, 0); | |
229 | if (tunnel) { | |
1b69e7e6 SH |
230 | const struct tnl_ptk_info *tpi; |
231 | ||
232 | if (tunnel->parms.iph.protocol != ipproto && | |
233 | tunnel->parms.iph.protocol != 0) | |
234 | goto drop; | |
235 | ||
eccc1bb8 | 236 | if (!xfrm4_policy_check(NULL, XFRM_POLICY_IN, skb)) |
237 | goto drop; | |
1b69e7e6 SH |
238 | #if IS_ENABLED(CONFIG_MPLS) |
239 | if (ipproto == IPPROTO_MPLS) | |
240 | tpi = &mplsip_tpi; | |
241 | else | |
242 | #endif | |
243 | tpi = &ipip_tpi; | |
244 | if (iptunnel_pull_header(skb, 0, tpi->proto, false)) | |
737e828b | 245 | goto drop; |
cfc7381b AS |
246 | if (tunnel->collect_md) { |
247 | tun_dst = ip_tun_rx_dst(skb, 0, 0, 0); | |
248 | if (!tun_dst) | |
249 | return 0; | |
250 | } | |
251 | return ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error); | |
1da177e4 | 252 | } |
1da177e4 | 253 | |
1da177e4 | 254 | return -1; |
eccc1bb8 | 255 | |
256 | drop: | |
257 | kfree_skb(skb); | |
258 | return 0; | |
1da177e4 LT |
259 | } |
260 | ||
1b69e7e6 SH |
261 | static int ipip_rcv(struct sk_buff *skb) |
262 | { | |
263 | return ipip_tunnel_rcv(skb, IPPROTO_IPIP); | |
264 | } | |
265 | ||
266 | #if IS_ENABLED(CONFIG_MPLS) | |
267 | static int mplsip_rcv(struct sk_buff *skb) | |
268 | { | |
269 | return ipip_tunnel_rcv(skb, IPPROTO_MPLS); | |
270 | } | |
271 | #endif | |
272 | ||
1da177e4 LT |
273 | /* |
274 | * This function assumes it is being called from dev_queue_xmit() | |
275 | * and that skb is filled properly by that function. | |
276 | */ | |
1b69e7e6 SH |
277 | static netdev_tx_t ipip_tunnel_xmit(struct sk_buff *skb, |
278 | struct net_device *dev) | |
1da177e4 | 279 | { |
2941a486 | 280 | struct ip_tunnel *tunnel = netdev_priv(dev); |
b71d1d42 | 281 | const struct iphdr *tiph = &tunnel->parms.iph; |
1b69e7e6 SH |
282 | u8 ipproto; |
283 | ||
284 | switch (skb->protocol) { | |
285 | case htons(ETH_P_IP): | |
286 | ipproto = IPPROTO_IPIP; | |
287 | break; | |
288 | #if IS_ENABLED(CONFIG_MPLS) | |
289 | case htons(ETH_P_MPLS_UC): | |
290 | ipproto = IPPROTO_MPLS; | |
291 | break; | |
292 | #endif | |
293 | default: | |
294 | goto tx_error; | |
295 | } | |
1da177e4 | 296 | |
1b69e7e6 | 297 | if (tiph->protocol != ipproto && tiph->protocol != 0) |
1da177e4 | 298 | goto tx_error; |
1da177e4 | 299 | |
7e13318d | 300 | if (iptunnel_handle_offloads(skb, SKB_GSO_IPXIP4)) |
aed069df | 301 | goto tx_error; |
8344bfc6 | 302 | |
1b69e7e6 | 303 | skb_set_inner_ipproto(skb, ipproto); |
077c5a09 | 304 | |
cfc7381b AS |
305 | if (tunnel->collect_md) |
306 | ip_md_tunnel_xmit(skb, dev, ipproto); | |
307 | else | |
308 | ip_tunnel_xmit(skb, dev, tiph, ipproto); | |
6ed10654 | 309 | return NETDEV_TX_OK; |
1da177e4 | 310 | |
1da177e4 | 311 | tx_error: |
3acfa1e7 | 312 | kfree_skb(skb); |
aed069df | 313 | |
cb32f511 | 314 | dev->stats.tx_errors++; |
6ed10654 | 315 | return NETDEV_TX_OK; |
1da177e4 LT |
316 | } |
317 | ||
1b69e7e6 SH |
318 | static bool ipip_tunnel_ioctl_verify_protocol(u8 ipproto) |
319 | { | |
320 | switch (ipproto) { | |
321 | case 0: | |
322 | case IPPROTO_IPIP: | |
323 | #if IS_ENABLED(CONFIG_MPLS) | |
324 | case IPPROTO_MPLS: | |
325 | #endif | |
326 | return true; | |
327 | } | |
328 | ||
329 | return false; | |
330 | } | |
331 | ||
1da177e4 | 332 | static int |
fd58156e | 333 | ipip_tunnel_ioctl(struct net_device *dev, struct ifreq *ifr, int cmd) |
1da177e4 LT |
334 | { |
335 | int err = 0; | |
336 | struct ip_tunnel_parm p; | |
1da177e4 | 337 | |
fd58156e PS |
338 | if (copy_from_user(&p, ifr->ifr_ifru.ifru_data, sizeof(p))) |
339 | return -EFAULT; | |
1da177e4 | 340 | |
3b7b514f | 341 | if (cmd == SIOCADDTUNNEL || cmd == SIOCCHGTUNNEL) { |
1b69e7e6 SH |
342 | if (p.iph.version != 4 || |
343 | !ipip_tunnel_ioctl_verify_protocol(p.iph.protocol) || | |
3b7b514f CW |
344 | p.iph.ihl != 5 || (p.iph.frag_off&htons(~IP_DF))) |
345 | return -EINVAL; | |
346 | } | |
347 | ||
252a8fbe ED |
348 | p.i_key = p.o_key = 0; |
349 | p.i_flags = p.o_flags = 0; | |
fd58156e PS |
350 | err = ip_tunnel_ioctl(dev, &p, cmd); |
351 | if (err) | |
352 | return err; | |
353 | ||
354 | if (copy_to_user(ifr->ifr_ifru.ifru_data, &p, sizeof(p))) | |
355 | return -EFAULT; | |
356 | ||
1da177e4 LT |
357 | return 0; |
358 | } | |
359 | ||
23a12b14 | 360 | static const struct net_device_ops ipip_netdev_ops = { |
fd58156e PS |
361 | .ndo_init = ipip_tunnel_init, |
362 | .ndo_uninit = ip_tunnel_uninit, | |
23a12b14 SH |
363 | .ndo_start_xmit = ipip_tunnel_xmit, |
364 | .ndo_do_ioctl = ipip_tunnel_ioctl, | |
fd58156e PS |
365 | .ndo_change_mtu = ip_tunnel_change_mtu, |
366 | .ndo_get_stats64 = ip_tunnel_get_stats64, | |
1e99584b | 367 | .ndo_get_iflink = ip_tunnel_get_iflink, |
23a12b14 SH |
368 | }; |
369 | ||
c3b89fbb ED |
370 | #define IPIP_FEATURES (NETIF_F_SG | \ |
371 | NETIF_F_FRAGLIST | \ | |
372 | NETIF_F_HIGHDMA | \ | |
cb32f511 | 373 | NETIF_F_GSO_SOFTWARE | \ |
c3b89fbb ED |
374 | NETIF_F_HW_CSUM) |
375 | ||
1da177e4 LT |
376 | static void ipip_tunnel_setup(struct net_device *dev) |
377 | { | |
23a12b14 | 378 | dev->netdev_ops = &ipip_netdev_ops; |
1da177e4 LT |
379 | |
380 | dev->type = ARPHRD_TUNNEL; | |
1da177e4 | 381 | dev->flags = IFF_NOARP; |
1da177e4 | 382 | dev->addr_len = 4; |
153f0943 | 383 | dev->features |= NETIF_F_LLTX; |
02875878 | 384 | netif_keep_dst(dev); |
c3b89fbb ED |
385 | |
386 | dev->features |= IPIP_FEATURES; | |
387 | dev->hw_features |= IPIP_FEATURES; | |
fd58156e | 388 | ip_tunnel_setup(dev, ipip_net_id); |
1da177e4 LT |
389 | } |
390 | ||
3c97af99 | 391 | static int ipip_tunnel_init(struct net_device *dev) |
1da177e4 | 392 | { |
23a12b14 | 393 | struct ip_tunnel *tunnel = netdev_priv(dev); |
1da177e4 | 394 | |
1da177e4 LT |
395 | memcpy(dev->dev_addr, &tunnel->parms.iph.saddr, 4); |
396 | memcpy(dev->broadcast, &tunnel->parms.iph.daddr, 4); | |
397 | ||
473ab820 TH |
398 | tunnel->tun_hlen = 0; |
399 | tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen; | |
fd58156e | 400 | return ip_tunnel_init(dev); |
1da177e4 LT |
401 | } |
402 | ||
a8b8a889 MS |
403 | static int ipip_tunnel_validate(struct nlattr *tb[], struct nlattr *data[], |
404 | struct netlink_ext_ack *extack) | |
1b69e7e6 SH |
405 | { |
406 | u8 proto; | |
407 | ||
408 | if (!data || !data[IFLA_IPTUN_PROTO]) | |
409 | return 0; | |
410 | ||
411 | proto = nla_get_u8(data[IFLA_IPTUN_PROTO]); | |
412 | if (proto != IPPROTO_IPIP && proto != IPPROTO_MPLS && proto != 0) | |
413 | return -EINVAL; | |
414 | ||
415 | return 0; | |
416 | } | |
417 | ||
be42da0e | 418 | static void ipip_netlink_parms(struct nlattr *data[], |
9830ad4c CG |
419 | struct ip_tunnel_parm *parms, bool *collect_md, |
420 | __u32 *fwmark) | |
be42da0e ND |
421 | { |
422 | memset(parms, 0, sizeof(*parms)); | |
423 | ||
424 | parms->iph.version = 4; | |
425 | parms->iph.protocol = IPPROTO_IPIP; | |
426 | parms->iph.ihl = 5; | |
cfc7381b | 427 | *collect_md = false; |
be42da0e ND |
428 | |
429 | if (!data) | |
430 | return; | |
431 | ||
432 | if (data[IFLA_IPTUN_LINK]) | |
433 | parms->link = nla_get_u32(data[IFLA_IPTUN_LINK]); | |
434 | ||
435 | if (data[IFLA_IPTUN_LOCAL]) | |
67b61f6c | 436 | parms->iph.saddr = nla_get_in_addr(data[IFLA_IPTUN_LOCAL]); |
be42da0e ND |
437 | |
438 | if (data[IFLA_IPTUN_REMOTE]) | |
67b61f6c | 439 | parms->iph.daddr = nla_get_in_addr(data[IFLA_IPTUN_REMOTE]); |
be42da0e ND |
440 | |
441 | if (data[IFLA_IPTUN_TTL]) { | |
442 | parms->iph.ttl = nla_get_u8(data[IFLA_IPTUN_TTL]); | |
443 | if (parms->iph.ttl) | |
444 | parms->iph.frag_off = htons(IP_DF); | |
445 | } | |
446 | ||
447 | if (data[IFLA_IPTUN_TOS]) | |
448 | parms->iph.tos = nla_get_u8(data[IFLA_IPTUN_TOS]); | |
449 | ||
1b69e7e6 SH |
450 | if (data[IFLA_IPTUN_PROTO]) |
451 | parms->iph.protocol = nla_get_u8(data[IFLA_IPTUN_PROTO]); | |
452 | ||
be42da0e ND |
453 | if (!data[IFLA_IPTUN_PMTUDISC] || nla_get_u8(data[IFLA_IPTUN_PMTUDISC])) |
454 | parms->iph.frag_off = htons(IP_DF); | |
cfc7381b AS |
455 | |
456 | if (data[IFLA_IPTUN_COLLECT_METADATA]) | |
457 | *collect_md = true; | |
9830ad4c CG |
458 | |
459 | if (data[IFLA_IPTUN_FWMARK]) | |
460 | *fwmark = nla_get_u32(data[IFLA_IPTUN_FWMARK]); | |
be42da0e ND |
461 | } |
462 | ||
473ab820 TH |
463 | /* This function returns true when ENCAP attributes are present in the nl msg */ |
464 | static bool ipip_netlink_encap_parms(struct nlattr *data[], | |
465 | struct ip_tunnel_encap *ipencap) | |
466 | { | |
467 | bool ret = false; | |
468 | ||
469 | memset(ipencap, 0, sizeof(*ipencap)); | |
470 | ||
471 | if (!data) | |
472 | return ret; | |
473 | ||
474 | if (data[IFLA_IPTUN_ENCAP_TYPE]) { | |
475 | ret = true; | |
476 | ipencap->type = nla_get_u16(data[IFLA_IPTUN_ENCAP_TYPE]); | |
477 | } | |
478 | ||
479 | if (data[IFLA_IPTUN_ENCAP_FLAGS]) { | |
480 | ret = true; | |
481 | ipencap->flags = nla_get_u16(data[IFLA_IPTUN_ENCAP_FLAGS]); | |
482 | } | |
483 | ||
484 | if (data[IFLA_IPTUN_ENCAP_SPORT]) { | |
485 | ret = true; | |
3e97fa70 | 486 | ipencap->sport = nla_get_be16(data[IFLA_IPTUN_ENCAP_SPORT]); |
473ab820 TH |
487 | } |
488 | ||
489 | if (data[IFLA_IPTUN_ENCAP_DPORT]) { | |
490 | ret = true; | |
3e97fa70 | 491 | ipencap->dport = nla_get_be16(data[IFLA_IPTUN_ENCAP_DPORT]); |
473ab820 TH |
492 | } |
493 | ||
494 | return ret; | |
495 | } | |
496 | ||
be42da0e | 497 | static int ipip_newlink(struct net *src_net, struct net_device *dev, |
7a3f4a18 MS |
498 | struct nlattr *tb[], struct nlattr *data[], |
499 | struct netlink_ext_ack *extack) | |
be42da0e | 500 | { |
cfc7381b | 501 | struct ip_tunnel *t = netdev_priv(dev); |
fd58156e | 502 | struct ip_tunnel_parm p; |
473ab820 | 503 | struct ip_tunnel_encap ipencap; |
9830ad4c | 504 | __u32 fwmark = 0; |
473ab820 TH |
505 | |
506 | if (ipip_netlink_encap_parms(data, &ipencap)) { | |
473ab820 TH |
507 | int err = ip_tunnel_encap_setup(t, &ipencap); |
508 | ||
509 | if (err < 0) | |
510 | return err; | |
511 | } | |
be42da0e | 512 | |
9830ad4c CG |
513 | ipip_netlink_parms(data, &p, &t->collect_md, &fwmark); |
514 | return ip_tunnel_newlink(dev, tb, &p, fwmark); | |
be42da0e ND |
515 | } |
516 | ||
517 | static int ipip_changelink(struct net_device *dev, struct nlattr *tb[], | |
ad744b22 MS |
518 | struct nlattr *data[], |
519 | struct netlink_ext_ack *extack) | |
be42da0e | 520 | { |
9830ad4c | 521 | struct ip_tunnel *t = netdev_priv(dev); |
be42da0e | 522 | struct ip_tunnel_parm p; |
473ab820 | 523 | struct ip_tunnel_encap ipencap; |
cfc7381b | 524 | bool collect_md; |
9830ad4c | 525 | __u32 fwmark = t->fwmark; |
473ab820 TH |
526 | |
527 | if (ipip_netlink_encap_parms(data, &ipencap)) { | |
473ab820 TH |
528 | int err = ip_tunnel_encap_setup(t, &ipencap); |
529 | ||
530 | if (err < 0) | |
531 | return err; | |
532 | } | |
be42da0e | 533 | |
9830ad4c | 534 | ipip_netlink_parms(data, &p, &collect_md, &fwmark); |
cfc7381b AS |
535 | if (collect_md) |
536 | return -EINVAL; | |
be42da0e ND |
537 | |
538 | if (((dev->flags & IFF_POINTOPOINT) && !p.iph.daddr) || | |
539 | (!(dev->flags & IFF_POINTOPOINT) && p.iph.daddr)) | |
540 | return -EINVAL; | |
541 | ||
9830ad4c | 542 | return ip_tunnel_changelink(dev, tb, &p, fwmark); |
be42da0e ND |
543 | } |
544 | ||
0974658d ND |
545 | static size_t ipip_get_size(const struct net_device *dev) |
546 | { | |
547 | return | |
548 | /* IFLA_IPTUN_LINK */ | |
549 | nla_total_size(4) + | |
550 | /* IFLA_IPTUN_LOCAL */ | |
551 | nla_total_size(4) + | |
552 | /* IFLA_IPTUN_REMOTE */ | |
553 | nla_total_size(4) + | |
554 | /* IFLA_IPTUN_TTL */ | |
555 | nla_total_size(1) + | |
556 | /* IFLA_IPTUN_TOS */ | |
557 | nla_total_size(1) + | |
1b69e7e6 SH |
558 | /* IFLA_IPTUN_PROTO */ |
559 | nla_total_size(1) + | |
befe2aa1 ND |
560 | /* IFLA_IPTUN_PMTUDISC */ |
561 | nla_total_size(1) + | |
473ab820 TH |
562 | /* IFLA_IPTUN_ENCAP_TYPE */ |
563 | nla_total_size(2) + | |
564 | /* IFLA_IPTUN_ENCAP_FLAGS */ | |
565 | nla_total_size(2) + | |
566 | /* IFLA_IPTUN_ENCAP_SPORT */ | |
567 | nla_total_size(2) + | |
568 | /* IFLA_IPTUN_ENCAP_DPORT */ | |
569 | nla_total_size(2) + | |
cfc7381b AS |
570 | /* IFLA_IPTUN_COLLECT_METADATA */ |
571 | nla_total_size(0) + | |
9830ad4c CG |
572 | /* IFLA_IPTUN_FWMARK */ |
573 | nla_total_size(4) + | |
0974658d ND |
574 | 0; |
575 | } | |
576 | ||
577 | static int ipip_fill_info(struct sk_buff *skb, const struct net_device *dev) | |
578 | { | |
579 | struct ip_tunnel *tunnel = netdev_priv(dev); | |
580 | struct ip_tunnel_parm *parm = &tunnel->parms; | |
581 | ||
582 | if (nla_put_u32(skb, IFLA_IPTUN_LINK, parm->link) || | |
930345ea JB |
583 | nla_put_in_addr(skb, IFLA_IPTUN_LOCAL, parm->iph.saddr) || |
584 | nla_put_in_addr(skb, IFLA_IPTUN_REMOTE, parm->iph.daddr) || | |
0974658d | 585 | nla_put_u8(skb, IFLA_IPTUN_TTL, parm->iph.ttl) || |
befe2aa1 | 586 | nla_put_u8(skb, IFLA_IPTUN_TOS, parm->iph.tos) || |
1b69e7e6 | 587 | nla_put_u8(skb, IFLA_IPTUN_PROTO, parm->iph.protocol) || |
befe2aa1 | 588 | nla_put_u8(skb, IFLA_IPTUN_PMTUDISC, |
9830ad4c CG |
589 | !!(parm->iph.frag_off & htons(IP_DF))) || |
590 | nla_put_u32(skb, IFLA_IPTUN_FWMARK, tunnel->fwmark)) | |
0974658d | 591 | goto nla_put_failure; |
473ab820 TH |
592 | |
593 | if (nla_put_u16(skb, IFLA_IPTUN_ENCAP_TYPE, | |
594 | tunnel->encap.type) || | |
3e97fa70 SD |
595 | nla_put_be16(skb, IFLA_IPTUN_ENCAP_SPORT, |
596 | tunnel->encap.sport) || | |
597 | nla_put_be16(skb, IFLA_IPTUN_ENCAP_DPORT, | |
598 | tunnel->encap.dport) || | |
473ab820 | 599 | nla_put_u16(skb, IFLA_IPTUN_ENCAP_FLAGS, |
e1b2cb65 | 600 | tunnel->encap.flags)) |
473ab820 TH |
601 | goto nla_put_failure; |
602 | ||
cfc7381b AS |
603 | if (tunnel->collect_md) |
604 | if (nla_put_flag(skb, IFLA_IPTUN_COLLECT_METADATA)) | |
605 | goto nla_put_failure; | |
0974658d ND |
606 | return 0; |
607 | ||
608 | nla_put_failure: | |
609 | return -EMSGSIZE; | |
610 | } | |
611 | ||
be42da0e ND |
612 | static const struct nla_policy ipip_policy[IFLA_IPTUN_MAX + 1] = { |
613 | [IFLA_IPTUN_LINK] = { .type = NLA_U32 }, | |
614 | [IFLA_IPTUN_LOCAL] = { .type = NLA_U32 }, | |
615 | [IFLA_IPTUN_REMOTE] = { .type = NLA_U32 }, | |
616 | [IFLA_IPTUN_TTL] = { .type = NLA_U8 }, | |
617 | [IFLA_IPTUN_TOS] = { .type = NLA_U8 }, | |
1b69e7e6 | 618 | [IFLA_IPTUN_PROTO] = { .type = NLA_U8 }, |
be42da0e | 619 | [IFLA_IPTUN_PMTUDISC] = { .type = NLA_U8 }, |
473ab820 TH |
620 | [IFLA_IPTUN_ENCAP_TYPE] = { .type = NLA_U16 }, |
621 | [IFLA_IPTUN_ENCAP_FLAGS] = { .type = NLA_U16 }, | |
622 | [IFLA_IPTUN_ENCAP_SPORT] = { .type = NLA_U16 }, | |
623 | [IFLA_IPTUN_ENCAP_DPORT] = { .type = NLA_U16 }, | |
cfc7381b | 624 | [IFLA_IPTUN_COLLECT_METADATA] = { .type = NLA_FLAG }, |
9830ad4c | 625 | [IFLA_IPTUN_FWMARK] = { .type = NLA_U32 }, |
be42da0e ND |
626 | }; |
627 | ||
0974658d ND |
628 | static struct rtnl_link_ops ipip_link_ops __read_mostly = { |
629 | .kind = "ipip", | |
630 | .maxtype = IFLA_IPTUN_MAX, | |
be42da0e | 631 | .policy = ipip_policy, |
0974658d | 632 | .priv_size = sizeof(struct ip_tunnel), |
be42da0e | 633 | .setup = ipip_tunnel_setup, |
1b69e7e6 | 634 | .validate = ipip_tunnel_validate, |
be42da0e ND |
635 | .newlink = ipip_newlink, |
636 | .changelink = ipip_changelink, | |
fd58156e | 637 | .dellink = ip_tunnel_dellink, |
0974658d ND |
638 | .get_size = ipip_get_size, |
639 | .fill_info = ipip_fill_info, | |
1728d4fa | 640 | .get_link_net = ip_tunnel_get_link_net, |
0974658d ND |
641 | }; |
642 | ||
6dcd814b | 643 | static struct xfrm_tunnel ipip_handler __read_mostly = { |
1da177e4 LT |
644 | .handler = ipip_rcv, |
645 | .err_handler = ipip_err, | |
d2acc347 | 646 | .priority = 1, |
1da177e4 LT |
647 | }; |
648 | ||
1b69e7e6 SH |
649 | #if IS_ENABLED(CONFIG_MPLS) |
650 | static struct xfrm_tunnel mplsip_handler __read_mostly = { | |
651 | .handler = mplsip_rcv, | |
652 | .err_handler = ipip_err, | |
653 | .priority = 1, | |
654 | }; | |
655 | #endif | |
656 | ||
2c8c1e72 | 657 | static int __net_init ipip_init_net(struct net *net) |
10dc4c7b | 658 | { |
fd58156e | 659 | return ip_tunnel_init_net(net, ipip_net_id, &ipip_link_ops, "tunl0"); |
10dc4c7b PE |
660 | } |
661 | ||
64bc1781 | 662 | static void __net_exit ipip_exit_batch_net(struct list_head *list_net) |
10dc4c7b | 663 | { |
64bc1781 | 664 | ip_tunnel_delete_nets(list_net, ipip_net_id, &ipip_link_ops); |
10dc4c7b PE |
665 | } |
666 | ||
667 | static struct pernet_operations ipip_net_ops = { | |
668 | .init = ipip_init_net, | |
64bc1781 | 669 | .exit_batch = ipip_exit_batch_net, |
86de8a63 | 670 | .id = &ipip_net_id, |
fd58156e | 671 | .size = sizeof(struct ip_tunnel_net), |
10dc4c7b PE |
672 | }; |
673 | ||
1da177e4 LT |
674 | static int __init ipip_init(void) |
675 | { | |
676 | int err; | |
677 | ||
1b69e7e6 | 678 | pr_info("ipip: IPv4 and MPLS over IPv4 tunneling driver\n"); |
1da177e4 | 679 | |
d5aa407f AD |
680 | err = register_pernet_device(&ipip_net_ops); |
681 | if (err < 0) | |
682 | return err; | |
683 | err = xfrm4_tunnel_register(&ipip_handler, AF_INET); | |
684 | if (err < 0) { | |
058bd4d2 | 685 | pr_info("%s: can't register tunnel\n", __func__); |
1b69e7e6 SH |
686 | goto xfrm_tunnel_ipip_failed; |
687 | } | |
688 | #if IS_ENABLED(CONFIG_MPLS) | |
689 | err = xfrm4_tunnel_register(&mplsip_handler, AF_MPLS); | |
690 | if (err < 0) { | |
691 | pr_info("%s: can't register tunnel\n", __func__); | |
692 | goto xfrm_tunnel_mplsip_failed; | |
1da177e4 | 693 | } |
1b69e7e6 | 694 | #endif |
0974658d ND |
695 | err = rtnl_link_register(&ipip_link_ops); |
696 | if (err < 0) | |
697 | goto rtnl_link_failed; | |
698 | ||
699 | out: | |
1da177e4 | 700 | return err; |
0974658d ND |
701 | |
702 | rtnl_link_failed: | |
1b69e7e6 SH |
703 | #if IS_ENABLED(CONFIG_MPLS) |
704 | xfrm4_tunnel_deregister(&mplsip_handler, AF_INET); | |
705 | xfrm_tunnel_mplsip_failed: | |
706 | ||
707 | #endif | |
0974658d | 708 | xfrm4_tunnel_deregister(&ipip_handler, AF_INET); |
1b69e7e6 | 709 | xfrm_tunnel_ipip_failed: |
0974658d ND |
710 | unregister_pernet_device(&ipip_net_ops); |
711 | goto out; | |
1da177e4 LT |
712 | } |
713 | ||
714 | static void __exit ipip_fini(void) | |
715 | { | |
0974658d | 716 | rtnl_link_unregister(&ipip_link_ops); |
c0d56408 | 717 | if (xfrm4_tunnel_deregister(&ipip_handler, AF_INET)) |
058bd4d2 | 718 | pr_info("%s: can't deregister tunnel\n", __func__); |
1b69e7e6 SH |
719 | #if IS_ENABLED(CONFIG_MPLS) |
720 | if (xfrm4_tunnel_deregister(&mplsip_handler, AF_MPLS)) | |
721 | pr_info("%s: can't deregister tunnel\n", __func__); | |
722 | #endif | |
86de8a63 | 723 | unregister_pernet_device(&ipip_net_ops); |
1da177e4 LT |
724 | } |
725 | ||
726 | module_init(ipip_init); | |
727 | module_exit(ipip_fini); | |
728 | MODULE_LICENSE("GPL"); | |
f98f89a0 | 729 | MODULE_ALIAS_RTNL_LINK("ipip"); |
8909c9ad | 730 | MODULE_ALIAS_NETDEV("tunl0"); |