]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - net/ipv4/ip_gre.c
tools headers UAPI: Sync linux/prctl.h with the kernel sources
[mirror_ubuntu-jammy-kernel.git] / net / ipv4 / ip_gre.c
CommitLineData
2874c5fd 1// SPDX-License-Identifier: GPL-2.0-or-later
1da177e4 2/*
e905a9ed 3 * Linux NET3: GRE over IP protocol decoder.
1da177e4
LT
4 *
5 * Authors: Alexey Kuznetsov (kuznet@ms2.inr.ac.ru)
1da177e4
LT
6 */
7
afd46503
JP
8#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
9
4fc268d2 10#include <linux/capability.h>
1da177e4
LT
11#include <linux/module.h>
12#include <linux/types.h>
1da177e4 13#include <linux/kernel.h>
5a0e3ad6 14#include <linux/slab.h>
7c0f6ba6 15#include <linux/uaccess.h>
1da177e4
LT
16#include <linux/skbuff.h>
17#include <linux/netdevice.h>
18#include <linux/in.h>
19#include <linux/tcp.h>
20#include <linux/udp.h>
21#include <linux/if_arp.h>
2e15ea39 22#include <linux/if_vlan.h>
1da177e4
LT
23#include <linux/init.h>
24#include <linux/in6.h>
25#include <linux/inetdevice.h>
26#include <linux/igmp.h>
27#include <linux/netfilter_ipv4.h>
e1a80002 28#include <linux/etherdevice.h>
46f25dff 29#include <linux/if_ether.h>
1da177e4
LT
30
31#include <net/sock.h>
32#include <net/ip.h>
33#include <net/icmp.h>
34#include <net/protocol.h>
c5441932 35#include <net/ip_tunnels.h>
1da177e4
LT
36#include <net/arp.h>
37#include <net/checksum.h>
38#include <net/dsfield.h>
39#include <net/inet_ecn.h>
40#include <net/xfrm.h>
59a4c759
PE
41#include <net/net_namespace.h>
42#include <net/netns/generic.h>
c19e654d 43#include <net/rtnetlink.h>
00959ade 44#include <net/gre.h>
2e15ea39 45#include <net/dst_metadata.h>
84e54fe0 46#include <net/erspan.h>
1da177e4 47
1da177e4
LT
48/*
49 Problems & solutions
50 --------------------
51
52 1. The most important issue is detecting local dead loops.
53 They would cause complete host lockup in transmit, which
54 would be "resolved" by stack overflow or, if queueing is enabled,
55 with infinite looping in net_bh.
56
57 We cannot track such dead loops during route installation,
58 it is infeasible task. The most general solutions would be
59 to keep skb->encapsulation counter (sort of local ttl),
6d0722a2 60 and silently drop packet when it expires. It is a good
bff52857 61 solution, but it supposes maintaining new variable in ALL
1da177e4
LT
62 skb, even if no tunneling is used.
63
6d0722a2
ED
64 Current solution: xmit_recursion breaks dead loops. This is a percpu
65 counter, since when we enter the first ndo_xmit(), cpu migration is
66 forbidden. We force an exit if this counter reaches RECURSION_LIMIT
1da177e4
LT
67
68 2. Networking dead loops would not kill routers, but would really
69 kill network. IP hop limit plays role of "t->recursion" in this case,
70 if we copy it from packet being encapsulated to upper header.
71 It is very good solution, but it introduces two problems:
72
73 - Routing protocols, using packets with ttl=1 (OSPF, RIP2),
74 do not work over tunnels.
75 - traceroute does not work. I planned to relay ICMP from tunnel,
76 so that this problem would be solved and traceroute output
77 would even more informative. This idea appeared to be wrong:
78 only Linux complies to rfc1812 now (yes, guys, Linux is the only
79 true router now :-)), all routers (at least, in neighbourhood of mine)
80 return only 8 bytes of payload. It is the end.
81
82 Hence, if we want that OSPF worked or traceroute said something reasonable,
83 we should search for another solution.
84
85 One of them is to parse packet trying to detect inner encapsulation
86 made by our node. It is difficult or even impossible, especially,
bff52857 87 taking into account fragmentation. TO be short, ttl is not solution at all.
1da177e4
LT
88
89 Current solution: The solution was UNEXPECTEDLY SIMPLE.
90 We force DF flag on tunnels with preconfigured hop limit,
91 that is ALL. :-) Well, it does not remove the problem completely,
92 but exponential growth of network traffic is changed to linear
93 (branches, that exceed pmtu are pruned) and tunnel mtu
bff52857 94 rapidly degrades to value <68, where looping stops.
1da177e4
LT
95 Yes, it is not good if there exists a router in the loop,
96 which does not force DF, even when encapsulating packets have DF set.
97 But it is not our problem! Nobody could accuse us, we made
98 all that we could make. Even if it is your gated who injected
99 fatal route to network, even if it were you who configured
100 fatal static route: you are innocent. :-)
101
1da177e4
LT
102 Alexey Kuznetsov.
103 */
104
eccc1bb8 105static bool log_ecn_error = true;
106module_param(log_ecn_error, bool, 0644);
107MODULE_PARM_DESC(log_ecn_error, "Log packets received with corrupted ECN");
108
c19e654d 109static struct rtnl_link_ops ipgre_link_ops __read_mostly;
aab1e898
GN
110static const struct header_ops ipgre_header_ops;
111
1da177e4 112static int ipgre_tunnel_init(struct net_device *dev);
1a66a836 113static void erspan_build_header(struct sk_buff *skb,
c69de58b 114 u32 id, u32 index,
a3222dc9 115 bool truncate, bool is_ipv4);
eb8ce741 116
c7d03a00
AD
117static unsigned int ipgre_net_id __read_mostly;
118static unsigned int gre_tap_net_id __read_mostly;
84e54fe0 119static unsigned int erspan_net_id __read_mostly;
1da177e4 120
32bbd879
SB
121static int ipgre_err(struct sk_buff *skb, u32 info,
122 const struct tnl_ptk_info *tpi)
1da177e4 123{
1da177e4 124
c5441932
PS
125 /* All the routers (except for Linux) return only
126 8 bytes of packet payload. It means, that precise relaying of
127 ICMP in the real Internet is absolutely infeasible.
1da177e4 128
c5441932
PS
129 Moreover, Cisco "wise men" put GRE key to the third word
130 in GRE header. It makes impossible maintaining even soft
131 state for keyed GRE tunnels with enabled checksum. Tell
132 them "thank you".
1da177e4 133
c5441932
PS
134 Well, I wonder, rfc1812 was written by Cisco employee,
135 what the hell these idiots break standards established
136 by themselves???
137 */
138 struct net *net = dev_net(skb->dev);
139 struct ip_tunnel_net *itn;
96f5a846 140 const struct iphdr *iph;
88c7664f
ACM
141 const int type = icmp_hdr(skb)->type;
142 const int code = icmp_hdr(skb)->code;
20e1954f 143 unsigned int data_len = 0;
1da177e4 144 struct ip_tunnel *t;
1da177e4 145
32bbd879
SB
146 if (tpi->proto == htons(ETH_P_TEB))
147 itn = net_generic(net, gre_tap_net_id);
148 else if (tpi->proto == htons(ETH_P_ERSPAN) ||
149 tpi->proto == htons(ETH_P_ERSPAN2))
150 itn = net_generic(net, erspan_net_id);
151 else
152 itn = net_generic(net, ipgre_net_id);
153
154 iph = (const struct iphdr *)(icmp_hdr(skb) + 1);
155 t = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
156 iph->daddr, iph->saddr, tpi->key);
157
158 if (!t)
159 return -ENOENT;
160
1da177e4
LT
161 switch (type) {
162 default:
163 case ICMP_PARAMETERPROB:
32bbd879 164 return 0;
1da177e4
LT
165
166 case ICMP_DEST_UNREACH:
167 switch (code) {
168 case ICMP_SR_FAILED:
169 case ICMP_PORT_UNREACH:
170 /* Impossible event. */
32bbd879 171 return 0;
1da177e4
LT
172 default:
173 /* All others are translated to HOST_UNREACH.
174 rfc2003 contains "deep thoughts" about NET_UNREACH,
175 I believe they are just ether pollution. --ANK
176 */
177 break;
178 }
179 break;
9f57c67c 180
1da177e4
LT
181 case ICMP_TIME_EXCEEDED:
182 if (code != ICMP_EXC_TTL)
32bbd879 183 return 0;
20e1954f 184 data_len = icmp_hdr(skb)->un.reserved[1] * 4; /* RFC 4884 4.1 */
1da177e4 185 break;
55be7a9c
DM
186
187 case ICMP_REDIRECT:
188 break;
1da177e4
LT
189 }
190
9b8c6d7b
ED
191#if IS_ENABLED(CONFIG_IPV6)
192 if (tpi->proto == htons(ETH_P_IPV6) &&
20e1954f
ED
193 !ip6_err_gen_icmpv6_unreach(skb, iph->ihl * 4 + tpi->hdr_len,
194 type, data_len))
32bbd879 195 return 0;
9b8c6d7b
ED
196#endif
197
36393395 198 if (t->parms.iph.daddr == 0 ||
f97c1e0c 199 ipv4_is_multicast(t->parms.iph.daddr))
32bbd879 200 return 0;
1da177e4
LT
201
202 if (t->parms.iph.ttl == 0 && type == ICMP_TIME_EXCEEDED)
32bbd879 203 return 0;
1da177e4 204
da6185d8 205 if (time_before(jiffies, t->err_time + IPTUNNEL_ERR_TIMEO))
1da177e4
LT
206 t->err_count++;
207 else
208 t->err_count = 1;
209 t->err_time = jiffies;
32bbd879
SB
210
211 return 0;
9f57c67c
PS
212}
213
214static void gre_err(struct sk_buff *skb, u32 info)
215{
216 /* All the routers (except for Linux) return only
217 * 8 bytes of packet payload. It means, that precise relaying of
218 * ICMP in the real Internet is absolutely infeasible.
219 *
220 * Moreover, Cisco "wise men" put GRE key to the third word
221 * in GRE header. It makes impossible maintaining even soft
222 * state for keyed
223 * GRE tunnels with enabled checksum. Tell them "thank you".
224 *
225 * Well, I wonder, rfc1812 was written by Cisco employee,
226 * what the hell these idiots break standards established
227 * by themselves???
228 */
229
e582615a 230 const struct iphdr *iph = (struct iphdr *)skb->data;
9f57c67c
PS
231 const int type = icmp_hdr(skb)->type;
232 const int code = icmp_hdr(skb)->code;
233 struct tnl_ptk_info tpi;
9f57c67c 234
b0350d51
HY
235 if (gre_parse_header(skb, &tpi, NULL, htons(ETH_P_IP),
236 iph->ihl * 4) < 0)
237 return;
9f57c67c
PS
238
239 if (type == ICMP_DEST_UNREACH && code == ICMP_FRAG_NEEDED) {
240 ipv4_update_pmtu(skb, dev_net(skb->dev), info,
d888f396 241 skb->dev->ifindex, IPPROTO_GRE);
9f57c67c
PS
242 return;
243 }
244 if (type == ICMP_REDIRECT) {
1042caa7
MÅ»
245 ipv4_redirect(skb, dev_net(skb->dev), skb->dev->ifindex,
246 IPPROTO_GRE);
9f57c67c
PS
247 return;
248 }
249
250 ipgre_err(skb, info, &tpi);
1da177e4
LT
251}
252
f989d546
WT
253static bool is_erspan_type1(int gre_hdr_len)
254{
255 /* Both ERSPAN type I (version 0) and type II (version 1) use
256 * protocol 0x88BE, but the type I has only 4-byte GRE header,
257 * while type II has 8-byte.
258 */
259 return gre_hdr_len == 4;
260}
261
84e54fe0
WT
262static int erspan_rcv(struct sk_buff *skb, struct tnl_ptk_info *tpi,
263 int gre_hdr_len)
264{
265 struct net *net = dev_net(skb->dev);
266 struct metadata_dst *tun_dst = NULL;
1d7e2ed2 267 struct erspan_base_hdr *ershdr;
84e54fe0
WT
268 struct ip_tunnel_net *itn;
269 struct ip_tunnel *tunnel;
84e54fe0 270 const struct iphdr *iph;
3df19283 271 struct erspan_md2 *md2;
1d7e2ed2 272 int ver;
84e54fe0
WT
273 int len;
274
275 itn = net_generic(net, erspan_net_id);
84e54fe0 276 iph = ip_hdr(skb);
f989d546
WT
277 if (is_erspan_type1(gre_hdr_len)) {
278 ver = 0;
279 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex,
280 tpi->flags | TUNNEL_NO_KEY,
281 iph->saddr, iph->daddr, 0);
282 } else {
283 ershdr = (struct erspan_base_hdr *)(skb->data + gre_hdr_len);
284 ver = ershdr->ver;
285 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex,
286 tpi->flags | TUNNEL_KEY,
287 iph->saddr, iph->daddr, tpi->key);
288 }
84e54fe0
WT
289
290 if (tunnel) {
f989d546
WT
291 if (is_erspan_type1(gre_hdr_len))
292 len = gre_hdr_len;
293 else
294 len = gre_hdr_len + erspan_hdr_len(ver);
295
1d7e2ed2 296 if (unlikely(!pskb_may_pull(skb, len)))
ae3e1337 297 return PACKET_REJECT;
1d7e2ed2 298
84e54fe0 299 if (__iptunnel_pull_header(skb,
1d7e2ed2 300 len,
84e54fe0
WT
301 htons(ETH_P_TEB),
302 false, false) < 0)
303 goto drop;
304
1a66a836 305 if (tunnel->collect_md) {
492b67e2 306 struct erspan_metadata *pkt_md, *md;
1a66a836 307 struct ip_tunnel_info *info;
492b67e2 308 unsigned char *gh;
1a66a836
WT
309 __be64 tun_id;
310 __be16 flags;
311
312 tpi->flags |= TUNNEL_KEY;
313 flags = tpi->flags;
314 tun_id = key32_to_tunnel_id(tpi->key);
315
316 tun_dst = ip_tun_rx_dst(skb, flags,
317 tun_id, sizeof(*md));
318 if (!tun_dst)
319 return PACKET_REJECT;
320
492b67e2
LB
321 /* skb can be uncloned in __iptunnel_pull_header, so
322 * old pkt_md is no longer valid and we need to reset
323 * it
324 */
325 gh = skb_network_header(skb) +
326 skb_network_header_len(skb);
327 pkt_md = (struct erspan_metadata *)(gh + gre_hdr_len +
328 sizeof(*ershdr));
1a66a836 329 md = ip_tunnel_info_opts(&tun_dst->u.tun_info);
f551c91d 330 md->version = ver;
3df19283
WT
331 md2 = &md->u.md2;
332 memcpy(md2, pkt_md, ver == 1 ? ERSPAN_V1_MDSIZE :
333 ERSPAN_V2_MDSIZE);
f551c91d 334
1a66a836
WT
335 info = &tun_dst->u.tun_info;
336 info->key.tun_flags |= TUNNEL_ERSPAN_OPT;
337 info->options_len = sizeof(*md);
1a66a836
WT
338 }
339
84e54fe0
WT
340 skb_reset_mac_header(skb);
341 ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
342 return PACKET_RCVD;
343 }
5a64506b
HY
344 return PACKET_REJECT;
345
84e54fe0
WT
346drop:
347 kfree_skb(skb);
348 return PACKET_RCVD;
349}
350
125372fa
JB
351static int __ipgre_rcv(struct sk_buff *skb, const struct tnl_ptk_info *tpi,
352 struct ip_tunnel_net *itn, int hdr_len, bool raw_proto)
1da177e4 353{
2e15ea39 354 struct metadata_dst *tun_dst = NULL;
b71d1d42 355 const struct iphdr *iph;
1da177e4 356 struct ip_tunnel *tunnel;
1da177e4 357
c5441932 358 iph = ip_hdr(skb);
bda7bb46
PS
359 tunnel = ip_tunnel_lookup(itn, skb->dev->ifindex, tpi->flags,
360 iph->saddr, iph->daddr, tpi->key);
e1a80002 361
d2083287 362 if (tunnel) {
c0d59da7 363 const struct iphdr *tnl_params;
364
125372fa
JB
365 if (__iptunnel_pull_header(skb, hdr_len, tpi->proto,
366 raw_proto, false) < 0)
244a797b
JB
367 goto drop;
368
aab1e898
GN
369 /* Special case for ipgre_header_parse(), which expects the
370 * mac_header to point to the outer IP header.
371 */
372 if (tunnel->dev->header_ops == &ipgre_header_ops)
e271c7b4
JB
373 skb_pop_mac_header(skb);
374 else
375 skb_reset_mac_header(skb);
c0d59da7 376
377 tnl_params = &tunnel->parms.iph;
378 if (tunnel->collect_md || tnl_params->daddr == 0) {
c29a70d2
PS
379 __be16 flags;
380 __be64 tun_id;
2e15ea39 381
c29a70d2 382 flags = tpi->flags & (TUNNEL_CSUM | TUNNEL_KEY);
d817f432 383 tun_id = key32_to_tunnel_id(tpi->key);
c29a70d2 384 tun_dst = ip_tun_rx_dst(skb, flags, tun_id, 0);
2e15ea39
PS
385 if (!tun_dst)
386 return PACKET_REJECT;
2e15ea39
PS
387 }
388
389 ip_tunnel_rcv(tunnel, skb, tpi, tun_dst, log_ecn_error);
bda7bb46 390 return PACKET_RCVD;
1da177e4 391 }
125372fa 392 return PACKET_NEXT;
244a797b
JB
393
394drop:
395 kfree_skb(skb);
396 return PACKET_RCVD;
1da177e4
LT
397}
398
125372fa
JB
399static int ipgre_rcv(struct sk_buff *skb, const struct tnl_ptk_info *tpi,
400 int hdr_len)
401{
402 struct net *net = dev_net(skb->dev);
403 struct ip_tunnel_net *itn;
404 int res;
405
406 if (tpi->proto == htons(ETH_P_TEB))
407 itn = net_generic(net, gre_tap_net_id);
408 else
409 itn = net_generic(net, ipgre_net_id);
410
411 res = __ipgre_rcv(skb, tpi, itn, hdr_len, false);
412 if (res == PACKET_NEXT && tpi->proto == htons(ETH_P_TEB)) {
413 /* ipgre tunnels in collect metadata mode should receive
414 * also ETH_P_TEB traffic.
415 */
416 itn = net_generic(net, ipgre_net_id);
417 res = __ipgre_rcv(skb, tpi, itn, hdr_len, true);
418 }
419 return res;
420}
421
9f57c67c
PS
422static int gre_rcv(struct sk_buff *skb)
423{
424 struct tnl_ptk_info tpi;
425 bool csum_err = false;
95f5c64c 426 int hdr_len;
9f57c67c
PS
427
428#ifdef CONFIG_NET_IPGRE_BROADCAST
429 if (ipv4_is_multicast(ip_hdr(skb)->daddr)) {
430 /* Looped back packet, drop it! */
431 if (rt_is_output_route(skb_rtable(skb)))
432 goto drop;
433 }
434#endif
435
e582615a 436 hdr_len = gre_parse_header(skb, &tpi, &csum_err, htons(ETH_P_IP), 0);
f132ae7c 437 if (hdr_len < 0)
95f5c64c
TH
438 goto drop;
439
f551c91d
WT
440 if (unlikely(tpi.proto == htons(ETH_P_ERSPAN) ||
441 tpi.proto == htons(ETH_P_ERSPAN2))) {
84e54fe0
WT
442 if (erspan_rcv(skb, &tpi, hdr_len) == PACKET_RCVD)
443 return 0;
dd8d5b8c 444 goto out;
84e54fe0
WT
445 }
446
244a797b 447 if (ipgre_rcv(skb, &tpi, hdr_len) == PACKET_RCVD)
9f57c67c
PS
448 return 0;
449
dd8d5b8c 450out:
9f57c67c
PS
451 icmp_send(skb, ICMP_DEST_UNREACH, ICMP_PORT_UNREACH, 0);
452drop:
453 kfree_skb(skb);
454 return 0;
455}
456
c5441932
PS
457static void __gre_xmit(struct sk_buff *skb, struct net_device *dev,
458 const struct iphdr *tnl_params,
459 __be16 proto)
460{
461 struct ip_tunnel *tunnel = netdev_priv(dev);
1da177e4 462
c5441932
PS
463 if (tunnel->parms.o_flags & TUNNEL_SEQ)
464 tunnel->o_seqno++;
1da177e4 465
c5441932 466 /* Push GRE header. */
182a352d
TH
467 gre_build_header(skb, tunnel->tun_hlen,
468 tunnel->parms.o_flags, proto, tunnel->parms.o_key,
469 htonl(tunnel->o_seqno));
54bc9bac 470
bf3d6a8f 471 ip_tunnel_xmit(skb, dev, tnl_params, tnl_params->protocol);
c5441932 472}
1da177e4 473
aed069df 474static int gre_handle_offloads(struct sk_buff *skb, bool csum)
b2acd1dc 475{
6fa79666 476 return iptunnel_handle_offloads(skb, csum ? SKB_GSO_GRE_CSUM : SKB_GSO_GRE);
b2acd1dc
PS
477}
478
862a03c3
WT
479static void gre_fb_xmit(struct sk_buff *skb, struct net_device *dev,
480 __be16 proto)
481{
77a5196a 482 struct ip_tunnel *tunnel = netdev_priv(dev);
862a03c3
WT
483 struct ip_tunnel_info *tun_info;
484 const struct ip_tunnel_key *key;
862a03c3 485 int tunnel_hlen;
962924fa 486 __be16 flags;
862a03c3
WT
487
488 tun_info = skb_tunnel_info(skb);
489 if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
490 ip_tunnel_info_af(tun_info) != AF_INET))
491 goto err_free_skb;
492
493 key = &tun_info->key;
494 tunnel_hlen = gre_calc_hlen(key->tun_flags);
495
962924fa 496 if (skb_cow_head(skb, dev->needed_headroom))
497 goto err_free_skb;
2e15ea39
PS
498
499 /* Push Tunnel header. */
aed069df 500 if (gre_handle_offloads(skb, !!(tun_info->key.tun_flags & TUNNEL_CSUM)))
962924fa 501 goto err_free_skb;
2e15ea39 502
77a5196a
WT
503 flags = tun_info->key.tun_flags &
504 (TUNNEL_CSUM | TUNNEL_KEY | TUNNEL_SEQ);
cba65321 505 gre_build_header(skb, tunnel_hlen, flags, proto,
77a5196a 506 tunnel_id_to_key32(tun_info->key.tun_id),
15746394 507 (flags & TUNNEL_SEQ) ? htonl(tunnel->o_seqno++) : 0);
2e15ea39 508
962924fa 509 ip_md_tunnel_xmit(skb, dev, IPPROTO_GRE, tunnel_hlen);
039f5062 510
2e15ea39
PS
511 return;
512
2e15ea39
PS
513err_free_skb:
514 kfree_skb(skb);
515 dev->stats.tx_dropped++;
516}
517
20704bd1 518static void erspan_fb_xmit(struct sk_buff *skb, struct net_device *dev)
1a66a836
WT
519{
520 struct ip_tunnel *tunnel = netdev_priv(dev);
521 struct ip_tunnel_info *tun_info;
522 const struct ip_tunnel_key *key;
523 struct erspan_metadata *md;
1a66a836 524 bool truncate = false;
962924fa 525 __be16 proto;
1a66a836 526 int tunnel_hlen;
f551c91d 527 int version;
1baf5ebf 528 int nhoff;
d5db21a3 529 int thoff;
1a66a836
WT
530
531 tun_info = skb_tunnel_info(skb);
532 if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
533 ip_tunnel_info_af(tun_info) != AF_INET))
534 goto err_free_skb;
535
536 key = &tun_info->key;
256c87c1 537 if (!(tun_info->key.tun_flags & TUNNEL_ERSPAN_OPT))
962924fa 538 goto err_free_skb;
2eb8d6d2 539 if (tun_info->options_len < sizeof(*md))
962924fa 540 goto err_free_skb;
2eb8d6d2 541 md = ip_tunnel_info_opts(tun_info);
1a66a836
WT
542
543 /* ERSPAN has fixed 8 byte GRE header */
f551c91d
WT
544 version = md->version;
545 tunnel_hlen = 8 + erspan_hdr_len(version);
1a66a836 546
962924fa 547 if (skb_cow_head(skb, dev->needed_headroom))
548 goto err_free_skb;
1a66a836
WT
549
550 if (gre_handle_offloads(skb, false))
962924fa 551 goto err_free_skb;
1a66a836 552
f192970d
WT
553 if (skb->len > dev->mtu + dev->hard_header_len) {
554 pskb_trim(skb, dev->mtu + dev->hard_header_len);
1a66a836
WT
555 truncate = true;
556 }
557
1baf5ebf
WT
558 nhoff = skb_network_header(skb) - skb_mac_header(skb);
559 if (skb->protocol == htons(ETH_P_IP) &&
560 (ntohs(ip_hdr(skb)->tot_len) > skb->len - nhoff))
561 truncate = true;
d5db21a3
WT
562
563 thoff = skb_transport_header(skb) - skb_mac_header(skb);
564 if (skb->protocol == htons(ETH_P_IPV6) &&
565 (ntohs(ipv6_hdr(skb)->payload_len) > skb->len - thoff))
566 truncate = true;
1baf5ebf 567
f551c91d 568 if (version == 1) {
c69de58b 569 erspan_build_header(skb, ntohl(tunnel_id_to_key32(key->tun_id)),
f551c91d 570 ntohl(md->u.index), truncate, true);
20704bd1 571 proto = htons(ETH_P_ERSPAN);
f551c91d 572 } else if (version == 2) {
c69de58b
WT
573 erspan_build_header_v2(skb,
574 ntohl(tunnel_id_to_key32(key->tun_id)),
575 md->u.md2.dir,
576 get_hwid(&md->u.md2),
577 truncate, true);
20704bd1 578 proto = htons(ETH_P_ERSPAN2);
f551c91d 579 } else {
962924fa 580 goto err_free_skb;
f551c91d 581 }
1a66a836
WT
582
583 gre_build_header(skb, 8, TUNNEL_SEQ,
20704bd1 584 proto, 0, htonl(tunnel->o_seqno++));
1a66a836 585
962924fa 586 ip_md_tunnel_xmit(skb, dev, IPPROTO_GRE, tunnel_hlen);
1a66a836 587
1a66a836
WT
588 return;
589
1a66a836
WT
590err_free_skb:
591 kfree_skb(skb);
592 dev->stats.tx_dropped++;
593}
594
fc4099f1
PS
595static int gre_fill_metadata_dst(struct net_device *dev, struct sk_buff *skb)
596{
597 struct ip_tunnel_info *info = skb_tunnel_info(skb);
962924fa 598 const struct ip_tunnel_key *key;
fc4099f1
PS
599 struct rtable *rt;
600 struct flowi4 fl4;
601
602 if (ip_tunnel_info_af(info) != AF_INET)
603 return -EINVAL;
604
962924fa 605 key = &info->key;
606 ip_tunnel_init_flow(&fl4, IPPROTO_GRE, key->u.ipv4.dst, key->u.ipv4.src,
607 tunnel_id_to_key32(key->tun_id), key->tos, 0,
24ba1440 608 skb->mark, skb_get_hash(skb));
962924fa 609 rt = ip_route_output_key(dev_net(dev), &fl4);
fc4099f1
PS
610 if (IS_ERR(rt))
611 return PTR_ERR(rt);
612
613 ip_rt_put(rt);
614 info->key.u.ipv4.src = fl4.saddr;
615 return 0;
616}
617
c5441932
PS
618static netdev_tx_t ipgre_xmit(struct sk_buff *skb,
619 struct net_device *dev)
620{
621 struct ip_tunnel *tunnel = netdev_priv(dev);
622 const struct iphdr *tnl_params;
1da177e4 623
cb9f1b78
WB
624 if (!pskb_inet_may_pull(skb))
625 goto free_skb;
626
2e15ea39 627 if (tunnel->collect_md) {
2090714e 628 gre_fb_xmit(skb, dev, skb->protocol);
2e15ea39
PS
629 return NETDEV_TX_OK;
630 }
631
c5441932 632 if (dev->header_ops) {
8a0ed250
WB
633 const int pull_len = tunnel->hlen + sizeof(struct iphdr);
634
fdafed45 635 if (skb_cow_head(skb, 0))
c5441932 636 goto free_skb;
1da177e4 637
c5441932 638 tnl_params = (const struct iphdr *)skb->data;
1da177e4 639
8a0ed250
WB
640 if (pull_len > skb_transport_offset(skb))
641 goto free_skb;
642
c5441932
PS
643 /* Pull skb since ip_tunnel_xmit() needs skb->data pointing
644 * to gre header.
645 */
8a0ed250 646 skb_pull(skb, pull_len);
8a0033a9 647 skb_reset_mac_header(skb);
c5441932
PS
648 } else {
649 if (skb_cow_head(skb, dev->needed_headroom))
650 goto free_skb;
1da177e4 651
c5441932 652 tnl_params = &tunnel->parms.iph;
1da177e4
LT
653 }
654
aed069df
AD
655 if (gre_handle_offloads(skb, !!(tunnel->parms.o_flags & TUNNEL_CSUM)))
656 goto free_skb;
8a0033a9 657
c5441932 658 __gre_xmit(skb, dev, tnl_params, skb->protocol);
6ed10654 659 return NETDEV_TX_OK;
1da177e4 660
c5441932 661free_skb:
3acfa1e7 662 kfree_skb(skb);
c5441932 663 dev->stats.tx_dropped++;
6ed10654 664 return NETDEV_TX_OK;
1da177e4
LT
665}
666
84e54fe0
WT
667static netdev_tx_t erspan_xmit(struct sk_buff *skb,
668 struct net_device *dev)
669{
670 struct ip_tunnel *tunnel = netdev_priv(dev);
671 bool truncate = false;
20704bd1 672 __be16 proto;
84e54fe0 673
cb9f1b78
WB
674 if (!pskb_inet_may_pull(skb))
675 goto free_skb;
676
1a66a836 677 if (tunnel->collect_md) {
20704bd1 678 erspan_fb_xmit(skb, dev);
1a66a836
WT
679 return NETDEV_TX_OK;
680 }
681
84e54fe0
WT
682 if (gre_handle_offloads(skb, false))
683 goto free_skb;
684
685 if (skb_cow_head(skb, dev->needed_headroom))
686 goto free_skb;
687
f192970d
WT
688 if (skb->len > dev->mtu + dev->hard_header_len) {
689 pskb_trim(skb, dev->mtu + dev->hard_header_len);
84e54fe0
WT
690 truncate = true;
691 }
692
693 /* Push ERSPAN header */
f989d546
WT
694 if (tunnel->erspan_ver == 0) {
695 proto = htons(ETH_P_ERSPAN);
696 tunnel->parms.o_flags &= ~TUNNEL_SEQ;
697 } else if (tunnel->erspan_ver == 1) {
c69de58b
WT
698 erspan_build_header(skb, ntohl(tunnel->parms.o_key),
699 tunnel->index,
f551c91d 700 truncate, true);
20704bd1
XL
701 proto = htons(ETH_P_ERSPAN);
702 } else if (tunnel->erspan_ver == 2) {
c69de58b 703 erspan_build_header_v2(skb, ntohl(tunnel->parms.o_key),
f551c91d
WT
704 tunnel->dir, tunnel->hwid,
705 truncate, true);
20704bd1
XL
706 proto = htons(ETH_P_ERSPAN2);
707 } else {
02f99df1 708 goto free_skb;
20704bd1 709 }
f551c91d 710
84e54fe0 711 tunnel->parms.o_flags &= ~TUNNEL_KEY;
20704bd1 712 __gre_xmit(skb, dev, &tunnel->parms.iph, proto);
84e54fe0
WT
713 return NETDEV_TX_OK;
714
715free_skb:
716 kfree_skb(skb);
717 dev->stats.tx_dropped++;
718 return NETDEV_TX_OK;
719}
720
c5441932
PS
721static netdev_tx_t gre_tap_xmit(struct sk_buff *skb,
722 struct net_device *dev)
ee34c1eb 723{
c5441932 724 struct ip_tunnel *tunnel = netdev_priv(dev);
ee34c1eb 725
cb9f1b78
WB
726 if (!pskb_inet_may_pull(skb))
727 goto free_skb;
728
2e15ea39 729 if (tunnel->collect_md) {
2090714e 730 gre_fb_xmit(skb, dev, htons(ETH_P_TEB));
2e15ea39
PS
731 return NETDEV_TX_OK;
732 }
733
aed069df
AD
734 if (gre_handle_offloads(skb, !!(tunnel->parms.o_flags & TUNNEL_CSUM)))
735 goto free_skb;
ee34c1eb 736
c5441932
PS
737 if (skb_cow_head(skb, dev->needed_headroom))
738 goto free_skb;
42aa9162 739
c5441932 740 __gre_xmit(skb, dev, &tunnel->parms.iph, htons(ETH_P_TEB));
c5441932 741 return NETDEV_TX_OK;
ee34c1eb 742
c5441932 743free_skb:
3acfa1e7 744 kfree_skb(skb);
c5441932
PS
745 dev->stats.tx_dropped++;
746 return NETDEV_TX_OK;
ee34c1eb
MS
747}
748
dd9d598c
XL
749static void ipgre_link_update(struct net_device *dev, bool set_mtu)
750{
751 struct ip_tunnel *tunnel = netdev_priv(dev);
752 int len;
753
754 len = tunnel->tun_hlen;
755 tunnel->tun_hlen = gre_calc_hlen(tunnel->parms.o_flags);
756 len = tunnel->tun_hlen - len;
757 tunnel->hlen = tunnel->hlen + len;
758
fdafed45
CW
759 if (dev->header_ops)
760 dev->hard_header_len += len;
761 else
762 dev->needed_headroom += len;
763
dd9d598c
XL
764 if (set_mtu)
765 dev->mtu = max_t(int, dev->mtu - len, 68);
766
767 if (!(tunnel->parms.o_flags & TUNNEL_SEQ)) {
768 if (!(tunnel->parms.o_flags & TUNNEL_CSUM) ||
769 tunnel->encap.type == TUNNEL_ENCAP_NONE) {
770 dev->features |= NETIF_F_GSO_SOFTWARE;
771 dev->hw_features |= NETIF_F_GSO_SOFTWARE;
1cc5954f
SD
772 } else {
773 dev->features &= ~NETIF_F_GSO_SOFTWARE;
774 dev->hw_features &= ~NETIF_F_GSO_SOFTWARE;
dd9d598c
XL
775 }
776 dev->features |= NETIF_F_LLTX;
1cc5954f
SD
777 } else {
778 dev->hw_features &= ~NETIF_F_GSO_SOFTWARE;
779 dev->features &= ~(NETIF_F_LLTX | NETIF_F_GSO_SOFTWARE);
dd9d598c
XL
780 }
781}
782
607259a6
CH
783static int ipgre_tunnel_ctl(struct net_device *dev, struct ip_tunnel_parm *p,
784 int cmd)
1da177e4 785{
a0efab67 786 int err;
1da177e4 787
6c734fb8 788 if (cmd == SIOCADDTUNNEL || cmd == SIOCCHGTUNNEL) {
607259a6
CH
789 if (p->iph.version != 4 || p->iph.protocol != IPPROTO_GRE ||
790 p->iph.ihl != 5 || (p->iph.frag_off & htons(~IP_DF)) ||
791 ((p->i_flags | p->o_flags) & (GRE_VERSION | GRE_ROUTING)))
6c734fb8 792 return -EINVAL;
1da177e4 793 }
a0efab67 794
607259a6
CH
795 p->i_flags = gre_flags_to_tnl_flags(p->i_flags);
796 p->o_flags = gre_flags_to_tnl_flags(p->o_flags);
1da177e4 797
607259a6 798 err = ip_tunnel_ctl(dev, p, cmd);
c5441932
PS
799 if (err)
800 return err;
1da177e4 801
a0efab67
XL
802 if (cmd == SIOCCHGTUNNEL) {
803 struct ip_tunnel *t = netdev_priv(dev);
804
607259a6
CH
805 t->parms.i_flags = p->i_flags;
806 t->parms.o_flags = p->o_flags;
a0efab67
XL
807
808 if (strcmp(dev->rtnl_link_ops->kind, "erspan"))
809 ipgre_link_update(dev, true);
810 }
811
607259a6
CH
812 p->i_flags = gre_tnl_flags_to_gre_flags(p->i_flags);
813 p->o_flags = gre_tnl_flags_to_gre_flags(p->o_flags);
1da177e4
LT
814 return 0;
815}
816
1da177e4
LT
817/* Nice toy. Unfortunately, useless in real life :-)
818 It allows to construct virtual multiprotocol broadcast "LAN"
819 over the Internet, provided multicast routing is tuned.
820
821
822 I have no idea was this bicycle invented before me,
823 so that I had to set ARPHRD_IPGRE to a random value.
824 I have an impression, that Cisco could make something similar,
825 but this feature is apparently missing in IOS<=11.2(8).
e905a9ed 826
1da177e4
LT
827 I set up 10.66.66/24 and fec0:6666:6666::0/96 as virtual networks
828 with broadcast 224.66.66.66. If you have access to mbone, play with me :-)
829
830 ping -t 255 224.66.66.66
831
832 If nobody answers, mbone does not work.
833
834 ip tunnel add Universe mode gre remote 224.66.66.66 local <Your_real_addr> ttl 255
835 ip addr add 10.66.66.<somewhat>/24 dev Universe
836 ifconfig Universe up
837 ifconfig Universe add fe80::<Your_real_addr>/10
838 ifconfig Universe add fec0:6666:6666::<Your_real_addr>/96
839 ftp 10.66.66.66
840 ...
841 ftp fec0:6666:6666::193.233.7.65
842 ...
1da177e4 843 */
3b04ddde
SH
844static int ipgre_header(struct sk_buff *skb, struct net_device *dev,
845 unsigned short type,
1507850b 846 const void *daddr, const void *saddr, unsigned int len)
1da177e4 847{
2941a486 848 struct ip_tunnel *t = netdev_priv(dev);
c5441932
PS
849 struct iphdr *iph;
850 struct gre_base_hdr *greh;
1da177e4 851
d58ff351 852 iph = skb_push(skb, t->hlen + sizeof(*iph));
c5441932 853 greh = (struct gre_base_hdr *)(iph+1);
95f5c64c 854 greh->flags = gre_tnl_flags_to_gre_flags(t->parms.o_flags);
c5441932 855 greh->protocol = htons(type);
1da177e4 856
c5441932 857 memcpy(iph, &t->parms.iph, sizeof(struct iphdr));
e905a9ed 858
c5441932 859 /* Set the source hardware address. */
1da177e4
LT
860 if (saddr)
861 memcpy(&iph->saddr, saddr, 4);
6d55cb91 862 if (daddr)
1da177e4 863 memcpy(&iph->daddr, daddr, 4);
6d55cb91 864 if (iph->daddr)
77a482bd 865 return t->hlen + sizeof(*iph);
e905a9ed 866
c5441932 867 return -(t->hlen + sizeof(*iph));
1da177e4
LT
868}
869
6a5f44d7
TT
870static int ipgre_header_parse(const struct sk_buff *skb, unsigned char *haddr)
871{
b71d1d42 872 const struct iphdr *iph = (const struct iphdr *) skb_mac_header(skb);
6a5f44d7
TT
873 memcpy(haddr, &iph->saddr, 4);
874 return 4;
875}
876
3b04ddde
SH
877static const struct header_ops ipgre_header_ops = {
878 .create = ipgre_header,
6a5f44d7 879 .parse = ipgre_header_parse,
3b04ddde
SH
880};
881
6a5f44d7 882#ifdef CONFIG_NET_IPGRE_BROADCAST
1da177e4
LT
883static int ipgre_open(struct net_device *dev)
884{
2941a486 885 struct ip_tunnel *t = netdev_priv(dev);
1da177e4 886
f97c1e0c 887 if (ipv4_is_multicast(t->parms.iph.daddr)) {
cbb1e85f
DM
888 struct flowi4 fl4;
889 struct rtable *rt;
890
b57708ad 891 rt = ip_route_output_gre(t->net, &fl4,
cbb1e85f
DM
892 t->parms.iph.daddr,
893 t->parms.iph.saddr,
894 t->parms.o_key,
895 RT_TOS(t->parms.iph.tos),
896 t->parms.link);
b23dd4fe 897 if (IS_ERR(rt))
1da177e4 898 return -EADDRNOTAVAIL;
d8d1f30b 899 dev = rt->dst.dev;
1da177e4 900 ip_rt_put(rt);
51456b29 901 if (!__in_dev_get_rtnl(dev))
1da177e4
LT
902 return -EADDRNOTAVAIL;
903 t->mlink = dev->ifindex;
e5ed6399 904 ip_mc_inc_group(__in_dev_get_rtnl(dev), t->parms.iph.daddr);
1da177e4
LT
905 }
906 return 0;
907}
908
909static int ipgre_close(struct net_device *dev)
910{
2941a486 911 struct ip_tunnel *t = netdev_priv(dev);
b8c26a33 912
f97c1e0c 913 if (ipv4_is_multicast(t->parms.iph.daddr) && t->mlink) {
7fee0ca2 914 struct in_device *in_dev;
b57708ad 915 in_dev = inetdev_by_index(t->net, t->mlink);
8723e1b4 916 if (in_dev)
1da177e4 917 ip_mc_dec_group(in_dev, t->parms.iph.daddr);
1da177e4
LT
918 }
919 return 0;
920}
1da177e4
LT
921#endif
922
b8c26a33
SH
923static const struct net_device_ops ipgre_netdev_ops = {
924 .ndo_init = ipgre_tunnel_init,
c5441932 925 .ndo_uninit = ip_tunnel_uninit,
b8c26a33
SH
926#ifdef CONFIG_NET_IPGRE_BROADCAST
927 .ndo_open = ipgre_open,
928 .ndo_stop = ipgre_close,
929#endif
c5441932 930 .ndo_start_xmit = ipgre_xmit,
3e7a1c7c 931 .ndo_siocdevprivate = ip_tunnel_siocdevprivate,
c5441932 932 .ndo_change_mtu = ip_tunnel_change_mtu,
98d7fc46 933 .ndo_get_stats64 = dev_get_tstats64,
1e99584b 934 .ndo_get_iflink = ip_tunnel_get_iflink,
607259a6 935 .ndo_tunnel_ctl = ipgre_tunnel_ctl,
b8c26a33
SH
936};
937
6b78f16e
ED
938#define GRE_FEATURES (NETIF_F_SG | \
939 NETIF_F_FRAGLIST | \
940 NETIF_F_HIGHDMA | \
941 NETIF_F_HW_CSUM)
942
1da177e4
LT
943static void ipgre_tunnel_setup(struct net_device *dev)
944{
b8c26a33 945 dev->netdev_ops = &ipgre_netdev_ops;
5a455275 946 dev->type = ARPHRD_IPGRE;
c5441932
PS
947 ip_tunnel_setup(dev, ipgre_net_id);
948}
1da177e4 949
c5441932
PS
950static void __gre_tunnel_init(struct net_device *dev)
951{
952 struct ip_tunnel *tunnel;
953
954 tunnel = netdev_priv(dev);
95f5c64c 955 tunnel->tun_hlen = gre_calc_hlen(tunnel->parms.o_flags);
c5441932
PS
956 tunnel->parms.iph.protocol = IPPROTO_GRE;
957
4565e991 958 tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen;
fdafed45 959 dev->needed_headroom = tunnel->hlen + sizeof(tunnel->parms.iph);
4565e991 960
b57708ad 961 dev->features |= GRE_FEATURES;
6b78f16e 962 dev->hw_features |= GRE_FEATURES;
c5441932
PS
963
964 if (!(tunnel->parms.o_flags & TUNNEL_SEQ)) {
a0ca153f
AD
965 /* TCP offload with GRE SEQ is not supported, nor
966 * can we support 2 levels of outer headers requiring
967 * an update.
968 */
969 if (!(tunnel->parms.o_flags & TUNNEL_CSUM) ||
970 (tunnel->encap.type == TUNNEL_ENCAP_NONE)) {
971 dev->features |= NETIF_F_GSO_SOFTWARE;
972 dev->hw_features |= NETIF_F_GSO_SOFTWARE;
973 }
974
c5441932
PS
975 /* Can use a lockless transmit, unless we generate
976 * output sequences
977 */
978 dev->features |= NETIF_F_LLTX;
979 }
1da177e4
LT
980}
981
982static int ipgre_tunnel_init(struct net_device *dev)
983{
c5441932
PS
984 struct ip_tunnel *tunnel = netdev_priv(dev);
985 struct iphdr *iph = &tunnel->parms.iph;
1da177e4 986
c5441932 987 __gre_tunnel_init(dev);
1da177e4 988
c5441932
PS
989 memcpy(dev->dev_addr, &iph->saddr, 4);
990 memcpy(dev->broadcast, &iph->daddr, 4);
1da177e4 991
c5441932 992 dev->flags = IFF_NOARP;
02875878 993 netif_keep_dst(dev);
c5441932 994 dev->addr_len = 4;
1da177e4 995
a64b04d8 996 if (iph->daddr && !tunnel->collect_md) {
1da177e4 997#ifdef CONFIG_NET_IPGRE_BROADCAST
f97c1e0c 998 if (ipv4_is_multicast(iph->daddr)) {
1da177e4
LT
999 if (!iph->saddr)
1000 return -EINVAL;
1001 dev->flags = IFF_BROADCAST;
3b04ddde 1002 dev->header_ops = &ipgre_header_ops;
fdafed45
CW
1003 dev->hard_header_len = tunnel->hlen + sizeof(*iph);
1004 dev->needed_headroom = 0;
1da177e4
LT
1005 }
1006#endif
a64b04d8 1007 } else if (!tunnel->collect_md) {
6a5f44d7 1008 dev->header_ops = &ipgre_header_ops;
fdafed45
CW
1009 dev->hard_header_len = tunnel->hlen + sizeof(*iph);
1010 dev->needed_headroom = 0;
a64b04d8 1011 }
1da177e4 1012
c5441932 1013 return ip_tunnel_init(dev);
1da177e4
LT
1014}
1015
9f57c67c
PS
1016static const struct gre_protocol ipgre_protocol = {
1017 .handler = gre_rcv,
1018 .err_handler = gre_err,
1da177e4
LT
1019};
1020
2c8c1e72 1021static int __net_init ipgre_init_net(struct net *net)
59a4c759 1022{
c5441932 1023 return ip_tunnel_init_net(net, ipgre_net_id, &ipgre_link_ops, NULL);
59a4c759
PE
1024}
1025
64bc1781 1026static void __net_exit ipgre_exit_batch_net(struct list_head *list_net)
59a4c759 1027{
64bc1781 1028 ip_tunnel_delete_nets(list_net, ipgre_net_id, &ipgre_link_ops);
59a4c759
PE
1029}
1030
1031static struct pernet_operations ipgre_net_ops = {
1032 .init = ipgre_init_net,
64bc1781 1033 .exit_batch = ipgre_exit_batch_net,
cfb8fbf2 1034 .id = &ipgre_net_id,
c5441932 1035 .size = sizeof(struct ip_tunnel_net),
59a4c759 1036};
1da177e4 1037
a8b8a889
MS
1038static int ipgre_tunnel_validate(struct nlattr *tb[], struct nlattr *data[],
1039 struct netlink_ext_ack *extack)
c19e654d
HX
1040{
1041 __be16 flags;
1042
1043 if (!data)
1044 return 0;
1045
1046 flags = 0;
1047 if (data[IFLA_GRE_IFLAGS])
1048 flags |= nla_get_be16(data[IFLA_GRE_IFLAGS]);
1049 if (data[IFLA_GRE_OFLAGS])
1050 flags |= nla_get_be16(data[IFLA_GRE_OFLAGS]);
1051 if (flags & (GRE_VERSION|GRE_ROUTING))
1052 return -EINVAL;
1053
946b636f
JB
1054 if (data[IFLA_GRE_COLLECT_METADATA] &&
1055 data[IFLA_GRE_ENCAP_TYPE] &&
1056 nla_get_u16(data[IFLA_GRE_ENCAP_TYPE]) != TUNNEL_ENCAP_NONE)
1057 return -EINVAL;
1058
c19e654d
HX
1059 return 0;
1060}
1061
a8b8a889
MS
1062static int ipgre_tap_validate(struct nlattr *tb[], struct nlattr *data[],
1063 struct netlink_ext_ack *extack)
e1a80002
HX
1064{
1065 __be32 daddr;
1066
1067 if (tb[IFLA_ADDRESS]) {
1068 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN)
1069 return -EINVAL;
1070 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS])))
1071 return -EADDRNOTAVAIL;
1072 }
1073
1074 if (!data)
1075 goto out;
1076
1077 if (data[IFLA_GRE_REMOTE]) {
1078 memcpy(&daddr, nla_data(data[IFLA_GRE_REMOTE]), 4);
1079 if (!daddr)
1080 return -EINVAL;
1081 }
1082
1083out:
a8b8a889 1084 return ipgre_tunnel_validate(tb, data, extack);
e1a80002
HX
1085}
1086
84e54fe0
WT
1087static int erspan_validate(struct nlattr *tb[], struct nlattr *data[],
1088 struct netlink_ext_ack *extack)
1089{
1090 __be16 flags = 0;
1091 int ret;
1092
1093 if (!data)
1094 return 0;
1095
1096 ret = ipgre_tap_validate(tb, data, extack);
1097 if (ret)
1098 return ret;
1099
51fa960d
WT
1100 if (data[IFLA_GRE_ERSPAN_VER] &&
1101 nla_get_u8(data[IFLA_GRE_ERSPAN_VER]) == 0)
f989d546
WT
1102 return 0;
1103
1104 /* ERSPAN type II/III should only have GRE sequence and key flag */
1a66a836
WT
1105 if (data[IFLA_GRE_OFLAGS])
1106 flags |= nla_get_be16(data[IFLA_GRE_OFLAGS]);
1107 if (data[IFLA_GRE_IFLAGS])
1108 flags |= nla_get_be16(data[IFLA_GRE_IFLAGS]);
1109 if (!data[IFLA_GRE_COLLECT_METADATA] &&
1110 flags != (GRE_SEQ | GRE_KEY))
84e54fe0
WT
1111 return -EINVAL;
1112
1113 /* ERSPAN Session ID only has 10-bit. Since we reuse
1114 * 32-bit key field as ID, check it's range.
1115 */
1116 if (data[IFLA_GRE_IKEY] &&
1117 (ntohl(nla_get_be32(data[IFLA_GRE_IKEY])) & ~ID_MASK))
1118 return -EINVAL;
1119
1120 if (data[IFLA_GRE_OKEY] &&
1121 (ntohl(nla_get_be32(data[IFLA_GRE_OKEY])) & ~ID_MASK))
1122 return -EINVAL;
1123
1124 return 0;
1125}
1126
22a59be8 1127static int ipgre_netlink_parms(struct net_device *dev,
2e15ea39
PS
1128 struct nlattr *data[],
1129 struct nlattr *tb[],
9830ad4c
CG
1130 struct ip_tunnel_parm *parms,
1131 __u32 *fwmark)
c19e654d 1132{
22a59be8
PP
1133 struct ip_tunnel *t = netdev_priv(dev);
1134
7bb82d92 1135 memset(parms, 0, sizeof(*parms));
c19e654d
HX
1136
1137 parms->iph.protocol = IPPROTO_GRE;
1138
1139 if (!data)
22a59be8 1140 return 0;
c19e654d
HX
1141
1142 if (data[IFLA_GRE_LINK])
1143 parms->link = nla_get_u32(data[IFLA_GRE_LINK]);
1144
1145 if (data[IFLA_GRE_IFLAGS])
c5441932 1146 parms->i_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_IFLAGS]));
c19e654d
HX
1147
1148 if (data[IFLA_GRE_OFLAGS])
c5441932 1149 parms->o_flags = gre_flags_to_tnl_flags(nla_get_be16(data[IFLA_GRE_OFLAGS]));
c19e654d
HX
1150
1151 if (data[IFLA_GRE_IKEY])
1152 parms->i_key = nla_get_be32(data[IFLA_GRE_IKEY]);
1153
1154 if (data[IFLA_GRE_OKEY])
1155 parms->o_key = nla_get_be32(data[IFLA_GRE_OKEY]);
1156
1157 if (data[IFLA_GRE_LOCAL])
67b61f6c 1158 parms->iph.saddr = nla_get_in_addr(data[IFLA_GRE_LOCAL]);
c19e654d
HX
1159
1160 if (data[IFLA_GRE_REMOTE])
67b61f6c 1161 parms->iph.daddr = nla_get_in_addr(data[IFLA_GRE_REMOTE]);
c19e654d
HX
1162
1163 if (data[IFLA_GRE_TTL])
1164 parms->iph.ttl = nla_get_u8(data[IFLA_GRE_TTL]);
1165
1166 if (data[IFLA_GRE_TOS])
1167 parms->iph.tos = nla_get_u8(data[IFLA_GRE_TOS]);
1168
22a59be8
PP
1169 if (!data[IFLA_GRE_PMTUDISC] || nla_get_u8(data[IFLA_GRE_PMTUDISC])) {
1170 if (t->ignore_df)
1171 return -EINVAL;
c19e654d 1172 parms->iph.frag_off = htons(IP_DF);
22a59be8 1173 }
2e15ea39
PS
1174
1175 if (data[IFLA_GRE_COLLECT_METADATA]) {
2e15ea39 1176 t->collect_md = true;
e271c7b4
JB
1177 if (dev->type == ARPHRD_IPGRE)
1178 dev->type = ARPHRD_NONE;
2e15ea39 1179 }
22a59be8
PP
1180
1181 if (data[IFLA_GRE_IGNORE_DF]) {
1182 if (nla_get_u8(data[IFLA_GRE_IGNORE_DF])
1183 && (parms->iph.frag_off & htons(IP_DF)))
1184 return -EINVAL;
1185 t->ignore_df = !!nla_get_u8(data[IFLA_GRE_IGNORE_DF]);
1186 }
1187
9830ad4c
CG
1188 if (data[IFLA_GRE_FWMARK])
1189 *fwmark = nla_get_u32(data[IFLA_GRE_FWMARK]);
1190
e1f8f78f
PM
1191 return 0;
1192}
1193
1194static int erspan_netlink_parms(struct net_device *dev,
1195 struct nlattr *data[],
1196 struct nlattr *tb[],
1197 struct ip_tunnel_parm *parms,
1198 __u32 *fwmark)
1199{
1200 struct ip_tunnel *t = netdev_priv(dev);
1201 int err;
1202
1203 err = ipgre_netlink_parms(dev, data, tb, parms, fwmark);
1204 if (err)
1205 return err;
32ca98fe
PM
1206 if (!data)
1207 return 0;
e1f8f78f 1208
f551c91d
WT
1209 if (data[IFLA_GRE_ERSPAN_VER]) {
1210 t->erspan_ver = nla_get_u8(data[IFLA_GRE_ERSPAN_VER]);
84e54fe0 1211
f989d546 1212 if (t->erspan_ver > 2)
84e54fe0
WT
1213 return -EINVAL;
1214 }
1215
f551c91d
WT
1216 if (t->erspan_ver == 1) {
1217 if (data[IFLA_GRE_ERSPAN_INDEX]) {
1218 t->index = nla_get_u32(data[IFLA_GRE_ERSPAN_INDEX]);
1219 if (t->index & ~INDEX_MASK)
1220 return -EINVAL;
1221 }
1222 } else if (t->erspan_ver == 2) {
1223 if (data[IFLA_GRE_ERSPAN_DIR]) {
1224 t->dir = nla_get_u8(data[IFLA_GRE_ERSPAN_DIR]);
1225 if (t->dir & ~(DIR_MASK >> DIR_OFFSET))
1226 return -EINVAL;
1227 }
1228 if (data[IFLA_GRE_ERSPAN_HWID]) {
1229 t->hwid = nla_get_u16(data[IFLA_GRE_ERSPAN_HWID]);
1230 if (t->hwid & ~(HWID_MASK >> HWID_OFFSET))
1231 return -EINVAL;
1232 }
1233 }
1234
22a59be8 1235 return 0;
c19e654d
HX
1236}
1237
4565e991
TH
1238/* This function returns true when ENCAP attributes are present in the nl msg */
1239static bool ipgre_netlink_encap_parms(struct nlattr *data[],
1240 struct ip_tunnel_encap *ipencap)
1241{
1242 bool ret = false;
1243
1244 memset(ipencap, 0, sizeof(*ipencap));
1245
1246 if (!data)
1247 return ret;
1248
1249 if (data[IFLA_GRE_ENCAP_TYPE]) {
1250 ret = true;
1251 ipencap->type = nla_get_u16(data[IFLA_GRE_ENCAP_TYPE]);
1252 }
1253
1254 if (data[IFLA_GRE_ENCAP_FLAGS]) {
1255 ret = true;
1256 ipencap->flags = nla_get_u16(data[IFLA_GRE_ENCAP_FLAGS]);
1257 }
1258
1259 if (data[IFLA_GRE_ENCAP_SPORT]) {
1260 ret = true;
3e97fa70 1261 ipencap->sport = nla_get_be16(data[IFLA_GRE_ENCAP_SPORT]);
4565e991
TH
1262 }
1263
1264 if (data[IFLA_GRE_ENCAP_DPORT]) {
1265 ret = true;
3e97fa70 1266 ipencap->dport = nla_get_be16(data[IFLA_GRE_ENCAP_DPORT]);
4565e991
TH
1267 }
1268
1269 return ret;
1270}
1271
c5441932 1272static int gre_tap_init(struct net_device *dev)
e1a80002 1273{
c5441932 1274 __gre_tunnel_init(dev);
bec94d43 1275 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
d51711c0 1276 netif_keep_dst(dev);
e1a80002 1277
c5441932 1278 return ip_tunnel_init(dev);
e1a80002
HX
1279}
1280
c5441932
PS
1281static const struct net_device_ops gre_tap_netdev_ops = {
1282 .ndo_init = gre_tap_init,
1283 .ndo_uninit = ip_tunnel_uninit,
1284 .ndo_start_xmit = gre_tap_xmit,
b8c26a33
SH
1285 .ndo_set_mac_address = eth_mac_addr,
1286 .ndo_validate_addr = eth_validate_addr,
c5441932 1287 .ndo_change_mtu = ip_tunnel_change_mtu,
98d7fc46 1288 .ndo_get_stats64 = dev_get_tstats64,
1e99584b 1289 .ndo_get_iflink = ip_tunnel_get_iflink,
fc4099f1 1290 .ndo_fill_metadata_dst = gre_fill_metadata_dst,
b8c26a33
SH
1291};
1292
84e54fe0
WT
1293static int erspan_tunnel_init(struct net_device *dev)
1294{
1295 struct ip_tunnel *tunnel = netdev_priv(dev);
84e54fe0 1296
f989d546
WT
1297 if (tunnel->erspan_ver == 0)
1298 tunnel->tun_hlen = 4; /* 4-byte GRE hdr. */
1299 else
1300 tunnel->tun_hlen = 8; /* 8-byte GRE hdr. */
1301
84e54fe0 1302 tunnel->parms.iph.protocol = IPPROTO_GRE;
c122fda2 1303 tunnel->hlen = tunnel->tun_hlen + tunnel->encap_hlen +
f551c91d 1304 erspan_hdr_len(tunnel->erspan_ver);
84e54fe0 1305
84e54fe0
WT
1306 dev->features |= GRE_FEATURES;
1307 dev->hw_features |= GRE_FEATURES;
1308 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
c84bed44 1309 netif_keep_dst(dev);
84e54fe0
WT
1310
1311 return ip_tunnel_init(dev);
1312}
1313
1314static const struct net_device_ops erspan_netdev_ops = {
1315 .ndo_init = erspan_tunnel_init,
1316 .ndo_uninit = ip_tunnel_uninit,
1317 .ndo_start_xmit = erspan_xmit,
1318 .ndo_set_mac_address = eth_mac_addr,
1319 .ndo_validate_addr = eth_validate_addr,
1320 .ndo_change_mtu = ip_tunnel_change_mtu,
98d7fc46 1321 .ndo_get_stats64 = dev_get_tstats64,
84e54fe0
WT
1322 .ndo_get_iflink = ip_tunnel_get_iflink,
1323 .ndo_fill_metadata_dst = gre_fill_metadata_dst,
1324};
1325
e1a80002
HX
1326static void ipgre_tap_setup(struct net_device *dev)
1327{
e1a80002 1328 ether_setup(dev);
cfddd4c3 1329 dev->max_mtu = 0;
d13b161c
JB
1330 dev->netdev_ops = &gre_tap_netdev_ops;
1331 dev->priv_flags &= ~IFF_TX_SKB_SHARING;
1332 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
c5441932 1333 ip_tunnel_setup(dev, gre_tap_net_id);
e1a80002
HX
1334}
1335
e1f8f78f
PM
1336static int
1337ipgre_newlink_encap_setup(struct net_device *dev, struct nlattr *data[])
c19e654d 1338{
4565e991
TH
1339 struct ip_tunnel_encap ipencap;
1340
1341 if (ipgre_netlink_encap_parms(data, &ipencap)) {
1342 struct ip_tunnel *t = netdev_priv(dev);
e1f8f78f 1343 int err = ip_tunnel_encap_setup(t, &ipencap);
4565e991
TH
1344
1345 if (err < 0)
1346 return err;
1347 }
c19e654d 1348
e1f8f78f
PM
1349 return 0;
1350}
1351
1352static int ipgre_newlink(struct net *src_net, struct net_device *dev,
1353 struct nlattr *tb[], struct nlattr *data[],
1354 struct netlink_ext_ack *extack)
1355{
1356 struct ip_tunnel_parm p;
1357 __u32 fwmark = 0;
1358 int err;
1359
1360 err = ipgre_newlink_encap_setup(dev, data);
1361 if (err)
1362 return err;
1363
9830ad4c 1364 err = ipgre_netlink_parms(dev, data, tb, &p, &fwmark);
22a59be8
PP
1365 if (err < 0)
1366 return err;
9830ad4c 1367 return ip_tunnel_newlink(dev, tb, &p, fwmark);
c19e654d
HX
1368}
1369
e1f8f78f
PM
1370static int erspan_newlink(struct net *src_net, struct net_device *dev,
1371 struct nlattr *tb[], struct nlattr *data[],
1372 struct netlink_ext_ack *extack)
1373{
1374 struct ip_tunnel_parm p;
1375 __u32 fwmark = 0;
1376 int err;
1377
1378 err = ipgre_newlink_encap_setup(dev, data);
1379 if (err)
1380 return err;
1381
1382 err = erspan_netlink_parms(dev, data, tb, &p, &fwmark);
1383 if (err)
1384 return err;
1385 return ip_tunnel_newlink(dev, tb, &p, fwmark);
1386}
1387
c19e654d 1388static int ipgre_changelink(struct net_device *dev, struct nlattr *tb[],
ad744b22
MS
1389 struct nlattr *data[],
1390 struct netlink_ext_ack *extack)
c19e654d 1391{
9830ad4c 1392 struct ip_tunnel *t = netdev_priv(dev);
9830ad4c 1393 __u32 fwmark = t->fwmark;
dd9d598c 1394 struct ip_tunnel_parm p;
22a59be8 1395 int err;
4565e991 1396
e1f8f78f
PM
1397 err = ipgre_newlink_encap_setup(dev, data);
1398 if (err)
1399 return err;
c19e654d 1400
9830ad4c 1401 err = ipgre_netlink_parms(dev, data, tb, &p, &fwmark);
22a59be8
PP
1402 if (err < 0)
1403 return err;
dd9d598c
XL
1404
1405 err = ip_tunnel_changelink(dev, tb, &p, fwmark);
1406 if (err < 0)
1407 return err;
1408
1409 t->parms.i_flags = p.i_flags;
1410 t->parms.o_flags = p.o_flags;
1411
e1f8f78f
PM
1412 ipgre_link_update(dev, !tb[IFLA_MTU]);
1413
1414 return 0;
1415}
1416
1417static int erspan_changelink(struct net_device *dev, struct nlattr *tb[],
1418 struct nlattr *data[],
1419 struct netlink_ext_ack *extack)
1420{
1421 struct ip_tunnel *t = netdev_priv(dev);
1422 __u32 fwmark = t->fwmark;
1423 struct ip_tunnel_parm p;
1424 int err;
1425
1426 err = ipgre_newlink_encap_setup(dev, data);
1427 if (err)
1428 return err;
1429
1430 err = erspan_netlink_parms(dev, data, tb, &p, &fwmark);
1431 if (err < 0)
1432 return err;
1433
1434 err = ip_tunnel_changelink(dev, tb, &p, fwmark);
1435 if (err < 0)
1436 return err;
1437
1438 t->parms.i_flags = p.i_flags;
1439 t->parms.o_flags = p.o_flags;
dd9d598c
XL
1440
1441 return 0;
c19e654d
HX
1442}
1443
1444static size_t ipgre_get_size(const struct net_device *dev)
1445{
1446 return
1447 /* IFLA_GRE_LINK */
1448 nla_total_size(4) +
1449 /* IFLA_GRE_IFLAGS */
1450 nla_total_size(2) +
1451 /* IFLA_GRE_OFLAGS */
1452 nla_total_size(2) +
1453 /* IFLA_GRE_IKEY */
1454 nla_total_size(4) +
1455 /* IFLA_GRE_OKEY */
1456 nla_total_size(4) +
1457 /* IFLA_GRE_LOCAL */
1458 nla_total_size(4) +
1459 /* IFLA_GRE_REMOTE */
1460 nla_total_size(4) +
1461 /* IFLA_GRE_TTL */
1462 nla_total_size(1) +
1463 /* IFLA_GRE_TOS */
1464 nla_total_size(1) +
1465 /* IFLA_GRE_PMTUDISC */
1466 nla_total_size(1) +
4565e991
TH
1467 /* IFLA_GRE_ENCAP_TYPE */
1468 nla_total_size(2) +
1469 /* IFLA_GRE_ENCAP_FLAGS */
1470 nla_total_size(2) +
1471 /* IFLA_GRE_ENCAP_SPORT */
1472 nla_total_size(2) +
1473 /* IFLA_GRE_ENCAP_DPORT */
1474 nla_total_size(2) +
2e15ea39
PS
1475 /* IFLA_GRE_COLLECT_METADATA */
1476 nla_total_size(0) +
22a59be8
PP
1477 /* IFLA_GRE_IGNORE_DF */
1478 nla_total_size(1) +
9830ad4c
CG
1479 /* IFLA_GRE_FWMARK */
1480 nla_total_size(4) +
84e54fe0
WT
1481 /* IFLA_GRE_ERSPAN_INDEX */
1482 nla_total_size(4) +
f551c91d
WT
1483 /* IFLA_GRE_ERSPAN_VER */
1484 nla_total_size(1) +
1485 /* IFLA_GRE_ERSPAN_DIR */
1486 nla_total_size(1) +
1487 /* IFLA_GRE_ERSPAN_HWID */
1488 nla_total_size(2) +
c19e654d
HX
1489 0;
1490}
1491
1492static int ipgre_fill_info(struct sk_buff *skb, const struct net_device *dev)
1493{
1494 struct ip_tunnel *t = netdev_priv(dev);
1495 struct ip_tunnel_parm *p = &t->parms;
feaf5c79
LB
1496 __be16 o_flags = p->o_flags;
1497
f989d546
WT
1498 if (t->erspan_ver <= 2) {
1499 if (t->erspan_ver != 0 && !t->collect_md)
2bdf700e
LB
1500 o_flags |= TUNNEL_KEY;
1501
1502 if (nla_put_u8(skb, IFLA_GRE_ERSPAN_VER, t->erspan_ver))
1503 goto nla_put_failure;
1504
1505 if (t->erspan_ver == 1) {
1506 if (nla_put_u32(skb, IFLA_GRE_ERSPAN_INDEX, t->index))
1507 goto nla_put_failure;
f989d546 1508 } else if (t->erspan_ver == 2) {
2bdf700e
LB
1509 if (nla_put_u8(skb, IFLA_GRE_ERSPAN_DIR, t->dir))
1510 goto nla_put_failure;
1511 if (nla_put_u16(skb, IFLA_GRE_ERSPAN_HWID, t->hwid))
1512 goto nla_put_failure;
1513 }
1514 }
c19e654d 1515
f3756b79 1516 if (nla_put_u32(skb, IFLA_GRE_LINK, p->link) ||
95f5c64c
TH
1517 nla_put_be16(skb, IFLA_GRE_IFLAGS,
1518 gre_tnl_flags_to_gre_flags(p->i_flags)) ||
1519 nla_put_be16(skb, IFLA_GRE_OFLAGS,
feaf5c79 1520 gre_tnl_flags_to_gre_flags(o_flags)) ||
f3756b79
DM
1521 nla_put_be32(skb, IFLA_GRE_IKEY, p->i_key) ||
1522 nla_put_be32(skb, IFLA_GRE_OKEY, p->o_key) ||
930345ea
JB
1523 nla_put_in_addr(skb, IFLA_GRE_LOCAL, p->iph.saddr) ||
1524 nla_put_in_addr(skb, IFLA_GRE_REMOTE, p->iph.daddr) ||
f3756b79
DM
1525 nla_put_u8(skb, IFLA_GRE_TTL, p->iph.ttl) ||
1526 nla_put_u8(skb, IFLA_GRE_TOS, p->iph.tos) ||
1527 nla_put_u8(skb, IFLA_GRE_PMTUDISC,
9830ad4c
CG
1528 !!(p->iph.frag_off & htons(IP_DF))) ||
1529 nla_put_u32(skb, IFLA_GRE_FWMARK, t->fwmark))
f3756b79 1530 goto nla_put_failure;
4565e991
TH
1531
1532 if (nla_put_u16(skb, IFLA_GRE_ENCAP_TYPE,
1533 t->encap.type) ||
3e97fa70
SD
1534 nla_put_be16(skb, IFLA_GRE_ENCAP_SPORT,
1535 t->encap.sport) ||
1536 nla_put_be16(skb, IFLA_GRE_ENCAP_DPORT,
1537 t->encap.dport) ||
4565e991 1538 nla_put_u16(skb, IFLA_GRE_ENCAP_FLAGS,
e1b2cb65 1539 t->encap.flags))
4565e991
TH
1540 goto nla_put_failure;
1541
22a59be8
PP
1542 if (nla_put_u8(skb, IFLA_GRE_IGNORE_DF, t->ignore_df))
1543 goto nla_put_failure;
1544
2e15ea39
PS
1545 if (t->collect_md) {
1546 if (nla_put_flag(skb, IFLA_GRE_COLLECT_METADATA))
1547 goto nla_put_failure;
1548 }
1549
c19e654d
HX
1550 return 0;
1551
1552nla_put_failure:
1553 return -EMSGSIZE;
1554}
1555
84e54fe0
WT
1556static void erspan_setup(struct net_device *dev)
1557{
84581bda
XL
1558 struct ip_tunnel *t = netdev_priv(dev);
1559
84e54fe0 1560 ether_setup(dev);
0e141f75 1561 dev->max_mtu = 0;
84e54fe0
WT
1562 dev->netdev_ops = &erspan_netdev_ops;
1563 dev->priv_flags &= ~IFF_TX_SKB_SHARING;
1564 dev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
1565 ip_tunnel_setup(dev, erspan_net_id);
84581bda 1566 t->erspan_ver = 1;
84e54fe0
WT
1567}
1568
c19e654d
HX
1569static const struct nla_policy ipgre_policy[IFLA_GRE_MAX + 1] = {
1570 [IFLA_GRE_LINK] = { .type = NLA_U32 },
1571 [IFLA_GRE_IFLAGS] = { .type = NLA_U16 },
1572 [IFLA_GRE_OFLAGS] = { .type = NLA_U16 },
1573 [IFLA_GRE_IKEY] = { .type = NLA_U32 },
1574 [IFLA_GRE_OKEY] = { .type = NLA_U32 },
c593642c
PB
1575 [IFLA_GRE_LOCAL] = { .len = sizeof_field(struct iphdr, saddr) },
1576 [IFLA_GRE_REMOTE] = { .len = sizeof_field(struct iphdr, daddr) },
c19e654d
HX
1577 [IFLA_GRE_TTL] = { .type = NLA_U8 },
1578 [IFLA_GRE_TOS] = { .type = NLA_U8 },
1579 [IFLA_GRE_PMTUDISC] = { .type = NLA_U8 },
4565e991
TH
1580 [IFLA_GRE_ENCAP_TYPE] = { .type = NLA_U16 },
1581 [IFLA_GRE_ENCAP_FLAGS] = { .type = NLA_U16 },
1582 [IFLA_GRE_ENCAP_SPORT] = { .type = NLA_U16 },
1583 [IFLA_GRE_ENCAP_DPORT] = { .type = NLA_U16 },
2e15ea39 1584 [IFLA_GRE_COLLECT_METADATA] = { .type = NLA_FLAG },
22a59be8 1585 [IFLA_GRE_IGNORE_DF] = { .type = NLA_U8 },
9830ad4c 1586 [IFLA_GRE_FWMARK] = { .type = NLA_U32 },
84e54fe0 1587 [IFLA_GRE_ERSPAN_INDEX] = { .type = NLA_U32 },
f551c91d
WT
1588 [IFLA_GRE_ERSPAN_VER] = { .type = NLA_U8 },
1589 [IFLA_GRE_ERSPAN_DIR] = { .type = NLA_U8 },
1590 [IFLA_GRE_ERSPAN_HWID] = { .type = NLA_U16 },
c19e654d
HX
1591};
1592
1593static struct rtnl_link_ops ipgre_link_ops __read_mostly = {
1594 .kind = "gre",
1595 .maxtype = IFLA_GRE_MAX,
1596 .policy = ipgre_policy,
1597 .priv_size = sizeof(struct ip_tunnel),
1598 .setup = ipgre_tunnel_setup,
1599 .validate = ipgre_tunnel_validate,
1600 .newlink = ipgre_newlink,
1601 .changelink = ipgre_changelink,
c5441932 1602 .dellink = ip_tunnel_dellink,
c19e654d
HX
1603 .get_size = ipgre_get_size,
1604 .fill_info = ipgre_fill_info,
1728d4fa 1605 .get_link_net = ip_tunnel_get_link_net,
c19e654d
HX
1606};
1607
e1a80002
HX
1608static struct rtnl_link_ops ipgre_tap_ops __read_mostly = {
1609 .kind = "gretap",
1610 .maxtype = IFLA_GRE_MAX,
1611 .policy = ipgre_policy,
1612 .priv_size = sizeof(struct ip_tunnel),
1613 .setup = ipgre_tap_setup,
1614 .validate = ipgre_tap_validate,
1615 .newlink = ipgre_newlink,
1616 .changelink = ipgre_changelink,
c5441932 1617 .dellink = ip_tunnel_dellink,
e1a80002
HX
1618 .get_size = ipgre_get_size,
1619 .fill_info = ipgre_fill_info,
1728d4fa 1620 .get_link_net = ip_tunnel_get_link_net,
e1a80002
HX
1621};
1622
84e54fe0
WT
1623static struct rtnl_link_ops erspan_link_ops __read_mostly = {
1624 .kind = "erspan",
1625 .maxtype = IFLA_GRE_MAX,
1626 .policy = ipgre_policy,
1627 .priv_size = sizeof(struct ip_tunnel),
1628 .setup = erspan_setup,
1629 .validate = erspan_validate,
e1f8f78f
PM
1630 .newlink = erspan_newlink,
1631 .changelink = erspan_changelink,
84e54fe0
WT
1632 .dellink = ip_tunnel_dellink,
1633 .get_size = ipgre_get_size,
1634 .fill_info = ipgre_fill_info,
1635 .get_link_net = ip_tunnel_get_link_net,
1636};
1637
b2acd1dc
PS
1638struct net_device *gretap_fb_dev_create(struct net *net, const char *name,
1639 u8 name_assign_type)
1640{
1641 struct nlattr *tb[IFLA_MAX + 1];
1642 struct net_device *dev;
106da663 1643 LIST_HEAD(list_kill);
b2acd1dc
PS
1644 struct ip_tunnel *t;
1645 int err;
1646
1647 memset(&tb, 0, sizeof(tb));
1648
1649 dev = rtnl_create_link(net, name, name_assign_type,
d0522f1c 1650 &ipgre_tap_ops, tb, NULL);
b2acd1dc
PS
1651 if (IS_ERR(dev))
1652 return dev;
1653
1654 /* Configure flow based GRE device. */
1655 t = netdev_priv(dev);
1656 t->collect_md = true;
1657
7a3f4a18 1658 err = ipgre_newlink(net, dev, tb, NULL, NULL);
106da663
ND
1659 if (err < 0) {
1660 free_netdev(dev);
1661 return ERR_PTR(err);
1662 }
7e059158
DW
1663
1664 /* openvswitch users expect packet sizes to be unrestricted,
1665 * so set the largest MTU we can.
1666 */
1667 err = __ip_tunnel_change_mtu(dev, IP_MAX_MTU, false);
1668 if (err)
1669 goto out;
1670
da6f1da8
ND
1671 err = rtnl_configure_link(dev, NULL);
1672 if (err < 0)
1673 goto out;
1674
b2acd1dc
PS
1675 return dev;
1676out:
106da663
ND
1677 ip_tunnel_dellink(dev, &list_kill);
1678 unregister_netdevice_many(&list_kill);
b2acd1dc
PS
1679 return ERR_PTR(err);
1680}
1681EXPORT_SYMBOL_GPL(gretap_fb_dev_create);
1682
c5441932
PS
1683static int __net_init ipgre_tap_init_net(struct net *net)
1684{
2e15ea39 1685 return ip_tunnel_init_net(net, gre_tap_net_id, &ipgre_tap_ops, "gretap0");
c5441932
PS
1686}
1687
64bc1781 1688static void __net_exit ipgre_tap_exit_batch_net(struct list_head *list_net)
c5441932 1689{
64bc1781 1690 ip_tunnel_delete_nets(list_net, gre_tap_net_id, &ipgre_tap_ops);
c5441932
PS
1691}
1692
1693static struct pernet_operations ipgre_tap_net_ops = {
1694 .init = ipgre_tap_init_net,
64bc1781 1695 .exit_batch = ipgre_tap_exit_batch_net,
c5441932
PS
1696 .id = &gre_tap_net_id,
1697 .size = sizeof(struct ip_tunnel_net),
1698};
1da177e4 1699
84e54fe0
WT
1700static int __net_init erspan_init_net(struct net *net)
1701{
1702 return ip_tunnel_init_net(net, erspan_net_id,
1703 &erspan_link_ops, "erspan0");
1704}
1705
64bc1781 1706static void __net_exit erspan_exit_batch_net(struct list_head *net_list)
84e54fe0 1707{
64bc1781 1708 ip_tunnel_delete_nets(net_list, erspan_net_id, &erspan_link_ops);
84e54fe0
WT
1709}
1710
1711static struct pernet_operations erspan_net_ops = {
1712 .init = erspan_init_net,
64bc1781 1713 .exit_batch = erspan_exit_batch_net,
84e54fe0
WT
1714 .id = &erspan_net_id,
1715 .size = sizeof(struct ip_tunnel_net),
1716};
1717
1da177e4
LT
1718static int __init ipgre_init(void)
1719{
1720 int err;
1721
058bd4d2 1722 pr_info("GRE over IPv4 tunneling driver\n");
1da177e4 1723
cfb8fbf2 1724 err = register_pernet_device(&ipgre_net_ops);
59a4c759 1725 if (err < 0)
c2892f02
AD
1726 return err;
1727
c5441932
PS
1728 err = register_pernet_device(&ipgre_tap_net_ops);
1729 if (err < 0)
e3d0328c 1730 goto pnet_tap_failed;
c5441932 1731
84e54fe0
WT
1732 err = register_pernet_device(&erspan_net_ops);
1733 if (err < 0)
1734 goto pnet_erspan_failed;
1735
9f57c67c 1736 err = gre_add_protocol(&ipgre_protocol, GREPROTO_CISCO);
c2892f02 1737 if (err < 0) {
058bd4d2 1738 pr_info("%s: can't add protocol\n", __func__);
c2892f02
AD
1739 goto add_proto_failed;
1740 }
7daa0004 1741
c19e654d
HX
1742 err = rtnl_link_register(&ipgre_link_ops);
1743 if (err < 0)
1744 goto rtnl_link_failed;
1745
e1a80002
HX
1746 err = rtnl_link_register(&ipgre_tap_ops);
1747 if (err < 0)
1748 goto tap_ops_failed;
1749
84e54fe0
WT
1750 err = rtnl_link_register(&erspan_link_ops);
1751 if (err < 0)
1752 goto erspan_link_failed;
1753
c5441932 1754 return 0;
c19e654d 1755
84e54fe0
WT
1756erspan_link_failed:
1757 rtnl_link_unregister(&ipgre_tap_ops);
e1a80002
HX
1758tap_ops_failed:
1759 rtnl_link_unregister(&ipgre_link_ops);
c19e654d 1760rtnl_link_failed:
9f57c67c 1761 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
c2892f02 1762add_proto_failed:
84e54fe0
WT
1763 unregister_pernet_device(&erspan_net_ops);
1764pnet_erspan_failed:
c5441932 1765 unregister_pernet_device(&ipgre_tap_net_ops);
e3d0328c 1766pnet_tap_failed:
c2892f02 1767 unregister_pernet_device(&ipgre_net_ops);
c5441932 1768 return err;
1da177e4
LT
1769}
1770
db44575f 1771static void __exit ipgre_fini(void)
1da177e4 1772{
e1a80002 1773 rtnl_link_unregister(&ipgre_tap_ops);
c19e654d 1774 rtnl_link_unregister(&ipgre_link_ops);
84e54fe0 1775 rtnl_link_unregister(&erspan_link_ops);
9f57c67c 1776 gre_del_protocol(&ipgre_protocol, GREPROTO_CISCO);
c5441932 1777 unregister_pernet_device(&ipgre_tap_net_ops);
c2892f02 1778 unregister_pernet_device(&ipgre_net_ops);
84e54fe0 1779 unregister_pernet_device(&erspan_net_ops);
1da177e4
LT
1780}
1781
1782module_init(ipgre_init);
1783module_exit(ipgre_fini);
1784MODULE_LICENSE("GPL");
4d74f8ba
PM
1785MODULE_ALIAS_RTNL_LINK("gre");
1786MODULE_ALIAS_RTNL_LINK("gretap");
84e54fe0 1787MODULE_ALIAS_RTNL_LINK("erspan");
8909c9ad 1788MODULE_ALIAS_NETDEV("gre0");
c5441932 1789MODULE_ALIAS_NETDEV("gretap0");
84e54fe0 1790MODULE_ALIAS_NETDEV("erspan0");