]>
Commit | Line | Data |
---|---|---|
b2441318 | 1 | // SPDX-License-Identifier: GPL-2.0 |
1da177e4 LT |
2 | /* |
3 | * INET An implementation of the TCP/IP protocol suite for the LINUX | |
4 | * operating system. INET is implemented using the BSD Socket | |
5 | * interface as the means of communication with the user level. | |
6 | * | |
7 | * The IP to API glue. | |
e905a9ed | 8 | * |
1da177e4 LT |
9 | * Authors: see ip.c |
10 | * | |
11 | * Fixes: | |
12 | * Many : Split from ip.c , see ip.c for history. | |
13 | * Martin Mares : TOS setting fixed. | |
e905a9ed | 14 | * Alan Cox : Fixed a couple of oopses in Martin's |
1da177e4 LT |
15 | * TOS tweaks. |
16 | * Mike McLagan : Routing by source | |
17 | */ | |
18 | ||
1da177e4 LT |
19 | #include <linux/module.h> |
20 | #include <linux/types.h> | |
21 | #include <linux/mm.h> | |
1da177e4 LT |
22 | #include <linux/skbuff.h> |
23 | #include <linux/ip.h> | |
24 | #include <linux/icmp.h> | |
14c85021 | 25 | #include <linux/inetdevice.h> |
1da177e4 | 26 | #include <linux/netdevice.h> |
5a0e3ad6 | 27 | #include <linux/slab.h> |
1da177e4 LT |
28 | #include <net/sock.h> |
29 | #include <net/ip.h> | |
30 | #include <net/icmp.h> | |
d83d8461 | 31 | #include <net/tcp_states.h> |
1da177e4 LT |
32 | #include <linux/udp.h> |
33 | #include <linux/igmp.h> | |
34 | #include <linux/netfilter.h> | |
35 | #include <linux/route.h> | |
36 | #include <linux/mroute.h> | |
2c67e9ac | 37 | #include <net/inet_ecn.h> |
1da177e4 LT |
38 | #include <net/route.h> |
39 | #include <net/xfrm.h> | |
dae50295 | 40 | #include <net/compat.h> |
ad6f939a | 41 | #include <net/checksum.h> |
dfd56b8b | 42 | #if IS_ENABLED(CONFIG_IPV6) |
1da177e4 LT |
43 | #include <net/transp_v6.h> |
44 | #endif | |
35ebf65e | 45 | #include <net/ip_fib.h> |
1da177e4 LT |
46 | |
47 | #include <linux/errqueue.h> | |
7c0f6ba6 | 48 | #include <linux/uaccess.h> |
1da177e4 | 49 | |
d2ba09c1 AS |
50 | #include <linux/bpfilter.h> |
51 | ||
1da177e4 LT |
52 | /* |
53 | * SOL_IP control messages. | |
54 | */ | |
55 | ||
56 | static void ip_cmsg_recv_pktinfo(struct msghdr *msg, struct sk_buff *skb) | |
57 | { | |
d826eb14 | 58 | struct in_pktinfo info = *PKTINFO_SKB_CB(skb); |
1da177e4 | 59 | |
eddc9ec5 | 60 | info.ipi_addr.s_addr = ip_hdr(skb)->daddr; |
1da177e4 LT |
61 | |
62 | put_cmsg(msg, SOL_IP, IP_PKTINFO, sizeof(info), &info); | |
63 | } | |
64 | ||
65 | static void ip_cmsg_recv_ttl(struct msghdr *msg, struct sk_buff *skb) | |
66 | { | |
eddc9ec5 | 67 | int ttl = ip_hdr(skb)->ttl; |
1da177e4 LT |
68 | put_cmsg(msg, SOL_IP, IP_TTL, sizeof(int), &ttl); |
69 | } | |
70 | ||
71 | static void ip_cmsg_recv_tos(struct msghdr *msg, struct sk_buff *skb) | |
72 | { | |
eddc9ec5 | 73 | put_cmsg(msg, SOL_IP, IP_TOS, 1, &ip_hdr(skb)->tos); |
1da177e4 LT |
74 | } |
75 | ||
76 | static void ip_cmsg_recv_opts(struct msghdr *msg, struct sk_buff *skb) | |
77 | { | |
78 | if (IPCB(skb)->opt.optlen == 0) | |
79 | return; | |
80 | ||
eddc9ec5 ACM |
81 | put_cmsg(msg, SOL_IP, IP_RECVOPTS, IPCB(skb)->opt.optlen, |
82 | ip_hdr(skb) + 1); | |
1da177e4 LT |
83 | } |
84 | ||
85 | ||
91ed1e66 PA |
86 | static void ip_cmsg_recv_retopts(struct net *net, struct msghdr *msg, |
87 | struct sk_buff *skb) | |
1da177e4 LT |
88 | { |
89 | unsigned char optbuf[sizeof(struct ip_options) + 40]; | |
5e73ea1a | 90 | struct ip_options *opt = (struct ip_options *)optbuf; |
1da177e4 LT |
91 | |
92 | if (IPCB(skb)->opt.optlen == 0) | |
93 | return; | |
94 | ||
91ed1e66 | 95 | if (ip_options_echo(net, opt, skb)) { |
1da177e4 LT |
96 | msg->msg_flags |= MSG_CTRUNC; |
97 | return; | |
98 | } | |
99 | ip_options_undo(opt); | |
100 | ||
101 | put_cmsg(msg, SOL_IP, IP_RETOPTS, opt->optlen, opt->__data); | |
102 | } | |
103 | ||
70ecc248 WB |
104 | static void ip_cmsg_recv_fragsize(struct msghdr *msg, struct sk_buff *skb) |
105 | { | |
106 | int val; | |
107 | ||
108 | if (IPCB(skb)->frag_max_size == 0) | |
109 | return; | |
110 | ||
111 | val = IPCB(skb)->frag_max_size; | |
112 | put_cmsg(msg, SOL_IP, IP_RECVFRAGSIZE, sizeof(val), &val); | |
113 | } | |
114 | ||
ad6f939a | 115 | static void ip_cmsg_recv_checksum(struct msghdr *msg, struct sk_buff *skb, |
10df8e61 | 116 | int tlen, int offset) |
ad6f939a TH |
117 | { |
118 | __wsum csum = skb->csum; | |
119 | ||
120 | if (skb->ip_summed != CHECKSUM_COMPLETE) | |
121 | return; | |
122 | ||
ca4ef457 PA |
123 | if (offset != 0) { |
124 | int tend_off = skb_transport_offset(skb) + tlen; | |
125 | csum = csum_sub(csum, skb_checksum(skb, tend_off, offset, 0)); | |
126 | } | |
ad6f939a TH |
127 | |
128 | put_cmsg(msg, SOL_IP, IP_CHECKSUM, sizeof(__wsum), &csum); | |
129 | } | |
130 | ||
2c7946a7 CZ |
131 | static void ip_cmsg_recv_security(struct msghdr *msg, struct sk_buff *skb) |
132 | { | |
3d328ede | 133 | struct lsmblob lb; |
2c7946a7 | 134 | char *secdata; |
3d328ede | 135 | u32 seclen; |
2c7946a7 CZ |
136 | int err; |
137 | ||
3d328ede | 138 | err = security_socket_getpeersec_dgram(NULL, skb, &lb); |
dc49c1f9 CZ |
139 | if (err) |
140 | return; | |
141 | ||
3d328ede CS |
142 | /* Scaffolding - it has to be element 0 */ |
143 | err = security_secid_to_secctx(lb.secid[0], &secdata, &seclen); | |
2c7946a7 CZ |
144 | if (err) |
145 | return; | |
146 | ||
147 | put_cmsg(msg, SOL_IP, SCM_SECURITY, seclen, secdata); | |
dc49c1f9 | 148 | security_release_secctx(secdata, seclen); |
2c7946a7 CZ |
149 | } |
150 | ||
21d1a161 | 151 | static void ip_cmsg_recv_dstaddr(struct msghdr *msg, struct sk_buff *skb) |
e8b2dfe9 | 152 | { |
4a06fa67 | 153 | __be16 _ports[2], *ports; |
e8b2dfe9 | 154 | struct sockaddr_in sin; |
e8b2dfe9 BS |
155 | |
156 | /* All current transport protocols have the port numbers in the | |
157 | * first four bytes of the transport header and this function is | |
158 | * written with this assumption in mind. | |
159 | */ | |
4a06fa67 WB |
160 | ports = skb_header_pointer(skb, skb_transport_offset(skb), |
161 | sizeof(_ports), &_ports); | |
162 | if (!ports) | |
163 | return; | |
e8b2dfe9 BS |
164 | |
165 | sin.sin_family = AF_INET; | |
64199fc0 | 166 | sin.sin_addr.s_addr = ip_hdr(skb)->daddr; |
e8b2dfe9 BS |
167 | sin.sin_port = ports[1]; |
168 | memset(sin.sin_zero, 0, sizeof(sin.sin_zero)); | |
169 | ||
170 | put_cmsg(msg, SOL_IP, IP_ORIGDSTADDR, sizeof(sin), &sin); | |
171 | } | |
1da177e4 | 172 | |
ad959036 PA |
173 | void ip_cmsg_recv_offset(struct msghdr *msg, struct sock *sk, |
174 | struct sk_buff *skb, int tlen, int offset) | |
1da177e4 | 175 | { |
ad959036 | 176 | struct inet_sock *inet = inet_sk(sk); |
95c96174 | 177 | unsigned int flags = inet->cmsg_flags; |
1da177e4 LT |
178 | |
179 | /* Ordered by supposed usage frequency */ | |
c44d13d6 | 180 | if (flags & IP_CMSG_PKTINFO) { |
1da177e4 | 181 | ip_cmsg_recv_pktinfo(msg, skb); |
1da177e4 | 182 | |
c44d13d6 TH |
183 | flags &= ~IP_CMSG_PKTINFO; |
184 | if (!flags) | |
185 | return; | |
186 | } | |
187 | ||
188 | if (flags & IP_CMSG_TTL) { | |
1da177e4 | 189 | ip_cmsg_recv_ttl(msg, skb); |
1da177e4 | 190 | |
c44d13d6 TH |
191 | flags &= ~IP_CMSG_TTL; |
192 | if (!flags) | |
193 | return; | |
194 | } | |
195 | ||
196 | if (flags & IP_CMSG_TOS) { | |
1da177e4 | 197 | ip_cmsg_recv_tos(msg, skb); |
1da177e4 | 198 | |
c44d13d6 TH |
199 | flags &= ~IP_CMSG_TOS; |
200 | if (!flags) | |
201 | return; | |
202 | } | |
203 | ||
204 | if (flags & IP_CMSG_RECVOPTS) { | |
1da177e4 | 205 | ip_cmsg_recv_opts(msg, skb); |
1da177e4 | 206 | |
c44d13d6 TH |
207 | flags &= ~IP_CMSG_RECVOPTS; |
208 | if (!flags) | |
209 | return; | |
210 | } | |
211 | ||
212 | if (flags & IP_CMSG_RETOPTS) { | |
91ed1e66 | 213 | ip_cmsg_recv_retopts(sock_net(sk), msg, skb); |
2c7946a7 | 214 | |
c44d13d6 TH |
215 | flags &= ~IP_CMSG_RETOPTS; |
216 | if (!flags) | |
217 | return; | |
218 | } | |
219 | ||
220 | if (flags & IP_CMSG_PASSSEC) { | |
2c7946a7 | 221 | ip_cmsg_recv_security(msg, skb); |
e8b2dfe9 | 222 | |
c44d13d6 TH |
223 | flags &= ~IP_CMSG_PASSSEC; |
224 | if (!flags) | |
225 | return; | |
226 | } | |
227 | ||
ad6f939a | 228 | if (flags & IP_CMSG_ORIGDSTADDR) { |
e8b2dfe9 BS |
229 | ip_cmsg_recv_dstaddr(msg, skb); |
230 | ||
ad6f939a TH |
231 | flags &= ~IP_CMSG_ORIGDSTADDR; |
232 | if (!flags) | |
233 | return; | |
234 | } | |
235 | ||
236 | if (flags & IP_CMSG_CHECKSUM) | |
10df8e61 | 237 | ip_cmsg_recv_checksum(msg, skb, tlen, offset); |
70ecc248 WB |
238 | |
239 | if (flags & IP_CMSG_RECVFRAGSIZE) | |
240 | ip_cmsg_recv_fragsize(msg, skb); | |
1da177e4 | 241 | } |
5961de9f | 242 | EXPORT_SYMBOL(ip_cmsg_recv_offset); |
1da177e4 | 243 | |
24025c46 | 244 | int ip_cmsg_send(struct sock *sk, struct msghdr *msg, struct ipcm_cookie *ipc, |
c8e6ad08 | 245 | bool allow_ipv6) |
1da177e4 | 246 | { |
f02db315 | 247 | int err, val; |
1da177e4 | 248 | struct cmsghdr *cmsg; |
24025c46 | 249 | struct net *net = sock_net(sk); |
1da177e4 | 250 | |
f95b414e | 251 | for_each_cmsghdr(cmsg, msg) { |
1da177e4 LT |
252 | if (!CMSG_OK(msg, cmsg)) |
253 | return -EINVAL; | |
5337b5b7 | 254 | #if IS_ENABLED(CONFIG_IPV6) |
c8e6ad08 HFS |
255 | if (allow_ipv6 && |
256 | cmsg->cmsg_level == SOL_IPV6 && | |
257 | cmsg->cmsg_type == IPV6_PKTINFO) { | |
258 | struct in6_pktinfo *src_info; | |
259 | ||
260 | if (cmsg->cmsg_len < CMSG_LEN(sizeof(*src_info))) | |
261 | return -EINVAL; | |
262 | src_info = (struct in6_pktinfo *)CMSG_DATA(cmsg); | |
263 | if (!ipv6_addr_v4mapped(&src_info->ipi6_addr)) | |
264 | return -EINVAL; | |
1cbec076 DA |
265 | if (src_info->ipi6_ifindex) |
266 | ipc->oif = src_info->ipi6_ifindex; | |
c8e6ad08 HFS |
267 | ipc->addr = src_info->ipi6_addr.s6_addr32[3]; |
268 | continue; | |
269 | } | |
270 | #endif | |
24025c46 | 271 | if (cmsg->cmsg_level == SOL_SOCKET) { |
2632616b ED |
272 | err = __sock_cmsg_send(sk, msg, cmsg, &ipc->sockc); |
273 | if (err) | |
274 | return err; | |
24025c46 SHY |
275 | continue; |
276 | } | |
277 | ||
1da177e4 LT |
278 | if (cmsg->cmsg_level != SOL_IP) |
279 | continue; | |
280 | switch (cmsg->cmsg_type) { | |
281 | case IP_RETOPTS: | |
1ff8cebf | 282 | err = cmsg->cmsg_len - sizeof(struct cmsghdr); |
91948309 ED |
283 | |
284 | /* Our caller is responsible for freeing ipc->opt */ | |
de40a3e8 CH |
285 | err = ip_options_get(net, &ipc->opt, |
286 | KERNEL_SOCKPTR(CMSG_DATA(cmsg)), | |
4d52cfbe | 287 | err < 40 ? err : 40); |
1da177e4 LT |
288 | if (err) |
289 | return err; | |
290 | break; | |
291 | case IP_PKTINFO: | |
292 | { | |
293 | struct in_pktinfo *info; | |
294 | if (cmsg->cmsg_len != CMSG_LEN(sizeof(struct in_pktinfo))) | |
295 | return -EINVAL; | |
296 | info = (struct in_pktinfo *)CMSG_DATA(cmsg); | |
1cbec076 DA |
297 | if (info->ipi_ifindex) |
298 | ipc->oif = info->ipi_ifindex; | |
1da177e4 LT |
299 | ipc->addr = info->ipi_spec_dst.s_addr; |
300 | break; | |
301 | } | |
f02db315 FF |
302 | case IP_TTL: |
303 | if (cmsg->cmsg_len != CMSG_LEN(sizeof(int))) | |
304 | return -EINVAL; | |
305 | val = *(int *)CMSG_DATA(cmsg); | |
306 | if (val < 1 || val > 255) | |
307 | return -EINVAL; | |
308 | ipc->ttl = val; | |
309 | break; | |
310 | case IP_TOS: | |
e895cdce ED |
311 | if (cmsg->cmsg_len == CMSG_LEN(sizeof(int))) |
312 | val = *(int *)CMSG_DATA(cmsg); | |
313 | else if (cmsg->cmsg_len == CMSG_LEN(sizeof(u8))) | |
314 | val = *(u8 *)CMSG_DATA(cmsg); | |
315 | else | |
f02db315 | 316 | return -EINVAL; |
f02db315 FF |
317 | if (val < 0 || val > 255) |
318 | return -EINVAL; | |
319 | ipc->tos = val; | |
320 | ipc->priority = rt_tos2priority(ipc->tos); | |
321 | break; | |
322 | ||
1da177e4 LT |
323 | default: |
324 | return -EINVAL; | |
325 | } | |
326 | } | |
327 | return 0; | |
328 | } | |
329 | ||
592fcb9d | 330 | static void ip_ra_destroy_rcu(struct rcu_head *head) |
66018506 | 331 | { |
592fcb9d ED |
332 | struct ip_ra_chain *ra = container_of(head, struct ip_ra_chain, rcu); |
333 | ||
334 | sock_put(ra->saved_sk); | |
335 | kfree(ra); | |
66018506 | 336 | } |
1da177e4 | 337 | |
4d52cfbe ED |
338 | int ip_ra_control(struct sock *sk, unsigned char on, |
339 | void (*destructor)(struct sock *)) | |
1da177e4 | 340 | { |
43a951e9 ED |
341 | struct ip_ra_chain *ra, *new_ra; |
342 | struct ip_ra_chain __rcu **rap; | |
5796ef75 | 343 | struct net *net = sock_net(sk); |
1da177e4 | 344 | |
c720c7e8 | 345 | if (sk->sk_type != SOCK_RAW || inet_sk(sk)->inet_num == IPPROTO_RAW) |
1da177e4 LT |
346 | return -EINVAL; |
347 | ||
348 | new_ra = on ? kmalloc(sizeof(*new_ra), GFP_KERNEL) : NULL; | |
425aa0e1 GZ |
349 | if (on && !new_ra) |
350 | return -ENOMEM; | |
1da177e4 | 351 | |
d9ff3049 | 352 | mutex_lock(&net->ipv4.ra_mutex); |
5796ef75 | 353 | for (rap = &net->ipv4.ra_chain; |
76d3e153 | 354 | (ra = rcu_dereference_protected(*rap, |
d9ff3049 | 355 | lockdep_is_held(&net->ipv4.ra_mutex))) != NULL; |
43a951e9 | 356 | rap = &ra->next) { |
1da177e4 LT |
357 | if (ra->sk == sk) { |
358 | if (on) { | |
d9ff3049 | 359 | mutex_unlock(&net->ipv4.ra_mutex); |
a51482bd | 360 | kfree(new_ra); |
1da177e4 LT |
361 | return -EADDRINUSE; |
362 | } | |
592fcb9d ED |
363 | /* dont let ip_call_ra_chain() use sk again */ |
364 | ra->sk = NULL; | |
8e380f00 | 365 | RCU_INIT_POINTER(*rap, ra->next); |
d9ff3049 | 366 | mutex_unlock(&net->ipv4.ra_mutex); |
1da177e4 LT |
367 | |
368 | if (ra->destructor) | |
369 | ra->destructor(sk); | |
592fcb9d ED |
370 | /* |
371 | * Delay sock_put(sk) and kfree(ra) after one rcu grace | |
372 | * period. This guarantee ip_call_ra_chain() dont need | |
373 | * to mess with socket refcounts. | |
374 | */ | |
375 | ra->saved_sk = sk; | |
376 | call_rcu(&ra->rcu, ip_ra_destroy_rcu); | |
1da177e4 LT |
377 | return 0; |
378 | } | |
379 | } | |
76d3e153 | 380 | if (!new_ra) { |
d9ff3049 | 381 | mutex_unlock(&net->ipv4.ra_mutex); |
1da177e4 | 382 | return -ENOBUFS; |
76d3e153 | 383 | } |
1da177e4 LT |
384 | new_ra->sk = sk; |
385 | new_ra->destructor = destructor; | |
386 | ||
8e380f00 | 387 | RCU_INIT_POINTER(new_ra->next, ra); |
66018506 | 388 | rcu_assign_pointer(*rap, new_ra); |
1da177e4 | 389 | sock_hold(sk); |
d9ff3049 | 390 | mutex_unlock(&net->ipv4.ra_mutex); |
1da177e4 LT |
391 | |
392 | return 0; | |
393 | } | |
394 | ||
178c49d9 WB |
395 | static void ipv4_icmp_error_rfc4884(const struct sk_buff *skb, |
396 | struct sock_ee_data_rfc4884 *out) | |
397 | { | |
398 | switch (icmp_hdr(skb)->type) { | |
399 | case ICMP_DEST_UNREACH: | |
400 | case ICMP_TIME_EXCEEDED: | |
401 | case ICMP_PARAMETERPROB: | |
402 | ip_icmp_error_rfc4884(skb, out, sizeof(struct icmphdr), | |
403 | icmp_hdr(skb)->un.reserved[1] * 4); | |
404 | } | |
405 | } | |
406 | ||
e905a9ed | 407 | void ip_icmp_error(struct sock *sk, struct sk_buff *skb, int err, |
35986b32 | 408 | __be16 port, u32 info, u8 *payload) |
1da177e4 | 409 | { |
1da177e4 LT |
410 | struct sock_exterr_skb *serr; |
411 | ||
1da177e4 LT |
412 | skb = skb_clone(skb, GFP_ATOMIC); |
413 | if (!skb) | |
414 | return; | |
415 | ||
e905a9ed | 416 | serr = SKB_EXT_ERR(skb); |
1da177e4 LT |
417 | serr->ee.ee_errno = err; |
418 | serr->ee.ee_origin = SO_EE_ORIGIN_ICMP; | |
88c7664f ACM |
419 | serr->ee.ee_type = icmp_hdr(skb)->type; |
420 | serr->ee.ee_code = icmp_hdr(skb)->code; | |
1da177e4 LT |
421 | serr->ee.ee_pad = 0; |
422 | serr->ee.ee_info = info; | |
423 | serr->ee.ee_data = 0; | |
88c7664f | 424 | serr->addr_offset = (u8 *)&(((struct iphdr *)(icmp_hdr(skb) + 1))->daddr) - |
d56f90a7 | 425 | skb_network_header(skb); |
1da177e4 LT |
426 | serr->port = port; |
427 | ||
00db4124 | 428 | if (skb_pull(skb, payload - skb->data)) { |
eba75c58 | 429 | if (inet_sk(sk)->recverr_rfc4884) |
178c49d9 | 430 | ipv4_icmp_error_rfc4884(skb, &serr->ee.ee_rfc4884); |
eba75c58 | 431 | |
bd82393c ACM |
432 | skb_reset_transport_header(skb); |
433 | if (sock_queue_err_skb(sk, skb) == 0) | |
434 | return; | |
435 | } | |
436 | kfree_skb(skb); | |
1da177e4 LT |
437 | } |
438 | ||
0579016e | 439 | void ip_local_error(struct sock *sk, int err, __be32 daddr, __be16 port, u32 info) |
1da177e4 LT |
440 | { |
441 | struct inet_sock *inet = inet_sk(sk); | |
442 | struct sock_exterr_skb *serr; | |
443 | struct iphdr *iph; | |
444 | struct sk_buff *skb; | |
445 | ||
446 | if (!inet->recverr) | |
447 | return; | |
448 | ||
449 | skb = alloc_skb(sizeof(struct iphdr), GFP_ATOMIC); | |
450 | if (!skb) | |
451 | return; | |
452 | ||
2ca9e6f2 ACM |
453 | skb_put(skb, sizeof(struct iphdr)); |
454 | skb_reset_network_header(skb); | |
eddc9ec5 | 455 | iph = ip_hdr(skb); |
1da177e4 LT |
456 | iph->daddr = daddr; |
457 | ||
e905a9ed | 458 | serr = SKB_EXT_ERR(skb); |
1da177e4 LT |
459 | serr->ee.ee_errno = err; |
460 | serr->ee.ee_origin = SO_EE_ORIGIN_LOCAL; | |
e905a9ed | 461 | serr->ee.ee_type = 0; |
1da177e4 LT |
462 | serr->ee.ee_code = 0; |
463 | serr->ee.ee_pad = 0; | |
464 | serr->ee.ee_info = info; | |
465 | serr->ee.ee_data = 0; | |
d56f90a7 | 466 | serr->addr_offset = (u8 *)&iph->daddr - skb_network_header(skb); |
1da177e4 LT |
467 | serr->port = port; |
468 | ||
27a884dc | 469 | __skb_pull(skb, skb_tail_pointer(skb) - skb->data); |
bd82393c | 470 | skb_reset_transport_header(skb); |
1da177e4 LT |
471 | |
472 | if (sock_queue_err_skb(sk, skb)) | |
473 | kfree_skb(skb); | |
474 | } | |
475 | ||
34b99df4 JA |
476 | /* For some errors we have valid addr_offset even with zero payload and |
477 | * zero port. Also, addr_offset should be supported if port is set. | |
478 | */ | |
479 | static inline bool ipv4_datagram_support_addr(struct sock_exterr_skb *serr) | |
480 | { | |
481 | return serr->ee.ee_origin == SO_EE_ORIGIN_ICMP || | |
482 | serr->ee.ee_origin == SO_EE_ORIGIN_LOCAL || serr->port; | |
483 | } | |
484 | ||
c247f053 WB |
485 | /* IPv4 supports cmsg on all imcp errors and some timestamps |
486 | * | |
487 | * Timestamp code paths do not initialize the fields expected by cmsg: | |
488 | * the PKTINFO fields in skb->cb[]. Fill those in here. | |
489 | */ | |
490 | static bool ipv4_datagram_support_cmsg(const struct sock *sk, | |
491 | struct sk_buff *skb, | |
492 | int ee_origin) | |
829ae9d6 | 493 | { |
c247f053 WB |
494 | struct in_pktinfo *info; |
495 | ||
496 | if (ee_origin == SO_EE_ORIGIN_ICMP) | |
497 | return true; | |
829ae9d6 | 498 | |
c247f053 WB |
499 | if (ee_origin == SO_EE_ORIGIN_LOCAL) |
500 | return false; | |
501 | ||
502 | /* Support IP_PKTINFO on tstamp packets if requested, to correlate | |
1862d620 | 503 | * timestamp with egress dev. Not possible for packets without iif |
c247f053 WB |
504 | * or without payload (SOF_TIMESTAMPING_OPT_TSONLY). |
505 | */ | |
1862d620 WB |
506 | info = PKTINFO_SKB_CB(skb); |
507 | if (!(sk->sk_tsflags & SOF_TIMESTAMPING_OPT_CMSG) || | |
508 | !info->ipi_ifindex) | |
829ae9d6 WB |
509 | return false; |
510 | ||
511 | info->ipi_spec_dst.s_addr = ip_hdr(skb)->saddr; | |
829ae9d6 WB |
512 | return true; |
513 | } | |
514 | ||
e905a9ed | 515 | /* |
1da177e4 LT |
516 | * Handle MSG_ERRQUEUE |
517 | */ | |
85fbaa75 | 518 | int ip_recv_error(struct sock *sk, struct msghdr *msg, int len, int *addr_len) |
1da177e4 LT |
519 | { |
520 | struct sock_exterr_skb *serr; | |
364a9e93 | 521 | struct sk_buff *skb; |
342dfc30 | 522 | DECLARE_SOCKADDR(struct sockaddr_in *, sin, msg->msg_name); |
1da177e4 LT |
523 | struct { |
524 | struct sock_extended_err ee; | |
525 | struct sockaddr_in offender; | |
526 | } errhdr; | |
527 | int err; | |
528 | int copied; | |
529 | ||
530 | err = -EAGAIN; | |
364a9e93 | 531 | skb = sock_dequeue_err_skb(sk); |
51456b29 | 532 | if (!skb) |
1da177e4 LT |
533 | goto out; |
534 | ||
535 | copied = skb->len; | |
536 | if (copied > len) { | |
537 | msg->msg_flags |= MSG_TRUNC; | |
538 | copied = len; | |
539 | } | |
51f3d02b | 540 | err = skb_copy_datagram_msg(skb, 0, msg, copied); |
960a2628 ED |
541 | if (unlikely(err)) { |
542 | kfree_skb(skb); | |
543 | return err; | |
544 | } | |
1da177e4 LT |
545 | sock_recv_timestamp(msg, sk, skb); |
546 | ||
547 | serr = SKB_EXT_ERR(skb); | |
548 | ||
34b99df4 | 549 | if (sin && ipv4_datagram_support_addr(serr)) { |
1da177e4 | 550 | sin->sin_family = AF_INET; |
d56f90a7 ACM |
551 | sin->sin_addr.s_addr = *(__be32 *)(skb_network_header(skb) + |
552 | serr->addr_offset); | |
1da177e4 LT |
553 | sin->sin_port = serr->port; |
554 | memset(&sin->sin_zero, 0, sizeof(sin->sin_zero)); | |
85fbaa75 | 555 | *addr_len = sizeof(*sin); |
1da177e4 LT |
556 | } |
557 | ||
558 | memcpy(&errhdr.ee, &serr->ee, sizeof(struct sock_extended_err)); | |
559 | sin = &errhdr.offender; | |
f812116b | 560 | memset(sin, 0, sizeof(*sin)); |
829ae9d6 | 561 | |
c247f053 | 562 | if (ipv4_datagram_support_cmsg(sk, skb, serr->ee.ee_origin)) { |
1da177e4 | 563 | sin->sin_family = AF_INET; |
eddc9ec5 | 564 | sin->sin_addr.s_addr = ip_hdr(skb)->saddr; |
f812116b | 565 | if (inet_sk(sk)->cmsg_flags) |
1da177e4 LT |
566 | ip_cmsg_recv(msg, skb); |
567 | } | |
568 | ||
569 | put_cmsg(msg, SOL_IP, IP_RECVERR, sizeof(errhdr), &errhdr); | |
570 | ||
571 | /* Now we could try to dump offended packet options */ | |
572 | ||
573 | msg->msg_flags |= MSG_ERRQUEUE; | |
574 | err = copied; | |
575 | ||
960a2628 | 576 | consume_skb(skb); |
1da177e4 LT |
577 | out: |
578 | return err; | |
579 | } | |
580 | ||
6ebf71ba CH |
581 | static void __ip_sock_set_tos(struct sock *sk, int val) |
582 | { | |
583 | if (sk->sk_type == SOCK_STREAM) { | |
584 | val &= ~INET_ECN_MASK; | |
585 | val |= inet_sk(sk)->tos & INET_ECN_MASK; | |
586 | } | |
587 | if (inet_sk(sk)->tos != val) { | |
588 | inet_sk(sk)->tos = val; | |
589 | sk->sk_priority = rt_tos2priority(val); | |
590 | sk_dst_reset(sk); | |
591 | } | |
592 | } | |
593 | ||
594 | void ip_sock_set_tos(struct sock *sk, int val) | |
595 | { | |
596 | lock_sock(sk); | |
597 | __ip_sock_set_tos(sk, val); | |
598 | release_sock(sk); | |
599 | } | |
600 | EXPORT_SYMBOL(ip_sock_set_tos); | |
1da177e4 | 601 | |
c4e446bf CH |
602 | void ip_sock_set_freebind(struct sock *sk) |
603 | { | |
604 | lock_sock(sk); | |
605 | inet_sk(sk)->freebind = true; | |
606 | release_sock(sk); | |
607 | } | |
608 | EXPORT_SYMBOL(ip_sock_set_freebind); | |
609 | ||
db45c0ef CH |
610 | void ip_sock_set_recverr(struct sock *sk) |
611 | { | |
612 | lock_sock(sk); | |
613 | inet_sk(sk)->recverr = true; | |
614 | release_sock(sk); | |
615 | } | |
616 | EXPORT_SYMBOL(ip_sock_set_recverr); | |
617 | ||
2de569bd CH |
618 | int ip_sock_set_mtu_discover(struct sock *sk, int val) |
619 | { | |
620 | if (val < IP_PMTUDISC_DONT || val > IP_PMTUDISC_OMIT) | |
621 | return -EINVAL; | |
622 | lock_sock(sk); | |
623 | inet_sk(sk)->pmtudisc = val; | |
624 | release_sock(sk); | |
625 | return 0; | |
626 | } | |
627 | EXPORT_SYMBOL(ip_sock_set_mtu_discover); | |
628 | ||
c1f9ec57 CH |
629 | void ip_sock_set_pktinfo(struct sock *sk) |
630 | { | |
631 | lock_sock(sk); | |
632 | inet_sk(sk)->cmsg_flags |= IP_CMSG_PKTINFO; | |
633 | release_sock(sk); | |
634 | } | |
635 | EXPORT_SYMBOL(ip_sock_set_pktinfo); | |
636 | ||
1da177e4 | 637 | /* |
4d52cfbe ED |
638 | * Socket option code for IP. This is the end of the line after any |
639 | * TCP,UDP etc options on an IP socket. | |
1da177e4 | 640 | */ |
baf606d9 MRL |
641 | static bool setsockopt_needs_rtnl(int optname) |
642 | { | |
643 | switch (optname) { | |
644 | case IP_ADD_MEMBERSHIP: | |
645 | case IP_ADD_SOURCE_MEMBERSHIP: | |
54ff9ef3 | 646 | case IP_BLOCK_SOURCE: |
baf606d9 | 647 | case IP_DROP_MEMBERSHIP: |
54ff9ef3 MRL |
648 | case IP_DROP_SOURCE_MEMBERSHIP: |
649 | case IP_MSFILTER: | |
650 | case IP_UNBLOCK_SOURCE: | |
651 | case MCAST_BLOCK_SOURCE: | |
652 | case MCAST_MSFILTER: | |
baf606d9 | 653 | case MCAST_JOIN_GROUP: |
54ff9ef3 | 654 | case MCAST_JOIN_SOURCE_GROUP: |
baf606d9 | 655 | case MCAST_LEAVE_GROUP: |
54ff9ef3 MRL |
656 | case MCAST_LEAVE_SOURCE_GROUP: |
657 | case MCAST_UNBLOCK_SOURCE: | |
baf606d9 MRL |
658 | return true; |
659 | } | |
660 | return false; | |
661 | } | |
1da177e4 | 662 | |
e986d4da AV |
663 | static int set_mcast_msfilter(struct sock *sk, int ifindex, |
664 | int numsrc, int fmode, | |
665 | struct sockaddr_storage *group, | |
666 | struct sockaddr_storage *list) | |
667 | { | |
e986d4da AV |
668 | struct ip_msfilter *msf; |
669 | struct sockaddr_in *psin; | |
670 | int err, i; | |
671 | ||
4167a960 | 672 | msf = kmalloc(IP_MSFILTER_SIZE(numsrc), GFP_KERNEL); |
e986d4da AV |
673 | if (!msf) |
674 | return -ENOBUFS; | |
675 | ||
676 | psin = (struct sockaddr_in *)group; | |
677 | if (psin->sin_family != AF_INET) | |
678 | goto Eaddrnotavail; | |
679 | msf->imsf_multiaddr = psin->sin_addr.s_addr; | |
680 | msf->imsf_interface = 0; | |
681 | msf->imsf_fmode = fmode; | |
682 | msf->imsf_numsrc = numsrc; | |
683 | for (i = 0; i < numsrc; ++i) { | |
684 | psin = (struct sockaddr_in *)&list[i]; | |
685 | ||
686 | if (psin->sin_family != AF_INET) | |
687 | goto Eaddrnotavail; | |
2d3e5caf | 688 | msf->imsf_slist_flex[i] = psin->sin_addr.s_addr; |
e986d4da AV |
689 | } |
690 | err = ip_mc_msfilter(sk, msf, ifindex); | |
691 | kfree(msf); | |
692 | return err; | |
693 | ||
694 | Eaddrnotavail: | |
695 | kfree(msf); | |
696 | return -EADDRNOTAVAIL; | |
697 | } | |
698 | ||
89654c5f CH |
699 | static int copy_group_source_from_sockptr(struct group_source_req *greqs, |
700 | sockptr_t optval, int optlen) | |
b6238c04 CH |
701 | { |
702 | if (in_compat_syscall()) { | |
703 | struct compat_group_source_req gr32; | |
704 | ||
705 | if (optlen != sizeof(gr32)) | |
706 | return -EINVAL; | |
89654c5f | 707 | if (copy_from_sockptr(&gr32, optval, sizeof(gr32))) |
b6238c04 CH |
708 | return -EFAULT; |
709 | greqs->gsr_interface = gr32.gsr_interface; | |
710 | greqs->gsr_group = gr32.gsr_group; | |
711 | greqs->gsr_source = gr32.gsr_source; | |
712 | } else { | |
713 | if (optlen != sizeof(*greqs)) | |
714 | return -EINVAL; | |
89654c5f | 715 | if (copy_from_sockptr(greqs, optval, sizeof(*greqs))) |
b6238c04 CH |
716 | return -EFAULT; |
717 | } | |
718 | ||
719 | return 0; | |
720 | } | |
721 | ||
2bbf8c1e | 722 | static int do_mcast_group_source(struct sock *sk, int optname, |
89654c5f | 723 | sockptr_t optval, int optlen) |
2bbf8c1e | 724 | { |
b6238c04 | 725 | struct group_source_req greqs; |
2bbf8c1e AV |
726 | struct ip_mreq_source mreqs; |
727 | struct sockaddr_in *psin; | |
728 | int omode, add, err; | |
729 | ||
89654c5f | 730 | err = copy_group_source_from_sockptr(&greqs, optval, optlen); |
b6238c04 CH |
731 | if (err) |
732 | return err; | |
733 | ||
734 | if (greqs.gsr_group.ss_family != AF_INET || | |
735 | greqs.gsr_source.ss_family != AF_INET) | |
2bbf8c1e AV |
736 | return -EADDRNOTAVAIL; |
737 | ||
b6238c04 | 738 | psin = (struct sockaddr_in *)&greqs.gsr_group; |
2bbf8c1e | 739 | mreqs.imr_multiaddr = psin->sin_addr.s_addr; |
b6238c04 | 740 | psin = (struct sockaddr_in *)&greqs.gsr_source; |
2bbf8c1e AV |
741 | mreqs.imr_sourceaddr = psin->sin_addr.s_addr; |
742 | mreqs.imr_interface = 0; /* use index for mc_source */ | |
743 | ||
744 | if (optname == MCAST_BLOCK_SOURCE) { | |
745 | omode = MCAST_EXCLUDE; | |
746 | add = 1; | |
747 | } else if (optname == MCAST_UNBLOCK_SOURCE) { | |
748 | omode = MCAST_EXCLUDE; | |
749 | add = 0; | |
750 | } else if (optname == MCAST_JOIN_SOURCE_GROUP) { | |
751 | struct ip_mreqn mreq; | |
752 | ||
b6238c04 | 753 | psin = (struct sockaddr_in *)&greqs.gsr_group; |
2bbf8c1e AV |
754 | mreq.imr_multiaddr = psin->sin_addr; |
755 | mreq.imr_address.s_addr = 0; | |
b6238c04 | 756 | mreq.imr_ifindex = greqs.gsr_interface; |
2bbf8c1e AV |
757 | err = ip_mc_join_group_ssm(sk, &mreq, MCAST_INCLUDE); |
758 | if (err && err != -EADDRINUSE) | |
759 | return err; | |
b6238c04 | 760 | greqs.gsr_interface = mreq.imr_ifindex; |
2bbf8c1e AV |
761 | omode = MCAST_INCLUDE; |
762 | add = 1; | |
763 | } else /* MCAST_LEAVE_SOURCE_GROUP */ { | |
764 | omode = MCAST_INCLUDE; | |
765 | add = 0; | |
766 | } | |
b6238c04 | 767 | return ip_mc_source(add, omode, sk, &mreqs, greqs.gsr_interface); |
2bbf8c1e AV |
768 | } |
769 | ||
89654c5f | 770 | static int ip_set_mcast_msfilter(struct sock *sk, sockptr_t optval, int optlen) |
d62c38f6 CH |
771 | { |
772 | struct group_filter *gsf = NULL; | |
773 | int err; | |
774 | ||
775 | if (optlen < GROUP_FILTER_SIZE(0)) | |
776 | return -EINVAL; | |
777 | if (optlen > sysctl_optmem_max) | |
778 | return -ENOBUFS; | |
779 | ||
89654c5f | 780 | gsf = memdup_sockptr(optval, optlen); |
d62c38f6 CH |
781 | if (IS_ERR(gsf)) |
782 | return PTR_ERR(gsf); | |
783 | ||
784 | /* numsrc >= (4G-140)/128 overflow in 32 bits */ | |
785 | err = -ENOBUFS; | |
786 | if (gsf->gf_numsrc >= 0x1ffffff || | |
787 | gsf->gf_numsrc > sock_net(sk)->ipv4.sysctl_igmp_max_msf) | |
788 | goto out_free_gsf; | |
789 | ||
790 | err = -EINVAL; | |
791 | if (GROUP_FILTER_SIZE(gsf->gf_numsrc) > optlen) | |
792 | goto out_free_gsf; | |
793 | ||
794 | err = set_mcast_msfilter(sk, gsf->gf_interface, gsf->gf_numsrc, | |
db243b79 GS |
795 | gsf->gf_fmode, &gsf->gf_group, |
796 | gsf->gf_slist_flex); | |
d62c38f6 CH |
797 | out_free_gsf: |
798 | kfree(gsf); | |
799 | return err; | |
800 | } | |
801 | ||
89654c5f | 802 | static int compat_ip_set_mcast_msfilter(struct sock *sk, sockptr_t optval, |
d62c38f6 CH |
803 | int optlen) |
804 | { | |
db243b79 | 805 | const int size0 = offsetof(struct compat_group_filter, gf_slist_flex); |
d62c38f6 CH |
806 | struct compat_group_filter *gf32; |
807 | unsigned int n; | |
808 | void *p; | |
809 | int err; | |
810 | ||
811 | if (optlen < size0) | |
812 | return -EINVAL; | |
813 | if (optlen > sysctl_optmem_max - 4) | |
814 | return -ENOBUFS; | |
815 | ||
816 | p = kmalloc(optlen + 4, GFP_KERNEL); | |
817 | if (!p) | |
818 | return -ENOMEM; | |
db243b79 | 819 | gf32 = p + 4; /* we want ->gf_group and ->gf_slist_flex aligned */ |
d62c38f6 CH |
820 | |
821 | err = -EFAULT; | |
89654c5f | 822 | if (copy_from_sockptr(gf32, optval, optlen)) |
d62c38f6 CH |
823 | goto out_free_gsf; |
824 | ||
825 | /* numsrc >= (4G-140)/128 overflow in 32 bits */ | |
826 | n = gf32->gf_numsrc; | |
827 | err = -ENOBUFS; | |
828 | if (n >= 0x1ffffff) | |
829 | goto out_free_gsf; | |
830 | ||
831 | err = -EINVAL; | |
db243b79 | 832 | if (offsetof(struct compat_group_filter, gf_slist_flex[n]) > optlen) |
d62c38f6 CH |
833 | goto out_free_gsf; |
834 | ||
d62c38f6 CH |
835 | /* numsrc >= (4G-140)/128 overflow in 32 bits */ |
836 | err = -ENOBUFS; | |
837 | if (n > sock_net(sk)->ipv4.sysctl_igmp_max_msf) | |
b6238c04 | 838 | goto out_free_gsf; |
d62c38f6 | 839 | err = set_mcast_msfilter(sk, gf32->gf_interface, n, gf32->gf_fmode, |
db243b79 | 840 | &gf32->gf_group, gf32->gf_slist_flex); |
d62c38f6 CH |
841 | out_free_gsf: |
842 | kfree(p); | |
843 | return err; | |
844 | } | |
d62c38f6 | 845 | |
02caad7c | 846 | static int ip_mcast_join_leave(struct sock *sk, int optname, |
89654c5f | 847 | sockptr_t optval, int optlen) |
02caad7c CH |
848 | { |
849 | struct ip_mreqn mreq = { }; | |
850 | struct sockaddr_in *psin; | |
851 | struct group_req greq; | |
852 | ||
853 | if (optlen < sizeof(struct group_req)) | |
854 | return -EINVAL; | |
89654c5f | 855 | if (copy_from_sockptr(&greq, optval, sizeof(greq))) |
02caad7c CH |
856 | return -EFAULT; |
857 | ||
858 | psin = (struct sockaddr_in *)&greq.gr_group; | |
859 | if (psin->sin_family != AF_INET) | |
860 | return -EINVAL; | |
861 | mreq.imr_multiaddr = psin->sin_addr; | |
862 | mreq.imr_ifindex = greq.gr_interface; | |
863 | if (optname == MCAST_JOIN_GROUP) | |
864 | return ip_mc_join_group(sk, &mreq); | |
865 | return ip_mc_leave_group(sk, &mreq); | |
866 | } | |
867 | ||
02caad7c | 868 | static int compat_ip_mcast_join_leave(struct sock *sk, int optname, |
89654c5f | 869 | sockptr_t optval, int optlen) |
02caad7c CH |
870 | { |
871 | struct compat_group_req greq; | |
872 | struct ip_mreqn mreq = { }; | |
873 | struct sockaddr_in *psin; | |
02caad7c CH |
874 | |
875 | if (optlen < sizeof(struct compat_group_req)) | |
876 | return -EINVAL; | |
89654c5f | 877 | if (copy_from_sockptr(&greq, optval, sizeof(greq))) |
02caad7c CH |
878 | return -EFAULT; |
879 | ||
880 | psin = (struct sockaddr_in *)&greq.gr_group; | |
881 | if (psin->sin_family != AF_INET) | |
882 | return -EINVAL; | |
883 | mreq.imr_multiaddr = psin->sin_addr; | |
884 | mreq.imr_ifindex = greq.gr_interface; | |
885 | ||
02caad7c | 886 | if (optname == MCAST_JOIN_GROUP) |
b6238c04 CH |
887 | return ip_mc_join_group(sk, &mreq); |
888 | return ip_mc_leave_group(sk, &mreq); | |
02caad7c | 889 | } |
02caad7c | 890 | |
89654c5f CH |
891 | static int do_ip_setsockopt(struct sock *sk, int level, int optname, |
892 | sockptr_t optval, unsigned int optlen) | |
1da177e4 LT |
893 | { |
894 | struct inet_sock *inet = inet_sk(sk); | |
166b6b2d | 895 | struct net *net = sock_net(sk); |
09cb105e | 896 | int val = 0, err; |
baf606d9 | 897 | bool needs_rtnl = setsockopt_needs_rtnl(optname); |
1da177e4 | 898 | |
0c9f79be XW |
899 | switch (optname) { |
900 | case IP_PKTINFO: | |
901 | case IP_RECVTTL: | |
902 | case IP_RECVOPTS: | |
903 | case IP_RECVTOS: | |
904 | case IP_RETOPTS: | |
905 | case IP_TOS: | |
906 | case IP_TTL: | |
907 | case IP_HDRINCL: | |
908 | case IP_MTU_DISCOVER: | |
909 | case IP_RECVERR: | |
910 | case IP_ROUTER_ALERT: | |
911 | case IP_FREEBIND: | |
912 | case IP_PASSSEC: | |
913 | case IP_TRANSPARENT: | |
914 | case IP_MINTTL: | |
915 | case IP_NODEFRAG: | |
90c337da | 916 | case IP_BIND_ADDRESS_NO_PORT: |
0c9f79be XW |
917 | case IP_UNICAST_IF: |
918 | case IP_MULTICAST_TTL: | |
919 | case IP_MULTICAST_ALL: | |
920 | case IP_MULTICAST_LOOP: | |
921 | case IP_RECVORIGDSTADDR: | |
ad6f939a | 922 | case IP_CHECKSUM: |
70ecc248 | 923 | case IP_RECVFRAGSIZE: |
eba75c58 | 924 | case IP_RECVERR_RFC4884: |
1da177e4 | 925 | if (optlen >= sizeof(int)) { |
89654c5f | 926 | if (copy_from_sockptr(&val, optval, sizeof(val))) |
1da177e4 LT |
927 | return -EFAULT; |
928 | } else if (optlen >= sizeof(char)) { | |
929 | unsigned char ucval; | |
930 | ||
89654c5f | 931 | if (copy_from_sockptr(&ucval, optval, sizeof(ucval))) |
1da177e4 LT |
932 | return -EFAULT; |
933 | val = (int) ucval; | |
934 | } | |
935 | } | |
936 | ||
937 | /* If optlen==0, it is equivalent to val == 0 */ | |
938 | ||
0526947f KT |
939 | if (optname == IP_ROUTER_ALERT) |
940 | return ip_ra_control(sk, val ? 1 : 0, NULL); | |
6a9fb947 | 941 | if (ip_mroute_opt(optname)) |
89654c5f | 942 | return ip_mroute_setsockopt(sk, optname, optval, optlen); |
1da177e4 LT |
943 | |
944 | err = 0; | |
baf606d9 MRL |
945 | if (needs_rtnl) |
946 | rtnl_lock(); | |
1da177e4 LT |
947 | lock_sock(sk); |
948 | ||
949 | switch (optname) { | |
132adf54 SH |
950 | case IP_OPTIONS: |
951 | { | |
f6d8bd05 ED |
952 | struct ip_options_rcu *old, *opt = NULL; |
953 | ||
65a1c4ff | 954 | if (optlen > 40) |
132adf54 | 955 | goto e_inval; |
89654c5f | 956 | err = ip_options_get(sock_net(sk), &opt, optval, optlen); |
132adf54 SH |
957 | if (err) |
958 | break; | |
f6d8bd05 | 959 | old = rcu_dereference_protected(inet->inet_opt, |
1e1d04e6 | 960 | lockdep_sock_is_held(sk)); |
132adf54 SH |
961 | if (inet->is_icsk) { |
962 | struct inet_connection_sock *icsk = inet_csk(sk); | |
dfd56b8b | 963 | #if IS_ENABLED(CONFIG_IPV6) |
132adf54 SH |
964 | if (sk->sk_family == PF_INET || |
965 | (!((1 << sk->sk_state) & | |
966 | (TCPF_LISTEN | TCPF_CLOSE)) && | |
c720c7e8 | 967 | inet->inet_daddr != LOOPBACK4_IPV6)) { |
1da177e4 | 968 | #endif |
f6d8bd05 ED |
969 | if (old) |
970 | icsk->icsk_ext_hdr_len -= old->opt.optlen; | |
132adf54 | 971 | if (opt) |
f6d8bd05 | 972 | icsk->icsk_ext_hdr_len += opt->opt.optlen; |
132adf54 | 973 | icsk->icsk_sync_mss(sk, icsk->icsk_pmtu_cookie); |
dfd56b8b | 974 | #if IS_ENABLED(CONFIG_IPV6) |
1da177e4 | 975 | } |
132adf54 | 976 | #endif |
1da177e4 | 977 | } |
f6d8bd05 ED |
978 | rcu_assign_pointer(inet->inet_opt, opt); |
979 | if (old) | |
605b4afe | 980 | kfree_rcu(old, rcu); |
132adf54 SH |
981 | break; |
982 | } | |
983 | case IP_PKTINFO: | |
984 | if (val) | |
985 | inet->cmsg_flags |= IP_CMSG_PKTINFO; | |
986 | else | |
987 | inet->cmsg_flags &= ~IP_CMSG_PKTINFO; | |
988 | break; | |
989 | case IP_RECVTTL: | |
990 | if (val) | |
991 | inet->cmsg_flags |= IP_CMSG_TTL; | |
992 | else | |
993 | inet->cmsg_flags &= ~IP_CMSG_TTL; | |
994 | break; | |
995 | case IP_RECVTOS: | |
996 | if (val) | |
997 | inet->cmsg_flags |= IP_CMSG_TOS; | |
998 | else | |
999 | inet->cmsg_flags &= ~IP_CMSG_TOS; | |
1000 | break; | |
1001 | case IP_RECVOPTS: | |
1002 | if (val) | |
1003 | inet->cmsg_flags |= IP_CMSG_RECVOPTS; | |
1004 | else | |
1005 | inet->cmsg_flags &= ~IP_CMSG_RECVOPTS; | |
1006 | break; | |
1007 | case IP_RETOPTS: | |
1008 | if (val) | |
1009 | inet->cmsg_flags |= IP_CMSG_RETOPTS; | |
1010 | else | |
1011 | inet->cmsg_flags &= ~IP_CMSG_RETOPTS; | |
1012 | break; | |
1013 | case IP_PASSSEC: | |
1014 | if (val) | |
1015 | inet->cmsg_flags |= IP_CMSG_PASSSEC; | |
1016 | else | |
1017 | inet->cmsg_flags &= ~IP_CMSG_PASSSEC; | |
1018 | break; | |
e8b2dfe9 BS |
1019 | case IP_RECVORIGDSTADDR: |
1020 | if (val) | |
1021 | inet->cmsg_flags |= IP_CMSG_ORIGDSTADDR; | |
1022 | else | |
1023 | inet->cmsg_flags &= ~IP_CMSG_ORIGDSTADDR; | |
1024 | break; | |
ad6f939a TH |
1025 | case IP_CHECKSUM: |
1026 | if (val) { | |
1027 | if (!(inet->cmsg_flags & IP_CMSG_CHECKSUM)) { | |
1028 | inet_inc_convert_csum(sk); | |
1029 | inet->cmsg_flags |= IP_CMSG_CHECKSUM; | |
1030 | } | |
1031 | } else { | |
1032 | if (inet->cmsg_flags & IP_CMSG_CHECKSUM) { | |
1033 | inet_dec_convert_csum(sk); | |
1034 | inet->cmsg_flags &= ~IP_CMSG_CHECKSUM; | |
1035 | } | |
1036 | } | |
1037 | break; | |
70ecc248 WB |
1038 | case IP_RECVFRAGSIZE: |
1039 | if (sk->sk_type != SOCK_RAW && sk->sk_type != SOCK_DGRAM) | |
1040 | goto e_inval; | |
1041 | if (val) | |
1042 | inet->cmsg_flags |= IP_CMSG_RECVFRAGSIZE; | |
1043 | else | |
1044 | inet->cmsg_flags &= ~IP_CMSG_RECVFRAGSIZE; | |
1045 | break; | |
132adf54 | 1046 | case IP_TOS: /* This sets both TOS and Precedence */ |
6ebf71ba | 1047 | __ip_sock_set_tos(sk, val); |
132adf54 SH |
1048 | break; |
1049 | case IP_TTL: | |
4d52cfbe | 1050 | if (optlen < 1) |
132adf54 | 1051 | goto e_inval; |
c9be4a5c | 1052 | if (val != -1 && (val < 1 || val > 255)) |
132adf54 SH |
1053 | goto e_inval; |
1054 | inet->uc_ttl = val; | |
1055 | break; | |
1056 | case IP_HDRINCL: | |
1057 | if (sk->sk_type != SOCK_RAW) { | |
1058 | err = -ENOPROTOOPT; | |
2c7946a7 | 1059 | break; |
132adf54 SH |
1060 | } |
1061 | inet->hdrincl = val ? 1 : 0; | |
1062 | break; | |
7b2ff18e JO |
1063 | case IP_NODEFRAG: |
1064 | if (sk->sk_type != SOCK_RAW) { | |
1065 | err = -ENOPROTOOPT; | |
1066 | break; | |
1067 | } | |
1068 | inet->nodefrag = val ? 1 : 0; | |
1069 | break; | |
90c337da ED |
1070 | case IP_BIND_ADDRESS_NO_PORT: |
1071 | inet->bind_address_no_port = val ? 1 : 0; | |
1072 | break; | |
132adf54 | 1073 | case IP_MTU_DISCOVER: |
1b346576 | 1074 | if (val < IP_PMTUDISC_DONT || val > IP_PMTUDISC_OMIT) |
132adf54 SH |
1075 | goto e_inval; |
1076 | inet->pmtudisc = val; | |
1077 | break; | |
1078 | case IP_RECVERR: | |
1079 | inet->recverr = !!val; | |
1080 | if (!val) | |
1081 | skb_queue_purge(&sk->sk_error_queue); | |
1082 | break; | |
eba75c58 WB |
1083 | case IP_RECVERR_RFC4884: |
1084 | if (val < 0 || val > 1) | |
1085 | goto e_inval; | |
1086 | inet->recverr_rfc4884 = !!val; | |
1087 | break; | |
132adf54 SH |
1088 | case IP_MULTICAST_TTL: |
1089 | if (sk->sk_type == SOCK_STREAM) | |
1090 | goto e_inval; | |
4d52cfbe | 1091 | if (optlen < 1) |
132adf54 | 1092 | goto e_inval; |
09cb105e | 1093 | if (val == -1) |
132adf54 SH |
1094 | val = 1; |
1095 | if (val < 0 || val > 255) | |
1096 | goto e_inval; | |
1097 | inet->mc_ttl = val; | |
1098 | break; | |
1099 | case IP_MULTICAST_LOOP: | |
4d52cfbe | 1100 | if (optlen < 1) |
132adf54 SH |
1101 | goto e_inval; |
1102 | inet->mc_loop = !!val; | |
1103 | break; | |
76e21053 EH |
1104 | case IP_UNICAST_IF: |
1105 | { | |
1106 | struct net_device *dev = NULL; | |
1107 | int ifindex; | |
9515a2e0 | 1108 | int midx; |
76e21053 EH |
1109 | |
1110 | if (optlen != sizeof(int)) | |
1111 | goto e_inval; | |
1112 | ||
1113 | ifindex = (__force int)ntohl((__force __be32)val); | |
1114 | if (ifindex == 0) { | |
1115 | inet->uc_index = 0; | |
1116 | err = 0; | |
1117 | break; | |
1118 | } | |
1119 | ||
1120 | dev = dev_get_by_index(sock_net(sk), ifindex); | |
1121 | err = -EADDRNOTAVAIL; | |
1122 | if (!dev) | |
1123 | break; | |
9515a2e0 DA |
1124 | |
1125 | midx = l3mdev_master_ifindex(dev); | |
76e21053 EH |
1126 | dev_put(dev); |
1127 | ||
1128 | err = -EINVAL; | |
fdf1923b | 1129 | if (sk->sk_bound_dev_if && midx != sk->sk_bound_dev_if) |
76e21053 EH |
1130 | break; |
1131 | ||
1132 | inet->uc_index = ifindex; | |
1133 | err = 0; | |
1134 | break; | |
1135 | } | |
132adf54 SH |
1136 | case IP_MULTICAST_IF: |
1137 | { | |
1138 | struct ip_mreqn mreq; | |
1139 | struct net_device *dev = NULL; | |
7bb387c5 | 1140 | int midx; |
132adf54 SH |
1141 | |
1142 | if (sk->sk_type == SOCK_STREAM) | |
1143 | goto e_inval; | |
1144 | /* | |
1145 | * Check the arguments are allowable | |
1146 | */ | |
1147 | ||
0915921b SW |
1148 | if (optlen < sizeof(struct in_addr)) |
1149 | goto e_inval; | |
1150 | ||
132adf54 SH |
1151 | err = -EFAULT; |
1152 | if (optlen >= sizeof(struct ip_mreqn)) { | |
89654c5f | 1153 | if (copy_from_sockptr(&mreq, optval, sizeof(mreq))) |
1da177e4 | 1154 | break; |
132adf54 SH |
1155 | } else { |
1156 | memset(&mreq, 0, sizeof(mreq)); | |
3a084ddb | 1157 | if (optlen >= sizeof(struct ip_mreq)) { |
89654c5f CH |
1158 | if (copy_from_sockptr(&mreq, optval, |
1159 | sizeof(struct ip_mreq))) | |
3a084ddb JP |
1160 | break; |
1161 | } else if (optlen >= sizeof(struct in_addr)) { | |
89654c5f CH |
1162 | if (copy_from_sockptr(&mreq.imr_address, optval, |
1163 | sizeof(struct in_addr))) | |
3a084ddb JP |
1164 | break; |
1165 | } | |
132adf54 SH |
1166 | } |
1167 | ||
1168 | if (!mreq.imr_ifindex) { | |
e6f1cebf | 1169 | if (mreq.imr_address.s_addr == htonl(INADDR_ANY)) { |
132adf54 SH |
1170 | inet->mc_index = 0; |
1171 | inet->mc_addr = 0; | |
1172 | err = 0; | |
1da177e4 LT |
1173 | break; |
1174 | } | |
3b1e0a65 | 1175 | dev = ip_dev_find(sock_net(sk), mreq.imr_address.s_addr); |
55b80503 | 1176 | if (dev) |
132adf54 | 1177 | mreq.imr_ifindex = dev->ifindex; |
132adf54 | 1178 | } else |
55b80503 | 1179 | dev = dev_get_by_index(sock_net(sk), mreq.imr_ifindex); |
1da177e4 | 1180 | |
1da177e4 | 1181 | |
132adf54 SH |
1182 | err = -EADDRNOTAVAIL; |
1183 | if (!dev) | |
1184 | break; | |
7bb387c5 DA |
1185 | |
1186 | midx = l3mdev_master_ifindex(dev); | |
1187 | ||
55b80503 | 1188 | dev_put(dev); |
132adf54 SH |
1189 | |
1190 | err = -EINVAL; | |
1191 | if (sk->sk_bound_dev_if && | |
7bb387c5 | 1192 | mreq.imr_ifindex != sk->sk_bound_dev_if && |
fdf1923b | 1193 | midx != sk->sk_bound_dev_if) |
132adf54 | 1194 | break; |
1da177e4 | 1195 | |
132adf54 SH |
1196 | inet->mc_index = mreq.imr_ifindex; |
1197 | inet->mc_addr = mreq.imr_address.s_addr; | |
1198 | err = 0; | |
1199 | break; | |
1200 | } | |
1da177e4 | 1201 | |
132adf54 SH |
1202 | case IP_ADD_MEMBERSHIP: |
1203 | case IP_DROP_MEMBERSHIP: | |
1204 | { | |
1205 | struct ip_mreqn mreq; | |
1da177e4 | 1206 | |
a96fb49b FL |
1207 | err = -EPROTO; |
1208 | if (inet_sk(sk)->is_icsk) | |
1209 | break; | |
1210 | ||
132adf54 SH |
1211 | if (optlen < sizeof(struct ip_mreq)) |
1212 | goto e_inval; | |
1213 | err = -EFAULT; | |
1214 | if (optlen >= sizeof(struct ip_mreqn)) { | |
89654c5f | 1215 | if (copy_from_sockptr(&mreq, optval, sizeof(mreq))) |
1da177e4 | 1216 | break; |
132adf54 SH |
1217 | } else { |
1218 | memset(&mreq, 0, sizeof(mreq)); | |
89654c5f CH |
1219 | if (copy_from_sockptr(&mreq, optval, |
1220 | sizeof(struct ip_mreq))) | |
1da177e4 | 1221 | break; |
132adf54 | 1222 | } |
1da177e4 | 1223 | |
132adf54 | 1224 | if (optname == IP_ADD_MEMBERSHIP) |
54ff9ef3 | 1225 | err = ip_mc_join_group(sk, &mreq); |
132adf54 | 1226 | else |
54ff9ef3 | 1227 | err = ip_mc_leave_group(sk, &mreq); |
132adf54 SH |
1228 | break; |
1229 | } | |
1230 | case IP_MSFILTER: | |
1231 | { | |
132adf54 SH |
1232 | struct ip_msfilter *msf; |
1233 | ||
4167a960 | 1234 | if (optlen < IP_MSFILTER_SIZE(0)) |
132adf54 SH |
1235 | goto e_inval; |
1236 | if (optlen > sysctl_optmem_max) { | |
1237 | err = -ENOBUFS; | |
1da177e4 LT |
1238 | break; |
1239 | } | |
89654c5f | 1240 | msf = memdup_sockptr(optval, optlen); |
a2c841d9 AV |
1241 | if (IS_ERR(msf)) { |
1242 | err = PTR_ERR(msf); | |
132adf54 SH |
1243 | break; |
1244 | } | |
1245 | /* numsrc >= (1G-4) overflow in 32 bits */ | |
1246 | if (msf->imsf_numsrc >= 0x3ffffffcU || | |
166b6b2d | 1247 | msf->imsf_numsrc > net->ipv4.sysctl_igmp_max_msf) { |
132adf54 SH |
1248 | kfree(msf); |
1249 | err = -ENOBUFS; | |
1250 | break; | |
1251 | } | |
4167a960 | 1252 | if (IP_MSFILTER_SIZE(msf->imsf_numsrc) > optlen) { |
132adf54 SH |
1253 | kfree(msf); |
1254 | err = -EINVAL; | |
1255 | break; | |
1256 | } | |
1257 | err = ip_mc_msfilter(sk, msf, 0); | |
1258 | kfree(msf); | |
1259 | break; | |
1260 | } | |
1261 | case IP_BLOCK_SOURCE: | |
1262 | case IP_UNBLOCK_SOURCE: | |
1263 | case IP_ADD_SOURCE_MEMBERSHIP: | |
1264 | case IP_DROP_SOURCE_MEMBERSHIP: | |
1265 | { | |
1266 | struct ip_mreq_source mreqs; | |
1267 | int omode, add; | |
1da177e4 | 1268 | |
132adf54 SH |
1269 | if (optlen != sizeof(struct ip_mreq_source)) |
1270 | goto e_inval; | |
89654c5f | 1271 | if (copy_from_sockptr(&mreqs, optval, sizeof(mreqs))) { |
1da177e4 | 1272 | err = -EFAULT; |
1da177e4 LT |
1273 | break; |
1274 | } | |
132adf54 SH |
1275 | if (optname == IP_BLOCK_SOURCE) { |
1276 | omode = MCAST_EXCLUDE; | |
1277 | add = 1; | |
1278 | } else if (optname == IP_UNBLOCK_SOURCE) { | |
1279 | omode = MCAST_EXCLUDE; | |
1280 | add = 0; | |
1281 | } else if (optname == IP_ADD_SOURCE_MEMBERSHIP) { | |
1282 | struct ip_mreqn mreq; | |
1da177e4 | 1283 | |
132adf54 SH |
1284 | mreq.imr_multiaddr.s_addr = mreqs.imr_multiaddr; |
1285 | mreq.imr_address.s_addr = mreqs.imr_interface; | |
1286 | mreq.imr_ifindex = 0; | |
6e2059b5 | 1287 | err = ip_mc_join_group_ssm(sk, &mreq, MCAST_INCLUDE); |
132adf54 | 1288 | if (err && err != -EADDRINUSE) |
1da177e4 | 1289 | break; |
132adf54 SH |
1290 | omode = MCAST_INCLUDE; |
1291 | add = 1; | |
1292 | } else /* IP_DROP_SOURCE_MEMBERSHIP */ { | |
1293 | omode = MCAST_INCLUDE; | |
1294 | add = 0; | |
1295 | } | |
1296 | err = ip_mc_source(add, omode, sk, &mreqs, 0); | |
1297 | break; | |
1298 | } | |
1299 | case MCAST_JOIN_GROUP: | |
1300 | case MCAST_LEAVE_GROUP: | |
b6238c04 CH |
1301 | if (in_compat_syscall()) |
1302 | err = compat_ip_mcast_join_leave(sk, optname, optval, | |
1303 | optlen); | |
1304 | else | |
1305 | err = ip_mcast_join_leave(sk, optname, optval, optlen); | |
132adf54 | 1306 | break; |
132adf54 SH |
1307 | case MCAST_JOIN_SOURCE_GROUP: |
1308 | case MCAST_LEAVE_SOURCE_GROUP: | |
1309 | case MCAST_BLOCK_SOURCE: | |
1310 | case MCAST_UNBLOCK_SOURCE: | |
b6238c04 | 1311 | err = do_mcast_group_source(sk, optname, optval, optlen); |
132adf54 | 1312 | break; |
132adf54 | 1313 | case MCAST_MSFILTER: |
b6238c04 CH |
1314 | if (in_compat_syscall()) |
1315 | err = compat_ip_set_mcast_msfilter(sk, optval, optlen); | |
1316 | else | |
1317 | err = ip_set_mcast_msfilter(sk, optval, optlen); | |
132adf54 | 1318 | break; |
f771bef9 NS |
1319 | case IP_MULTICAST_ALL: |
1320 | if (optlen < 1) | |
1321 | goto e_inval; | |
1322 | if (val != 0 && val != 1) | |
1323 | goto e_inval; | |
1324 | inet->mc_all = val; | |
1325 | break; | |
132adf54 SH |
1326 | |
1327 | case IP_FREEBIND: | |
4d52cfbe | 1328 | if (optlen < 1) |
132adf54 SH |
1329 | goto e_inval; |
1330 | inet->freebind = !!val; | |
1331 | break; | |
1332 | ||
1333 | case IP_IPSEC_POLICY: | |
1334 | case IP_XFRM_POLICY: | |
1335 | err = -EPERM; | |
52e804c6 | 1336 | if (!ns_capable(sock_net(sk)->user_ns, CAP_NET_ADMIN)) |
1da177e4 | 1337 | break; |
89654c5f | 1338 | err = xfrm_user_policy(sk, optname, optval, optlen); |
132adf54 | 1339 | break; |
1da177e4 | 1340 | |
f5715aea | 1341 | case IP_TRANSPARENT: |
52e804c6 EB |
1342 | if (!!val && !ns_capable(sock_net(sk)->user_ns, CAP_NET_RAW) && |
1343 | !ns_capable(sock_net(sk)->user_ns, CAP_NET_ADMIN)) { | |
f5715aea KK |
1344 | err = -EPERM; |
1345 | break; | |
1346 | } | |
1347 | if (optlen < 1) | |
1348 | goto e_inval; | |
1349 | inet->transparent = !!val; | |
1350 | break; | |
1351 | ||
d218d111 SH |
1352 | case IP_MINTTL: |
1353 | if (optlen < 1) | |
1354 | goto e_inval; | |
1355 | if (val < 0 || val > 255) | |
1356 | goto e_inval; | |
1357 | inet->min_ttl = val; | |
1358 | break; | |
1359 | ||
132adf54 SH |
1360 | default: |
1361 | err = -ENOPROTOOPT; | |
1362 | break; | |
1da177e4 LT |
1363 | } |
1364 | release_sock(sk); | |
baf606d9 MRL |
1365 | if (needs_rtnl) |
1366 | rtnl_unlock(); | |
1da177e4 LT |
1367 | return err; |
1368 | ||
1369 | e_inval: | |
1370 | release_sock(sk); | |
baf606d9 MRL |
1371 | if (needs_rtnl) |
1372 | rtnl_unlock(); | |
1da177e4 LT |
1373 | return -EINVAL; |
1374 | } | |
1375 | ||
f84af32c | 1376 | /** |
829ae9d6 | 1377 | * ipv4_pktinfo_prepare - transfer some info from rtable to skb |
f84af32c ED |
1378 | * @sk: socket |
1379 | * @skb: buffer | |
1380 | * | |
35ebf65e DM |
1381 | * To support IP_CMSG_PKTINFO option, we store rt_iif and specific |
1382 | * destination in skb->cb[] before dst drop. | |
8e3bff96 | 1383 | * This way, receiver doesn't make cache line misses to read rtable. |
f84af32c | 1384 | */ |
fbf8866d | 1385 | void ipv4_pktinfo_prepare(const struct sock *sk, struct sk_buff *skb) |
f84af32c | 1386 | { |
d826eb14 | 1387 | struct in_pktinfo *pktinfo = PKTINFO_SKB_CB(skb); |
4b261c75 HFS |
1388 | bool prepare = (inet_sk(sk)->cmsg_flags & IP_CMSG_PKTINFO) || |
1389 | ipv6_sk_rxinfo(sk); | |
d826eb14 | 1390 | |
4b261c75 | 1391 | if (prepare && skb_rtable(skb)) { |
0b922b7a DA |
1392 | /* skb->cb is overloaded: prior to this point it is IP{6}CB |
1393 | * which has interface index (iif) as the first member of the | |
1394 | * underlying inet{6}_skb_parm struct. This code then overlays | |
1395 | * PKTINFO_SKB_CB and in_pktinfo also has iif as the first | |
f0c16ba8 WZ |
1396 | * element so the iif is picked up from the prior IPCB. If iif |
1397 | * is the loopback interface, then return the sending interface | |
1398 | * (e.g., process binds socket to eth0 for Tx which is | |
1399 | * redirected to loopback in the rtable/dst). | |
0b922b7a | 1400 | */ |
cbea8f02 DA |
1401 | struct rtable *rt = skb_rtable(skb); |
1402 | bool l3slave = ipv4_l3mdev_skb(IPCB(skb)->flags); | |
1403 | ||
1404 | if (pktinfo->ipi_ifindex == LOOPBACK_IFINDEX) | |
f0c16ba8 | 1405 | pktinfo->ipi_ifindex = inet_iif(skb); |
cbea8f02 DA |
1406 | else if (l3slave && rt && rt->rt_iif) |
1407 | pktinfo->ipi_ifindex = rt->rt_iif; | |
f0c16ba8 | 1408 | |
35ebf65e | 1409 | pktinfo->ipi_spec_dst.s_addr = fib_compute_spec_dst(skb); |
d826eb14 ED |
1410 | } else { |
1411 | pktinfo->ipi_ifindex = 0; | |
1412 | pktinfo->ipi_spec_dst.s_addr = 0; | |
1413 | } | |
61a1030b | 1414 | skb_dst_drop(skb); |
f84af32c | 1415 | } |
f84af32c | 1416 | |
a7b75c5a CH |
1417 | int ip_setsockopt(struct sock *sk, int level, int optname, sockptr_t optval, |
1418 | unsigned int optlen) | |
3fdadf7d DM |
1419 | { |
1420 | int err; | |
1421 | ||
1422 | if (level != SOL_IP) | |
1423 | return -ENOPROTOOPT; | |
1424 | ||
a7b75c5a | 1425 | err = do_ip_setsockopt(sk, level, optname, optval, optlen); |
97adadda | 1426 | #if IS_ENABLED(CONFIG_BPFILTER_UMH) |
d2ba09c1 AS |
1427 | if (optname >= BPFILTER_IPT_SO_SET_REPLACE && |
1428 | optname < BPFILTER_IPT_SET_MAX) | |
a7b75c5a | 1429 | err = bpfilter_ip_set_sockopt(sk, optname, optval, optlen); |
d2ba09c1 | 1430 | #endif |
3fdadf7d DM |
1431 | #ifdef CONFIG_NETFILTER |
1432 | /* we need to exclude all possible ENOPROTOOPTs except default case */ | |
1433 | if (err == -ENOPROTOOPT && optname != IP_HDRINCL && | |
6a9fb947 PE |
1434 | optname != IP_IPSEC_POLICY && |
1435 | optname != IP_XFRM_POLICY && | |
3f34cfae | 1436 | !ip_mroute_opt(optname)) |
a7b75c5a | 1437 | err = nf_setsockopt(sk, PF_INET, optname, optval, optlen); |
3fdadf7d DM |
1438 | #endif |
1439 | return err; | |
1440 | } | |
4d52cfbe | 1441 | EXPORT_SYMBOL(ip_setsockopt); |
3fdadf7d | 1442 | |
1da177e4 | 1443 | /* |
4d52cfbe ED |
1444 | * Get the options. Note for future reference. The GET of IP options gets |
1445 | * the _received_ ones. The set sets the _sent_ ones. | |
1da177e4 LT |
1446 | */ |
1447 | ||
87e9f031 WC |
1448 | static bool getsockopt_needs_rtnl(int optname) |
1449 | { | |
1450 | switch (optname) { | |
1451 | case IP_MSFILTER: | |
1452 | case MCAST_MSFILTER: | |
1453 | return true; | |
1454 | } | |
1455 | return false; | |
1456 | } | |
1457 | ||
49e74c24 CH |
1458 | static int ip_get_mcast_msfilter(struct sock *sk, void __user *optval, |
1459 | int __user *optlen, int len) | |
1460 | { | |
db243b79 | 1461 | const int size0 = offsetof(struct group_filter, gf_slist_flex); |
49e74c24 CH |
1462 | struct group_filter __user *p = optval; |
1463 | struct group_filter gsf; | |
1464 | int num; | |
1465 | int err; | |
1466 | ||
1467 | if (len < size0) | |
1468 | return -EINVAL; | |
1469 | if (copy_from_user(&gsf, p, size0)) | |
1470 | return -EFAULT; | |
1471 | ||
1472 | num = gsf.gf_numsrc; | |
db243b79 | 1473 | err = ip_mc_gsfget(sk, &gsf, p->gf_slist_flex); |
49e74c24 CH |
1474 | if (err) |
1475 | return err; | |
1476 | if (gsf.gf_numsrc < num) | |
1477 | num = gsf.gf_numsrc; | |
1478 | if (put_user(GROUP_FILTER_SIZE(num), optlen) || | |
1479 | copy_to_user(p, &gsf, size0)) | |
1480 | return -EFAULT; | |
1481 | return 0; | |
1482 | } | |
1483 | ||
49e74c24 | 1484 | static int compat_ip_get_mcast_msfilter(struct sock *sk, void __user *optval, |
b6238c04 | 1485 | int __user *optlen, int len) |
49e74c24 | 1486 | { |
db243b79 | 1487 | const int size0 = offsetof(struct compat_group_filter, gf_slist_flex); |
49e74c24 CH |
1488 | struct compat_group_filter __user *p = optval; |
1489 | struct compat_group_filter gf32; | |
1490 | struct group_filter gf; | |
49e74c24 | 1491 | int num; |
b6238c04 | 1492 | int err; |
49e74c24 | 1493 | |
49e74c24 CH |
1494 | if (len < size0) |
1495 | return -EINVAL; | |
49e74c24 CH |
1496 | if (copy_from_user(&gf32, p, size0)) |
1497 | return -EFAULT; | |
1498 | ||
1499 | gf.gf_interface = gf32.gf_interface; | |
1500 | gf.gf_fmode = gf32.gf_fmode; | |
1501 | num = gf.gf_numsrc = gf32.gf_numsrc; | |
1502 | gf.gf_group = gf32.gf_group; | |
1503 | ||
db243b79 | 1504 | err = ip_mc_gsfget(sk, &gf, p->gf_slist_flex); |
49e74c24 CH |
1505 | if (err) |
1506 | return err; | |
1507 | if (gf.gf_numsrc < num) | |
1508 | num = gf.gf_numsrc; | |
1509 | len = GROUP_FILTER_SIZE(num) - (sizeof(gf) - sizeof(gf32)); | |
1510 | if (put_user(len, optlen) || | |
1511 | put_user(gf.gf_fmode, &p->gf_fmode) || | |
1512 | put_user(gf.gf_numsrc, &p->gf_numsrc)) | |
1513 | return -EFAULT; | |
1514 | return 0; | |
1515 | } | |
49e74c24 | 1516 | |
3fdadf7d | 1517 | static int do_ip_getsockopt(struct sock *sk, int level, int optname, |
b6238c04 | 1518 | char __user *optval, int __user *optlen) |
1da177e4 LT |
1519 | { |
1520 | struct inet_sock *inet = inet_sk(sk); | |
87e9f031 WC |
1521 | bool needs_rtnl = getsockopt_needs_rtnl(optname); |
1522 | int val, err = 0; | |
1da177e4 | 1523 | int len; |
e905a9ed | 1524 | |
132adf54 | 1525 | if (level != SOL_IP) |
1da177e4 LT |
1526 | return -EOPNOTSUPP; |
1527 | ||
6a9fb947 | 1528 | if (ip_mroute_opt(optname)) |
09cb105e | 1529 | return ip_mroute_getsockopt(sk, optname, optval, optlen); |
1da177e4 | 1530 | |
09cb105e | 1531 | if (get_user(len, optlen)) |
1da177e4 | 1532 | return -EFAULT; |
132adf54 | 1533 | if (len < 0) |
1da177e4 | 1534 | return -EINVAL; |
e905a9ed | 1535 | |
87e9f031 WC |
1536 | if (needs_rtnl) |
1537 | rtnl_lock(); | |
1da177e4 LT |
1538 | lock_sock(sk); |
1539 | ||
132adf54 SH |
1540 | switch (optname) { |
1541 | case IP_OPTIONS: | |
1542 | { | |
1543 | unsigned char optbuf[sizeof(struct ip_options)+40]; | |
f6d8bd05 ED |
1544 | struct ip_options *opt = (struct ip_options *)optbuf; |
1545 | struct ip_options_rcu *inet_opt; | |
1546 | ||
1547 | inet_opt = rcu_dereference_protected(inet->inet_opt, | |
1e1d04e6 | 1548 | lockdep_sock_is_held(sk)); |
132adf54 | 1549 | opt->optlen = 0; |
f6d8bd05 ED |
1550 | if (inet_opt) |
1551 | memcpy(optbuf, &inet_opt->opt, | |
1552 | sizeof(struct ip_options) + | |
1553 | inet_opt->opt.optlen); | |
132adf54 SH |
1554 | release_sock(sk); |
1555 | ||
1556 | if (opt->optlen == 0) | |
1557 | return put_user(0, optlen); | |
1558 | ||
1559 | ip_options_undo(opt); | |
1560 | ||
1561 | len = min_t(unsigned int, len, opt->optlen); | |
1562 | if (put_user(len, optlen)) | |
1563 | return -EFAULT; | |
1564 | if (copy_to_user(optval, opt->__data, len)) | |
1565 | return -EFAULT; | |
1566 | return 0; | |
1567 | } | |
1568 | case IP_PKTINFO: | |
1569 | val = (inet->cmsg_flags & IP_CMSG_PKTINFO) != 0; | |
1570 | break; | |
1571 | case IP_RECVTTL: | |
1572 | val = (inet->cmsg_flags & IP_CMSG_TTL) != 0; | |
1573 | break; | |
1574 | case IP_RECVTOS: | |
1575 | val = (inet->cmsg_flags & IP_CMSG_TOS) != 0; | |
1576 | break; | |
1577 | case IP_RECVOPTS: | |
1578 | val = (inet->cmsg_flags & IP_CMSG_RECVOPTS) != 0; | |
1579 | break; | |
1580 | case IP_RETOPTS: | |
1581 | val = (inet->cmsg_flags & IP_CMSG_RETOPTS) != 0; | |
1582 | break; | |
1583 | case IP_PASSSEC: | |
1584 | val = (inet->cmsg_flags & IP_CMSG_PASSSEC) != 0; | |
1585 | break; | |
e8b2dfe9 BS |
1586 | case IP_RECVORIGDSTADDR: |
1587 | val = (inet->cmsg_flags & IP_CMSG_ORIGDSTADDR) != 0; | |
1588 | break; | |
ad6f939a TH |
1589 | case IP_CHECKSUM: |
1590 | val = (inet->cmsg_flags & IP_CMSG_CHECKSUM) != 0; | |
1591 | break; | |
70ecc248 WB |
1592 | case IP_RECVFRAGSIZE: |
1593 | val = (inet->cmsg_flags & IP_CMSG_RECVFRAGSIZE) != 0; | |
1594 | break; | |
132adf54 SH |
1595 | case IP_TOS: |
1596 | val = inet->tos; | |
1597 | break; | |
1598 | case IP_TTL: | |
fa50d974 NB |
1599 | { |
1600 | struct net *net = sock_net(sk); | |
132adf54 | 1601 | val = (inet->uc_ttl == -1 ? |
fa50d974 | 1602 | net->ipv4.sysctl_ip_default_ttl : |
132adf54 SH |
1603 | inet->uc_ttl); |
1604 | break; | |
fa50d974 | 1605 | } |
132adf54 SH |
1606 | case IP_HDRINCL: |
1607 | val = inet->hdrincl; | |
1608 | break; | |
a89b4763 MK |
1609 | case IP_NODEFRAG: |
1610 | val = inet->nodefrag; | |
1611 | break; | |
90c337da ED |
1612 | case IP_BIND_ADDRESS_NO_PORT: |
1613 | val = inet->bind_address_no_port; | |
1614 | break; | |
132adf54 SH |
1615 | case IP_MTU_DISCOVER: |
1616 | val = inet->pmtudisc; | |
1617 | break; | |
1618 | case IP_MTU: | |
1619 | { | |
1620 | struct dst_entry *dst; | |
1621 | val = 0; | |
1622 | dst = sk_dst_get(sk); | |
1623 | if (dst) { | |
1624 | val = dst_mtu(dst); | |
1625 | dst_release(dst); | |
1da177e4 | 1626 | } |
132adf54 | 1627 | if (!val) { |
1da177e4 | 1628 | release_sock(sk); |
132adf54 | 1629 | return -ENOTCONN; |
1da177e4 | 1630 | } |
132adf54 SH |
1631 | break; |
1632 | } | |
1633 | case IP_RECVERR: | |
1634 | val = inet->recverr; | |
1635 | break; | |
eba75c58 WB |
1636 | case IP_RECVERR_RFC4884: |
1637 | val = inet->recverr_rfc4884; | |
1638 | break; | |
132adf54 SH |
1639 | case IP_MULTICAST_TTL: |
1640 | val = inet->mc_ttl; | |
1641 | break; | |
1642 | case IP_MULTICAST_LOOP: | |
1643 | val = inet->mc_loop; | |
1644 | break; | |
76e21053 EH |
1645 | case IP_UNICAST_IF: |
1646 | val = (__force int)htonl((__u32) inet->uc_index); | |
1647 | break; | |
132adf54 SH |
1648 | case IP_MULTICAST_IF: |
1649 | { | |
1650 | struct in_addr addr; | |
1651 | len = min_t(unsigned int, len, sizeof(struct in_addr)); | |
1652 | addr.s_addr = inet->mc_addr; | |
1653 | release_sock(sk); | |
1da177e4 | 1654 | |
132adf54 SH |
1655 | if (put_user(len, optlen)) |
1656 | return -EFAULT; | |
1657 | if (copy_to_user(optval, &addr, len)) | |
1658 | return -EFAULT; | |
1659 | return 0; | |
1660 | } | |
1661 | case IP_MSFILTER: | |
1662 | { | |
1663 | struct ip_msfilter msf; | |
132adf54 | 1664 | |
4167a960 | 1665 | if (len < IP_MSFILTER_SIZE(0)) { |
87e9f031 WC |
1666 | err = -EINVAL; |
1667 | goto out; | |
1da177e4 | 1668 | } |
4167a960 | 1669 | if (copy_from_user(&msf, optval, IP_MSFILTER_SIZE(0))) { |
87e9f031 WC |
1670 | err = -EFAULT; |
1671 | goto out; | |
1da177e4 | 1672 | } |
132adf54 SH |
1673 | err = ip_mc_msfget(sk, &msf, |
1674 | (struct ip_msfilter __user *)optval, optlen); | |
87e9f031 | 1675 | goto out; |
132adf54 SH |
1676 | } |
1677 | case MCAST_MSFILTER: | |
b6238c04 CH |
1678 | if (in_compat_syscall()) |
1679 | err = compat_ip_get_mcast_msfilter(sk, optval, optlen, | |
1680 | len); | |
1681 | else | |
1682 | err = ip_get_mcast_msfilter(sk, optval, optlen, len); | |
87e9f031 | 1683 | goto out; |
f771bef9 NS |
1684 | case IP_MULTICAST_ALL: |
1685 | val = inet->mc_all; | |
1686 | break; | |
132adf54 SH |
1687 | case IP_PKTOPTIONS: |
1688 | { | |
1689 | struct msghdr msg; | |
1da177e4 | 1690 | |
132adf54 | 1691 | release_sock(sk); |
1da177e4 | 1692 | |
132adf54 SH |
1693 | if (sk->sk_type != SOCK_STREAM) |
1694 | return -ENOPROTOOPT; | |
1da177e4 | 1695 | |
1f466e1f CH |
1696 | msg.msg_control_is_user = true; |
1697 | msg.msg_control_user = optval; | |
132adf54 | 1698 | msg.msg_controllen = len; |
b6238c04 | 1699 | msg.msg_flags = in_compat_syscall() ? MSG_CMSG_COMPAT : 0; |
1da177e4 | 1700 | |
132adf54 SH |
1701 | if (inet->cmsg_flags & IP_CMSG_PKTINFO) { |
1702 | struct in_pktinfo info; | |
1703 | ||
c720c7e8 ED |
1704 | info.ipi_addr.s_addr = inet->inet_rcv_saddr; |
1705 | info.ipi_spec_dst.s_addr = inet->inet_rcv_saddr; | |
132adf54 SH |
1706 | info.ipi_ifindex = inet->mc_index; |
1707 | put_cmsg(&msg, SOL_IP, IP_PKTINFO, sizeof(info), &info); | |
1da177e4 | 1708 | } |
132adf54 SH |
1709 | if (inet->cmsg_flags & IP_CMSG_TTL) { |
1710 | int hlim = inet->mc_ttl; | |
1711 | put_cmsg(&msg, SOL_IP, IP_TTL, sizeof(hlim), &hlim); | |
1712 | } | |
4c507d28 JB |
1713 | if (inet->cmsg_flags & IP_CMSG_TOS) { |
1714 | int tos = inet->rcv_tos; | |
1715 | put_cmsg(&msg, SOL_IP, IP_TOS, sizeof(tos), &tos); | |
1716 | } | |
132adf54 SH |
1717 | len -= msg.msg_controllen; |
1718 | return put_user(len, optlen); | |
1719 | } | |
1720 | case IP_FREEBIND: | |
1721 | val = inet->freebind; | |
1722 | break; | |
f5715aea KK |
1723 | case IP_TRANSPARENT: |
1724 | val = inet->transparent; | |
1725 | break; | |
d218d111 SH |
1726 | case IP_MINTTL: |
1727 | val = inet->min_ttl; | |
1728 | break; | |
132adf54 SH |
1729 | default: |
1730 | release_sock(sk); | |
1731 | return -ENOPROTOOPT; | |
1da177e4 LT |
1732 | } |
1733 | release_sock(sk); | |
e905a9ed | 1734 | |
4d52cfbe | 1735 | if (len < sizeof(int) && len > 0 && val >= 0 && val <= 255) { |
1da177e4 LT |
1736 | unsigned char ucval = (unsigned char)val; |
1737 | len = 1; | |
132adf54 | 1738 | if (put_user(len, optlen)) |
1da177e4 | 1739 | return -EFAULT; |
09cb105e | 1740 | if (copy_to_user(optval, &ucval, 1)) |
1da177e4 LT |
1741 | return -EFAULT; |
1742 | } else { | |
1743 | len = min_t(unsigned int, sizeof(int), len); | |
132adf54 | 1744 | if (put_user(len, optlen)) |
1da177e4 | 1745 | return -EFAULT; |
09cb105e | 1746 | if (copy_to_user(optval, &val, len)) |
1da177e4 LT |
1747 | return -EFAULT; |
1748 | } | |
1749 | return 0; | |
87e9f031 WC |
1750 | |
1751 | out: | |
1752 | release_sock(sk); | |
1753 | if (needs_rtnl) | |
1754 | rtnl_unlock(); | |
1755 | return err; | |
1da177e4 LT |
1756 | } |
1757 | ||
3fdadf7d | 1758 | int ip_getsockopt(struct sock *sk, int level, |
132adf54 | 1759 | int optname, char __user *optval, int __user *optlen) |
3fdadf7d DM |
1760 | { |
1761 | int err; | |
1762 | ||
b6238c04 | 1763 | err = do_ip_getsockopt(sk, level, optname, optval, optlen); |
42908c69 | 1764 | |
97adadda | 1765 | #if IS_ENABLED(CONFIG_BPFILTER_UMH) |
d2ba09c1 AS |
1766 | if (optname >= BPFILTER_IPT_SO_GET_INFO && |
1767 | optname < BPFILTER_IPT_GET_MAX) | |
1768 | err = bpfilter_ip_get_sockopt(sk, optname, optval, optlen); | |
1769 | #endif | |
3fdadf7d DM |
1770 | #ifdef CONFIG_NETFILTER |
1771 | /* we need to exclude all possible ENOPROTOOPTs except default case */ | |
6a9fb947 PE |
1772 | if (err == -ENOPROTOOPT && optname != IP_PKTOPTIONS && |
1773 | !ip_mroute_opt(optname)) { | |
e905a9ed | 1774 | int len; |
3fdadf7d | 1775 | |
543d9cfe | 1776 | if (get_user(len, optlen)) |
3fdadf7d DM |
1777 | return -EFAULT; |
1778 | ||
77d4df41 | 1779 | err = nf_getsockopt(sk, PF_INET, optname, optval, &len); |
3fdadf7d DM |
1780 | if (err >= 0) |
1781 | err = put_user(len, optlen); | |
1782 | return err; | |
1783 | } | |
1784 | #endif | |
1785 | return err; | |
1786 | } | |
b6238c04 | 1787 | EXPORT_SYMBOL(ip_getsockopt); |