]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - net/ipv4/sysctl_net_ipv4.c
Merge tag 'mlx5-updates-2017-04-22' of git://git.kernel.org/pub/scm/linux/kernel...
[mirror_ubuntu-artful-kernel.git] / net / ipv4 / sysctl_net_ipv4.c
CommitLineData
1da177e4
LT
1/*
2 * sysctl_net_ipv4.c: sysctl interface to net IPV4 subsystem.
3 *
1da177e4
LT
4 * Begun April 1, 1996, Mike Shaver.
5 * Added /proc/sys/net/ipv4 directory entry (empty =) ). [MS]
6 */
7
8#include <linux/mm.h>
9#include <linux/module.h>
10#include <linux/sysctl.h>
20380731 11#include <linux/igmp.h>
14c85021 12#include <linux/inetdevice.h>
227b60f5 13#include <linux/seqlock.h>
3e37c3f9 14#include <linux/init.h>
5a0e3ad6 15#include <linux/slab.h>
c319b4d7 16#include <linux/nsproxy.h>
3dc43e3e 17#include <linux/swap.h>
1da177e4 18#include <net/snmp.h>
20380731 19#include <net/icmp.h>
1da177e4
LT
20#include <net/ip.h>
21#include <net/route.h>
22#include <net/tcp.h>
95766fff 23#include <net/udp.h>
446fda4f 24#include <net/cipso_ipv4.h>
04128f23 25#include <net/inet_frag.h>
c319b4d7 26#include <net/ping.h>
dddb64bc 27#include <net/protocol.h>
1da177e4 28
89cee8b1 29static int zero;
cdda8891 30static int one = 1;
6ba8a3b1 31static int four = 4;
43e122b0 32static int thousand = 1000;
95bd09eb 33static int gso_max_segs = GSO_MAX_SEGS;
e905a9ed 34static int tcp_retr1_max = 255;
1da177e4
LT
35static int ip_local_port_range_min[] = { 1, 1 };
36static int ip_local_port_range_max[] = { 65535, 65535 };
0147fc05
AD
37static int tcp_adv_win_scale_min = -31;
38static int tcp_adv_win_scale_max = 31;
4548b683
KJ
39static int ip_privileged_port_min;
40static int ip_privileged_port_max = 65535;
249fab77
ED
41static int ip_ttl_min = 1;
42static int ip_ttl_max = 255;
651e9271
MT
43static int tcp_syn_retries_min = 1;
44static int tcp_syn_retries_max = MAX_TCP_SYNCNT;
c319b4d7
VK
45static int ip_ping_group_range_min[] = { 0, 0 };
46static int ip_ping_group_range_max[] = { GID_T_MAX, GID_T_MAX };
1da177e4 47
227b60f5 48/* Update system visible IP port range */
0bbf87d8 49static void set_local_port_range(struct net *net, int range[2])
227b60f5 50{
ed2dfd90
ED
51 bool same_parity = !((range[0] ^ range[1]) & 1);
52
4ee3bd4a 53 write_seqlock_bh(&net->ipv4.ip_local_ports.lock);
ed2dfd90
ED
54 if (same_parity && !net->ipv4.ip_local_ports.warned) {
55 net->ipv4.ip_local_ports.warned = true;
56 pr_err_ratelimited("ip_local_port_range: prefer different parity for start/end values.\n");
57 }
c9d8f1a6
CW
58 net->ipv4.ip_local_ports.range[0] = range[0];
59 net->ipv4.ip_local_ports.range[1] = range[1];
4ee3bd4a 60 write_sequnlock_bh(&net->ipv4.ip_local_ports.lock);
227b60f5
SH
61}
62
63/* Validate changes from /proc interface. */
fe2c6338 64static int ipv4_local_port_range(struct ctl_table *table, int write,
227b60f5
SH
65 void __user *buffer,
66 size_t *lenp, loff_t *ppos)
67{
0bbf87d8 68 struct net *net =
c9d8f1a6 69 container_of(table->data, struct net, ipv4.ip_local_ports.range);
227b60f5 70 int ret;
3c689b73 71 int range[2];
fe2c6338 72 struct ctl_table tmp = {
227b60f5
SH
73 .data = &range,
74 .maxlen = sizeof(range),
75 .mode = table->mode,
76 .extra1 = &ip_local_port_range_min,
77 .extra2 = &ip_local_port_range_max,
78 };
79
0bbf87d8
EB
80 inet_get_local_port_range(net, &range[0], &range[1]);
81
8d65af78 82 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
227b60f5
SH
83
84 if (write && ret == 0) {
4548b683
KJ
85 /* Ensure that the upper limit is not smaller than the lower,
86 * and that the lower does not encroach upon the privileged
87 * port limit.
88 */
89 if ((range[1] < range[0]) ||
90 (range[0] < net->ipv4.sysctl_ip_prot_sock))
227b60f5
SH
91 ret = -EINVAL;
92 else
0bbf87d8 93 set_local_port_range(net, range);
227b60f5
SH
94 }
95
96 return ret;
97}
98
4548b683
KJ
99/* Validate changes from /proc interface. */
100static int ipv4_privileged_ports(struct ctl_table *table, int write,
101 void __user *buffer, size_t *lenp, loff_t *ppos)
102{
103 struct net *net = container_of(table->data, struct net,
104 ipv4.sysctl_ip_prot_sock);
105 int ret;
106 int pports;
107 int range[2];
108 struct ctl_table tmp = {
109 .data = &pports,
110 .maxlen = sizeof(pports),
111 .mode = table->mode,
112 .extra1 = &ip_privileged_port_min,
113 .extra2 = &ip_privileged_port_max,
114 };
115
116 pports = net->ipv4.sysctl_ip_prot_sock;
117
118 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
119
120 if (write && ret == 0) {
121 inet_get_local_port_range(net, &range[0], &range[1]);
122 /* Ensure that the local port range doesn't overlap with the
123 * privileged port range.
124 */
125 if (range[0] < pports)
126 ret = -EINVAL;
127 else
128 net->ipv4.sysctl_ip_prot_sock = pports;
129 }
130
131 return ret;
132}
c319b4d7 133
7064d16e 134static void inet_get_ping_group_range_table(struct ctl_table *table, kgid_t *low, kgid_t *high)
c319b4d7 135{
7064d16e 136 kgid_t *data = table->data;
0bbf87d8 137 struct net *net =
ba6b918a 138 container_of(table->data, struct net, ipv4.ping_group_range.range);
95c96174 139 unsigned int seq;
c319b4d7 140 do {
396a30cc 141 seq = read_seqbegin(&net->ipv4.ping_group_range.lock);
c319b4d7
VK
142
143 *low = data[0];
144 *high = data[1];
396a30cc 145 } while (read_seqretry(&net->ipv4.ping_group_range.lock, seq));
c319b4d7
VK
146}
147
148/* Update system visible IP port range */
7064d16e 149static void set_ping_group_range(struct ctl_table *table, kgid_t low, kgid_t high)
c319b4d7 150{
7064d16e 151 kgid_t *data = table->data;
0bbf87d8 152 struct net *net =
ba6b918a 153 container_of(table->data, struct net, ipv4.ping_group_range.range);
396a30cc 154 write_seqlock(&net->ipv4.ping_group_range.lock);
7064d16e
EB
155 data[0] = low;
156 data[1] = high;
396a30cc 157 write_sequnlock(&net->ipv4.ping_group_range.lock);
c319b4d7
VK
158}
159
160/* Validate changes from /proc interface. */
fe2c6338 161static int ipv4_ping_group_range(struct ctl_table *table, int write,
c319b4d7
VK
162 void __user *buffer,
163 size_t *lenp, loff_t *ppos)
164{
7064d16e 165 struct user_namespace *user_ns = current_user_ns();
c319b4d7 166 int ret;
7064d16e
EB
167 gid_t urange[2];
168 kgid_t low, high;
fe2c6338 169 struct ctl_table tmp = {
7064d16e
EB
170 .data = &urange,
171 .maxlen = sizeof(urange),
c319b4d7
VK
172 .mode = table->mode,
173 .extra1 = &ip_ping_group_range_min,
174 .extra2 = &ip_ping_group_range_max,
175 };
176
7064d16e
EB
177 inet_get_ping_group_range_table(table, &low, &high);
178 urange[0] = from_kgid_munged(user_ns, low);
179 urange[1] = from_kgid_munged(user_ns, high);
c319b4d7
VK
180 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
181
7064d16e
EB
182 if (write && ret == 0) {
183 low = make_kgid(user_ns, urange[0]);
184 high = make_kgid(user_ns, urange[1]);
185 if (!gid_valid(low) || !gid_valid(high) ||
186 (urange[1] < urange[0]) || gid_lt(high, low)) {
187 low = make_kgid(&init_user_ns, 1);
188 high = make_kgid(&init_user_ns, 0);
189 }
190 set_ping_group_range(table, low, high);
191 }
c319b4d7
VK
192
193 return ret;
194}
195
fe2c6338 196static int proc_tcp_congestion_control(struct ctl_table *ctl, int write,
317a76f9
SH
197 void __user *buffer, size_t *lenp, loff_t *ppos)
198{
199 char val[TCP_CA_NAME_MAX];
fe2c6338 200 struct ctl_table tbl = {
317a76f9
SH
201 .data = val,
202 .maxlen = TCP_CA_NAME_MAX,
203 };
204 int ret;
205
206 tcp_get_default_congestion_control(val);
207
8d65af78 208 ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
317a76f9
SH
209 if (write && ret == 0)
210 ret = tcp_set_default_congestion_control(val);
211 return ret;
212}
213
fe2c6338 214static int proc_tcp_available_congestion_control(struct ctl_table *ctl,
8d65af78 215 int write,
3ff825b2
SH
216 void __user *buffer, size_t *lenp,
217 loff_t *ppos)
218{
fe2c6338 219 struct ctl_table tbl = { .maxlen = TCP_CA_BUF_MAX, };
3ff825b2
SH
220 int ret;
221
222 tbl.data = kmalloc(tbl.maxlen, GFP_USER);
223 if (!tbl.data)
224 return -ENOMEM;
225 tcp_get_available_congestion_control(tbl.data, TCP_CA_BUF_MAX);
8d65af78 226 ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
3ff825b2
SH
227 kfree(tbl.data);
228 return ret;
229}
230
fe2c6338 231static int proc_allowed_congestion_control(struct ctl_table *ctl,
8d65af78 232 int write,
ce7bc3bf
SH
233 void __user *buffer, size_t *lenp,
234 loff_t *ppos)
235{
fe2c6338 236 struct ctl_table tbl = { .maxlen = TCP_CA_BUF_MAX };
ce7bc3bf
SH
237 int ret;
238
239 tbl.data = kmalloc(tbl.maxlen, GFP_USER);
240 if (!tbl.data)
241 return -ENOMEM;
242
243 tcp_get_allowed_congestion_control(tbl.data, tbl.maxlen);
8d65af78 244 ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
ce7bc3bf
SH
245 if (write && ret == 0)
246 ret = tcp_set_allowed_congestion_control(tbl.data);
247 kfree(tbl.data);
248 return ret;
249}
250
fe2c6338
JP
251static int proc_tcp_fastopen_key(struct ctl_table *ctl, int write,
252 void __user *buffer, size_t *lenp,
253 loff_t *ppos)
10467163 254{
fe2c6338 255 struct ctl_table tbl = { .maxlen = (TCP_FASTOPEN_KEY_LENGTH * 2 + 10) };
10467163
JC
256 struct tcp_fastopen_context *ctxt;
257 int ret;
258 u32 user_key[4]; /* 16 bytes, matching TCP_FASTOPEN_KEY_LENGTH */
259
260 tbl.data = kmalloc(tbl.maxlen, GFP_KERNEL);
261 if (!tbl.data)
262 return -ENOMEM;
263
264 rcu_read_lock();
265 ctxt = rcu_dereference(tcp_fastopen_ctx);
266 if (ctxt)
267 memcpy(user_key, ctxt->key, TCP_FASTOPEN_KEY_LENGTH);
0e24c4fc
AC
268 else
269 memset(user_key, 0, sizeof(user_key));
10467163
JC
270 rcu_read_unlock();
271
272 snprintf(tbl.data, tbl.maxlen, "%08x-%08x-%08x-%08x",
273 user_key[0], user_key[1], user_key[2], user_key[3]);
274 ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
275
276 if (write && ret == 0) {
277 if (sscanf(tbl.data, "%x-%x-%x-%x", user_key, user_key + 1,
278 user_key + 2, user_key + 3) != 4) {
279 ret = -EINVAL;
280 goto bad_key;
281 }
222e83d2
HFS
282 /* Generate a dummy secret but don't publish it. This
283 * is needed so we don't regenerate a new key on the
284 * first invocation of tcp_fastopen_cookie_gen
285 */
286 tcp_fastopen_init_key_once(false);
10467163
JC
287 tcp_fastopen_reset_cipher(user_key, TCP_FASTOPEN_KEY_LENGTH);
288 }
289
290bad_key:
291 pr_debug("proc FO key set 0x%x-%x-%x-%x <- 0x%s: %u\n",
292 user_key[0], user_key[1], user_key[2], user_key[3],
293 (char *)tbl.data, ret);
294 kfree(tbl.data);
295 return ret;
296}
297
dddb64bc
SAK
298static void proc_configure_early_demux(int enabled, int protocol)
299{
300 struct net_protocol *ipprot;
301#if IS_ENABLED(CONFIG_IPV6)
302 struct inet6_protocol *ip6prot;
303#endif
304
58c4c6a3
DA
305 rcu_read_lock();
306
dddb64bc
SAK
307 ipprot = rcu_dereference(inet_protos[protocol]);
308 if (ipprot)
309 ipprot->early_demux = enabled ? ipprot->early_demux_handler :
310 NULL;
311
312#if IS_ENABLED(CONFIG_IPV6)
313 ip6prot = rcu_dereference(inet6_protos[protocol]);
314 if (ip6prot)
315 ip6prot->early_demux = enabled ? ip6prot->early_demux_handler :
316 NULL;
317#endif
58c4c6a3 318 rcu_read_unlock();
dddb64bc
SAK
319}
320
321static int proc_tcp_early_demux(struct ctl_table *table, int write,
322 void __user *buffer, size_t *lenp, loff_t *ppos)
323{
324 int ret = 0;
325
326 ret = proc_dointvec(table, write, buffer, lenp, ppos);
327
328 if (write && !ret) {
329 int enabled = init_net.ipv4.sysctl_tcp_early_demux;
330
331 proc_configure_early_demux(enabled, IPPROTO_TCP);
332 }
333
334 return ret;
335}
336
337static int proc_udp_early_demux(struct ctl_table *table, int write,
338 void __user *buffer, size_t *lenp, loff_t *ppos)
339{
340 int ret = 0;
341
342 ret = proc_dointvec(table, write, buffer, lenp, ppos);
343
344 if (write && !ret) {
345 int enabled = init_net.ipv4.sysctl_udp_early_demux;
346
347 proc_configure_early_demux(enabled, IPPROTO_UDP);
348 }
349
350 return ret;
351}
352
3e37c3f9 353static struct ctl_table ipv4_table[] = {
e905a9ed 354 {
1da177e4
LT
355 .procname = "tcp_timestamps",
356 .data = &sysctl_tcp_timestamps,
357 .maxlen = sizeof(int),
358 .mode = 0644,
6d9f239a 359 .proc_handler = proc_dointvec
1da177e4 360 },
e905a9ed 361 {
1da177e4
LT
362 .procname = "tcp_window_scaling",
363 .data = &sysctl_tcp_window_scaling,
364 .maxlen = sizeof(int),
365 .mode = 0644,
6d9f239a 366 .proc_handler = proc_dointvec
1da177e4 367 },
e905a9ed 368 {
1da177e4
LT
369 .procname = "tcp_sack",
370 .data = &sysctl_tcp_sack,
371 .maxlen = sizeof(int),
372 .mode = 0644,
6d9f239a 373 .proc_handler = proc_dointvec
1da177e4 374 },
e905a9ed 375 {
1da177e4
LT
376 .procname = "tcp_retrans_collapse",
377 .data = &sysctl_tcp_retrans_collapse,
378 .maxlen = sizeof(int),
379 .mode = 0644,
6d9f239a 380 .proc_handler = proc_dointvec
1da177e4 381 },
1da177e4 382 {
1da177e4
LT
383 .procname = "tcp_max_orphans",
384 .data = &sysctl_tcp_max_orphans,
385 .maxlen = sizeof(int),
386 .mode = 0644,
6d9f239a 387 .proc_handler = proc_dointvec
1da177e4 388 },
2100c8d2
YC
389 {
390 .procname = "tcp_fastopen",
391 .data = &sysctl_tcp_fastopen,
392 .maxlen = sizeof(int),
393 .mode = 0644,
394 .proc_handler = proc_dointvec,
395 },
10467163
JC
396 {
397 .procname = "tcp_fastopen_key",
398 .mode = 0600,
399 .maxlen = ((TCP_FASTOPEN_KEY_LENGTH * 2) + 10),
400 .proc_handler = proc_tcp_fastopen_key,
401 },
1da177e4 402 {
1da177e4
LT
403 .procname = "tcp_abort_on_overflow",
404 .data = &sysctl_tcp_abort_on_overflow,
405 .maxlen = sizeof(int),
406 .mode = 0644,
6d9f239a 407 .proc_handler = proc_dointvec
1da177e4
LT
408 },
409 {
1da177e4
LT
410 .procname = "tcp_stdurg",
411 .data = &sysctl_tcp_stdurg,
412 .maxlen = sizeof(int),
413 .mode = 0644,
6d9f239a 414 .proc_handler = proc_dointvec
1da177e4
LT
415 },
416 {
1da177e4
LT
417 .procname = "tcp_rfc1337",
418 .data = &sysctl_tcp_rfc1337,
419 .maxlen = sizeof(int),
420 .mode = 0644,
6d9f239a 421 .proc_handler = proc_dointvec
1da177e4 422 },
1da177e4 423 {
1da177e4
LT
424 .procname = "inet_peer_threshold",
425 .data = &inet_peer_threshold,
426 .maxlen = sizeof(int),
427 .mode = 0644,
6d9f239a 428 .proc_handler = proc_dointvec
1da177e4
LT
429 },
430 {
1da177e4
LT
431 .procname = "inet_peer_minttl",
432 .data = &inet_peer_minttl,
433 .maxlen = sizeof(int),
434 .mode = 0644,
6d9f239a 435 .proc_handler = proc_dointvec_jiffies,
1da177e4
LT
436 },
437 {
1da177e4
LT
438 .procname = "inet_peer_maxttl",
439 .data = &inet_peer_maxttl,
440 .maxlen = sizeof(int),
441 .mode = 0644,
6d9f239a 442 .proc_handler = proc_dointvec_jiffies,
1da177e4 443 },
1da177e4 444 {
1da177e4
LT
445 .procname = "tcp_fack",
446 .data = &sysctl_tcp_fack,
447 .maxlen = sizeof(int),
448 .mode = 0644,
6d9f239a 449 .proc_handler = proc_dointvec
1da177e4 450 },
4f41b1c5
YC
451 {
452 .procname = "tcp_recovery",
453 .data = &sysctl_tcp_recovery,
454 .maxlen = sizeof(int),
455 .mode = 0644,
456 .proc_handler = proc_dointvec,
457 },
dca145ff
ED
458 {
459 .procname = "tcp_max_reordering",
460 .data = &sysctl_tcp_max_reordering,
461 .maxlen = sizeof(int),
462 .mode = 0644,
463 .proc_handler = proc_dointvec
464 },
1da177e4 465 {
1da177e4
LT
466 .procname = "tcp_dsack",
467 .data = &sysctl_tcp_dsack,
468 .maxlen = sizeof(int),
469 .mode = 0644,
6d9f239a 470 .proc_handler = proc_dointvec
1da177e4 471 },
a4fe34bf
EB
472 {
473 .procname = "tcp_mem",
474 .maxlen = sizeof(sysctl_tcp_mem),
475 .data = &sysctl_tcp_mem,
476 .mode = 0644,
477 .proc_handler = proc_doulongvec_minmax,
478 },
1da177e4 479 {
1da177e4
LT
480 .procname = "tcp_wmem",
481 .data = &sysctl_tcp_wmem,
482 .maxlen = sizeof(sysctl_tcp_wmem),
483 .mode = 0644,
cdda8891 484 .proc_handler = proc_dointvec_minmax,
5d37852b 485 .extra1 = &one,
1da177e4
LT
486 },
487 {
1da177e4
LT
488 .procname = "tcp_rmem",
489 .data = &sysctl_tcp_rmem,
490 .maxlen = sizeof(sysctl_tcp_rmem),
491 .mode = 0644,
cdda8891 492 .proc_handler = proc_dointvec_minmax,
5d37852b 493 .extra1 = &one,
1da177e4
LT
494 },
495 {
1da177e4
LT
496 .procname = "tcp_app_win",
497 .data = &sysctl_tcp_app_win,
498 .maxlen = sizeof(int),
499 .mode = 0644,
6d9f239a 500 .proc_handler = proc_dointvec
1da177e4
LT
501 },
502 {
1da177e4
LT
503 .procname = "tcp_adv_win_scale",
504 .data = &sysctl_tcp_adv_win_scale,
505 .maxlen = sizeof(int),
506 .mode = 0644,
0147fc05
AD
507 .proc_handler = proc_dointvec_minmax,
508 .extra1 = &tcp_adv_win_scale_min,
509 .extra2 = &tcp_adv_win_scale_max,
1da177e4 510 },
1da177e4 511 {
1da177e4
LT
512 .procname = "tcp_frto",
513 .data = &sysctl_tcp_frto,
514 .maxlen = sizeof(int),
f6722583
YC
515 .mode = 0644,
516 .proc_handler = proc_dointvec
517 },
518 {
519 .procname = "tcp_min_rtt_wlen",
520 .data = &sysctl_tcp_min_rtt_wlen,
521 .maxlen = sizeof(int),
1da177e4 522 .mode = 0644,
6d9f239a 523 .proc_handler = proc_dointvec
1da177e4
LT
524 },
525 {
1da177e4
LT
526 .procname = "tcp_low_latency",
527 .data = &sysctl_tcp_low_latency,
528 .maxlen = sizeof(int),
529 .mode = 0644,
6d9f239a 530 .proc_handler = proc_dointvec
1da177e4 531 },
1da177e4 532 {
1da177e4
LT
533 .procname = "tcp_no_metrics_save",
534 .data = &sysctl_tcp_nometrics_save,
535 .maxlen = sizeof(int),
536 .mode = 0644,
6d9f239a 537 .proc_handler = proc_dointvec,
1da177e4 538 },
1da177e4 539 {
1da177e4
LT
540 .procname = "tcp_moderate_rcvbuf",
541 .data = &sysctl_tcp_moderate_rcvbuf,
542 .maxlen = sizeof(int),
543 .mode = 0644,
6d9f239a 544 .proc_handler = proc_dointvec,
1da177e4
LT
545 },
546 {
1da177e4
LT
547 .procname = "tcp_tso_win_divisor",
548 .data = &sysctl_tcp_tso_win_divisor,
549 .maxlen = sizeof(int),
550 .mode = 0644,
6d9f239a 551 .proc_handler = proc_dointvec,
1da177e4
LT
552 },
553 {
317a76f9 554 .procname = "tcp_congestion_control",
1da177e4 555 .mode = 0644,
317a76f9 556 .maxlen = TCP_CA_NAME_MAX,
6d9f239a 557 .proc_handler = proc_tcp_congestion_control,
1da177e4 558 },
e905a9ed 559 {
15d99e02
RJ
560 .procname = "tcp_workaround_signed_windows",
561 .data = &sysctl_tcp_workaround_signed_windows,
562 .maxlen = sizeof(int),
563 .mode = 0644,
6d9f239a 564 .proc_handler = proc_dointvec
15d99e02 565 },
46d3ceab
ED
566 {
567 .procname = "tcp_limit_output_bytes",
568 .data = &sysctl_tcp_limit_output_bytes,
569 .maxlen = sizeof(int),
570 .mode = 0644,
571 .proc_handler = proc_dointvec
572 },
282f23c6
ED
573 {
574 .procname = "tcp_challenge_ack_limit",
575 .data = &sysctl_tcp_challenge_ack_limit,
576 .maxlen = sizeof(int),
577 .mode = 0644,
578 .proc_handler = proc_dointvec
579 },
35089bb2 580 {
35089bb2
DM
581 .procname = "tcp_slow_start_after_idle",
582 .data = &sysctl_tcp_slow_start_after_idle,
583 .maxlen = sizeof(int),
584 .mode = 0644,
6d9f239a 585 .proc_handler = proc_dointvec
35089bb2 586 },
446fda4f
PM
587#ifdef CONFIG_NETLABEL
588 {
446fda4f
PM
589 .procname = "cipso_cache_enable",
590 .data = &cipso_v4_cache_enabled,
591 .maxlen = sizeof(int),
592 .mode = 0644,
6d9f239a 593 .proc_handler = proc_dointvec,
446fda4f
PM
594 },
595 {
446fda4f
PM
596 .procname = "cipso_cache_bucket_size",
597 .data = &cipso_v4_cache_bucketsize,
598 .maxlen = sizeof(int),
599 .mode = 0644,
6d9f239a 600 .proc_handler = proc_dointvec,
446fda4f
PM
601 },
602 {
446fda4f
PM
603 .procname = "cipso_rbm_optfmt",
604 .data = &cipso_v4_rbm_optfmt,
605 .maxlen = sizeof(int),
606 .mode = 0644,
6d9f239a 607 .proc_handler = proc_dointvec,
446fda4f
PM
608 },
609 {
446fda4f
PM
610 .procname = "cipso_rbm_strictvalid",
611 .data = &cipso_v4_rbm_strictvalid,
612 .maxlen = sizeof(int),
613 .mode = 0644,
6d9f239a 614 .proc_handler = proc_dointvec,
446fda4f
PM
615 },
616#endif /* CONFIG_NETLABEL */
3ff825b2 617 {
3ff825b2
SH
618 .procname = "tcp_available_congestion_control",
619 .maxlen = TCP_CA_BUF_MAX,
620 .mode = 0444,
6d9f239a 621 .proc_handler = proc_tcp_available_congestion_control,
3ff825b2 622 },
ce7bc3bf 623 {
ce7bc3bf
SH
624 .procname = "tcp_allowed_congestion_control",
625 .maxlen = TCP_CA_BUF_MAX,
626 .mode = 0644,
6d9f239a 627 .proc_handler = proc_allowed_congestion_control,
ce7bc3bf 628 },
36e31b0a
AP
629 {
630 .procname = "tcp_thin_linear_timeouts",
631 .data = &sysctl_tcp_thin_linear_timeouts,
632 .maxlen = sizeof(int),
633 .mode = 0644,
634 .proc_handler = proc_dointvec
635 },
eed530b6
YC
636 {
637 .procname = "tcp_early_retrans",
638 .data = &sysctl_tcp_early_retrans,
639 .maxlen = sizeof(int),
640 .mode = 0644,
641 .proc_handler = proc_dointvec_minmax,
642 .extra1 = &zero,
6ba8a3b1 643 .extra2 = &four,
eed530b6 644 },
95bd09eb
ED
645 {
646 .procname = "tcp_min_tso_segs",
647 .data = &sysctl_tcp_min_tso_segs,
648 .maxlen = sizeof(int),
649 .mode = 0644,
650 .proc_handler = proc_dointvec_minmax,
d6a4e26a 651 .extra1 = &one,
95bd09eb
ED
652 .extra2 = &gso_max_segs,
653 },
43e122b0
ED
654 {
655 .procname = "tcp_pacing_ss_ratio",
656 .data = &sysctl_tcp_pacing_ss_ratio,
657 .maxlen = sizeof(int),
658 .mode = 0644,
659 .proc_handler = proc_dointvec_minmax,
660 .extra1 = &zero,
661 .extra2 = &thousand,
662 },
663 {
664 .procname = "tcp_pacing_ca_ratio",
665 .data = &sysctl_tcp_pacing_ca_ratio,
666 .maxlen = sizeof(int),
667 .mode = 0644,
668 .proc_handler = proc_dointvec_minmax,
669 .extra1 = &zero,
670 .extra2 = &thousand,
671 },
f54b3111
ED
672 {
673 .procname = "tcp_autocorking",
674 .data = &sysctl_tcp_autocorking,
675 .maxlen = sizeof(int),
676 .mode = 0644,
677 .proc_handler = proc_dointvec_minmax,
678 .extra1 = &zero,
679 .extra2 = &one,
680 },
032ee423
NC
681 {
682 .procname = "tcp_invalid_ratelimit",
683 .data = &sysctl_tcp_invalid_ratelimit,
684 .maxlen = sizeof(int),
685 .mode = 0644,
686 .proc_handler = proc_dointvec_ms_jiffies,
687 },
4cdf507d
ED
688 {
689 .procname = "icmp_msgs_per_sec",
690 .data = &sysctl_icmp_msgs_per_sec,
691 .maxlen = sizeof(int),
692 .mode = 0644,
693 .proc_handler = proc_dointvec_minmax,
694 .extra1 = &zero,
695 },
696 {
697 .procname = "icmp_msgs_burst",
698 .data = &sysctl_icmp_msgs_burst,
699 .maxlen = sizeof(int),
700 .mode = 0644,
701 .proc_handler = proc_dointvec_minmax,
702 .extra1 = &zero,
703 },
95766fff 704 {
95766fff
HA
705 .procname = "udp_mem",
706 .data = &sysctl_udp_mem,
707 .maxlen = sizeof(sysctl_udp_mem),
708 .mode = 0644,
8d987e5c 709 .proc_handler = proc_doulongvec_minmax,
95766fff
HA
710 },
711 {
95766fff
HA
712 .procname = "udp_rmem_min",
713 .data = &sysctl_udp_rmem_min,
714 .maxlen = sizeof(sysctl_udp_rmem_min),
715 .mode = 0644,
6d9f239a 716 .proc_handler = proc_dointvec_minmax,
5d37852b 717 .extra1 = &one
95766fff
HA
718 },
719 {
95766fff
HA
720 .procname = "udp_wmem_min",
721 .data = &sysctl_udp_wmem_min,
722 .maxlen = sizeof(sysctl_udp_wmem_min),
723 .mode = 0644,
6d9f239a 724 .proc_handler = proc_dointvec_minmax,
5d37852b 725 .extra1 = &one
95766fff 726 },
f8572d8f 727 { }
1da177e4 728};
3e37c3f9 729
68528f09
PE
730static struct ctl_table ipv4_net_table[] = {
731 {
68528f09
PE
732 .procname = "icmp_echo_ignore_all",
733 .data = &init_net.ipv4.sysctl_icmp_echo_ignore_all,
734 .maxlen = sizeof(int),
735 .mode = 0644,
6d9f239a 736 .proc_handler = proc_dointvec
68528f09
PE
737 },
738 {
68528f09
PE
739 .procname = "icmp_echo_ignore_broadcasts",
740 .data = &init_net.ipv4.sysctl_icmp_echo_ignore_broadcasts,
741 .maxlen = sizeof(int),
742 .mode = 0644,
6d9f239a 743 .proc_handler = proc_dointvec
68528f09
PE
744 },
745 {
68528f09
PE
746 .procname = "icmp_ignore_bogus_error_responses",
747 .data = &init_net.ipv4.sysctl_icmp_ignore_bogus_error_responses,
748 .maxlen = sizeof(int),
749 .mode = 0644,
6d9f239a 750 .proc_handler = proc_dointvec
68528f09
PE
751 },
752 {
68528f09
PE
753 .procname = "icmp_errors_use_inbound_ifaddr",
754 .data = &init_net.ipv4.sysctl_icmp_errors_use_inbound_ifaddr,
755 .maxlen = sizeof(int),
756 .mode = 0644,
6d9f239a 757 .proc_handler = proc_dointvec
68528f09
PE
758 },
759 {
68528f09
PE
760 .procname = "icmp_ratelimit",
761 .data = &init_net.ipv4.sysctl_icmp_ratelimit,
762 .maxlen = sizeof(int),
763 .mode = 0644,
6d9f239a 764 .proc_handler = proc_dointvec_ms_jiffies,
68528f09
PE
765 },
766 {
68528f09
PE
767 .procname = "icmp_ratemask",
768 .data = &init_net.ipv4.sysctl_icmp_ratemask,
769 .maxlen = sizeof(int),
770 .mode = 0644,
6d9f239a 771 .proc_handler = proc_dointvec
68528f09 772 },
c319b4d7
VK
773 {
774 .procname = "ping_group_range",
ba6b918a 775 .data = &init_net.ipv4.ping_group_range.range,
7064d16e 776 .maxlen = sizeof(gid_t)*2,
c319b4d7
VK
777 .mode = 0644,
778 .proc_handler = ipv4_ping_group_range,
779 },
5d134f1c
HFS
780 {
781 .procname = "tcp_ecn",
782 .data = &init_net.ipv4.sysctl_tcp_ecn,
783 .maxlen = sizeof(int),
784 .mode = 0644,
785 .proc_handler = proc_dointvec
786 },
49213555
DB
787 {
788 .procname = "tcp_ecn_fallback",
789 .data = &init_net.ipv4.sysctl_tcp_ecn_fallback,
790 .maxlen = sizeof(int),
791 .mode = 0644,
792 .proc_handler = proc_dointvec
793 },
287b7f38
NB
794 {
795 .procname = "ip_dynaddr",
796 .data = &init_net.ipv4.sysctl_ip_dynaddr,
797 .maxlen = sizeof(int),
798 .mode = 0644,
799 .proc_handler = proc_dointvec
800 },
e21145a9
NB
801 {
802 .procname = "ip_early_demux",
803 .data = &init_net.ipv4.sysctl_ip_early_demux,
804 .maxlen = sizeof(int),
805 .mode = 0644,
806 .proc_handler = proc_dointvec
807 },
dddb64bc
SAK
808 {
809 .procname = "udp_early_demux",
810 .data = &init_net.ipv4.sysctl_udp_early_demux,
811 .maxlen = sizeof(int),
812 .mode = 0644,
813 .proc_handler = proc_udp_early_demux
814 },
815 {
816 .procname = "tcp_early_demux",
817 .data = &init_net.ipv4.sysctl_tcp_early_demux,
818 .maxlen = sizeof(int),
819 .mode = 0644,
820 .proc_handler = proc_tcp_early_demux
821 },
fa50d974
NB
822 {
823 .procname = "ip_default_ttl",
824 .data = &init_net.ipv4.sysctl_ip_default_ttl,
825 .maxlen = sizeof(int),
826 .mode = 0644,
827 .proc_handler = proc_dointvec_minmax,
828 .extra1 = &ip_ttl_min,
829 .extra2 = &ip_ttl_max,
830 },
0bbf87d8
EB
831 {
832 .procname = "ip_local_port_range",
c9d8f1a6
CW
833 .maxlen = sizeof(init_net.ipv4.ip_local_ports.range),
834 .data = &init_net.ipv4.ip_local_ports.range,
0bbf87d8
EB
835 .mode = 0644,
836 .proc_handler = ipv4_local_port_range,
837 },
122ff243
WC
838 {
839 .procname = "ip_local_reserved_ports",
840 .data = &init_net.ipv4.sysctl_local_reserved_ports,
841 .maxlen = 65536,
842 .mode = 0644,
843 .proc_handler = proc_do_large_bitmap,
844 },
974eda11
HFS
845 {
846 .procname = "ip_no_pmtu_disc",
847 .data = &init_net.ipv4.sysctl_ip_no_pmtu_disc,
848 .maxlen = sizeof(int),
849 .mode = 0644,
850 .proc_handler = proc_dointvec
851 },
f87c10a8
HFS
852 {
853 .procname = "ip_forward_use_pmtu",
854 .data = &init_net.ipv4.sysctl_ip_fwd_use_pmtu,
855 .maxlen = sizeof(int),
856 .mode = 0644,
857 .proc_handler = proc_dointvec,
858 },
49a60158
VB
859 {
860 .procname = "ip_nonlocal_bind",
861 .data = &init_net.ipv4.sysctl_ip_nonlocal_bind,
862 .maxlen = sizeof(int),
863 .mode = 0644,
864 .proc_handler = proc_dointvec
865 },
e110861f
LC
866 {
867 .procname = "fwmark_reflect",
868 .data = &init_net.ipv4.sysctl_fwmark_reflect,
869 .maxlen = sizeof(int),
870 .mode = 0644,
871 .proc_handler = proc_dointvec,
872 },
84f39b08
LC
873 {
874 .procname = "tcp_fwmark_accept",
875 .data = &init_net.ipv4.sysctl_tcp_fwmark_accept,
876 .maxlen = sizeof(int),
877 .mode = 0644,
878 .proc_handler = proc_dointvec,
879 },
6dd9a14e
DA
880#ifdef CONFIG_NET_L3_MASTER_DEV
881 {
882 .procname = "tcp_l3mdev_accept",
883 .data = &init_net.ipv4.sysctl_tcp_l3mdev_accept,
884 .maxlen = sizeof(int),
885 .mode = 0644,
886 .proc_handler = proc_dointvec_minmax,
887 .extra1 = &zero,
888 .extra2 = &one,
889 },
890#endif
b0f9ca53
FD
891 {
892 .procname = "tcp_mtu_probing",
893 .data = &init_net.ipv4.sysctl_tcp_mtu_probing,
894 .maxlen = sizeof(int),
895 .mode = 0644,
896 .proc_handler = proc_dointvec,
897 },
898 {
899 .procname = "tcp_base_mss",
900 .data = &init_net.ipv4.sysctl_tcp_base_mss,
901 .maxlen = sizeof(int),
902 .mode = 0644,
903 .proc_handler = proc_dointvec,
904 },
6b58e0a5
FD
905 {
906 .procname = "tcp_probe_threshold",
907 .data = &init_net.ipv4.sysctl_tcp_probe_threshold,
908 .maxlen = sizeof(int),
909 .mode = 0644,
910 .proc_handler = proc_dointvec,
911 },
05cbc0db
FD
912 {
913 .procname = "tcp_probe_interval",
914 .data = &init_net.ipv4.sysctl_tcp_probe_interval,
915 .maxlen = sizeof(int),
916 .mode = 0644,
917 .proc_handler = proc_dointvec,
918 },
df2cf4a7
PD
919 {
920 .procname = "igmp_link_local_mcast_reports",
87a8a2ae 921 .data = &init_net.ipv4.sysctl_igmp_llm_reports,
df2cf4a7
PD
922 .maxlen = sizeof(int),
923 .mode = 0644,
924 .proc_handler = proc_dointvec
925 },
815c5270
NB
926 {
927 .procname = "igmp_max_memberships",
928 .data = &init_net.ipv4.sysctl_igmp_max_memberships,
929 .maxlen = sizeof(int),
930 .mode = 0644,
931 .proc_handler = proc_dointvec
932 },
166b6b2d
NB
933 {
934 .procname = "igmp_max_msf",
935 .data = &init_net.ipv4.sysctl_igmp_max_msf,
936 .maxlen = sizeof(int),
937 .mode = 0644,
938 .proc_handler = proc_dointvec
939 },
165094af
NB
940#ifdef CONFIG_IP_MULTICAST
941 {
942 .procname = "igmp_qrv",
943 .data = &init_net.ipv4.sysctl_igmp_qrv,
944 .maxlen = sizeof(int),
945 .mode = 0644,
946 .proc_handler = proc_dointvec_minmax,
947 .extra1 = &one
948 },
949#endif
13b287e8
NB
950 {
951 .procname = "tcp_keepalive_time",
952 .data = &init_net.ipv4.sysctl_tcp_keepalive_time,
953 .maxlen = sizeof(int),
954 .mode = 0644,
955 .proc_handler = proc_dointvec_jiffies,
956 },
9bd6861b
NB
957 {
958 .procname = "tcp_keepalive_probes",
959 .data = &init_net.ipv4.sysctl_tcp_keepalive_probes,
960 .maxlen = sizeof(int),
961 .mode = 0644,
962 .proc_handler = proc_dointvec
963 },
b840d15d
NB
964 {
965 .procname = "tcp_keepalive_intvl",
966 .data = &init_net.ipv4.sysctl_tcp_keepalive_intvl,
967 .maxlen = sizeof(int),
968 .mode = 0644,
969 .proc_handler = proc_dointvec_jiffies,
970 },
6fa25166
NB
971 {
972 .procname = "tcp_syn_retries",
973 .data = &init_net.ipv4.sysctl_tcp_syn_retries,
974 .maxlen = sizeof(int),
975 .mode = 0644,
976 .proc_handler = proc_dointvec_minmax,
977 .extra1 = &tcp_syn_retries_min,
978 .extra2 = &tcp_syn_retries_max
979 },
7c083ecb
NB
980 {
981 .procname = "tcp_synack_retries",
982 .data = &init_net.ipv4.sysctl_tcp_synack_retries,
983 .maxlen = sizeof(int),
984 .mode = 0644,
985 .proc_handler = proc_dointvec
986 },
12ed8244
NB
987#ifdef CONFIG_SYN_COOKIES
988 {
989 .procname = "tcp_syncookies",
990 .data = &init_net.ipv4.sysctl_tcp_syncookies,
991 .maxlen = sizeof(int),
992 .mode = 0644,
993 .proc_handler = proc_dointvec
994 },
995#endif
1043e25f
NB
996 {
997 .procname = "tcp_reordering",
998 .data = &init_net.ipv4.sysctl_tcp_reordering,
999 .maxlen = sizeof(int),
1000 .mode = 0644,
1001 .proc_handler = proc_dointvec
1002 },
ae5c3f40
NB
1003 {
1004 .procname = "tcp_retries1",
1005 .data = &init_net.ipv4.sysctl_tcp_retries1,
1006 .maxlen = sizeof(int),
1007 .mode = 0644,
1008 .proc_handler = proc_dointvec_minmax,
1009 .extra2 = &tcp_retr1_max
1010 },
c6214a97
NB
1011 {
1012 .procname = "tcp_retries2",
1013 .data = &init_net.ipv4.sysctl_tcp_retries2,
1014 .maxlen = sizeof(int),
1015 .mode = 0644,
1016 .proc_handler = proc_dointvec
1017 },
c402d9be
NB
1018 {
1019 .procname = "tcp_orphan_retries",
1020 .data = &init_net.ipv4.sysctl_tcp_orphan_retries,
1021 .maxlen = sizeof(int),
1022 .mode = 0644,
1023 .proc_handler = proc_dointvec
1024 },
1e579caa
NB
1025 {
1026 .procname = "tcp_fin_timeout",
1027 .data = &init_net.ipv4.sysctl_tcp_fin_timeout,
1028 .maxlen = sizeof(int),
1029 .mode = 0644,
1030 .proc_handler = proc_dointvec_jiffies,
1031 },
4979f2d9
NB
1032 {
1033 .procname = "tcp_notsent_lowat",
1034 .data = &init_net.ipv4.sysctl_tcp_notsent_lowat,
1035 .maxlen = sizeof(unsigned int),
1036 .mode = 0644,
b007f090 1037 .proc_handler = proc_douintvec,
4979f2d9 1038 },
56ab6b93
HY
1039 {
1040 .procname = "tcp_tw_reuse",
1041 .data = &init_net.ipv4.sysctl_tcp_tw_reuse,
1042 .maxlen = sizeof(int),
1043 .mode = 0644,
1044 .proc_handler = proc_dointvec
1045 },
1946e672
HY
1046 {
1047 .procname = "tcp_max_tw_buckets",
1048 .data = &init_net.ipv4.tcp_death_row.sysctl_max_tw_buckets,
1049 .maxlen = sizeof(int),
1050 .mode = 0644,
1051 .proc_handler = proc_dointvec
1052 },
fee83d09
HY
1053 {
1054 .procname = "tcp_max_syn_backlog",
1055 .data = &init_net.ipv4.sysctl_max_syn_backlog,
1056 .maxlen = sizeof(int),
1057 .mode = 0644,
1058 .proc_handler = proc_dointvec
1059 },
a6db4494
DA
1060#ifdef CONFIG_IP_ROUTE_MULTIPATH
1061 {
1062 .procname = "fib_multipath_use_neigh",
1063 .data = &init_net.ipv4.sysctl_fib_multipath_use_neigh,
1064 .maxlen = sizeof(int),
1065 .mode = 0644,
1066 .proc_handler = proc_dointvec_minmax,
bf4e0a3d
NA
1067 .extra1 = &zero,
1068 .extra2 = &one,
1069 },
1070 {
1071 .procname = "fib_multipath_hash_policy",
1072 .data = &init_net.ipv4.sysctl_fib_multipath_hash_policy,
1073 .maxlen = sizeof(int),
1074 .mode = 0644,
1075 .proc_handler = proc_dointvec_minmax,
a6db4494
DA
1076 .extra1 = &zero,
1077 .extra2 = &one,
1078 },
1079#endif
4548b683
KJ
1080 {
1081 .procname = "ip_unprivileged_port_start",
1082 .maxlen = sizeof(int),
1083 .data = &init_net.ipv4.sysctl_ip_prot_sock,
1084 .mode = 0644,
1085 .proc_handler = ipv4_privileged_ports,
1086 },
63a6fff3
RS
1087#ifdef CONFIG_NET_L3_MASTER_DEV
1088 {
1089 .procname = "udp_l3mdev_accept",
1090 .data = &init_net.ipv4.sysctl_udp_l3mdev_accept,
1091 .maxlen = sizeof(int),
1092 .mode = 0644,
1093 .proc_handler = proc_dointvec_minmax,
1094 .extra1 = &zero,
1095 .extra2 = &one,
1096 },
1097#endif
68528f09
PE
1098 { }
1099};
1100
1577519d
PE
1101static __net_init int ipv4_sysctl_init_net(struct net *net)
1102{
68528f09
PE
1103 struct ctl_table *table;
1104
1105 table = ipv4_net_table;
09ad9bc7 1106 if (!net_eq(net, &init_net)) {
0a6fa23d
EB
1107 int i;
1108
68528f09 1109 table = kmemdup(table, sizeof(ipv4_net_table), GFP_KERNEL);
51456b29 1110 if (!table)
68528f09
PE
1111 goto err_alloc;
1112
0a6fa23d
EB
1113 /* Update the variables to point into the current struct net */
1114 for (i = 0; i < ARRAY_SIZE(ipv4_net_table) - 1; i++)
1115 table[i].data += (void *)net - (void *)&init_net;
68528f09
PE
1116 }
1117
ec8f23ce 1118 net->ipv4.ipv4_hdr = register_net_sysctl(net, "net/ipv4", table);
51456b29 1119 if (!net->ipv4.ipv4_hdr)
68528f09
PE
1120 goto err_reg;
1121
122ff243
WC
1122 net->ipv4.sysctl_local_reserved_ports = kzalloc(65536 / 8, GFP_KERNEL);
1123 if (!net->ipv4.sysctl_local_reserved_ports)
1124 goto err_ports;
1125
1577519d 1126 return 0;
68528f09 1127
122ff243
WC
1128err_ports:
1129 unregister_net_sysctl_table(net->ipv4.ipv4_hdr);
68528f09 1130err_reg:
09ad9bc7 1131 if (!net_eq(net, &init_net))
68528f09
PE
1132 kfree(table);
1133err_alloc:
1134 return -ENOMEM;
1577519d
PE
1135}
1136
1137static __net_exit void ipv4_sysctl_exit_net(struct net *net)
1138{
68528f09
PE
1139 struct ctl_table *table;
1140
122ff243 1141 kfree(net->ipv4.sysctl_local_reserved_ports);
68528f09
PE
1142 table = net->ipv4.ipv4_hdr->ctl_table_arg;
1143 unregister_net_sysctl_table(net->ipv4.ipv4_hdr);
1144 kfree(table);
1577519d
PE
1145}
1146
1147static __net_initdata struct pernet_operations ipv4_sysctl_ops = {
1148 .init = ipv4_sysctl_init_net,
1149 .exit = ipv4_sysctl_exit_net,
1150};
1151
3e37c3f9
PE
1152static __init int sysctl_ipv4_init(void)
1153{
1154 struct ctl_table_header *hdr;
1155
ec8f23ce 1156 hdr = register_net_sysctl(&init_net, "net/ipv4", ipv4_table);
51456b29 1157 if (!hdr)
1577519d
PE
1158 return -ENOMEM;
1159
1160 if (register_pernet_subsys(&ipv4_sysctl_ops)) {
5dd3df10 1161 unregister_net_sysctl_table(hdr);
1577519d
PE
1162 return -ENOMEM;
1163 }
1164
1165 return 0;
3e37c3f9
PE
1166}
1167
1168__initcall(sysctl_ipv4_init);