2 * sysctl_net_ipv4.c: sysctl interface to net IPV4 subsystem.
4 * Begun April 1, 1996, Mike Shaver.
5 * Added /proc/sys/net/ipv4 directory entry (empty =) ). [MS]
9 #include <linux/module.h>
10 #include <linux/sysctl.h>
11 #include <linux/igmp.h>
12 #include <linux/inetdevice.h>
13 #include <linux/seqlock.h>
14 #include <linux/init.h>
15 #include <linux/slab.h>
16 #include <linux/nsproxy.h>
20 #include <net/route.h>
23 #include <net/cipso_ipv4.h>
24 #include <net/inet_frag.h>
28 static int tcp_retr1_max
= 255;
29 static int ip_local_port_range_min
[] = { 1, 1 };
30 static int ip_local_port_range_max
[] = { 65535, 65535 };
31 static int tcp_adv_win_scale_min
= -31;
32 static int tcp_adv_win_scale_max
= 31;
33 static int ip_ttl_min
= 1;
34 static int ip_ttl_max
= 255;
35 static int ip_ping_group_range_min
[] = { 0, 0 };
36 static int ip_ping_group_range_max
[] = { GID_T_MAX
, GID_T_MAX
};
38 /* Update system visible IP port range */
39 static void set_local_port_range(int range
[2])
41 write_seqlock(&sysctl_local_ports
.lock
);
42 sysctl_local_ports
.range
[0] = range
[0];
43 sysctl_local_ports
.range
[1] = range
[1];
44 write_sequnlock(&sysctl_local_ports
.lock
);
47 /* Validate changes from /proc interface. */
48 static int ipv4_local_port_range(ctl_table
*table
, int write
,
50 size_t *lenp
, loff_t
*ppos
)
56 .maxlen
= sizeof(range
),
58 .extra1
= &ip_local_port_range_min
,
59 .extra2
= &ip_local_port_range_max
,
62 inet_get_local_port_range(range
, range
+ 1);
63 ret
= proc_dointvec_minmax(&tmp
, write
, buffer
, lenp
, ppos
);
65 if (write
&& ret
== 0) {
66 if (range
[1] < range
[0])
69 set_local_port_range(range
);
76 void inet_get_ping_group_range_table(struct ctl_table
*table
, gid_t
*low
, gid_t
*high
)
78 gid_t
*data
= table
->data
;
81 seq
= read_seqbegin(&sysctl_local_ports
.lock
);
85 } while (read_seqretry(&sysctl_local_ports
.lock
, seq
));
88 /* Update system visible IP port range */
89 static void set_ping_group_range(struct ctl_table
*table
, int range
[2])
91 gid_t
*data
= table
->data
;
92 write_seqlock(&sysctl_local_ports
.lock
);
95 write_sequnlock(&sysctl_local_ports
.lock
);
98 /* Validate changes from /proc interface. */
99 static int ipv4_ping_group_range(ctl_table
*table
, int write
,
101 size_t *lenp
, loff_t
*ppos
)
107 .maxlen
= sizeof(range
),
109 .extra1
= &ip_ping_group_range_min
,
110 .extra2
= &ip_ping_group_range_max
,
113 inet_get_ping_group_range_table(table
, range
, range
+ 1);
114 ret
= proc_dointvec_minmax(&tmp
, write
, buffer
, lenp
, ppos
);
116 if (write
&& ret
== 0)
117 set_ping_group_range(table
, range
);
122 static int proc_tcp_congestion_control(ctl_table
*ctl
, int write
,
123 void __user
*buffer
, size_t *lenp
, loff_t
*ppos
)
125 char val
[TCP_CA_NAME_MAX
];
128 .maxlen
= TCP_CA_NAME_MAX
,
132 tcp_get_default_congestion_control(val
);
134 ret
= proc_dostring(&tbl
, write
, buffer
, lenp
, ppos
);
135 if (write
&& ret
== 0)
136 ret
= tcp_set_default_congestion_control(val
);
140 static int proc_tcp_available_congestion_control(ctl_table
*ctl
,
142 void __user
*buffer
, size_t *lenp
,
145 ctl_table tbl
= { .maxlen
= TCP_CA_BUF_MAX
, };
148 tbl
.data
= kmalloc(tbl
.maxlen
, GFP_USER
);
151 tcp_get_available_congestion_control(tbl
.data
, TCP_CA_BUF_MAX
);
152 ret
= proc_dostring(&tbl
, write
, buffer
, lenp
, ppos
);
157 static int proc_allowed_congestion_control(ctl_table
*ctl
,
159 void __user
*buffer
, size_t *lenp
,
162 ctl_table tbl
= { .maxlen
= TCP_CA_BUF_MAX
};
165 tbl
.data
= kmalloc(tbl
.maxlen
, GFP_USER
);
169 tcp_get_allowed_congestion_control(tbl
.data
, tbl
.maxlen
);
170 ret
= proc_dostring(&tbl
, write
, buffer
, lenp
, ppos
);
171 if (write
&& ret
== 0)
172 ret
= tcp_set_allowed_congestion_control(tbl
.data
);
177 static struct ctl_table ipv4_table
[] = {
179 .procname
= "tcp_timestamps",
180 .data
= &sysctl_tcp_timestamps
,
181 .maxlen
= sizeof(int),
183 .proc_handler
= proc_dointvec
186 .procname
= "tcp_window_scaling",
187 .data
= &sysctl_tcp_window_scaling
,
188 .maxlen
= sizeof(int),
190 .proc_handler
= proc_dointvec
193 .procname
= "tcp_sack",
194 .data
= &sysctl_tcp_sack
,
195 .maxlen
= sizeof(int),
197 .proc_handler
= proc_dointvec
200 .procname
= "tcp_retrans_collapse",
201 .data
= &sysctl_tcp_retrans_collapse
,
202 .maxlen
= sizeof(int),
204 .proc_handler
= proc_dointvec
207 .procname
= "ip_default_ttl",
208 .data
= &sysctl_ip_default_ttl
,
209 .maxlen
= sizeof(int),
211 .proc_handler
= proc_dointvec_minmax
,
212 .extra1
= &ip_ttl_min
,
213 .extra2
= &ip_ttl_max
,
216 .procname
= "ip_no_pmtu_disc",
217 .data
= &ipv4_config
.no_pmtu_disc
,
218 .maxlen
= sizeof(int),
220 .proc_handler
= proc_dointvec
223 .procname
= "ip_nonlocal_bind",
224 .data
= &sysctl_ip_nonlocal_bind
,
225 .maxlen
= sizeof(int),
227 .proc_handler
= proc_dointvec
230 .procname
= "tcp_syn_retries",
231 .data
= &sysctl_tcp_syn_retries
,
232 .maxlen
= sizeof(int),
234 .proc_handler
= proc_dointvec
237 .procname
= "tcp_synack_retries",
238 .data
= &sysctl_tcp_synack_retries
,
239 .maxlen
= sizeof(int),
241 .proc_handler
= proc_dointvec
244 .procname
= "tcp_max_orphans",
245 .data
= &sysctl_tcp_max_orphans
,
246 .maxlen
= sizeof(int),
248 .proc_handler
= proc_dointvec
251 .procname
= "tcp_max_tw_buckets",
252 .data
= &tcp_death_row
.sysctl_max_tw_buckets
,
253 .maxlen
= sizeof(int),
255 .proc_handler
= proc_dointvec
258 .procname
= "ip_dynaddr",
259 .data
= &sysctl_ip_dynaddr
,
260 .maxlen
= sizeof(int),
262 .proc_handler
= proc_dointvec
265 .procname
= "tcp_keepalive_time",
266 .data
= &sysctl_tcp_keepalive_time
,
267 .maxlen
= sizeof(int),
269 .proc_handler
= proc_dointvec_jiffies
,
272 .procname
= "tcp_keepalive_probes",
273 .data
= &sysctl_tcp_keepalive_probes
,
274 .maxlen
= sizeof(int),
276 .proc_handler
= proc_dointvec
279 .procname
= "tcp_keepalive_intvl",
280 .data
= &sysctl_tcp_keepalive_intvl
,
281 .maxlen
= sizeof(int),
283 .proc_handler
= proc_dointvec_jiffies
,
286 .procname
= "tcp_retries1",
287 .data
= &sysctl_tcp_retries1
,
288 .maxlen
= sizeof(int),
290 .proc_handler
= proc_dointvec_minmax
,
291 .extra2
= &tcp_retr1_max
294 .procname
= "tcp_retries2",
295 .data
= &sysctl_tcp_retries2
,
296 .maxlen
= sizeof(int),
298 .proc_handler
= proc_dointvec
301 .procname
= "tcp_fin_timeout",
302 .data
= &sysctl_tcp_fin_timeout
,
303 .maxlen
= sizeof(int),
305 .proc_handler
= proc_dointvec_jiffies
,
307 #ifdef CONFIG_SYN_COOKIES
309 .procname
= "tcp_syncookies",
310 .data
= &sysctl_tcp_syncookies
,
311 .maxlen
= sizeof(int),
313 .proc_handler
= proc_dointvec
317 .procname
= "tcp_tw_recycle",
318 .data
= &tcp_death_row
.sysctl_tw_recycle
,
319 .maxlen
= sizeof(int),
321 .proc_handler
= proc_dointvec
324 .procname
= "tcp_abort_on_overflow",
325 .data
= &sysctl_tcp_abort_on_overflow
,
326 .maxlen
= sizeof(int),
328 .proc_handler
= proc_dointvec
331 .procname
= "tcp_stdurg",
332 .data
= &sysctl_tcp_stdurg
,
333 .maxlen
= sizeof(int),
335 .proc_handler
= proc_dointvec
338 .procname
= "tcp_rfc1337",
339 .data
= &sysctl_tcp_rfc1337
,
340 .maxlen
= sizeof(int),
342 .proc_handler
= proc_dointvec
345 .procname
= "tcp_max_syn_backlog",
346 .data
= &sysctl_max_syn_backlog
,
347 .maxlen
= sizeof(int),
349 .proc_handler
= proc_dointvec
352 .procname
= "ip_local_port_range",
353 .data
= &sysctl_local_ports
.range
,
354 .maxlen
= sizeof(sysctl_local_ports
.range
),
356 .proc_handler
= ipv4_local_port_range
,
359 .procname
= "ip_local_reserved_ports",
360 .data
= NULL
, /* initialized in sysctl_ipv4_init */
363 .proc_handler
= proc_do_large_bitmap
,
366 .procname
= "igmp_max_memberships",
367 .data
= &sysctl_igmp_max_memberships
,
368 .maxlen
= sizeof(int),
370 .proc_handler
= proc_dointvec
373 .procname
= "igmp_max_msf",
374 .data
= &sysctl_igmp_max_msf
,
375 .maxlen
= sizeof(int),
377 .proc_handler
= proc_dointvec
380 .procname
= "inet_peer_threshold",
381 .data
= &inet_peer_threshold
,
382 .maxlen
= sizeof(int),
384 .proc_handler
= proc_dointvec
387 .procname
= "inet_peer_minttl",
388 .data
= &inet_peer_minttl
,
389 .maxlen
= sizeof(int),
391 .proc_handler
= proc_dointvec_jiffies
,
394 .procname
= "inet_peer_maxttl",
395 .data
= &inet_peer_maxttl
,
396 .maxlen
= sizeof(int),
398 .proc_handler
= proc_dointvec_jiffies
,
401 .procname
= "tcp_orphan_retries",
402 .data
= &sysctl_tcp_orphan_retries
,
403 .maxlen
= sizeof(int),
405 .proc_handler
= proc_dointvec
408 .procname
= "tcp_fack",
409 .data
= &sysctl_tcp_fack
,
410 .maxlen
= sizeof(int),
412 .proc_handler
= proc_dointvec
415 .procname
= "tcp_reordering",
416 .data
= &sysctl_tcp_reordering
,
417 .maxlen
= sizeof(int),
419 .proc_handler
= proc_dointvec
422 .procname
= "tcp_ecn",
423 .data
= &sysctl_tcp_ecn
,
424 .maxlen
= sizeof(int),
426 .proc_handler
= proc_dointvec
429 .procname
= "tcp_dsack",
430 .data
= &sysctl_tcp_dsack
,
431 .maxlen
= sizeof(int),
433 .proc_handler
= proc_dointvec
436 .procname
= "tcp_mem",
437 .data
= &sysctl_tcp_mem
,
438 .maxlen
= sizeof(sysctl_tcp_mem
),
440 .proc_handler
= proc_doulongvec_minmax
443 .procname
= "tcp_wmem",
444 .data
= &sysctl_tcp_wmem
,
445 .maxlen
= sizeof(sysctl_tcp_wmem
),
447 .proc_handler
= proc_dointvec
450 .procname
= "tcp_rmem",
451 .data
= &sysctl_tcp_rmem
,
452 .maxlen
= sizeof(sysctl_tcp_rmem
),
454 .proc_handler
= proc_dointvec
457 .procname
= "tcp_app_win",
458 .data
= &sysctl_tcp_app_win
,
459 .maxlen
= sizeof(int),
461 .proc_handler
= proc_dointvec
464 .procname
= "tcp_adv_win_scale",
465 .data
= &sysctl_tcp_adv_win_scale
,
466 .maxlen
= sizeof(int),
468 .proc_handler
= proc_dointvec_minmax
,
469 .extra1
= &tcp_adv_win_scale_min
,
470 .extra2
= &tcp_adv_win_scale_max
,
473 .procname
= "tcp_tw_reuse",
474 .data
= &sysctl_tcp_tw_reuse
,
475 .maxlen
= sizeof(int),
477 .proc_handler
= proc_dointvec
480 .procname
= "tcp_frto",
481 .data
= &sysctl_tcp_frto
,
482 .maxlen
= sizeof(int),
484 .proc_handler
= proc_dointvec
487 .procname
= "tcp_frto_response",
488 .data
= &sysctl_tcp_frto_response
,
489 .maxlen
= sizeof(int),
491 .proc_handler
= proc_dointvec
494 .procname
= "tcp_low_latency",
495 .data
= &sysctl_tcp_low_latency
,
496 .maxlen
= sizeof(int),
498 .proc_handler
= proc_dointvec
501 .procname
= "tcp_no_metrics_save",
502 .data
= &sysctl_tcp_nometrics_save
,
503 .maxlen
= sizeof(int),
505 .proc_handler
= proc_dointvec
,
508 .procname
= "tcp_moderate_rcvbuf",
509 .data
= &sysctl_tcp_moderate_rcvbuf
,
510 .maxlen
= sizeof(int),
512 .proc_handler
= proc_dointvec
,
515 .procname
= "tcp_tso_win_divisor",
516 .data
= &sysctl_tcp_tso_win_divisor
,
517 .maxlen
= sizeof(int),
519 .proc_handler
= proc_dointvec
,
522 .procname
= "tcp_congestion_control",
524 .maxlen
= TCP_CA_NAME_MAX
,
525 .proc_handler
= proc_tcp_congestion_control
,
528 .procname
= "tcp_abc",
529 .data
= &sysctl_tcp_abc
,
530 .maxlen
= sizeof(int),
532 .proc_handler
= proc_dointvec
,
535 .procname
= "tcp_mtu_probing",
536 .data
= &sysctl_tcp_mtu_probing
,
537 .maxlen
= sizeof(int),
539 .proc_handler
= proc_dointvec
,
542 .procname
= "tcp_base_mss",
543 .data
= &sysctl_tcp_base_mss
,
544 .maxlen
= sizeof(int),
546 .proc_handler
= proc_dointvec
,
549 .procname
= "tcp_workaround_signed_windows",
550 .data
= &sysctl_tcp_workaround_signed_windows
,
551 .maxlen
= sizeof(int),
553 .proc_handler
= proc_dointvec
555 #ifdef CONFIG_NET_DMA
557 .procname
= "tcp_dma_copybreak",
558 .data
= &sysctl_tcp_dma_copybreak
,
559 .maxlen
= sizeof(int),
561 .proc_handler
= proc_dointvec
565 .procname
= "tcp_slow_start_after_idle",
566 .data
= &sysctl_tcp_slow_start_after_idle
,
567 .maxlen
= sizeof(int),
569 .proc_handler
= proc_dointvec
571 #ifdef CONFIG_NETLABEL
573 .procname
= "cipso_cache_enable",
574 .data
= &cipso_v4_cache_enabled
,
575 .maxlen
= sizeof(int),
577 .proc_handler
= proc_dointvec
,
580 .procname
= "cipso_cache_bucket_size",
581 .data
= &cipso_v4_cache_bucketsize
,
582 .maxlen
= sizeof(int),
584 .proc_handler
= proc_dointvec
,
587 .procname
= "cipso_rbm_optfmt",
588 .data
= &cipso_v4_rbm_optfmt
,
589 .maxlen
= sizeof(int),
591 .proc_handler
= proc_dointvec
,
594 .procname
= "cipso_rbm_strictvalid",
595 .data
= &cipso_v4_rbm_strictvalid
,
596 .maxlen
= sizeof(int),
598 .proc_handler
= proc_dointvec
,
600 #endif /* CONFIG_NETLABEL */
602 .procname
= "tcp_available_congestion_control",
603 .maxlen
= TCP_CA_BUF_MAX
,
605 .proc_handler
= proc_tcp_available_congestion_control
,
608 .procname
= "tcp_allowed_congestion_control",
609 .maxlen
= TCP_CA_BUF_MAX
,
611 .proc_handler
= proc_allowed_congestion_control
,
614 .procname
= "tcp_max_ssthresh",
615 .data
= &sysctl_tcp_max_ssthresh
,
616 .maxlen
= sizeof(int),
618 .proc_handler
= proc_dointvec
,
621 .procname
= "tcp_cookie_size",
622 .data
= &sysctl_tcp_cookie_size
,
623 .maxlen
= sizeof(int),
625 .proc_handler
= proc_dointvec
628 .procname
= "tcp_thin_linear_timeouts",
629 .data
= &sysctl_tcp_thin_linear_timeouts
,
630 .maxlen
= sizeof(int),
632 .proc_handler
= proc_dointvec
635 .procname
= "tcp_thin_dupack",
636 .data
= &sysctl_tcp_thin_dupack
,
637 .maxlen
= sizeof(int),
639 .proc_handler
= proc_dointvec
642 .procname
= "udp_mem",
643 .data
= &sysctl_udp_mem
,
644 .maxlen
= sizeof(sysctl_udp_mem
),
646 .proc_handler
= proc_doulongvec_minmax
,
649 .procname
= "udp_rmem_min",
650 .data
= &sysctl_udp_rmem_min
,
651 .maxlen
= sizeof(sysctl_udp_rmem_min
),
653 .proc_handler
= proc_dointvec_minmax
,
657 .procname
= "udp_wmem_min",
658 .data
= &sysctl_udp_wmem_min
,
659 .maxlen
= sizeof(sysctl_udp_wmem_min
),
661 .proc_handler
= proc_dointvec_minmax
,
667 static struct ctl_table ipv4_net_table
[] = {
669 .procname
= "icmp_echo_ignore_all",
670 .data
= &init_net
.ipv4
.sysctl_icmp_echo_ignore_all
,
671 .maxlen
= sizeof(int),
673 .proc_handler
= proc_dointvec
676 .procname
= "icmp_echo_ignore_broadcasts",
677 .data
= &init_net
.ipv4
.sysctl_icmp_echo_ignore_broadcasts
,
678 .maxlen
= sizeof(int),
680 .proc_handler
= proc_dointvec
683 .procname
= "icmp_ignore_bogus_error_responses",
684 .data
= &init_net
.ipv4
.sysctl_icmp_ignore_bogus_error_responses
,
685 .maxlen
= sizeof(int),
687 .proc_handler
= proc_dointvec
690 .procname
= "icmp_errors_use_inbound_ifaddr",
691 .data
= &init_net
.ipv4
.sysctl_icmp_errors_use_inbound_ifaddr
,
692 .maxlen
= sizeof(int),
694 .proc_handler
= proc_dointvec
697 .procname
= "icmp_ratelimit",
698 .data
= &init_net
.ipv4
.sysctl_icmp_ratelimit
,
699 .maxlen
= sizeof(int),
701 .proc_handler
= proc_dointvec_ms_jiffies
,
704 .procname
= "icmp_ratemask",
705 .data
= &init_net
.ipv4
.sysctl_icmp_ratemask
,
706 .maxlen
= sizeof(int),
708 .proc_handler
= proc_dointvec
711 .procname
= "rt_cache_rebuild_count",
712 .data
= &init_net
.ipv4
.sysctl_rt_cache_rebuild_count
,
713 .maxlen
= sizeof(int),
715 .proc_handler
= proc_dointvec
718 .procname
= "ping_group_range",
719 .data
= &init_net
.ipv4
.sysctl_ping_group_range
,
720 .maxlen
= sizeof(init_net
.ipv4
.sysctl_ping_group_range
),
722 .proc_handler
= ipv4_ping_group_range
,
727 struct ctl_path net_ipv4_ctl_path
[] = {
728 { .procname
= "net", },
729 { .procname
= "ipv4", },
732 EXPORT_SYMBOL_GPL(net_ipv4_ctl_path
);
734 static __net_init
int ipv4_sysctl_init_net(struct net
*net
)
736 struct ctl_table
*table
;
738 table
= ipv4_net_table
;
739 if (!net_eq(net
, &init_net
)) {
740 table
= kmemdup(table
, sizeof(ipv4_net_table
), GFP_KERNEL
);
745 &net
->ipv4
.sysctl_icmp_echo_ignore_all
;
747 &net
->ipv4
.sysctl_icmp_echo_ignore_broadcasts
;
749 &net
->ipv4
.sysctl_icmp_ignore_bogus_error_responses
;
751 &net
->ipv4
.sysctl_icmp_errors_use_inbound_ifaddr
;
753 &net
->ipv4
.sysctl_icmp_ratelimit
;
755 &net
->ipv4
.sysctl_icmp_ratemask
;
757 &net
->ipv4
.sysctl_rt_cache_rebuild_count
;
759 &net
->ipv4
.sysctl_ping_group_range
;
764 * Sane defaults - nobody may create ping sockets.
765 * Boot scripts should set this to distro-specific group.
767 net
->ipv4
.sysctl_ping_group_range
[0] = 1;
768 net
->ipv4
.sysctl_ping_group_range
[1] = 0;
770 net
->ipv4
.sysctl_rt_cache_rebuild_count
= 4;
772 net
->ipv4
.ipv4_hdr
= register_net_sysctl_table(net
,
773 net_ipv4_ctl_path
, table
);
774 if (net
->ipv4
.ipv4_hdr
== NULL
)
780 if (!net_eq(net
, &init_net
))
786 static __net_exit
void ipv4_sysctl_exit_net(struct net
*net
)
788 struct ctl_table
*table
;
790 table
= net
->ipv4
.ipv4_hdr
->ctl_table_arg
;
791 unregister_net_sysctl_table(net
->ipv4
.ipv4_hdr
);
795 static __net_initdata
struct pernet_operations ipv4_sysctl_ops
= {
796 .init
= ipv4_sysctl_init_net
,
797 .exit
= ipv4_sysctl_exit_net
,
800 static __init
int sysctl_ipv4_init(void)
802 struct ctl_table_header
*hdr
;
805 for (i
= ipv4_table
; i
->procname
; i
++) {
806 if (strcmp(i
->procname
, "ip_local_reserved_ports") == 0) {
807 i
->data
= sysctl_local_reserved_ports
;
814 hdr
= register_sysctl_paths(net_ipv4_ctl_path
, ipv4_table
);
818 if (register_pernet_subsys(&ipv4_sysctl_ops
)) {
819 unregister_sysctl_table(hdr
);
826 __initcall(sysctl_ipv4_init
);