1 /* 2 * sysctl_net_ipv4.c: sysctl interface to net IPV4 subsystem. 3 * 4 * Begun April 1, 1996, Mike Shaver. 5 * Added /proc/sys/net/ipv4 directory entry (empty =) ). [MS] 6 */ 7 8 #include <linux/mm.h> 9 #include <linux/module.h> 10 #include <linux/sysctl.h> 11 #include <linux/igmp.h> 12 #include <linux/inetdevice.h> 13 #include <linux/seqlock.h> 14 #include <linux/init.h> 15 #include <linux/slab.h> 16 #include <linux/nsproxy.h> 17 #include <linux/swap.h> 18 #include <net/snmp.h> 19 #include <net/icmp.h> 20 #include <net/ip.h> 21 #include <net/route.h> 22 #include <net/tcp.h> 23 #include <net/udp.h> 24 #include <net/cipso_ipv4.h> 25 #include <net/inet_frag.h> 26 #include <net/ping.h> 27 #include <net/tcp_memcontrol.h> 28 29 static int zero; 30 static int one = 1; 31 static int four = 4; 32 static int gso_max_segs = GSO_MAX_SEGS; 33 static int tcp_retr1_max = 255; 34 static int ip_local_port_range_min[] = { 1, 1 }; 35 static int ip_local_port_range_max[] = { 65535, 65535 }; 36 static int tcp_adv_win_scale_min = -31; 37 static int tcp_adv_win_scale_max = 31; 38 static int ip_ttl_min = 1; 39 static int ip_ttl_max = 255; 40 static int tcp_syn_retries_min = 1; 41 static int tcp_syn_retries_max = MAX_TCP_SYNCNT; 42 static int ip_ping_group_range_min[] = { 0, 0 }; 43 static int ip_ping_group_range_max[] = { GID_T_MAX, GID_T_MAX }; 44 45 /* Update system visible IP port range */ 46 static void set_local_port_range(struct net *net, int range[2]) 47 { 48 write_seqlock(&net->ipv4.sysctl_local_ports.lock); 49 net->ipv4.sysctl_local_ports.range[0] = range[0]; 50 net->ipv4.sysctl_local_ports.range[1] = range[1]; 51 write_sequnlock(&net->ipv4.sysctl_local_ports.lock); 52 } 53 54 /* Validate changes from /proc interface. */ 55 static int ipv4_local_port_range(struct ctl_table *table, int write, 56 void __user *buffer, 57 size_t *lenp, loff_t *ppos) 58 { 59 struct net *net = 60 container_of(table->data, struct net, ipv4.sysctl_local_ports.range); 61 int ret; 62 int range[2]; 63 struct ctl_table tmp = { 64 .data = &range, 65 .maxlen = sizeof(range), 66 .mode = table->mode, 67 .extra1 = &ip_local_port_range_min, 68 .extra2 = &ip_local_port_range_max, 69 }; 70 71 inet_get_local_port_range(net, &range[0], &range[1]); 72 73 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos); 74 75 if (write && ret == 0) { 76 if (range[1] < range[0]) 77 ret = -EINVAL; 78 else 79 set_local_port_range(net, range); 80 } 81 82 return ret; 83 } 84 85 86 static void inet_get_ping_group_range_table(struct ctl_table *table, kgid_t *low, kgid_t *high) 87 { 88 kgid_t *data = table->data; 89 struct net *net = 90 container_of(table->data, struct net, ipv4.sysctl_ping_group_range); 91 unsigned int seq; 92 do { 93 seq = read_seqbegin(&net->ipv4.sysctl_local_ports.lock); 94 95 *low = data[0]; 96 *high = data[1]; 97 } while (read_seqretry(&net->ipv4.sysctl_local_ports.lock, seq)); 98 } 99 100 /* Update system visible IP port range */ 101 static void set_ping_group_range(struct ctl_table *table, kgid_t low, kgid_t high) 102 { 103 kgid_t *data = table->data; 104 struct net *net = 105 container_of(table->data, struct net, ipv4.sysctl_ping_group_range); 106 write_seqlock(&net->ipv4.sysctl_local_ports.lock); 107 data[0] = low; 108 data[1] = high; 109 write_sequnlock(&net->ipv4.sysctl_local_ports.lock); 110 } 111 112 /* Validate changes from /proc interface. */ 113 static int ipv4_ping_group_range(struct ctl_table *table, int write, 114 void __user *buffer, 115 size_t *lenp, loff_t *ppos) 116 { 117 struct user_namespace *user_ns = current_user_ns(); 118 int ret; 119 gid_t urange[2]; 120 kgid_t low, high; 121 struct ctl_table tmp = { 122 .data = &urange, 123 .maxlen = sizeof(urange), 124 .mode = table->mode, 125 .extra1 = &ip_ping_group_range_min, 126 .extra2 = &ip_ping_group_range_max, 127 }; 128 129 inet_get_ping_group_range_table(table, &low, &high); 130 urange[0] = from_kgid_munged(user_ns, low); 131 urange[1] = from_kgid_munged(user_ns, high); 132 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos); 133 134 if (write && ret == 0) { 135 low = make_kgid(user_ns, urange[0]); 136 high = make_kgid(user_ns, urange[1]); 137 if (!gid_valid(low) || !gid_valid(high) || 138 (urange[1] < urange[0]) || gid_lt(high, low)) { 139 low = make_kgid(&init_user_ns, 1); 140 high = make_kgid(&init_user_ns, 0); 141 } 142 set_ping_group_range(table, low, high); 143 } 144 145 return ret; 146 } 147 148 static int proc_tcp_congestion_control(struct ctl_table *ctl, int write, 149 void __user *buffer, size_t *lenp, loff_t *ppos) 150 { 151 char val[TCP_CA_NAME_MAX]; 152 struct ctl_table tbl = { 153 .data = val, 154 .maxlen = TCP_CA_NAME_MAX, 155 }; 156 int ret; 157 158 tcp_get_default_congestion_control(val); 159 160 ret = proc_dostring(&tbl, write, buffer, lenp, ppos); 161 if (write && ret == 0) 162 ret = tcp_set_default_congestion_control(val); 163 return ret; 164 } 165 166 static int proc_tcp_available_congestion_control(struct ctl_table *ctl, 167 int write, 168 void __user *buffer, size_t *lenp, 169 loff_t *ppos) 170 { 171 struct ctl_table tbl = { .maxlen = TCP_CA_BUF_MAX, }; 172 int ret; 173 174 tbl.data = kmalloc(tbl.maxlen, GFP_USER); 175 if (!tbl.data) 176 return -ENOMEM; 177 tcp_get_available_congestion_control(tbl.data, TCP_CA_BUF_MAX); 178 ret = proc_dostring(&tbl, write, buffer, lenp, ppos); 179 kfree(tbl.data); 180 return ret; 181 } 182 183 static int proc_allowed_congestion_control(struct ctl_table *ctl, 184 int write, 185 void __user *buffer, size_t *lenp, 186 loff_t *ppos) 187 { 188 struct ctl_table tbl = { .maxlen = TCP_CA_BUF_MAX }; 189 int ret; 190 191 tbl.data = kmalloc(tbl.maxlen, GFP_USER); 192 if (!tbl.data) 193 return -ENOMEM; 194 195 tcp_get_allowed_congestion_control(tbl.data, tbl.maxlen); 196 ret = proc_dostring(&tbl, write, buffer, lenp, ppos); 197 if (write && ret == 0) 198 ret = tcp_set_allowed_congestion_control(tbl.data); 199 kfree(tbl.data); 200 return ret; 201 } 202 203 static int ipv4_tcp_mem(struct ctl_table *ctl, int write, 204 void __user *buffer, size_t *lenp, 205 loff_t *ppos) 206 { 207 int ret; 208 unsigned long vec[3]; 209 struct net *net = current->nsproxy->net_ns; 210 #ifdef CONFIG_MEMCG_KMEM 211 struct mem_cgroup *memcg; 212 #endif 213 214 struct ctl_table tmp = { 215 .data = &vec, 216 .maxlen = sizeof(vec), 217 .mode = ctl->mode, 218 }; 219 220 if (!write) { 221 ctl->data = &net->ipv4.sysctl_tcp_mem; 222 return proc_doulongvec_minmax(ctl, write, buffer, lenp, ppos); 223 } 224 225 ret = proc_doulongvec_minmax(&tmp, write, buffer, lenp, ppos); 226 if (ret) 227 return ret; 228 229 #ifdef CONFIG_MEMCG_KMEM 230 rcu_read_lock(); 231 memcg = mem_cgroup_from_task(current); 232 233 tcp_prot_mem(memcg, vec[0], 0); 234 tcp_prot_mem(memcg, vec[1], 1); 235 tcp_prot_mem(memcg, vec[2], 2); 236 rcu_read_unlock(); 237 #endif 238 239 net->ipv4.sysctl_tcp_mem[0] = vec[0]; 240 net->ipv4.sysctl_tcp_mem[1] = vec[1]; 241 net->ipv4.sysctl_tcp_mem[2] = vec[2]; 242 243 return 0; 244 } 245 246 static int proc_tcp_fastopen_key(struct ctl_table *ctl, int write, 247 void __user *buffer, size_t *lenp, 248 loff_t *ppos) 249 { 250 struct ctl_table tbl = { .maxlen = (TCP_FASTOPEN_KEY_LENGTH * 2 + 10) }; 251 struct tcp_fastopen_context *ctxt; 252 int ret; 253 u32 user_key[4]; /* 16 bytes, matching TCP_FASTOPEN_KEY_LENGTH */ 254 255 tbl.data = kmalloc(tbl.maxlen, GFP_KERNEL); 256 if (!tbl.data) 257 return -ENOMEM; 258 259 rcu_read_lock(); 260 ctxt = rcu_dereference(tcp_fastopen_ctx); 261 if (ctxt) 262 memcpy(user_key, ctxt->key, TCP_FASTOPEN_KEY_LENGTH); 263 else 264 memset(user_key, 0, sizeof(user_key)); 265 rcu_read_unlock(); 266 267 snprintf(tbl.data, tbl.maxlen, "%08x-%08x-%08x-%08x", 268 user_key[0], user_key[1], user_key[2], user_key[3]); 269 ret = proc_dostring(&tbl, write, buffer, lenp, ppos); 270 271 if (write && ret == 0) { 272 if (sscanf(tbl.data, "%x-%x-%x-%x", user_key, user_key + 1, 273 user_key + 2, user_key + 3) != 4) { 274 ret = -EINVAL; 275 goto bad_key; 276 } 277 tcp_fastopen_reset_cipher(user_key, TCP_FASTOPEN_KEY_LENGTH); 278 } 279 280 bad_key: 281 pr_debug("proc FO key set 0x%x-%x-%x-%x <- 0x%s: %u\n", 282 user_key[0], user_key[1], user_key[2], user_key[3], 283 (char *)tbl.data, ret); 284 kfree(tbl.data); 285 return ret; 286 } 287 288 static struct ctl_table ipv4_table[] = { 289 { 290 .procname = "tcp_timestamps", 291 .data = &sysctl_tcp_timestamps, 292 .maxlen = sizeof(int), 293 .mode = 0644, 294 .proc_handler = proc_dointvec 295 }, 296 { 297 .procname = "tcp_window_scaling", 298 .data = &sysctl_tcp_window_scaling, 299 .maxlen = sizeof(int), 300 .mode = 0644, 301 .proc_handler = proc_dointvec 302 }, 303 { 304 .procname = "tcp_sack", 305 .data = &sysctl_tcp_sack, 306 .maxlen = sizeof(int), 307 .mode = 0644, 308 .proc_handler = proc_dointvec 309 }, 310 { 311 .procname = "tcp_retrans_collapse", 312 .data = &sysctl_tcp_retrans_collapse, 313 .maxlen = sizeof(int), 314 .mode = 0644, 315 .proc_handler = proc_dointvec 316 }, 317 { 318 .procname = "ip_default_ttl", 319 .data = &sysctl_ip_default_ttl, 320 .maxlen = sizeof(int), 321 .mode = 0644, 322 .proc_handler = proc_dointvec_minmax, 323 .extra1 = &ip_ttl_min, 324 .extra2 = &ip_ttl_max, 325 }, 326 { 327 .procname = "ip_no_pmtu_disc", 328 .data = &ipv4_config.no_pmtu_disc, 329 .maxlen = sizeof(int), 330 .mode = 0644, 331 .proc_handler = proc_dointvec 332 }, 333 { 334 .procname = "ip_nonlocal_bind", 335 .data = &sysctl_ip_nonlocal_bind, 336 .maxlen = sizeof(int), 337 .mode = 0644, 338 .proc_handler = proc_dointvec 339 }, 340 { 341 .procname = "tcp_syn_retries", 342 .data = &sysctl_tcp_syn_retries, 343 .maxlen = sizeof(int), 344 .mode = 0644, 345 .proc_handler = proc_dointvec_minmax, 346 .extra1 = &tcp_syn_retries_min, 347 .extra2 = &tcp_syn_retries_max 348 }, 349 { 350 .procname = "tcp_synack_retries", 351 .data = &sysctl_tcp_synack_retries, 352 .maxlen = sizeof(int), 353 .mode = 0644, 354 .proc_handler = proc_dointvec 355 }, 356 { 357 .procname = "tcp_max_orphans", 358 .data = &sysctl_tcp_max_orphans, 359 .maxlen = sizeof(int), 360 .mode = 0644, 361 .proc_handler = proc_dointvec 362 }, 363 { 364 .procname = "tcp_max_tw_buckets", 365 .data = &tcp_death_row.sysctl_max_tw_buckets, 366 .maxlen = sizeof(int), 367 .mode = 0644, 368 .proc_handler = proc_dointvec 369 }, 370 { 371 .procname = "ip_early_demux", 372 .data = &sysctl_ip_early_demux, 373 .maxlen = sizeof(int), 374 .mode = 0644, 375 .proc_handler = proc_dointvec 376 }, 377 { 378 .procname = "ip_dynaddr", 379 .data = &sysctl_ip_dynaddr, 380 .maxlen = sizeof(int), 381 .mode = 0644, 382 .proc_handler = proc_dointvec 383 }, 384 { 385 .procname = "tcp_keepalive_time", 386 .data = &sysctl_tcp_keepalive_time, 387 .maxlen = sizeof(int), 388 .mode = 0644, 389 .proc_handler = proc_dointvec_jiffies, 390 }, 391 { 392 .procname = "tcp_keepalive_probes", 393 .data = &sysctl_tcp_keepalive_probes, 394 .maxlen = sizeof(int), 395 .mode = 0644, 396 .proc_handler = proc_dointvec 397 }, 398 { 399 .procname = "tcp_keepalive_intvl", 400 .data = &sysctl_tcp_keepalive_intvl, 401 .maxlen = sizeof(int), 402 .mode = 0644, 403 .proc_handler = proc_dointvec_jiffies, 404 }, 405 { 406 .procname = "tcp_retries1", 407 .data = &sysctl_tcp_retries1, 408 .maxlen = sizeof(int), 409 .mode = 0644, 410 .proc_handler = proc_dointvec_minmax, 411 .extra2 = &tcp_retr1_max 412 }, 413 { 414 .procname = "tcp_retries2", 415 .data = &sysctl_tcp_retries2, 416 .maxlen = sizeof(int), 417 .mode = 0644, 418 .proc_handler = proc_dointvec 419 }, 420 { 421 .procname = "tcp_fin_timeout", 422 .data = &sysctl_tcp_fin_timeout, 423 .maxlen = sizeof(int), 424 .mode = 0644, 425 .proc_handler = proc_dointvec_jiffies, 426 }, 427 #ifdef CONFIG_SYN_COOKIES 428 { 429 .procname = "tcp_syncookies", 430 .data = &sysctl_tcp_syncookies, 431 .maxlen = sizeof(int), 432 .mode = 0644, 433 .proc_handler = proc_dointvec 434 }, 435 #endif 436 { 437 .procname = "tcp_fastopen", 438 .data = &sysctl_tcp_fastopen, 439 .maxlen = sizeof(int), 440 .mode = 0644, 441 .proc_handler = proc_dointvec, 442 }, 443 { 444 .procname = "tcp_fastopen_key", 445 .mode = 0600, 446 .maxlen = ((TCP_FASTOPEN_KEY_LENGTH * 2) + 10), 447 .proc_handler = proc_tcp_fastopen_key, 448 }, 449 { 450 .procname = "tcp_tw_recycle", 451 .data = &tcp_death_row.sysctl_tw_recycle, 452 .maxlen = sizeof(int), 453 .mode = 0644, 454 .proc_handler = proc_dointvec 455 }, 456 { 457 .procname = "tcp_abort_on_overflow", 458 .data = &sysctl_tcp_abort_on_overflow, 459 .maxlen = sizeof(int), 460 .mode = 0644, 461 .proc_handler = proc_dointvec 462 }, 463 { 464 .procname = "tcp_stdurg", 465 .data = &sysctl_tcp_stdurg, 466 .maxlen = sizeof(int), 467 .mode = 0644, 468 .proc_handler = proc_dointvec 469 }, 470 { 471 .procname = "tcp_rfc1337", 472 .data = &sysctl_tcp_rfc1337, 473 .maxlen = sizeof(int), 474 .mode = 0644, 475 .proc_handler = proc_dointvec 476 }, 477 { 478 .procname = "tcp_max_syn_backlog", 479 .data = &sysctl_max_syn_backlog, 480 .maxlen = sizeof(int), 481 .mode = 0644, 482 .proc_handler = proc_dointvec 483 }, 484 { 485 .procname = "ip_local_reserved_ports", 486 .data = NULL, /* initialized in sysctl_ipv4_init */ 487 .maxlen = 65536, 488 .mode = 0644, 489 .proc_handler = proc_do_large_bitmap, 490 }, 491 { 492 .procname = "igmp_max_memberships", 493 .data = &sysctl_igmp_max_memberships, 494 .maxlen = sizeof(int), 495 .mode = 0644, 496 .proc_handler = proc_dointvec 497 }, 498 { 499 .procname = "igmp_max_msf", 500 .data = &sysctl_igmp_max_msf, 501 .maxlen = sizeof(int), 502 .mode = 0644, 503 .proc_handler = proc_dointvec 504 }, 505 { 506 .procname = "inet_peer_threshold", 507 .data = &inet_peer_threshold, 508 .maxlen = sizeof(int), 509 .mode = 0644, 510 .proc_handler = proc_dointvec 511 }, 512 { 513 .procname = "inet_peer_minttl", 514 .data = &inet_peer_minttl, 515 .maxlen = sizeof(int), 516 .mode = 0644, 517 .proc_handler = proc_dointvec_jiffies, 518 }, 519 { 520 .procname = "inet_peer_maxttl", 521 .data = &inet_peer_maxttl, 522 .maxlen = sizeof(int), 523 .mode = 0644, 524 .proc_handler = proc_dointvec_jiffies, 525 }, 526 { 527 .procname = "tcp_orphan_retries", 528 .data = &sysctl_tcp_orphan_retries, 529 .maxlen = sizeof(int), 530 .mode = 0644, 531 .proc_handler = proc_dointvec 532 }, 533 { 534 .procname = "tcp_fack", 535 .data = &sysctl_tcp_fack, 536 .maxlen = sizeof(int), 537 .mode = 0644, 538 .proc_handler = proc_dointvec 539 }, 540 { 541 .procname = "tcp_reordering", 542 .data = &sysctl_tcp_reordering, 543 .maxlen = sizeof(int), 544 .mode = 0644, 545 .proc_handler = proc_dointvec 546 }, 547 { 548 .procname = "tcp_dsack", 549 .data = &sysctl_tcp_dsack, 550 .maxlen = sizeof(int), 551 .mode = 0644, 552 .proc_handler = proc_dointvec 553 }, 554 { 555 .procname = "tcp_wmem", 556 .data = &sysctl_tcp_wmem, 557 .maxlen = sizeof(sysctl_tcp_wmem), 558 .mode = 0644, 559 .proc_handler = proc_dointvec_minmax, 560 .extra1 = &one, 561 }, 562 { 563 .procname = "tcp_notsent_lowat", 564 .data = &sysctl_tcp_notsent_lowat, 565 .maxlen = sizeof(sysctl_tcp_notsent_lowat), 566 .mode = 0644, 567 .proc_handler = proc_dointvec, 568 }, 569 { 570 .procname = "tcp_rmem", 571 .data = &sysctl_tcp_rmem, 572 .maxlen = sizeof(sysctl_tcp_rmem), 573 .mode = 0644, 574 .proc_handler = proc_dointvec_minmax, 575 .extra1 = &one, 576 }, 577 { 578 .procname = "tcp_app_win", 579 .data = &sysctl_tcp_app_win, 580 .maxlen = sizeof(int), 581 .mode = 0644, 582 .proc_handler = proc_dointvec 583 }, 584 { 585 .procname = "tcp_adv_win_scale", 586 .data = &sysctl_tcp_adv_win_scale, 587 .maxlen = sizeof(int), 588 .mode = 0644, 589 .proc_handler = proc_dointvec_minmax, 590 .extra1 = &tcp_adv_win_scale_min, 591 .extra2 = &tcp_adv_win_scale_max, 592 }, 593 { 594 .procname = "tcp_tw_reuse", 595 .data = &sysctl_tcp_tw_reuse, 596 .maxlen = sizeof(int), 597 .mode = 0644, 598 .proc_handler = proc_dointvec 599 }, 600 { 601 .procname = "tcp_frto", 602 .data = &sysctl_tcp_frto, 603 .maxlen = sizeof(int), 604 .mode = 0644, 605 .proc_handler = proc_dointvec 606 }, 607 { 608 .procname = "tcp_low_latency", 609 .data = &sysctl_tcp_low_latency, 610 .maxlen = sizeof(int), 611 .mode = 0644, 612 .proc_handler = proc_dointvec 613 }, 614 { 615 .procname = "tcp_no_metrics_save", 616 .data = &sysctl_tcp_nometrics_save, 617 .maxlen = sizeof(int), 618 .mode = 0644, 619 .proc_handler = proc_dointvec, 620 }, 621 { 622 .procname = "tcp_moderate_rcvbuf", 623 .data = &sysctl_tcp_moderate_rcvbuf, 624 .maxlen = sizeof(int), 625 .mode = 0644, 626 .proc_handler = proc_dointvec, 627 }, 628 { 629 .procname = "tcp_tso_win_divisor", 630 .data = &sysctl_tcp_tso_win_divisor, 631 .maxlen = sizeof(int), 632 .mode = 0644, 633 .proc_handler = proc_dointvec, 634 }, 635 { 636 .procname = "tcp_congestion_control", 637 .mode = 0644, 638 .maxlen = TCP_CA_NAME_MAX, 639 .proc_handler = proc_tcp_congestion_control, 640 }, 641 { 642 .procname = "tcp_mtu_probing", 643 .data = &sysctl_tcp_mtu_probing, 644 .maxlen = sizeof(int), 645 .mode = 0644, 646 .proc_handler = proc_dointvec, 647 }, 648 { 649 .procname = "tcp_base_mss", 650 .data = &sysctl_tcp_base_mss, 651 .maxlen = sizeof(int), 652 .mode = 0644, 653 .proc_handler = proc_dointvec, 654 }, 655 { 656 .procname = "tcp_workaround_signed_windows", 657 .data = &sysctl_tcp_workaround_signed_windows, 658 .maxlen = sizeof(int), 659 .mode = 0644, 660 .proc_handler = proc_dointvec 661 }, 662 { 663 .procname = "tcp_limit_output_bytes", 664 .data = &sysctl_tcp_limit_output_bytes, 665 .maxlen = sizeof(int), 666 .mode = 0644, 667 .proc_handler = proc_dointvec 668 }, 669 { 670 .procname = "tcp_challenge_ack_limit", 671 .data = &sysctl_tcp_challenge_ack_limit, 672 .maxlen = sizeof(int), 673 .mode = 0644, 674 .proc_handler = proc_dointvec 675 }, 676 #ifdef CONFIG_NET_DMA 677 { 678 .procname = "tcp_dma_copybreak", 679 .data = &sysctl_tcp_dma_copybreak, 680 .maxlen = sizeof(int), 681 .mode = 0644, 682 .proc_handler = proc_dointvec 683 }, 684 #endif 685 { 686 .procname = "tcp_slow_start_after_idle", 687 .data = &sysctl_tcp_slow_start_after_idle, 688 .maxlen = sizeof(int), 689 .mode = 0644, 690 .proc_handler = proc_dointvec 691 }, 692 #ifdef CONFIG_NETLABEL 693 { 694 .procname = "cipso_cache_enable", 695 .data = &cipso_v4_cache_enabled, 696 .maxlen = sizeof(int), 697 .mode = 0644, 698 .proc_handler = proc_dointvec, 699 }, 700 { 701 .procname = "cipso_cache_bucket_size", 702 .data = &cipso_v4_cache_bucketsize, 703 .maxlen = sizeof(int), 704 .mode = 0644, 705 .proc_handler = proc_dointvec, 706 }, 707 { 708 .procname = "cipso_rbm_optfmt", 709 .data = &cipso_v4_rbm_optfmt, 710 .maxlen = sizeof(int), 711 .mode = 0644, 712 .proc_handler = proc_dointvec, 713 }, 714 { 715 .procname = "cipso_rbm_strictvalid", 716 .data = &cipso_v4_rbm_strictvalid, 717 .maxlen = sizeof(int), 718 .mode = 0644, 719 .proc_handler = proc_dointvec, 720 }, 721 #endif /* CONFIG_NETLABEL */ 722 { 723 .procname = "tcp_available_congestion_control", 724 .maxlen = TCP_CA_BUF_MAX, 725 .mode = 0444, 726 .proc_handler = proc_tcp_available_congestion_control, 727 }, 728 { 729 .procname = "tcp_allowed_congestion_control", 730 .maxlen = TCP_CA_BUF_MAX, 731 .mode = 0644, 732 .proc_handler = proc_allowed_congestion_control, 733 }, 734 { 735 .procname = "tcp_max_ssthresh", 736 .data = &sysctl_tcp_max_ssthresh, 737 .maxlen = sizeof(int), 738 .mode = 0644, 739 .proc_handler = proc_dointvec, 740 }, 741 { 742 .procname = "tcp_thin_linear_timeouts", 743 .data = &sysctl_tcp_thin_linear_timeouts, 744 .maxlen = sizeof(int), 745 .mode = 0644, 746 .proc_handler = proc_dointvec 747 }, 748 { 749 .procname = "tcp_thin_dupack", 750 .data = &sysctl_tcp_thin_dupack, 751 .maxlen = sizeof(int), 752 .mode = 0644, 753 .proc_handler = proc_dointvec 754 }, 755 { 756 .procname = "tcp_early_retrans", 757 .data = &sysctl_tcp_early_retrans, 758 .maxlen = sizeof(int), 759 .mode = 0644, 760 .proc_handler = proc_dointvec_minmax, 761 .extra1 = &zero, 762 .extra2 = &four, 763 }, 764 { 765 .procname = "tcp_min_tso_segs", 766 .data = &sysctl_tcp_min_tso_segs, 767 .maxlen = sizeof(int), 768 .mode = 0644, 769 .proc_handler = proc_dointvec_minmax, 770 .extra1 = &zero, 771 .extra2 = &gso_max_segs, 772 }, 773 { 774 .procname = "udp_mem", 775 .data = &sysctl_udp_mem, 776 .maxlen = sizeof(sysctl_udp_mem), 777 .mode = 0644, 778 .proc_handler = proc_doulongvec_minmax, 779 }, 780 { 781 .procname = "udp_rmem_min", 782 .data = &sysctl_udp_rmem_min, 783 .maxlen = sizeof(sysctl_udp_rmem_min), 784 .mode = 0644, 785 .proc_handler = proc_dointvec_minmax, 786 .extra1 = &one 787 }, 788 { 789 .procname = "udp_wmem_min", 790 .data = &sysctl_udp_wmem_min, 791 .maxlen = sizeof(sysctl_udp_wmem_min), 792 .mode = 0644, 793 .proc_handler = proc_dointvec_minmax, 794 .extra1 = &one 795 }, 796 { } 797 }; 798 799 static struct ctl_table ipv4_net_table[] = { 800 { 801 .procname = "icmp_echo_ignore_all", 802 .data = &init_net.ipv4.sysctl_icmp_echo_ignore_all, 803 .maxlen = sizeof(int), 804 .mode = 0644, 805 .proc_handler = proc_dointvec 806 }, 807 { 808 .procname = "icmp_echo_ignore_broadcasts", 809 .data = &init_net.ipv4.sysctl_icmp_echo_ignore_broadcasts, 810 .maxlen = sizeof(int), 811 .mode = 0644, 812 .proc_handler = proc_dointvec 813 }, 814 { 815 .procname = "icmp_ignore_bogus_error_responses", 816 .data = &init_net.ipv4.sysctl_icmp_ignore_bogus_error_responses, 817 .maxlen = sizeof(int), 818 .mode = 0644, 819 .proc_handler = proc_dointvec 820 }, 821 { 822 .procname = "icmp_errors_use_inbound_ifaddr", 823 .data = &init_net.ipv4.sysctl_icmp_errors_use_inbound_ifaddr, 824 .maxlen = sizeof(int), 825 .mode = 0644, 826 .proc_handler = proc_dointvec 827 }, 828 { 829 .procname = "icmp_ratelimit", 830 .data = &init_net.ipv4.sysctl_icmp_ratelimit, 831 .maxlen = sizeof(int), 832 .mode = 0644, 833 .proc_handler = proc_dointvec_ms_jiffies, 834 }, 835 { 836 .procname = "icmp_ratemask", 837 .data = &init_net.ipv4.sysctl_icmp_ratemask, 838 .maxlen = sizeof(int), 839 .mode = 0644, 840 .proc_handler = proc_dointvec 841 }, 842 { 843 .procname = "ping_group_range", 844 .data = &init_net.ipv4.sysctl_ping_group_range, 845 .maxlen = sizeof(gid_t)*2, 846 .mode = 0644, 847 .proc_handler = ipv4_ping_group_range, 848 }, 849 { 850 .procname = "tcp_ecn", 851 .data = &init_net.ipv4.sysctl_tcp_ecn, 852 .maxlen = sizeof(int), 853 .mode = 0644, 854 .proc_handler = proc_dointvec 855 }, 856 { 857 .procname = "ip_local_port_range", 858 .maxlen = sizeof(init_net.ipv4.sysctl_local_ports.range), 859 .data = &init_net.ipv4.sysctl_local_ports.range, 860 .mode = 0644, 861 .proc_handler = ipv4_local_port_range, 862 }, 863 { 864 .procname = "tcp_mem", 865 .maxlen = sizeof(init_net.ipv4.sysctl_tcp_mem), 866 .mode = 0644, 867 .proc_handler = ipv4_tcp_mem, 868 }, 869 { } 870 }; 871 872 static __net_init int ipv4_sysctl_init_net(struct net *net) 873 { 874 struct ctl_table *table; 875 876 table = ipv4_net_table; 877 if (!net_eq(net, &init_net)) { 878 table = kmemdup(table, sizeof(ipv4_net_table), GFP_KERNEL); 879 if (table == NULL) 880 goto err_alloc; 881 882 table[0].data = 883 &net->ipv4.sysctl_icmp_echo_ignore_all; 884 table[1].data = 885 &net->ipv4.sysctl_icmp_echo_ignore_broadcasts; 886 table[2].data = 887 &net->ipv4.sysctl_icmp_ignore_bogus_error_responses; 888 table[3].data = 889 &net->ipv4.sysctl_icmp_errors_use_inbound_ifaddr; 890 table[4].data = 891 &net->ipv4.sysctl_icmp_ratelimit; 892 table[5].data = 893 &net->ipv4.sysctl_icmp_ratemask; 894 table[6].data = 895 &net->ipv4.sysctl_ping_group_range; 896 table[7].data = 897 &net->ipv4.sysctl_tcp_ecn; 898 table[8].data = 899 &net->ipv4.sysctl_local_ports.range; 900 901 /* Don't export sysctls to unprivileged users */ 902 if (net->user_ns != &init_user_ns) 903 table[0].procname = NULL; 904 } 905 906 /* 907 * Sane defaults - nobody may create ping sockets. 908 * Boot scripts should set this to distro-specific group. 909 */ 910 net->ipv4.sysctl_ping_group_range[0] = make_kgid(&init_user_ns, 1); 911 net->ipv4.sysctl_ping_group_range[1] = make_kgid(&init_user_ns, 0); 912 913 /* 914 * Set defaults for local port range 915 */ 916 seqlock_init(&net->ipv4.sysctl_local_ports.lock); 917 net->ipv4.sysctl_local_ports.range[0] = 32768; 918 net->ipv4.sysctl_local_ports.range[1] = 61000; 919 920 tcp_init_mem(net); 921 922 net->ipv4.ipv4_hdr = register_net_sysctl(net, "net/ipv4", table); 923 if (net->ipv4.ipv4_hdr == NULL) 924 goto err_reg; 925 926 return 0; 927 928 err_reg: 929 if (!net_eq(net, &init_net)) 930 kfree(table); 931 err_alloc: 932 return -ENOMEM; 933 } 934 935 static __net_exit void ipv4_sysctl_exit_net(struct net *net) 936 { 937 struct ctl_table *table; 938 939 table = net->ipv4.ipv4_hdr->ctl_table_arg; 940 unregister_net_sysctl_table(net->ipv4.ipv4_hdr); 941 kfree(table); 942 } 943 944 static __net_initdata struct pernet_operations ipv4_sysctl_ops = { 945 .init = ipv4_sysctl_init_net, 946 .exit = ipv4_sysctl_exit_net, 947 }; 948 949 static __init int sysctl_ipv4_init(void) 950 { 951 struct ctl_table_header *hdr; 952 struct ctl_table *i; 953 954 for (i = ipv4_table; i->procname; i++) { 955 if (strcmp(i->procname, "ip_local_reserved_ports") == 0) { 956 i->data = sysctl_local_reserved_ports; 957 break; 958 } 959 } 960 if (!i->procname) 961 return -EINVAL; 962 963 hdr = register_net_sysctl(&init_net, "net/ipv4", ipv4_table); 964 if (hdr == NULL) 965 return -ENOMEM; 966 967 if (register_pernet_subsys(&ipv4_sysctl_ops)) { 968 unregister_net_sysctl_table(hdr); 969 return -ENOMEM; 970 } 971 972 return 0; 973 } 974 975 __initcall(sysctl_ipv4_init); 976