sysctl_net_ipv4.c 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938
  1. /*
  2. * sysctl_net_ipv4.c: sysctl interface to net IPV4 subsystem.
  3. *
  4. * Begun April 1, 1996, Mike Shaver.
  5. * Added /proc/sys/net/ipv4 directory entry (empty =) ). [MS]
  6. */
  7. #include <linux/mm.h>
  8. #include <linux/module.h>
  9. #include <linux/sysctl.h>
  10. #include <linux/igmp.h>
  11. #include <linux/inetdevice.h>
  12. #include <linux/seqlock.h>
  13. #include <linux/init.h>
  14. #include <linux/slab.h>
  15. #include <linux/nsproxy.h>
  16. #include <linux/swap.h>
  17. #include <net/snmp.h>
  18. #include <net/icmp.h>
  19. #include <net/ip.h>
  20. #include <net/route.h>
  21. #include <net/tcp.h>
  22. #include <net/udp.h>
  23. #include <net/cipso_ipv4.h>
  24. #include <net/inet_frag.h>
  25. #include <net/ping.h>
  26. #include <net/tcp_memcontrol.h>
  27. static int zero;
  28. static int one = 1;
  29. static int four = 4;
  30. static int tcp_retr1_max = 255;
  31. static int ip_local_port_range_min[] = { 1, 1 };
  32. static int ip_local_port_range_max[] = { 65535, 65535 };
  33. static int tcp_adv_win_scale_min = -31;
  34. static int tcp_adv_win_scale_max = 31;
  35. static int ip_ttl_min = 1;
  36. static int ip_ttl_max = 255;
  37. static int ip_ping_group_range_min[] = { 0, 0 };
  38. static int ip_ping_group_range_max[] = { GID_T_MAX, GID_T_MAX };
  39. /* Update system visible IP port range */
  40. static void set_local_port_range(int range[2])
  41. {
  42. write_seqlock(&sysctl_local_ports.lock);
  43. sysctl_local_ports.range[0] = range[0];
  44. sysctl_local_ports.range[1] = range[1];
  45. write_sequnlock(&sysctl_local_ports.lock);
  46. }
  47. /* Validate changes from /proc interface. */
  48. static int ipv4_local_port_range(struct ctl_table *table, int write,
  49. void __user *buffer,
  50. size_t *lenp, loff_t *ppos)
  51. {
  52. int ret;
  53. int range[2];
  54. struct ctl_table tmp = {
  55. .data = &range,
  56. .maxlen = sizeof(range),
  57. .mode = table->mode,
  58. .extra1 = &ip_local_port_range_min,
  59. .extra2 = &ip_local_port_range_max,
  60. };
  61. inet_get_local_port_range(range, range + 1);
  62. ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
  63. if (write && ret == 0) {
  64. if (range[1] < range[0])
  65. ret = -EINVAL;
  66. else
  67. set_local_port_range(range);
  68. }
  69. return ret;
  70. }
  71. static void inet_get_ping_group_range_table(struct ctl_table *table, kgid_t *low, kgid_t *high)
  72. {
  73. kgid_t *data = table->data;
  74. unsigned int seq;
  75. do {
  76. seq = read_seqbegin(&sysctl_local_ports.lock);
  77. *low = data[0];
  78. *high = data[1];
  79. } while (read_seqretry(&sysctl_local_ports.lock, seq));
  80. }
  81. /* Update system visible IP port range */
  82. static void set_ping_group_range(struct ctl_table *table, kgid_t low, kgid_t high)
  83. {
  84. kgid_t *data = table->data;
  85. write_seqlock(&sysctl_local_ports.lock);
  86. data[0] = low;
  87. data[1] = high;
  88. write_sequnlock(&sysctl_local_ports.lock);
  89. }
  90. /* Validate changes from /proc interface. */
  91. static int ipv4_ping_group_range(struct ctl_table *table, int write,
  92. void __user *buffer,
  93. size_t *lenp, loff_t *ppos)
  94. {
  95. struct user_namespace *user_ns = current_user_ns();
  96. int ret;
  97. gid_t urange[2];
  98. kgid_t low, high;
  99. struct ctl_table tmp = {
  100. .data = &urange,
  101. .maxlen = sizeof(urange),
  102. .mode = table->mode,
  103. .extra1 = &ip_ping_group_range_min,
  104. .extra2 = &ip_ping_group_range_max,
  105. };
  106. inet_get_ping_group_range_table(table, &low, &high);
  107. urange[0] = from_kgid_munged(user_ns, low);
  108. urange[1] = from_kgid_munged(user_ns, high);
  109. ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
  110. if (write && ret == 0) {
  111. low = make_kgid(user_ns, urange[0]);
  112. high = make_kgid(user_ns, urange[1]);
  113. if (!gid_valid(low) || !gid_valid(high) ||
  114. (urange[1] < urange[0]) || gid_lt(high, low)) {
  115. low = make_kgid(&init_user_ns, 1);
  116. high = make_kgid(&init_user_ns, 0);
  117. }
  118. set_ping_group_range(table, low, high);
  119. }
  120. return ret;
  121. }
  122. static int proc_tcp_congestion_control(struct ctl_table *ctl, int write,
  123. void __user *buffer, size_t *lenp, loff_t *ppos)
  124. {
  125. char val[TCP_CA_NAME_MAX];
  126. struct ctl_table tbl = {
  127. .data = val,
  128. .maxlen = TCP_CA_NAME_MAX,
  129. };
  130. int ret;
  131. tcp_get_default_congestion_control(val);
  132. ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
  133. if (write && ret == 0)
  134. ret = tcp_set_default_congestion_control(val);
  135. return ret;
  136. }
  137. static int proc_tcp_available_congestion_control(struct ctl_table *ctl,
  138. int write,
  139. void __user *buffer, size_t *lenp,
  140. loff_t *ppos)
  141. {
  142. struct ctl_table tbl = { .maxlen = TCP_CA_BUF_MAX, };
  143. int ret;
  144. tbl.data = kmalloc(tbl.maxlen, GFP_USER);
  145. if (!tbl.data)
  146. return -ENOMEM;
  147. tcp_get_available_congestion_control(tbl.data, TCP_CA_BUF_MAX);
  148. ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
  149. kfree(tbl.data);
  150. return ret;
  151. }
  152. static int proc_allowed_congestion_control(struct ctl_table *ctl,
  153. int write,
  154. void __user *buffer, size_t *lenp,
  155. loff_t *ppos)
  156. {
  157. struct ctl_table tbl = { .maxlen = TCP_CA_BUF_MAX };
  158. int ret;
  159. tbl.data = kmalloc(tbl.maxlen, GFP_USER);
  160. if (!tbl.data)
  161. return -ENOMEM;
  162. tcp_get_allowed_congestion_control(tbl.data, tbl.maxlen);
  163. ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
  164. if (write && ret == 0)
  165. ret = tcp_set_allowed_congestion_control(tbl.data);
  166. kfree(tbl.data);
  167. return ret;
  168. }
  169. static int ipv4_tcp_mem(struct ctl_table *ctl, int write,
  170. void __user *buffer, size_t *lenp,
  171. loff_t *ppos)
  172. {
  173. int ret;
  174. unsigned long vec[3];
  175. struct net *net = current->nsproxy->net_ns;
  176. #ifdef CONFIG_MEMCG_KMEM
  177. struct mem_cgroup *memcg;
  178. #endif
  179. struct ctl_table tmp = {
  180. .data = &vec,
  181. .maxlen = sizeof(vec),
  182. .mode = ctl->mode,
  183. };
  184. if (!write) {
  185. ctl->data = &net->ipv4.sysctl_tcp_mem;
  186. return proc_doulongvec_minmax(ctl, write, buffer, lenp, ppos);
  187. }
  188. ret = proc_doulongvec_minmax(&tmp, write, buffer, lenp, ppos);
  189. if (ret)
  190. return ret;
  191. #ifdef CONFIG_MEMCG_KMEM
  192. rcu_read_lock();
  193. memcg = mem_cgroup_from_task(current);
  194. tcp_prot_mem(memcg, vec[0], 0);
  195. tcp_prot_mem(memcg, vec[1], 1);
  196. tcp_prot_mem(memcg, vec[2], 2);
  197. rcu_read_unlock();
  198. #endif
  199. net->ipv4.sysctl_tcp_mem[0] = vec[0];
  200. net->ipv4.sysctl_tcp_mem[1] = vec[1];
  201. net->ipv4.sysctl_tcp_mem[2] = vec[2];
  202. return 0;
  203. }
  204. static int proc_tcp_fastopen_key(struct ctl_table *ctl, int write,
  205. void __user *buffer, size_t *lenp,
  206. loff_t *ppos)
  207. {
  208. struct ctl_table tbl = { .maxlen = (TCP_FASTOPEN_KEY_LENGTH * 2 + 10) };
  209. struct tcp_fastopen_context *ctxt;
  210. int ret;
  211. u32 user_key[4]; /* 16 bytes, matching TCP_FASTOPEN_KEY_LENGTH */
  212. tbl.data = kmalloc(tbl.maxlen, GFP_KERNEL);
  213. if (!tbl.data)
  214. return -ENOMEM;
  215. rcu_read_lock();
  216. ctxt = rcu_dereference(tcp_fastopen_ctx);
  217. if (ctxt)
  218. memcpy(user_key, ctxt->key, TCP_FASTOPEN_KEY_LENGTH);
  219. else
  220. memset(user_key, 0, sizeof(user_key));
  221. rcu_read_unlock();
  222. snprintf(tbl.data, tbl.maxlen, "%08x-%08x-%08x-%08x",
  223. user_key[0], user_key[1], user_key[2], user_key[3]);
  224. ret = proc_dostring(&tbl, write, buffer, lenp, ppos);
  225. if (write && ret == 0) {
  226. if (sscanf(tbl.data, "%x-%x-%x-%x", user_key, user_key + 1,
  227. user_key + 2, user_key + 3) != 4) {
  228. ret = -EINVAL;
  229. goto bad_key;
  230. }
  231. tcp_fastopen_reset_cipher(user_key, TCP_FASTOPEN_KEY_LENGTH);
  232. }
  233. bad_key:
  234. pr_debug("proc FO key set 0x%x-%x-%x-%x <- 0x%s: %u\n",
  235. user_key[0], user_key[1], user_key[2], user_key[3],
  236. (char *)tbl.data, ret);
  237. kfree(tbl.data);
  238. return ret;
  239. }
  240. static struct ctl_table ipv4_table[] = {
  241. {
  242. .procname = "tcp_timestamps",
  243. .data = &sysctl_tcp_timestamps,
  244. .maxlen = sizeof(int),
  245. .mode = 0644,
  246. .proc_handler = proc_dointvec
  247. },
  248. {
  249. .procname = "tcp_window_scaling",
  250. .data = &sysctl_tcp_window_scaling,
  251. .maxlen = sizeof(int),
  252. .mode = 0644,
  253. .proc_handler = proc_dointvec
  254. },
  255. {
  256. .procname = "tcp_sack",
  257. .data = &sysctl_tcp_sack,
  258. .maxlen = sizeof(int),
  259. .mode = 0644,
  260. .proc_handler = proc_dointvec
  261. },
  262. {
  263. .procname = "tcp_retrans_collapse",
  264. .data = &sysctl_tcp_retrans_collapse,
  265. .maxlen = sizeof(int),
  266. .mode = 0644,
  267. .proc_handler = proc_dointvec
  268. },
  269. {
  270. .procname = "ip_default_ttl",
  271. .data = &sysctl_ip_default_ttl,
  272. .maxlen = sizeof(int),
  273. .mode = 0644,
  274. .proc_handler = proc_dointvec_minmax,
  275. .extra1 = &ip_ttl_min,
  276. .extra2 = &ip_ttl_max,
  277. },
  278. {
  279. .procname = "ip_no_pmtu_disc",
  280. .data = &ipv4_config.no_pmtu_disc,
  281. .maxlen = sizeof(int),
  282. .mode = 0644,
  283. .proc_handler = proc_dointvec
  284. },
  285. {
  286. .procname = "ip_nonlocal_bind",
  287. .data = &sysctl_ip_nonlocal_bind,
  288. .maxlen = sizeof(int),
  289. .mode = 0644,
  290. .proc_handler = proc_dointvec
  291. },
  292. {
  293. .procname = "tcp_syn_retries",
  294. .data = &sysctl_tcp_syn_retries,
  295. .maxlen = sizeof(int),
  296. .mode = 0644,
  297. .proc_handler = proc_dointvec
  298. },
  299. {
  300. .procname = "tcp_synack_retries",
  301. .data = &sysctl_tcp_synack_retries,
  302. .maxlen = sizeof(int),
  303. .mode = 0644,
  304. .proc_handler = proc_dointvec
  305. },
  306. {
  307. .procname = "tcp_max_orphans",
  308. .data = &sysctl_tcp_max_orphans,
  309. .maxlen = sizeof(int),
  310. .mode = 0644,
  311. .proc_handler = proc_dointvec
  312. },
  313. {
  314. .procname = "tcp_max_tw_buckets",
  315. .data = &tcp_death_row.sysctl_max_tw_buckets,
  316. .maxlen = sizeof(int),
  317. .mode = 0644,
  318. .proc_handler = proc_dointvec
  319. },
  320. {
  321. .procname = "ip_early_demux",
  322. .data = &sysctl_ip_early_demux,
  323. .maxlen = sizeof(int),
  324. .mode = 0644,
  325. .proc_handler = proc_dointvec
  326. },
  327. {
  328. .procname = "ip_dynaddr",
  329. .data = &sysctl_ip_dynaddr,
  330. .maxlen = sizeof(int),
  331. .mode = 0644,
  332. .proc_handler = proc_dointvec
  333. },
  334. {
  335. .procname = "tcp_keepalive_time",
  336. .data = &sysctl_tcp_keepalive_time,
  337. .maxlen = sizeof(int),
  338. .mode = 0644,
  339. .proc_handler = proc_dointvec_jiffies,
  340. },
  341. {
  342. .procname = "tcp_keepalive_probes",
  343. .data = &sysctl_tcp_keepalive_probes,
  344. .maxlen = sizeof(int),
  345. .mode = 0644,
  346. .proc_handler = proc_dointvec
  347. },
  348. {
  349. .procname = "tcp_keepalive_intvl",
  350. .data = &sysctl_tcp_keepalive_intvl,
  351. .maxlen = sizeof(int),
  352. .mode = 0644,
  353. .proc_handler = proc_dointvec_jiffies,
  354. },
  355. {
  356. .procname = "tcp_retries1",
  357. .data = &sysctl_tcp_retries1,
  358. .maxlen = sizeof(int),
  359. .mode = 0644,
  360. .proc_handler = proc_dointvec_minmax,
  361. .extra2 = &tcp_retr1_max
  362. },
  363. {
  364. .procname = "tcp_retries2",
  365. .data = &sysctl_tcp_retries2,
  366. .maxlen = sizeof(int),
  367. .mode = 0644,
  368. .proc_handler = proc_dointvec
  369. },
  370. {
  371. .procname = "tcp_fin_timeout",
  372. .data = &sysctl_tcp_fin_timeout,
  373. .maxlen = sizeof(int),
  374. .mode = 0644,
  375. .proc_handler = proc_dointvec_jiffies,
  376. },
  377. #ifdef CONFIG_SYN_COOKIES
  378. {
  379. .procname = "tcp_syncookies",
  380. .data = &sysctl_tcp_syncookies,
  381. .maxlen = sizeof(int),
  382. .mode = 0644,
  383. .proc_handler = proc_dointvec
  384. },
  385. #endif
  386. {
  387. .procname = "tcp_fastopen",
  388. .data = &sysctl_tcp_fastopen,
  389. .maxlen = sizeof(int),
  390. .mode = 0644,
  391. .proc_handler = proc_dointvec,
  392. },
  393. {
  394. .procname = "tcp_fastopen_key",
  395. .mode = 0600,
  396. .maxlen = ((TCP_FASTOPEN_KEY_LENGTH * 2) + 10),
  397. .proc_handler = proc_tcp_fastopen_key,
  398. },
  399. {
  400. .procname = "tcp_tw_recycle",
  401. .data = &tcp_death_row.sysctl_tw_recycle,
  402. .maxlen = sizeof(int),
  403. .mode = 0644,
  404. .proc_handler = proc_dointvec
  405. },
  406. {
  407. .procname = "tcp_abort_on_overflow",
  408. .data = &sysctl_tcp_abort_on_overflow,
  409. .maxlen = sizeof(int),
  410. .mode = 0644,
  411. .proc_handler = proc_dointvec
  412. },
  413. {
  414. .procname = "tcp_stdurg",
  415. .data = &sysctl_tcp_stdurg,
  416. .maxlen = sizeof(int),
  417. .mode = 0644,
  418. .proc_handler = proc_dointvec
  419. },
  420. {
  421. .procname = "tcp_rfc1337",
  422. .data = &sysctl_tcp_rfc1337,
  423. .maxlen = sizeof(int),
  424. .mode = 0644,
  425. .proc_handler = proc_dointvec
  426. },
  427. {
  428. .procname = "tcp_max_syn_backlog",
  429. .data = &sysctl_max_syn_backlog,
  430. .maxlen = sizeof(int),
  431. .mode = 0644,
  432. .proc_handler = proc_dointvec
  433. },
  434. {
  435. .procname = "ip_local_port_range",
  436. .data = &sysctl_local_ports.range,
  437. .maxlen = sizeof(sysctl_local_ports.range),
  438. .mode = 0644,
  439. .proc_handler = ipv4_local_port_range,
  440. },
  441. {
  442. .procname = "ip_local_reserved_ports",
  443. .data = NULL, /* initialized in sysctl_ipv4_init */
  444. .maxlen = 65536,
  445. .mode = 0644,
  446. .proc_handler = proc_do_large_bitmap,
  447. },
  448. {
  449. .procname = "igmp_max_memberships",
  450. .data = &sysctl_igmp_max_memberships,
  451. .maxlen = sizeof(int),
  452. .mode = 0644,
  453. .proc_handler = proc_dointvec
  454. },
  455. {
  456. .procname = "igmp_max_msf",
  457. .data = &sysctl_igmp_max_msf,
  458. .maxlen = sizeof(int),
  459. .mode = 0644,
  460. .proc_handler = proc_dointvec
  461. },
  462. {
  463. .procname = "inet_peer_threshold",
  464. .data = &inet_peer_threshold,
  465. .maxlen = sizeof(int),
  466. .mode = 0644,
  467. .proc_handler = proc_dointvec
  468. },
  469. {
  470. .procname = "inet_peer_minttl",
  471. .data = &inet_peer_minttl,
  472. .maxlen = sizeof(int),
  473. .mode = 0644,
  474. .proc_handler = proc_dointvec_jiffies,
  475. },
  476. {
  477. .procname = "inet_peer_maxttl",
  478. .data = &inet_peer_maxttl,
  479. .maxlen = sizeof(int),
  480. .mode = 0644,
  481. .proc_handler = proc_dointvec_jiffies,
  482. },
  483. {
  484. .procname = "tcp_orphan_retries",
  485. .data = &sysctl_tcp_orphan_retries,
  486. .maxlen = sizeof(int),
  487. .mode = 0644,
  488. .proc_handler = proc_dointvec
  489. },
  490. {
  491. .procname = "tcp_fack",
  492. .data = &sysctl_tcp_fack,
  493. .maxlen = sizeof(int),
  494. .mode = 0644,
  495. .proc_handler = proc_dointvec
  496. },
  497. {
  498. .procname = "tcp_reordering",
  499. .data = &sysctl_tcp_reordering,
  500. .maxlen = sizeof(int),
  501. .mode = 0644,
  502. .proc_handler = proc_dointvec
  503. },
  504. {
  505. .procname = "tcp_dsack",
  506. .data = &sysctl_tcp_dsack,
  507. .maxlen = sizeof(int),
  508. .mode = 0644,
  509. .proc_handler = proc_dointvec
  510. },
  511. {
  512. .procname = "tcp_wmem",
  513. .data = &sysctl_tcp_wmem,
  514. .maxlen = sizeof(sysctl_tcp_wmem),
  515. .mode = 0644,
  516. .proc_handler = proc_dointvec_minmax,
  517. .extra1 = &one,
  518. },
  519. {
  520. .procname = "tcp_rmem",
  521. .data = &sysctl_tcp_rmem,
  522. .maxlen = sizeof(sysctl_tcp_rmem),
  523. .mode = 0644,
  524. .proc_handler = proc_dointvec_minmax,
  525. .extra1 = &one,
  526. },
  527. {
  528. .procname = "tcp_app_win",
  529. .data = &sysctl_tcp_app_win,
  530. .maxlen = sizeof(int),
  531. .mode = 0644,
  532. .proc_handler = proc_dointvec
  533. },
  534. {
  535. .procname = "tcp_adv_win_scale",
  536. .data = &sysctl_tcp_adv_win_scale,
  537. .maxlen = sizeof(int),
  538. .mode = 0644,
  539. .proc_handler = proc_dointvec_minmax,
  540. .extra1 = &tcp_adv_win_scale_min,
  541. .extra2 = &tcp_adv_win_scale_max,
  542. },
  543. {
  544. .procname = "tcp_tw_reuse",
  545. .data = &sysctl_tcp_tw_reuse,
  546. .maxlen = sizeof(int),
  547. .mode = 0644,
  548. .proc_handler = proc_dointvec
  549. },
  550. {
  551. .procname = "tcp_frto",
  552. .data = &sysctl_tcp_frto,
  553. .maxlen = sizeof(int),
  554. .mode = 0644,
  555. .proc_handler = proc_dointvec
  556. },
  557. {
  558. .procname = "tcp_low_latency",
  559. .data = &sysctl_tcp_low_latency,
  560. .maxlen = sizeof(int),
  561. .mode = 0644,
  562. .proc_handler = proc_dointvec
  563. },
  564. {
  565. .procname = "tcp_no_metrics_save",
  566. .data = &sysctl_tcp_nometrics_save,
  567. .maxlen = sizeof(int),
  568. .mode = 0644,
  569. .proc_handler = proc_dointvec,
  570. },
  571. {
  572. .procname = "tcp_moderate_rcvbuf",
  573. .data = &sysctl_tcp_moderate_rcvbuf,
  574. .maxlen = sizeof(int),
  575. .mode = 0644,
  576. .proc_handler = proc_dointvec,
  577. },
  578. {
  579. .procname = "tcp_tso_win_divisor",
  580. .data = &sysctl_tcp_tso_win_divisor,
  581. .maxlen = sizeof(int),
  582. .mode = 0644,
  583. .proc_handler = proc_dointvec,
  584. },
  585. {
  586. .procname = "tcp_congestion_control",
  587. .mode = 0644,
  588. .maxlen = TCP_CA_NAME_MAX,
  589. .proc_handler = proc_tcp_congestion_control,
  590. },
  591. {
  592. .procname = "tcp_mtu_probing",
  593. .data = &sysctl_tcp_mtu_probing,
  594. .maxlen = sizeof(int),
  595. .mode = 0644,
  596. .proc_handler = proc_dointvec,
  597. },
  598. {
  599. .procname = "tcp_base_mss",
  600. .data = &sysctl_tcp_base_mss,
  601. .maxlen = sizeof(int),
  602. .mode = 0644,
  603. .proc_handler = proc_dointvec,
  604. },
  605. {
  606. .procname = "tcp_workaround_signed_windows",
  607. .data = &sysctl_tcp_workaround_signed_windows,
  608. .maxlen = sizeof(int),
  609. .mode = 0644,
  610. .proc_handler = proc_dointvec
  611. },
  612. {
  613. .procname = "tcp_limit_output_bytes",
  614. .data = &sysctl_tcp_limit_output_bytes,
  615. .maxlen = sizeof(int),
  616. .mode = 0644,
  617. .proc_handler = proc_dointvec
  618. },
  619. {
  620. .procname = "tcp_challenge_ack_limit",
  621. .data = &sysctl_tcp_challenge_ack_limit,
  622. .maxlen = sizeof(int),
  623. .mode = 0644,
  624. .proc_handler = proc_dointvec
  625. },
  626. #ifdef CONFIG_NET_DMA
  627. {
  628. .procname = "tcp_dma_copybreak",
  629. .data = &sysctl_tcp_dma_copybreak,
  630. .maxlen = sizeof(int),
  631. .mode = 0644,
  632. .proc_handler = proc_dointvec
  633. },
  634. #endif
  635. {
  636. .procname = "tcp_slow_start_after_idle",
  637. .data = &sysctl_tcp_slow_start_after_idle,
  638. .maxlen = sizeof(int),
  639. .mode = 0644,
  640. .proc_handler = proc_dointvec
  641. },
  642. #ifdef CONFIG_NETLABEL
  643. {
  644. .procname = "cipso_cache_enable",
  645. .data = &cipso_v4_cache_enabled,
  646. .maxlen = sizeof(int),
  647. .mode = 0644,
  648. .proc_handler = proc_dointvec,
  649. },
  650. {
  651. .procname = "cipso_cache_bucket_size",
  652. .data = &cipso_v4_cache_bucketsize,
  653. .maxlen = sizeof(int),
  654. .mode = 0644,
  655. .proc_handler = proc_dointvec,
  656. },
  657. {
  658. .procname = "cipso_rbm_optfmt",
  659. .data = &cipso_v4_rbm_optfmt,
  660. .maxlen = sizeof(int),
  661. .mode = 0644,
  662. .proc_handler = proc_dointvec,
  663. },
  664. {
  665. .procname = "cipso_rbm_strictvalid",
  666. .data = &cipso_v4_rbm_strictvalid,
  667. .maxlen = sizeof(int),
  668. .mode = 0644,
  669. .proc_handler = proc_dointvec,
  670. },
  671. #endif /* CONFIG_NETLABEL */
  672. {
  673. .procname = "tcp_available_congestion_control",
  674. .maxlen = TCP_CA_BUF_MAX,
  675. .mode = 0444,
  676. .proc_handler = proc_tcp_available_congestion_control,
  677. },
  678. {
  679. .procname = "tcp_allowed_congestion_control",
  680. .maxlen = TCP_CA_BUF_MAX,
  681. .mode = 0644,
  682. .proc_handler = proc_allowed_congestion_control,
  683. },
  684. {
  685. .procname = "tcp_max_ssthresh",
  686. .data = &sysctl_tcp_max_ssthresh,
  687. .maxlen = sizeof(int),
  688. .mode = 0644,
  689. .proc_handler = proc_dointvec,
  690. },
  691. {
  692. .procname = "tcp_thin_linear_timeouts",
  693. .data = &sysctl_tcp_thin_linear_timeouts,
  694. .maxlen = sizeof(int),
  695. .mode = 0644,
  696. .proc_handler = proc_dointvec
  697. },
  698. {
  699. .procname = "tcp_thin_dupack",
  700. .data = &sysctl_tcp_thin_dupack,
  701. .maxlen = sizeof(int),
  702. .mode = 0644,
  703. .proc_handler = proc_dointvec
  704. },
  705. {
  706. .procname = "tcp_early_retrans",
  707. .data = &sysctl_tcp_early_retrans,
  708. .maxlen = sizeof(int),
  709. .mode = 0644,
  710. .proc_handler = proc_dointvec_minmax,
  711. .extra1 = &zero,
  712. .extra2 = &four,
  713. },
  714. {
  715. .procname = "udp_mem",
  716. .data = &sysctl_udp_mem,
  717. .maxlen = sizeof(sysctl_udp_mem),
  718. .mode = 0644,
  719. .proc_handler = proc_doulongvec_minmax,
  720. },
  721. {
  722. .procname = "udp_rmem_min",
  723. .data = &sysctl_udp_rmem_min,
  724. .maxlen = sizeof(sysctl_udp_rmem_min),
  725. .mode = 0644,
  726. .proc_handler = proc_dointvec_minmax,
  727. .extra1 = &one
  728. },
  729. {
  730. .procname = "udp_wmem_min",
  731. .data = &sysctl_udp_wmem_min,
  732. .maxlen = sizeof(sysctl_udp_wmem_min),
  733. .mode = 0644,
  734. .proc_handler = proc_dointvec_minmax,
  735. .extra1 = &one
  736. },
  737. { }
  738. };
  739. static struct ctl_table ipv4_net_table[] = {
  740. {
  741. .procname = "icmp_echo_ignore_all",
  742. .data = &init_net.ipv4.sysctl_icmp_echo_ignore_all,
  743. .maxlen = sizeof(int),
  744. .mode = 0644,
  745. .proc_handler = proc_dointvec
  746. },
  747. {
  748. .procname = "icmp_echo_ignore_broadcasts",
  749. .data = &init_net.ipv4.sysctl_icmp_echo_ignore_broadcasts,
  750. .maxlen = sizeof(int),
  751. .mode = 0644,
  752. .proc_handler = proc_dointvec
  753. },
  754. {
  755. .procname = "icmp_ignore_bogus_error_responses",
  756. .data = &init_net.ipv4.sysctl_icmp_ignore_bogus_error_responses,
  757. .maxlen = sizeof(int),
  758. .mode = 0644,
  759. .proc_handler = proc_dointvec
  760. },
  761. {
  762. .procname = "icmp_errors_use_inbound_ifaddr",
  763. .data = &init_net.ipv4.sysctl_icmp_errors_use_inbound_ifaddr,
  764. .maxlen = sizeof(int),
  765. .mode = 0644,
  766. .proc_handler = proc_dointvec
  767. },
  768. {
  769. .procname = "icmp_ratelimit",
  770. .data = &init_net.ipv4.sysctl_icmp_ratelimit,
  771. .maxlen = sizeof(int),
  772. .mode = 0644,
  773. .proc_handler = proc_dointvec_ms_jiffies,
  774. },
  775. {
  776. .procname = "icmp_ratemask",
  777. .data = &init_net.ipv4.sysctl_icmp_ratemask,
  778. .maxlen = sizeof(int),
  779. .mode = 0644,
  780. .proc_handler = proc_dointvec
  781. },
  782. {
  783. .procname = "ping_group_range",
  784. .data = &init_net.ipv4.sysctl_ping_group_range,
  785. .maxlen = sizeof(gid_t)*2,
  786. .mode = 0644,
  787. .proc_handler = ipv4_ping_group_range,
  788. },
  789. {
  790. .procname = "tcp_ecn",
  791. .data = &init_net.ipv4.sysctl_tcp_ecn,
  792. .maxlen = sizeof(int),
  793. .mode = 0644,
  794. .proc_handler = proc_dointvec
  795. },
  796. {
  797. .procname = "tcp_mem",
  798. .maxlen = sizeof(init_net.ipv4.sysctl_tcp_mem),
  799. .mode = 0644,
  800. .proc_handler = ipv4_tcp_mem,
  801. },
  802. { }
  803. };
  804. static __net_init int ipv4_sysctl_init_net(struct net *net)
  805. {
  806. struct ctl_table *table;
  807. table = ipv4_net_table;
  808. if (!net_eq(net, &init_net)) {
  809. table = kmemdup(table, sizeof(ipv4_net_table), GFP_KERNEL);
  810. if (table == NULL)
  811. goto err_alloc;
  812. table[0].data =
  813. &net->ipv4.sysctl_icmp_echo_ignore_all;
  814. table[1].data =
  815. &net->ipv4.sysctl_icmp_echo_ignore_broadcasts;
  816. table[2].data =
  817. &net->ipv4.sysctl_icmp_ignore_bogus_error_responses;
  818. table[3].data =
  819. &net->ipv4.sysctl_icmp_errors_use_inbound_ifaddr;
  820. table[4].data =
  821. &net->ipv4.sysctl_icmp_ratelimit;
  822. table[5].data =
  823. &net->ipv4.sysctl_icmp_ratemask;
  824. table[6].data =
  825. &net->ipv4.sysctl_ping_group_range;
  826. table[7].data =
  827. &net->ipv4.sysctl_tcp_ecn;
  828. /* Don't export sysctls to unprivileged users */
  829. if (net->user_ns != &init_user_ns)
  830. table[0].procname = NULL;
  831. }
  832. /*
  833. * Sane defaults - nobody may create ping sockets.
  834. * Boot scripts should set this to distro-specific group.
  835. */
  836. net->ipv4.sysctl_ping_group_range[0] = make_kgid(&init_user_ns, 1);
  837. net->ipv4.sysctl_ping_group_range[1] = make_kgid(&init_user_ns, 0);
  838. tcp_init_mem(net);
  839. net->ipv4.ipv4_hdr = register_net_sysctl(net, "net/ipv4", table);
  840. if (net->ipv4.ipv4_hdr == NULL)
  841. goto err_reg;
  842. return 0;
  843. err_reg:
  844. if (!net_eq(net, &init_net))
  845. kfree(table);
  846. err_alloc:
  847. return -ENOMEM;
  848. }
  849. static __net_exit void ipv4_sysctl_exit_net(struct net *net)
  850. {
  851. struct ctl_table *table;
  852. table = net->ipv4.ipv4_hdr->ctl_table_arg;
  853. unregister_net_sysctl_table(net->ipv4.ipv4_hdr);
  854. kfree(table);
  855. }
  856. static __net_initdata struct pernet_operations ipv4_sysctl_ops = {
  857. .init = ipv4_sysctl_init_net,
  858. .exit = ipv4_sysctl_exit_net,
  859. };
  860. static __init int sysctl_ipv4_init(void)
  861. {
  862. struct ctl_table_header *hdr;
  863. struct ctl_table *i;
  864. for (i = ipv4_table; i->procname; i++) {
  865. if (strcmp(i->procname, "ip_local_reserved_ports") == 0) {
  866. i->data = sysctl_local_reserved_ports;
  867. break;
  868. }
  869. }
  870. if (!i->procname)
  871. return -EINVAL;
  872. hdr = register_net_sysctl(&init_net, "net/ipv4", ipv4_table);
  873. if (hdr == NULL)
  874. return -ENOMEM;
  875. if (register_pernet_subsys(&ipv4_sysctl_ops)) {
  876. unregister_net_sysctl_table(hdr);
  877. return -ENOMEM;
  878. }
  879. return 0;
  880. }
  881. __initcall(sysctl_ipv4_init);