sysctl_net_core.c 5.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266
  1. /* -*- linux-c -*-
  2. * sysctl_net_core.c: sysctl interface to net core subsystem.
  3. *
  4. * Begun April 1, 1996, Mike Shaver.
  5. * Added /proc/sys/net/core directory entry (empty =) ). [MS]
  6. */
  7. #include <linux/mm.h>
  8. #include <linux/sysctl.h>
  9. #include <linux/module.h>
  10. #include <linux/socket.h>
  11. #include <linux/netdevice.h>
  12. #include <linux/ratelimit.h>
  13. #include <linux/vmalloc.h>
  14. #include <linux/init.h>
  15. #include <linux/slab.h>
  16. #include <linux/kmemleak.h>
  17. #include <net/ip.h>
  18. #include <net/sock.h>
  19. #include <net/net_ratelimit.h>
  20. static int one = 1;
  21. #ifdef CONFIG_RPS
  22. static int rps_sock_flow_sysctl(ctl_table *table, int write,
  23. void __user *buffer, size_t *lenp, loff_t *ppos)
  24. {
  25. unsigned int orig_size, size;
  26. int ret, i;
  27. ctl_table tmp = {
  28. .data = &size,
  29. .maxlen = sizeof(size),
  30. .mode = table->mode
  31. };
  32. struct rps_sock_flow_table *orig_sock_table, *sock_table;
  33. static DEFINE_MUTEX(sock_flow_mutex);
  34. mutex_lock(&sock_flow_mutex);
  35. orig_sock_table = rcu_dereference_protected(rps_sock_flow_table,
  36. lockdep_is_held(&sock_flow_mutex));
  37. size = orig_size = orig_sock_table ? orig_sock_table->mask + 1 : 0;
  38. ret = proc_dointvec(&tmp, write, buffer, lenp, ppos);
  39. if (write) {
  40. if (size) {
  41. if (size > 1<<30) {
  42. /* Enforce limit to prevent overflow */
  43. mutex_unlock(&sock_flow_mutex);
  44. return -EINVAL;
  45. }
  46. size = roundup_pow_of_two(size);
  47. if (size != orig_size) {
  48. sock_table =
  49. vmalloc(RPS_SOCK_FLOW_TABLE_SIZE(size));
  50. if (!sock_table) {
  51. mutex_unlock(&sock_flow_mutex);
  52. return -ENOMEM;
  53. }
  54. sock_table->mask = size - 1;
  55. } else
  56. sock_table = orig_sock_table;
  57. for (i = 0; i < size; i++)
  58. sock_table->ents[i] = RPS_NO_CPU;
  59. } else
  60. sock_table = NULL;
  61. if (sock_table != orig_sock_table) {
  62. rcu_assign_pointer(rps_sock_flow_table, sock_table);
  63. if (sock_table)
  64. static_key_slow_inc(&rps_needed);
  65. if (orig_sock_table) {
  66. static_key_slow_dec(&rps_needed);
  67. synchronize_rcu();
  68. vfree(orig_sock_table);
  69. }
  70. }
  71. }
  72. mutex_unlock(&sock_flow_mutex);
  73. return ret;
  74. }
  75. #endif /* CONFIG_RPS */
  76. static struct ctl_table net_core_table[] = {
  77. #ifdef CONFIG_NET
  78. {
  79. .procname = "wmem_max",
  80. .data = &sysctl_wmem_max,
  81. .maxlen = sizeof(int),
  82. .mode = 0644,
  83. .proc_handler = proc_dointvec_minmax,
  84. .extra1 = &one,
  85. },
  86. {
  87. .procname = "rmem_max",
  88. .data = &sysctl_rmem_max,
  89. .maxlen = sizeof(int),
  90. .mode = 0644,
  91. .proc_handler = proc_dointvec_minmax,
  92. .extra1 = &one,
  93. },
  94. {
  95. .procname = "wmem_default",
  96. .data = &sysctl_wmem_default,
  97. .maxlen = sizeof(int),
  98. .mode = 0644,
  99. .proc_handler = proc_dointvec_minmax,
  100. .extra1 = &one,
  101. },
  102. {
  103. .procname = "rmem_default",
  104. .data = &sysctl_rmem_default,
  105. .maxlen = sizeof(int),
  106. .mode = 0644,
  107. .proc_handler = proc_dointvec_minmax,
  108. .extra1 = &one,
  109. },
  110. {
  111. .procname = "dev_weight",
  112. .data = &weight_p,
  113. .maxlen = sizeof(int),
  114. .mode = 0644,
  115. .proc_handler = proc_dointvec
  116. },
  117. {
  118. .procname = "netdev_max_backlog",
  119. .data = &netdev_max_backlog,
  120. .maxlen = sizeof(int),
  121. .mode = 0644,
  122. .proc_handler = proc_dointvec
  123. },
  124. #ifdef CONFIG_BPF_JIT
  125. {
  126. .procname = "bpf_jit_enable",
  127. .data = &bpf_jit_enable,
  128. .maxlen = sizeof(int),
  129. .mode = 0644,
  130. .proc_handler = proc_dointvec
  131. },
  132. #endif
  133. {
  134. .procname = "netdev_tstamp_prequeue",
  135. .data = &netdev_tstamp_prequeue,
  136. .maxlen = sizeof(int),
  137. .mode = 0644,
  138. .proc_handler = proc_dointvec
  139. },
  140. {
  141. .procname = "message_cost",
  142. .data = &net_ratelimit_state.interval,
  143. .maxlen = sizeof(int),
  144. .mode = 0644,
  145. .proc_handler = proc_dointvec_jiffies,
  146. },
  147. {
  148. .procname = "message_burst",
  149. .data = &net_ratelimit_state.burst,
  150. .maxlen = sizeof(int),
  151. .mode = 0644,
  152. .proc_handler = proc_dointvec,
  153. },
  154. {
  155. .procname = "optmem_max",
  156. .data = &sysctl_optmem_max,
  157. .maxlen = sizeof(int),
  158. .mode = 0644,
  159. .proc_handler = proc_dointvec
  160. },
  161. #ifdef CONFIG_RPS
  162. {
  163. .procname = "rps_sock_flow_entries",
  164. .maxlen = sizeof(int),
  165. .mode = 0644,
  166. .proc_handler = rps_sock_flow_sysctl
  167. },
  168. #endif
  169. #endif /* CONFIG_NET */
  170. {
  171. .procname = "netdev_budget",
  172. .data = &netdev_budget,
  173. .maxlen = sizeof(int),
  174. .mode = 0644,
  175. .proc_handler = proc_dointvec
  176. },
  177. {
  178. .procname = "warnings",
  179. .data = &net_msg_warn,
  180. .maxlen = sizeof(int),
  181. .mode = 0644,
  182. .proc_handler = proc_dointvec
  183. },
  184. { }
  185. };
  186. static struct ctl_table netns_core_table[] = {
  187. {
  188. .procname = "somaxconn",
  189. .data = &init_net.core.sysctl_somaxconn,
  190. .maxlen = sizeof(int),
  191. .mode = 0644,
  192. .proc_handler = proc_dointvec
  193. },
  194. { }
  195. };
  196. static __net_init int sysctl_core_net_init(struct net *net)
  197. {
  198. struct ctl_table *tbl;
  199. net->core.sysctl_somaxconn = SOMAXCONN;
  200. tbl = netns_core_table;
  201. if (!net_eq(net, &init_net)) {
  202. tbl = kmemdup(tbl, sizeof(netns_core_table), GFP_KERNEL);
  203. if (tbl == NULL)
  204. goto err_dup;
  205. tbl[0].data = &net->core.sysctl_somaxconn;
  206. /* Don't export any sysctls to unprivileged users */
  207. if (net->user_ns != &init_user_ns) {
  208. tbl[0].procname = NULL;
  209. }
  210. }
  211. net->core.sysctl_hdr = register_net_sysctl(net, "net/core", tbl);
  212. if (net->core.sysctl_hdr == NULL)
  213. goto err_reg;
  214. return 0;
  215. err_reg:
  216. if (tbl != netns_core_table)
  217. kfree(tbl);
  218. err_dup:
  219. return -ENOMEM;
  220. }
  221. static __net_exit void sysctl_core_net_exit(struct net *net)
  222. {
  223. struct ctl_table *tbl;
  224. tbl = net->core.sysctl_hdr->ctl_table_arg;
  225. unregister_net_sysctl_table(net->core.sysctl_hdr);
  226. BUG_ON(tbl == netns_core_table);
  227. kfree(tbl);
  228. }
  229. static __net_initdata struct pernet_operations sysctl_core_ops = {
  230. .init = sysctl_core_net_init,
  231. .exit = sysctl_core_net_exit,
  232. };
  233. static __init int sysctl_core_init(void)
  234. {
  235. register_net_sysctl(&init_net, "net/core", net_core_table);
  236. return register_pernet_subsys(&sysctl_core_ops);
  237. }
  238. fs_initcall(sysctl_core_init);