blob: a7c36845b123c09f727931cfe3ef3e4ad0365432 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/* -*- linux-c -*-
2 * sysctl_net_core.c: sysctl interface to net core subsystem.
3 *
4 * Begun April 1, 1996, Mike Shaver.
5 * Added /proc/sys/net/core directory entry (empty =) ). [MS]
6 */
7
8#include <linux/mm.h>
9#include <linux/sysctl.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070010#include <linux/module.h>
Arnaldo Carvalho de Melo20380732005-08-16 02:18:02 -030011#include <linux/socket.h>
Pavel Emelyanova37ae402007-10-23 21:13:53 -070012#include <linux/netdevice.h>
Ingo Molnar3fff4c42009-09-22 16:18:09 +020013#include <linux/ratelimit.h>
Tom Herbertfec5e652010-04-16 16:01:27 -070014#include <linux/vmalloc.h>
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -080015#include <linux/init.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090016#include <linux/slab.h>
Shan Wei7426a562012-04-18 18:05:46 +000017#include <linux/kmemleak.h>
Ingo Molnar3fff4c42009-09-22 16:18:09 +020018
Hannes Eder63d819c2009-02-25 10:32:14 +000019#include <net/ip.h>
Arnaldo Carvalho de Melo20380732005-08-16 02:18:02 -030020#include <net/sock.h>
David S. Millerc5c177b2011-05-27 13:41:33 -040021#include <net/net_ratelimit.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070022
Tom Herbertfec5e652010-04-16 16:01:27 -070023#ifdef CONFIG_RPS
24static int rps_sock_flow_sysctl(ctl_table *table, int write,
25 void __user *buffer, size_t *lenp, loff_t *ppos)
26{
27 unsigned int orig_size, size;
28 int ret, i;
29 ctl_table tmp = {
30 .data = &size,
31 .maxlen = sizeof(size),
32 .mode = table->mode
33 };
34 struct rps_sock_flow_table *orig_sock_table, *sock_table;
35 static DEFINE_MUTEX(sock_flow_mutex);
36
37 mutex_lock(&sock_flow_mutex);
38
Eric Dumazet6e3f7fa2010-10-25 03:02:02 +000039 orig_sock_table = rcu_dereference_protected(rps_sock_flow_table,
40 lockdep_is_held(&sock_flow_mutex));
Tom Herbertfec5e652010-04-16 16:01:27 -070041 size = orig_size = orig_sock_table ? orig_sock_table->mask + 1 : 0;
42
43 ret = proc_dointvec(&tmp, write, buffer, lenp, ppos);
44
45 if (write) {
46 if (size) {
47 if (size > 1<<30) {
48 /* Enforce limit to prevent overflow */
49 mutex_unlock(&sock_flow_mutex);
50 return -EINVAL;
51 }
52 size = roundup_pow_of_two(size);
53 if (size != orig_size) {
54 sock_table =
55 vmalloc(RPS_SOCK_FLOW_TABLE_SIZE(size));
56 if (!sock_table) {
57 mutex_unlock(&sock_flow_mutex);
58 return -ENOMEM;
59 }
60
61 sock_table->mask = size - 1;
62 } else
63 sock_table = orig_sock_table;
64
65 for (i = 0; i < size; i++)
66 sock_table->ents[i] = RPS_NO_CPU;
67 } else
68 sock_table = NULL;
69
70 if (sock_table != orig_sock_table) {
71 rcu_assign_pointer(rps_sock_flow_table, sock_table);
Eric Dumazetadc93002011-11-17 03:13:26 +000072 if (sock_table)
Ingo Molnarc5905af2012-02-24 08:31:31 +010073 static_key_slow_inc(&rps_needed);
Eric Dumazetadc93002011-11-17 03:13:26 +000074 if (orig_sock_table) {
Ingo Molnarc5905af2012-02-24 08:31:31 +010075 static_key_slow_dec(&rps_needed);
Eric Dumazetadc93002011-11-17 03:13:26 +000076 synchronize_rcu();
77 vfree(orig_sock_table);
78 }
Tom Herbertfec5e652010-04-16 16:01:27 -070079 }
80 }
81
82 mutex_unlock(&sock_flow_mutex);
83
84 return ret;
85}
86#endif /* CONFIG_RPS */
87
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -080088static struct ctl_table net_core_table[] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -070089#ifdef CONFIG_NET
90 {
Linus Torvalds1da177e2005-04-16 15:20:36 -070091 .procname = "wmem_max",
92 .data = &sysctl_wmem_max,
93 .maxlen = sizeof(int),
94 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -080095 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -070096 },
97 {
Linus Torvalds1da177e2005-04-16 15:20:36 -070098 .procname = "rmem_max",
99 .data = &sysctl_rmem_max,
100 .maxlen = sizeof(int),
101 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800102 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103 },
104 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105 .procname = "wmem_default",
106 .data = &sysctl_wmem_default,
107 .maxlen = sizeof(int),
108 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800109 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110 },
111 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112 .procname = "rmem_default",
113 .data = &sysctl_rmem_default,
114 .maxlen = sizeof(int),
115 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800116 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117 },
118 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119 .procname = "dev_weight",
120 .data = &weight_p,
121 .maxlen = sizeof(int),
122 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800123 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124 },
125 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126 .procname = "netdev_max_backlog",
127 .data = &netdev_max_backlog,
128 .maxlen = sizeof(int),
129 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800130 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131 },
Eric Dumazet0a148422011-04-20 09:27:32 +0000132#ifdef CONFIG_BPF_JIT
133 {
134 .procname = "bpf_jit_enable",
135 .data = &bpf_jit_enable,
136 .maxlen = sizeof(int),
137 .mode = 0644,
138 .proc_handler = proc_dointvec
139 },
140#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700141 {
Eric Dumazet3b098e22010-05-15 23:57:10 -0700142 .procname = "netdev_tstamp_prequeue",
143 .data = &netdev_tstamp_prequeue,
144 .maxlen = sizeof(int),
145 .mode = 0644,
146 .proc_handler = proc_dointvec
147 },
148 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700149 .procname = "message_cost",
Dave Young717115e2008-07-25 01:45:58 -0700150 .data = &net_ratelimit_state.interval,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151 .maxlen = sizeof(int),
152 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800153 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154 },
155 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156 .procname = "message_burst",
Dave Young717115e2008-07-25 01:45:58 -0700157 .data = &net_ratelimit_state.burst,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158 .maxlen = sizeof(int),
159 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800160 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161 },
162 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163 .procname = "optmem_max",
164 .data = &sysctl_optmem_max,
165 .maxlen = sizeof(int),
166 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800167 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168 },
Tom Herbertfec5e652010-04-16 16:01:27 -0700169#ifdef CONFIG_RPS
170 {
171 .procname = "rps_sock_flow_entries",
172 .maxlen = sizeof(int),
173 .mode = 0644,
174 .proc_handler = rps_sock_flow_sysctl
175 },
176#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177#endif /* CONFIG_NET */
178 {
Stephen Hemminger51b0bde2005-06-23 20:14:40 -0700179 .procname = "netdev_budget",
180 .data = &netdev_budget,
181 .maxlen = sizeof(int),
182 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800183 .proc_handler = proc_dointvec
Stephen Hemminger51b0bde2005-06-23 20:14:40 -0700184 },
Stephen Hemmingera2a316f2007-03-08 20:41:08 -0800185 {
Stephen Hemmingera2a316f2007-03-08 20:41:08 -0800186 .procname = "warnings",
187 .data = &net_msg_warn,
188 .maxlen = sizeof(int),
189 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800190 .proc_handler = proc_dointvec
Stephen Hemmingera2a316f2007-03-08 20:41:08 -0800191 },
Eric W. Biedermanf8572d82009-11-05 13:32:03 -0800192 { }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193};
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -0800194
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700195static struct ctl_table netns_core_table[] = {
196 {
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700197 .procname = "somaxconn",
198 .data = &init_net.core.sysctl_somaxconn,
199 .maxlen = sizeof(int),
200 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800201 .proc_handler = proc_dointvec
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700202 },
Eric W. Biedermanf8572d82009-11-05 13:32:03 -0800203 { }
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700204};
205
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800206static __net_init int sysctl_core_net_init(struct net *net)
207{
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700208 struct ctl_table *tbl;
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800209
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -0700210 net->core.sysctl_somaxconn = SOMAXCONN;
Pavel Emelyanovb8e1f9b2007-12-08 00:12:33 -0800211
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700212 tbl = netns_core_table;
Octavian Purdila09ad9bc2009-11-25 15:14:13 -0800213 if (!net_eq(net, &init_net)) {
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700214 tbl = kmemdup(tbl, sizeof(netns_core_table), GFP_KERNEL);
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800215 if (tbl == NULL)
216 goto err_dup;
217
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700218 tbl[0].data = &net->core.sysctl_somaxconn;
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800219 }
220
Eric W. Biedermanec8f23c2012-04-19 13:44:49 +0000221 net->core.sysctl_hdr = register_net_sysctl(net, "net/core", tbl);
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -0700222 if (net->core.sysctl_hdr == NULL)
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800223 goto err_reg;
224
225 return 0;
226
227err_reg:
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700228 if (tbl != netns_core_table)
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800229 kfree(tbl);
230err_dup:
231 return -ENOMEM;
232}
233
234static __net_exit void sysctl_core_net_exit(struct net *net)
235{
236 struct ctl_table *tbl;
237
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -0700238 tbl = net->core.sysctl_hdr->ctl_table_arg;
239 unregister_net_sysctl_table(net->core.sysctl_hdr);
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700240 BUG_ON(tbl == netns_core_table);
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800241 kfree(tbl);
242}
243
244static __net_initdata struct pernet_operations sysctl_core_ops = {
245 .init = sysctl_core_net_init,
246 .exit = sysctl_core_net_exit,
247};
248
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -0800249static __init int sysctl_core_init(void)
250{
Eric W. Biederman43444752012-04-19 13:22:55 +0000251 register_net_sysctl(&init_net, "net/core", net_core_table);
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800252 return register_pernet_subsys(&sysctl_core_ops);
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -0800253}
254
Alexey Dobriyanb27aead2008-11-25 18:00:48 -0800255fs_initcall(sysctl_core_init);