blob: d05559d4d9cd4bbf5d97bd1ce1f058ef016a8e3a [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/* -*- linux-c -*-
2 * sysctl_net_core.c: sysctl interface to net core subsystem.
3 *
4 * Begun April 1, 1996, Mike Shaver.
5 * Added /proc/sys/net/core directory entry (empty =) ). [MS]
6 */
7
8#include <linux/mm.h>
9#include <linux/sysctl.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070010#include <linux/module.h>
Arnaldo Carvalho de Melo20380732005-08-16 02:18:02 -030011#include <linux/socket.h>
Pavel Emelyanova37ae402007-10-23 21:13:53 -070012#include <linux/netdevice.h>
Ingo Molnar3fff4c42009-09-22 16:18:09 +020013#include <linux/ratelimit.h>
Tom Herbertfec5e652010-04-16 16:01:27 -070014#include <linux/vmalloc.h>
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -080015#include <linux/init.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090016#include <linux/slab.h>
Ingo Molnar3fff4c42009-09-22 16:18:09 +020017
Hannes Eder63d819c2009-02-25 10:32:14 +000018#include <net/ip.h>
Arnaldo Carvalho de Melo20380732005-08-16 02:18:02 -030019#include <net/sock.h>
David S. Millerc5c177b2011-05-27 13:41:33 -040020#include <net/net_ratelimit.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021
Tom Herbertfec5e652010-04-16 16:01:27 -070022#ifdef CONFIG_RPS
23static int rps_sock_flow_sysctl(ctl_table *table, int write,
24 void __user *buffer, size_t *lenp, loff_t *ppos)
25{
26 unsigned int orig_size, size;
27 int ret, i;
28 ctl_table tmp = {
29 .data = &size,
30 .maxlen = sizeof(size),
31 .mode = table->mode
32 };
33 struct rps_sock_flow_table *orig_sock_table, *sock_table;
34 static DEFINE_MUTEX(sock_flow_mutex);
35
36 mutex_lock(&sock_flow_mutex);
37
Eric Dumazet6e3f7fa2010-10-25 03:02:02 +000038 orig_sock_table = rcu_dereference_protected(rps_sock_flow_table,
39 lockdep_is_held(&sock_flow_mutex));
Tom Herbertfec5e652010-04-16 16:01:27 -070040 size = orig_size = orig_sock_table ? orig_sock_table->mask + 1 : 0;
41
42 ret = proc_dointvec(&tmp, write, buffer, lenp, ppos);
43
44 if (write) {
45 if (size) {
46 if (size > 1<<30) {
47 /* Enforce limit to prevent overflow */
48 mutex_unlock(&sock_flow_mutex);
49 return -EINVAL;
50 }
51 size = roundup_pow_of_two(size);
52 if (size != orig_size) {
53 sock_table =
54 vmalloc(RPS_SOCK_FLOW_TABLE_SIZE(size));
55 if (!sock_table) {
56 mutex_unlock(&sock_flow_mutex);
57 return -ENOMEM;
58 }
59
60 sock_table->mask = size - 1;
61 } else
62 sock_table = orig_sock_table;
63
64 for (i = 0; i < size; i++)
65 sock_table->ents[i] = RPS_NO_CPU;
66 } else
67 sock_table = NULL;
68
69 if (sock_table != orig_sock_table) {
70 rcu_assign_pointer(rps_sock_flow_table, sock_table);
Eric Dumazetadc93002011-11-17 03:13:26 +000071 if (sock_table)
72 jump_label_inc(&rps_needed);
73 if (orig_sock_table) {
74 jump_label_dec(&rps_needed);
75 synchronize_rcu();
76 vfree(orig_sock_table);
77 }
Tom Herbertfec5e652010-04-16 16:01:27 -070078 }
79 }
80
81 mutex_unlock(&sock_flow_mutex);
82
83 return ret;
84}
85#endif /* CONFIG_RPS */
86
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -080087static struct ctl_table net_core_table[] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -070088#ifdef CONFIG_NET
89 {
Linus Torvalds1da177e2005-04-16 15:20:36 -070090 .procname = "wmem_max",
91 .data = &sysctl_wmem_max,
92 .maxlen = sizeof(int),
93 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -080094 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -070095 },
96 {
Linus Torvalds1da177e2005-04-16 15:20:36 -070097 .procname = "rmem_max",
98 .data = &sysctl_rmem_max,
99 .maxlen = sizeof(int),
100 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800101 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102 },
103 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104 .procname = "wmem_default",
105 .data = &sysctl_wmem_default,
106 .maxlen = sizeof(int),
107 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800108 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109 },
110 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 .procname = "rmem_default",
112 .data = &sysctl_rmem_default,
113 .maxlen = sizeof(int),
114 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800115 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116 },
117 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118 .procname = "dev_weight",
119 .data = &weight_p,
120 .maxlen = sizeof(int),
121 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800122 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700123 },
124 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125 .procname = "netdev_max_backlog",
126 .data = &netdev_max_backlog,
127 .maxlen = sizeof(int),
128 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800129 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700130 },
Eric Dumazet0a148422011-04-20 09:27:32 +0000131#ifdef CONFIG_BPF_JIT
132 {
133 .procname = "bpf_jit_enable",
134 .data = &bpf_jit_enable,
135 .maxlen = sizeof(int),
136 .mode = 0644,
137 .proc_handler = proc_dointvec
138 },
139#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700140 {
Eric Dumazet3b098e22010-05-15 23:57:10 -0700141 .procname = "netdev_tstamp_prequeue",
142 .data = &netdev_tstamp_prequeue,
143 .maxlen = sizeof(int),
144 .mode = 0644,
145 .proc_handler = proc_dointvec
146 },
147 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148 .procname = "message_cost",
Dave Young717115e2008-07-25 01:45:58 -0700149 .data = &net_ratelimit_state.interval,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150 .maxlen = sizeof(int),
151 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800152 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 },
154 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 .procname = "message_burst",
Dave Young717115e2008-07-25 01:45:58 -0700156 .data = &net_ratelimit_state.burst,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157 .maxlen = sizeof(int),
158 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800159 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160 },
161 {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162 .procname = "optmem_max",
163 .data = &sysctl_optmem_max,
164 .maxlen = sizeof(int),
165 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800166 .proc_handler = proc_dointvec
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167 },
Tom Herbertfec5e652010-04-16 16:01:27 -0700168#ifdef CONFIG_RPS
169 {
170 .procname = "rps_sock_flow_entries",
171 .maxlen = sizeof(int),
172 .mode = 0644,
173 .proc_handler = rps_sock_flow_sysctl
174 },
175#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176#endif /* CONFIG_NET */
177 {
Stephen Hemminger51b0bde2005-06-23 20:14:40 -0700178 .procname = "netdev_budget",
179 .data = &netdev_budget,
180 .maxlen = sizeof(int),
181 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800182 .proc_handler = proc_dointvec
Stephen Hemminger51b0bde2005-06-23 20:14:40 -0700183 },
Stephen Hemmingera2a316f2007-03-08 20:41:08 -0800184 {
Stephen Hemmingera2a316f2007-03-08 20:41:08 -0800185 .procname = "warnings",
186 .data = &net_msg_warn,
187 .maxlen = sizeof(int),
188 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800189 .proc_handler = proc_dointvec
Stephen Hemmingera2a316f2007-03-08 20:41:08 -0800190 },
Eric W. Biedermanf8572d82009-11-05 13:32:03 -0800191 { }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192};
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -0800193
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700194static struct ctl_table netns_core_table[] = {
195 {
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700196 .procname = "somaxconn",
197 .data = &init_net.core.sysctl_somaxconn,
198 .maxlen = sizeof(int),
199 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -0800200 .proc_handler = proc_dointvec
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700201 },
Eric W. Biedermanf8572d82009-11-05 13:32:03 -0800202 { }
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700203};
204
Alexey Dobriyanb27aead2008-11-25 18:00:48 -0800205__net_initdata struct ctl_path net_core_path[] = {
Eric W. Biedermanf8572d82009-11-05 13:32:03 -0800206 { .procname = "net", },
207 { .procname = "core", },
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -0800208 { },
209};
210
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800211static __net_init int sysctl_core_net_init(struct net *net)
212{
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700213 struct ctl_table *tbl;
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800214
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -0700215 net->core.sysctl_somaxconn = SOMAXCONN;
Pavel Emelyanovb8e1f9b2007-12-08 00:12:33 -0800216
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700217 tbl = netns_core_table;
Octavian Purdila09ad9bc2009-11-25 15:14:13 -0800218 if (!net_eq(net, &init_net)) {
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700219 tbl = kmemdup(tbl, sizeof(netns_core_table), GFP_KERNEL);
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800220 if (tbl == NULL)
221 goto err_dup;
222
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700223 tbl[0].data = &net->core.sysctl_somaxconn;
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800224 }
225
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -0700226 net->core.sysctl_hdr = register_net_sysctl_table(net,
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800227 net_core_path, tbl);
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -0700228 if (net->core.sysctl_hdr == NULL)
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800229 goto err_reg;
230
231 return 0;
232
233err_reg:
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700234 if (tbl != netns_core_table)
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800235 kfree(tbl);
236err_dup:
237 return -ENOMEM;
238}
239
240static __net_exit void sysctl_core_net_exit(struct net *net)
241{
242 struct ctl_table *tbl;
243
Pavel Emelyanov8efa6e92008-03-31 19:41:14 -0700244 tbl = net->core.sysctl_hdr->ctl_table_arg;
245 unregister_net_sysctl_table(net->core.sysctl_hdr);
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700246 BUG_ON(tbl == netns_core_table);
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800247 kfree(tbl);
248}
249
250static __net_initdata struct pernet_operations sysctl_core_ops = {
251 .init = sysctl_core_net_init,
252 .exit = sysctl_core_net_exit,
253};
254
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -0800255static __init int sysctl_core_init(void)
256{
Alexey Dobriyanb27aead2008-11-25 18:00:48 -0800257 static struct ctl_table empty[1];
258
259 register_sysctl_paths(net_core_path, empty);
Pavel Emelyanovd5a45022008-05-19 13:49:52 -0700260 register_net_sysctl_rotable(net_core_path, net_core_table);
Pavel Emelyanov024626e2007-12-08 00:09:24 -0800261 return register_pernet_subsys(&sysctl_core_ops);
Pavel Emelyanov33eb9cf2007-12-05 01:37:34 -0800262}
263
Alexey Dobriyanb27aead2008-11-25 18:00:48 -0800264fs_initcall(sysctl_core_init);