]>
Commit | Line | Data |
---|---|---|
b2441318 | 1 | // SPDX-License-Identifier: GPL-2.0 |
1da177e4 LT |
2 | /* -*- linux-c -*- |
3 | * sysctl_net_core.c: sysctl interface to net core subsystem. | |
4 | * | |
5 | * Begun April 1, 1996, Mike Shaver. | |
6 | * Added /proc/sys/net/core directory entry (empty =) ). [MS] | |
7 | */ | |
8 | ||
b6459415 | 9 | #include <linux/filter.h> |
1da177e4 LT |
10 | #include <linux/mm.h> |
11 | #include <linux/sysctl.h> | |
1da177e4 | 12 | #include <linux/module.h> |
20380731 | 13 | #include <linux/socket.h> |
a37ae408 | 14 | #include <linux/netdevice.h> |
3fff4c42 | 15 | #include <linux/ratelimit.h> |
fec5e652 | 16 | #include <linux/vmalloc.h> |
33eb9cfc | 17 | #include <linux/init.h> |
5a0e3ad6 | 18 | #include <linux/slab.h> |
605cfa1b | 19 | #include <linux/sched/isolation.h> |
3fff4c42 | 20 | |
63d819ca | 21 | #include <net/ip.h> |
20380731 | 22 | #include <net/sock.h> |
c5c177b4 | 23 | #include <net/net_ratelimit.h> |
076bb0c8 | 24 | #include <net/busy_poll.h> |
6da7c8fc | 25 | #include <net/pkt_sched.h> |
1da177e4 | 26 | |
6264f58c JK |
27 | #include "dev.h" |
28 | ||
5aa3afe1 | 29 | static int int_3600 = 3600; |
b1cb59cf AK |
30 | static int min_sndbuf = SOCK_MIN_SNDBUF; |
31 | static int min_rcvbuf = SOCK_MIN_RCVBUF; | |
5f74f82e | 32 | static int max_skb_frags = MAX_SKB_FRAGS; |
cdda8891 | 33 | |
ba7a46f1 JP |
34 | static int net_msg_warn; /* Unused, but still a sysctl */ |
35 | ||
79134e6c ED |
36 | int sysctl_fb_tunnels_only_for_init_net __read_mostly = 0; |
37 | EXPORT_SYMBOL(sysctl_fb_tunnels_only_for_init_net); | |
38 | ||
856c395c CW |
39 | /* 0 - Keep current behavior: |
40 | * IPv4: inherit all current settings from init_net | |
41 | * IPv6: reset all settings to default | |
42 | * 1 - Both inherit all current settings from init_net | |
43 | * 2 - Both reset all settings to default | |
9efd6a3c | 44 | * 3 - Both inherit all settings from current netns |
856c395c CW |
45 | */ |
46 | int sysctl_devconf_inherit_init_net __read_mostly; | |
47 | EXPORT_SYMBOL(sysctl_devconf_inherit_init_net); | |
48 | ||
605cfa1b | 49 | #if IS_ENABLED(CONFIG_NET_FLOW_LIMIT) || IS_ENABLED(CONFIG_RPS) |
135746c6 PA |
50 | static void dump_cpumask(void *buffer, size_t *lenp, loff_t *ppos, |
51 | struct cpumask *mask) | |
52 | { | |
53 | char kbuf[128]; | |
54 | int len; | |
55 | ||
56 | if (*ppos || !*lenp) { | |
57 | *lenp = 0; | |
58 | return; | |
59 | } | |
60 | ||
61 | len = min(sizeof(kbuf) - 1, *lenp); | |
62 | len = scnprintf(kbuf, len, "%*pb", cpumask_pr_args(mask)); | |
63 | if (!len) { | |
64 | *lenp = 0; | |
65 | return; | |
66 | } | |
67 | ||
68 | if (len < *lenp) | |
69 | kbuf[len++] = '\n'; | |
70 | memcpy(buffer, kbuf, len); | |
71 | *lenp = len; | |
72 | *ppos += len; | |
73 | } | |
74 | #endif | |
75 | ||
fec5e652 | 76 | #ifdef CONFIG_RPS |
50bcfe8d PA |
77 | |
78 | static struct cpumask *rps_default_mask_cow_alloc(struct net *net) | |
79 | { | |
80 | struct cpumask *rps_default_mask; | |
81 | ||
82 | if (net->core.rps_default_mask) | |
83 | return net->core.rps_default_mask; | |
84 | ||
85 | rps_default_mask = kzalloc(cpumask_size(), GFP_KERNEL); | |
86 | if (!rps_default_mask) | |
87 | return NULL; | |
88 | ||
89 | /* pairs with READ_ONCE in rx_queue_default_mask() */ | |
90 | WRITE_ONCE(net->core.rps_default_mask, rps_default_mask); | |
91 | return rps_default_mask; | |
92 | } | |
605cfa1b PA |
93 | |
94 | static int rps_default_mask_sysctl(struct ctl_table *table, int write, | |
95 | void *buffer, size_t *lenp, loff_t *ppos) | |
96 | { | |
50bcfe8d | 97 | struct net *net = (struct net *)table->data; |
605cfa1b PA |
98 | int err = 0; |
99 | ||
100 | rtnl_lock(); | |
101 | if (write) { | |
50bcfe8d PA |
102 | struct cpumask *rps_default_mask = rps_default_mask_cow_alloc(net); |
103 | ||
104 | err = -ENOMEM; | |
105 | if (!rps_default_mask) | |
106 | goto done; | |
107 | ||
108 | err = cpumask_parse(buffer, rps_default_mask); | |
605cfa1b PA |
109 | if (err) |
110 | goto done; | |
111 | ||
50bcfe8d | 112 | err = rps_cpumask_housekeeping(rps_default_mask); |
605cfa1b PA |
113 | if (err) |
114 | goto done; | |
115 | } else { | |
50bcfe8d PA |
116 | dump_cpumask(buffer, lenp, ppos, |
117 | net->core.rps_default_mask ? : cpu_none_mask); | |
605cfa1b PA |
118 | } |
119 | ||
120 | done: | |
121 | rtnl_unlock(); | |
122 | return err; | |
123 | } | |
124 | ||
fe2c6338 | 125 | static int rps_sock_flow_sysctl(struct ctl_table *table, int write, |
32927393 | 126 | void *buffer, size_t *lenp, loff_t *ppos) |
fec5e652 TH |
127 | { |
128 | unsigned int orig_size, size; | |
129 | int ret, i; | |
fe2c6338 | 130 | struct ctl_table tmp = { |
fec5e652 TH |
131 | .data = &size, |
132 | .maxlen = sizeof(size), | |
133 | .mode = table->mode | |
134 | }; | |
135 | struct rps_sock_flow_table *orig_sock_table, *sock_table; | |
136 | static DEFINE_MUTEX(sock_flow_mutex); | |
137 | ||
138 | mutex_lock(&sock_flow_mutex); | |
139 | ||
6e3f7faf ED |
140 | orig_sock_table = rcu_dereference_protected(rps_sock_flow_table, |
141 | lockdep_is_held(&sock_flow_mutex)); | |
fec5e652 TH |
142 | size = orig_size = orig_sock_table ? orig_sock_table->mask + 1 : 0; |
143 | ||
144 | ret = proc_dointvec(&tmp, write, buffer, lenp, ppos); | |
145 | ||
146 | if (write) { | |
147 | if (size) { | |
93c1af6c | 148 | if (size > 1<<29) { |
fec5e652 TH |
149 | /* Enforce limit to prevent overflow */ |
150 | mutex_unlock(&sock_flow_mutex); | |
151 | return -EINVAL; | |
152 | } | |
153 | size = roundup_pow_of_two(size); | |
154 | if (size != orig_size) { | |
155 | sock_table = | |
156 | vmalloc(RPS_SOCK_FLOW_TABLE_SIZE(size)); | |
157 | if (!sock_table) { | |
158 | mutex_unlock(&sock_flow_mutex); | |
159 | return -ENOMEM; | |
160 | } | |
567e4b79 | 161 | rps_cpu_mask = roundup_pow_of_two(nr_cpu_ids) - 1; |
fec5e652 TH |
162 | sock_table->mask = size - 1; |
163 | } else | |
164 | sock_table = orig_sock_table; | |
165 | ||
166 | for (i = 0; i < size; i++) | |
167 | sock_table->ents[i] = RPS_NO_CPU; | |
168 | } else | |
169 | sock_table = NULL; | |
170 | ||
171 | if (sock_table != orig_sock_table) { | |
172 | rcu_assign_pointer(rps_sock_flow_table, sock_table); | |
13bfff25 | 173 | if (sock_table) { |
dc05360f ED |
174 | static_branch_inc(&rps_needed); |
175 | static_branch_inc(&rfs_needed); | |
13bfff25 | 176 | } |
adc9300e | 177 | if (orig_sock_table) { |
dc05360f ED |
178 | static_branch_dec(&rps_needed); |
179 | static_branch_dec(&rfs_needed); | |
aef3b8b8 | 180 | kvfree_rcu_mightsleep(orig_sock_table); |
adc9300e | 181 | } |
fec5e652 TH |
182 | } |
183 | } | |
184 | ||
185 | mutex_unlock(&sock_flow_mutex); | |
186 | ||
187 | return ret; | |
188 | } | |
189 | #endif /* CONFIG_RPS */ | |
190 | ||
99bbc707 WB |
191 | #ifdef CONFIG_NET_FLOW_LIMIT |
192 | static DEFINE_MUTEX(flow_limit_update_mutex); | |
193 | ||
fe2c6338 | 194 | static int flow_limit_cpu_sysctl(struct ctl_table *table, int write, |
32927393 | 195 | void *buffer, size_t *lenp, loff_t *ppos) |
99bbc707 WB |
196 | { |
197 | struct sd_flow_limit *cur; | |
198 | struct softnet_data *sd; | |
199 | cpumask_var_t mask; | |
200 | int i, len, ret = 0; | |
201 | ||
202 | if (!alloc_cpumask_var(&mask, GFP_KERNEL)) | |
203 | return -ENOMEM; | |
204 | ||
205 | if (write) { | |
56965ac7 | 206 | ret = cpumask_parse(buffer, mask); |
99bbc707 WB |
207 | if (ret) |
208 | goto done; | |
209 | ||
210 | mutex_lock(&flow_limit_update_mutex); | |
211 | len = sizeof(*cur) + netdev_flow_limit_table_len; | |
212 | for_each_possible_cpu(i) { | |
213 | sd = &per_cpu(softnet_data, i); | |
214 | cur = rcu_dereference_protected(sd->flow_limit, | |
215 | lockdep_is_held(&flow_limit_update_mutex)); | |
216 | if (cur && !cpumask_test_cpu(i, mask)) { | |
217 | RCU_INIT_POINTER(sd->flow_limit, NULL); | |
aef3b8b8 | 218 | kfree_rcu_mightsleep(cur); |
99bbc707 | 219 | } else if (!cur && cpumask_test_cpu(i, mask)) { |
5b59d467 ED |
220 | cur = kzalloc_node(len, GFP_KERNEL, |
221 | cpu_to_node(i)); | |
99bbc707 WB |
222 | if (!cur) { |
223 | /* not unwinding previous changes */ | |
224 | ret = -ENOMEM; | |
225 | goto write_unlock; | |
226 | } | |
227 | cur->num_buckets = netdev_flow_limit_table_len; | |
228 | rcu_assign_pointer(sd->flow_limit, cur); | |
229 | } | |
230 | } | |
231 | write_unlock: | |
232 | mutex_unlock(&flow_limit_update_mutex); | |
233 | } else { | |
99bbc707 WB |
234 | cpumask_clear(mask); |
235 | rcu_read_lock(); | |
236 | for_each_possible_cpu(i) { | |
237 | sd = &per_cpu(softnet_data, i); | |
238 | if (rcu_dereference(sd->flow_limit)) | |
239 | cpumask_set_cpu(i, mask); | |
240 | } | |
241 | rcu_read_unlock(); | |
242 | ||
135746c6 | 243 | dump_cpumask(buffer, lenp, ppos, mask); |
99bbc707 WB |
244 | } |
245 | ||
246 | done: | |
247 | free_cpumask_var(mask); | |
248 | return ret; | |
249 | } | |
250 | ||
fe2c6338 | 251 | static int flow_limit_table_len_sysctl(struct ctl_table *table, int write, |
32927393 | 252 | void *buffer, size_t *lenp, loff_t *ppos) |
99bbc707 WB |
253 | { |
254 | unsigned int old, *ptr; | |
255 | int ret; | |
256 | ||
257 | mutex_lock(&flow_limit_update_mutex); | |
258 | ||
259 | ptr = table->data; | |
260 | old = *ptr; | |
261 | ret = proc_dointvec(table, write, buffer, lenp, ppos); | |
262 | if (!ret && write && !is_power_of_2(*ptr)) { | |
263 | *ptr = old; | |
264 | ret = -EINVAL; | |
265 | } | |
266 | ||
267 | mutex_unlock(&flow_limit_update_mutex); | |
268 | return ret; | |
269 | } | |
270 | #endif /* CONFIG_NET_FLOW_LIMIT */ | |
271 | ||
6da7c8fc | 272 | #ifdef CONFIG_NET_SCHED |
273 | static int set_default_qdisc(struct ctl_table *table, int write, | |
32927393 | 274 | void *buffer, size_t *lenp, loff_t *ppos) |
6da7c8fc | 275 | { |
276 | char id[IFNAMSIZ]; | |
277 | struct ctl_table tbl = { | |
278 | .data = id, | |
279 | .maxlen = IFNAMSIZ, | |
280 | }; | |
281 | int ret; | |
282 | ||
283 | qdisc_get_default(id, IFNAMSIZ); | |
284 | ||
285 | ret = proc_dostring(&tbl, write, buffer, lenp, ppos); | |
286 | if (write && ret == 0) | |
287 | ret = qdisc_set_default(id); | |
288 | return ret; | |
289 | } | |
290 | #endif | |
291 | ||
3d48b53f | 292 | static int proc_do_dev_weight(struct ctl_table *table, int write, |
32927393 | 293 | void *buffer, size_t *lenp, loff_t *ppos) |
3d48b53f | 294 | { |
bf955b5a KI |
295 | static DEFINE_MUTEX(dev_weight_mutex); |
296 | int ret, weight; | |
3d48b53f | 297 | |
bf955b5a | 298 | mutex_lock(&dev_weight_mutex); |
3d48b53f | 299 | ret = proc_dointvec(table, write, buffer, lenp, ppos); |
bf955b5a KI |
300 | if (!ret && write) { |
301 | weight = READ_ONCE(weight_p); | |
302 | WRITE_ONCE(dev_rx_weight, weight * dev_weight_rx_bias); | |
303 | WRITE_ONCE(dev_tx_weight, weight * dev_weight_tx_bias); | |
304 | } | |
305 | mutex_unlock(&dev_weight_mutex); | |
3d48b53f MT |
306 | |
307 | return ret; | |
308 | } | |
309 | ||
960fb622 | 310 | static int proc_do_rss_key(struct ctl_table *table, int write, |
32927393 | 311 | void *buffer, size_t *lenp, loff_t *ppos) |
960fb622 ED |
312 | { |
313 | struct ctl_table fake_table; | |
314 | char buf[NETDEV_RSS_KEY_LEN * 3]; | |
315 | ||
316 | snprintf(buf, sizeof(buf), "%*phC", NETDEV_RSS_KEY_LEN, netdev_rss_key); | |
317 | fake_table.data = buf; | |
318 | fake_table.maxlen = sizeof(buf); | |
319 | return proc_dostring(&fake_table, write, buffer, lenp, ppos); | |
320 | } | |
321 | ||
2e4a3098 DB |
322 | #ifdef CONFIG_BPF_JIT |
323 | static int proc_dointvec_minmax_bpf_enable(struct ctl_table *table, int write, | |
32927393 | 324 | void *buffer, size_t *lenp, |
2e4a3098 DB |
325 | loff_t *ppos) |
326 | { | |
327 | int ret, jit_enable = *(int *)table->data; | |
174efa78 TY |
328 | int min = *(int *)table->extra1; |
329 | int max = *(int *)table->extra2; | |
2e4a3098 DB |
330 | struct ctl_table tmp = *table; |
331 | ||
332 | if (write && !capable(CAP_SYS_ADMIN)) | |
333 | return -EPERM; | |
334 | ||
335 | tmp.data = &jit_enable; | |
336 | ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos); | |
337 | if (write && !ret) { | |
338 | if (jit_enable < 2 || | |
63960260 | 339 | (jit_enable == 2 && bpf_dump_raw_ok(current_cred()))) { |
2e4a3098 DB |
340 | *(int *)table->data = jit_enable; |
341 | if (jit_enable == 2) | |
342 | pr_warn("bpf_jit_enable = 2 was set! NEVER use this in production, only for JIT debugging!\n"); | |
343 | } else { | |
344 | ret = -EPERM; | |
345 | } | |
346 | } | |
174efa78 TY |
347 | |
348 | if (write && ret && min == max) | |
349 | pr_info_once("CONFIG_BPF_JIT_ALWAYS_ON is enabled, bpf_jit_enable is permanently set to 1.\n"); | |
350 | ||
2e4a3098 DB |
351 | return ret; |
352 | } | |
353 | ||
1148f9ad | 354 | # ifdef CONFIG_HAVE_EBPF_JIT |
2e4a3098 DB |
355 | static int |
356 | proc_dointvec_minmax_bpf_restricted(struct ctl_table *table, int write, | |
32927393 | 357 | void *buffer, size_t *lenp, loff_t *ppos) |
2e4a3098 DB |
358 | { |
359 | if (!capable(CAP_SYS_ADMIN)) | |
360 | return -EPERM; | |
361 | ||
362 | return proc_dointvec_minmax(table, write, buffer, lenp, ppos); | |
363 | } | |
1148f9ad | 364 | # endif /* CONFIG_HAVE_EBPF_JIT */ |
fdadd049 DB |
365 | |
366 | static int | |
367 | proc_dolongvec_minmax_bpf_restricted(struct ctl_table *table, int write, | |
32927393 | 368 | void *buffer, size_t *lenp, loff_t *ppos) |
fdadd049 DB |
369 | { |
370 | if (!capable(CAP_SYS_ADMIN)) | |
371 | return -EPERM; | |
372 | ||
373 | return proc_doulongvec_minmax(table, write, buffer, lenp, ppos); | |
374 | } | |
2e4a3098 DB |
375 | #endif |
376 | ||
33eb9cfc | 377 | static struct ctl_table net_core_table[] = { |
1da177e4 | 378 | { |
1da177e4 LT |
379 | .procname = "wmem_max", |
380 | .data = &sysctl_wmem_max, | |
381 | .maxlen = sizeof(int), | |
382 | .mode = 0644, | |
cdda8891 | 383 | .proc_handler = proc_dointvec_minmax, |
b1cb59cf | 384 | .extra1 = &min_sndbuf, |
1da177e4 LT |
385 | }, |
386 | { | |
1da177e4 LT |
387 | .procname = "rmem_max", |
388 | .data = &sysctl_rmem_max, | |
389 | .maxlen = sizeof(int), | |
390 | .mode = 0644, | |
cdda8891 | 391 | .proc_handler = proc_dointvec_minmax, |
b1cb59cf | 392 | .extra1 = &min_rcvbuf, |
1da177e4 LT |
393 | }, |
394 | { | |
1da177e4 LT |
395 | .procname = "wmem_default", |
396 | .data = &sysctl_wmem_default, | |
397 | .maxlen = sizeof(int), | |
398 | .mode = 0644, | |
cdda8891 | 399 | .proc_handler = proc_dointvec_minmax, |
b1cb59cf | 400 | .extra1 = &min_sndbuf, |
1da177e4 LT |
401 | }, |
402 | { | |
1da177e4 LT |
403 | .procname = "rmem_default", |
404 | .data = &sysctl_rmem_default, | |
405 | .maxlen = sizeof(int), | |
406 | .mode = 0644, | |
cdda8891 | 407 | .proc_handler = proc_dointvec_minmax, |
b1cb59cf | 408 | .extra1 = &min_rcvbuf, |
1da177e4 LT |
409 | }, |
410 | { | |
1da177e4 LT |
411 | .procname = "dev_weight", |
412 | .data = &weight_p, | |
413 | .maxlen = sizeof(int), | |
414 | .mode = 0644, | |
3d48b53f MT |
415 | .proc_handler = proc_do_dev_weight, |
416 | }, | |
417 | { | |
418 | .procname = "dev_weight_rx_bias", | |
419 | .data = &dev_weight_rx_bias, | |
420 | .maxlen = sizeof(int), | |
421 | .mode = 0644, | |
422 | .proc_handler = proc_do_dev_weight, | |
423 | }, | |
424 | { | |
425 | .procname = "dev_weight_tx_bias", | |
426 | .data = &dev_weight_tx_bias, | |
427 | .maxlen = sizeof(int), | |
428 | .mode = 0644, | |
429 | .proc_handler = proc_do_dev_weight, | |
1da177e4 LT |
430 | }, |
431 | { | |
1da177e4 LT |
432 | .procname = "netdev_max_backlog", |
433 | .data = &netdev_max_backlog, | |
434 | .maxlen = sizeof(int), | |
435 | .mode = 0644, | |
6d9f239a | 436 | .proc_handler = proc_dointvec |
1da177e4 | 437 | }, |
960fb622 ED |
438 | { |
439 | .procname = "netdev_rss_key", | |
440 | .data = &netdev_rss_key, | |
441 | .maxlen = sizeof(int), | |
442 | .mode = 0444, | |
443 | .proc_handler = proc_do_rss_key, | |
444 | }, | |
0a14842f ED |
445 | #ifdef CONFIG_BPF_JIT |
446 | { | |
447 | .procname = "bpf_jit_enable", | |
448 | .data = &bpf_jit_enable, | |
449 | .maxlen = sizeof(int), | |
450 | .mode = 0644, | |
2e4a3098 | 451 | .proc_handler = proc_dointvec_minmax_bpf_enable, |
fa9dd599 | 452 | # ifdef CONFIG_BPF_JIT_ALWAYS_ON |
eec4844f MC |
453 | .extra1 = SYSCTL_ONE, |
454 | .extra2 = SYSCTL_ONE, | |
fa9dd599 | 455 | # else |
eec4844f | 456 | .extra1 = SYSCTL_ZERO, |
bd8a5367 | 457 | .extra2 = SYSCTL_TWO, |
fa9dd599 | 458 | # endif |
0a14842f | 459 | }, |
4f3446bb DB |
460 | # ifdef CONFIG_HAVE_EBPF_JIT |
461 | { | |
462 | .procname = "bpf_jit_harden", | |
463 | .data = &bpf_jit_harden, | |
464 | .maxlen = sizeof(int), | |
465 | .mode = 0600, | |
2e4a3098 | 466 | .proc_handler = proc_dointvec_minmax_bpf_restricted, |
eec4844f | 467 | .extra1 = SYSCTL_ZERO, |
bd8a5367 | 468 | .extra2 = SYSCTL_TWO, |
4f3446bb | 469 | }, |
74451e66 DB |
470 | { |
471 | .procname = "bpf_jit_kallsyms", | |
472 | .data = &bpf_jit_kallsyms, | |
473 | .maxlen = sizeof(int), | |
474 | .mode = 0600, | |
2e4a3098 | 475 | .proc_handler = proc_dointvec_minmax_bpf_restricted, |
eec4844f MC |
476 | .extra1 = SYSCTL_ZERO, |
477 | .extra2 = SYSCTL_ONE, | |
74451e66 | 478 | }, |
4f3446bb | 479 | # endif |
ede95a63 DB |
480 | { |
481 | .procname = "bpf_jit_limit", | |
482 | .data = &bpf_jit_limit, | |
fdadd049 | 483 | .maxlen = sizeof(long), |
ede95a63 | 484 | .mode = 0600, |
fdadd049 | 485 | .proc_handler = proc_dolongvec_minmax_bpf_restricted, |
bd8a5367 | 486 | .extra1 = SYSCTL_LONG_ONE, |
fadb7ff1 | 487 | .extra2 = &bpf_jit_limit_max, |
ede95a63 | 488 | }, |
0a14842f | 489 | #endif |
3b098e2d ED |
490 | { |
491 | .procname = "netdev_tstamp_prequeue", | |
492 | .data = &netdev_tstamp_prequeue, | |
493 | .maxlen = sizeof(int), | |
494 | .mode = 0644, | |
495 | .proc_handler = proc_dointvec | |
496 | }, | |
1da177e4 | 497 | { |
1da177e4 | 498 | .procname = "message_cost", |
717115e1 | 499 | .data = &net_ratelimit_state.interval, |
1da177e4 LT |
500 | .maxlen = sizeof(int), |
501 | .mode = 0644, | |
6d9f239a | 502 | .proc_handler = proc_dointvec_jiffies, |
1da177e4 LT |
503 | }, |
504 | { | |
1da177e4 | 505 | .procname = "message_burst", |
717115e1 | 506 | .data = &net_ratelimit_state.burst, |
1da177e4 LT |
507 | .maxlen = sizeof(int), |
508 | .mode = 0644, | |
6d9f239a | 509 | .proc_handler = proc_dointvec, |
1da177e4 | 510 | }, |
b245be1f WB |
511 | { |
512 | .procname = "tstamp_allow_data", | |
513 | .data = &sysctl_tstamp_allow_data, | |
514 | .maxlen = sizeof(int), | |
515 | .mode = 0644, | |
516 | .proc_handler = proc_dointvec_minmax, | |
eec4844f MC |
517 | .extra1 = SYSCTL_ZERO, |
518 | .extra2 = SYSCTL_ONE | |
b245be1f | 519 | }, |
fec5e652 TH |
520 | #ifdef CONFIG_RPS |
521 | { | |
522 | .procname = "rps_sock_flow_entries", | |
523 | .maxlen = sizeof(int), | |
524 | .mode = 0644, | |
525 | .proc_handler = rps_sock_flow_sysctl | |
526 | }, | |
527 | #endif | |
99bbc707 WB |
528 | #ifdef CONFIG_NET_FLOW_LIMIT |
529 | { | |
530 | .procname = "flow_limit_cpu_bitmap", | |
531 | .mode = 0644, | |
532 | .proc_handler = flow_limit_cpu_sysctl | |
533 | }, | |
534 | { | |
535 | .procname = "flow_limit_table_len", | |
536 | .data = &netdev_flow_limit_table_len, | |
537 | .maxlen = sizeof(int), | |
538 | .mode = 0644, | |
539 | .proc_handler = flow_limit_table_len_sysctl | |
540 | }, | |
541 | #endif /* CONFIG_NET_FLOW_LIMIT */ | |
e0d1095a | 542 | #ifdef CONFIG_NET_RX_BUSY_POLL |
06021292 | 543 | { |
64b0dc51 ET |
544 | .procname = "busy_poll", |
545 | .data = &sysctl_net_busy_poll, | |
eb6db622 | 546 | .maxlen = sizeof(unsigned int), |
06021292 | 547 | .mode = 0644, |
95f25521 | 548 | .proc_handler = proc_dointvec_minmax, |
eec4844f | 549 | .extra1 = SYSCTL_ZERO, |
06021292 | 550 | }, |
2d48d67f | 551 | { |
64b0dc51 ET |
552 | .procname = "busy_read", |
553 | .data = &sysctl_net_busy_read, | |
2d48d67f ET |
554 | .maxlen = sizeof(unsigned int), |
555 | .mode = 0644, | |
95f25521 | 556 | .proc_handler = proc_dointvec_minmax, |
eec4844f | 557 | .extra1 = SYSCTL_ZERO, |
2d48d67f | 558 | }, |
6da7c8fc | 559 | #endif |
560 | #ifdef CONFIG_NET_SCHED | |
561 | { | |
562 | .procname = "default_qdisc", | |
563 | .mode = 0644, | |
564 | .maxlen = IFNAMSIZ, | |
565 | .proc_handler = set_default_qdisc | |
566 | }, | |
06021292 | 567 | #endif |
51b0bded | 568 | { |
51b0bded SH |
569 | .procname = "netdev_budget", |
570 | .data = &netdev_budget, | |
571 | .maxlen = sizeof(int), | |
572 | .mode = 0644, | |
6d9f239a | 573 | .proc_handler = proc_dointvec |
51b0bded | 574 | }, |
a2a316fd | 575 | { |
a2a316fd SH |
576 | .procname = "warnings", |
577 | .data = &net_msg_warn, | |
578 | .maxlen = sizeof(int), | |
579 | .mode = 0644, | |
6d9f239a | 580 | .proc_handler = proc_dointvec |
a2a316fd | 581 | }, |
5f74f82e HWR |
582 | { |
583 | .procname = "max_skb_frags", | |
584 | .data = &sysctl_max_skb_frags, | |
585 | .maxlen = sizeof(int), | |
586 | .mode = 0644, | |
587 | .proc_handler = proc_dointvec_minmax, | |
eec4844f | 588 | .extra1 = SYSCTL_ONE, |
5f74f82e HWR |
589 | .extra2 = &max_skb_frags, |
590 | }, | |
7acf8a1e MW |
591 | { |
592 | .procname = "netdev_budget_usecs", | |
593 | .data = &netdev_budget_usecs, | |
594 | .maxlen = sizeof(unsigned int), | |
595 | .mode = 0644, | |
596 | .proc_handler = proc_dointvec_minmax, | |
eec4844f | 597 | .extra1 = SYSCTL_ZERO, |
7acf8a1e | 598 | }, |
79134e6c ED |
599 | { |
600 | .procname = "fb_tunnels_only_for_init_net", | |
601 | .data = &sysctl_fb_tunnels_only_for_init_net, | |
602 | .maxlen = sizeof(int), | |
603 | .mode = 0644, | |
604 | .proc_handler = proc_dointvec_minmax, | |
eec4844f | 605 | .extra1 = SYSCTL_ZERO, |
bd8a5367 | 606 | .extra2 = SYSCTL_TWO, |
79134e6c | 607 | }, |
856c395c CW |
608 | { |
609 | .procname = "devconf_inherit_init_net", | |
610 | .data = &sysctl_devconf_inherit_init_net, | |
611 | .maxlen = sizeof(int), | |
612 | .mode = 0644, | |
613 | .proc_handler = proc_dointvec_minmax, | |
eec4844f | 614 | .extra1 = SYSCTL_ZERO, |
4c7f24f8 | 615 | .extra2 = SYSCTL_THREE, |
856c395c | 616 | }, |
ce27ec60 ED |
617 | { |
618 | .procname = "high_order_alloc_disable", | |
619 | .data = &net_high_order_alloc_disable_key.key, | |
620 | .maxlen = sizeof(net_high_order_alloc_disable_key), | |
621 | .mode = 0644, | |
622 | .proc_handler = proc_do_static_key, | |
623 | }, | |
323ebb61 EC |
624 | { |
625 | .procname = "gro_normal_batch", | |
626 | .data = &gro_normal_batch, | |
627 | .maxlen = sizeof(unsigned int), | |
628 | .mode = 0644, | |
629 | .proc_handler = proc_dointvec_minmax, | |
630 | .extra1 = SYSCTL_ONE, | |
631 | }, | |
5aa3afe1 DV |
632 | { |
633 | .procname = "netdev_unregister_timeout_secs", | |
634 | .data = &netdev_unregister_timeout_secs, | |
635 | .maxlen = sizeof(unsigned int), | |
636 | .mode = 0644, | |
637 | .proc_handler = proc_dointvec_minmax, | |
6c996e19 | 638 | .extra1 = SYSCTL_ONE, |
5aa3afe1 DV |
639 | .extra2 = &int_3600, |
640 | }, | |
39564c3f ED |
641 | { |
642 | .procname = "skb_defer_max", | |
643 | .data = &sysctl_skb_defer_max, | |
644 | .maxlen = sizeof(unsigned int), | |
645 | .mode = 0644, | |
646 | .proc_handler = proc_dointvec_minmax, | |
647 | .extra1 = SYSCTL_ZERO, | |
648 | }, | |
f8572d8f | 649 | { } |
1da177e4 | 650 | }; |
33eb9cfc | 651 | |
d5a4502e | 652 | static struct ctl_table netns_core_table[] = { |
50bcfe8d PA |
653 | #if IS_ENABLED(CONFIG_RPS) |
654 | { | |
655 | .procname = "rps_default_mask", | |
656 | .data = &init_net, | |
657 | .mode = 0644, | |
658 | .proc_handler = rps_default_mask_sysctl | |
659 | }, | |
660 | #endif | |
d5a4502e | 661 | { |
d5a4502e PE |
662 | .procname = "somaxconn", |
663 | .data = &init_net.core.sysctl_somaxconn, | |
664 | .maxlen = sizeof(int), | |
665 | .mode = 0644, | |
eec4844f | 666 | .extra1 = SYSCTL_ZERO, |
5f671d6b | 667 | .proc_handler = proc_dointvec_minmax |
d5a4502e | 668 | }, |
f5769fae ED |
669 | { |
670 | .procname = "optmem_max", | |
671 | .data = &init_net.core.sysctl_optmem_max, | |
672 | .maxlen = sizeof(int), | |
673 | .mode = 0644, | |
674 | .extra1 = SYSCTL_ZERO, | |
675 | .proc_handler = proc_dointvec_minmax | |
676 | }, | |
e187013a AK |
677 | { |
678 | .procname = "txrehash", | |
679 | .data = &init_net.core.sysctl_txrehash, | |
680 | .maxlen = sizeof(u8), | |
681 | .mode = 0644, | |
682 | .extra1 = SYSCTL_ZERO, | |
683 | .extra2 = SYSCTL_ONE, | |
684 | .proc_handler = proc_dou8vec_minmax, | |
685 | }, | |
f8572d8f | 686 | { } |
d5a4502e PE |
687 | }; |
688 | ||
316cdaa1 MB |
689 | static int __init fb_tunnels_only_for_init_net_sysctl_setup(char *str) |
690 | { | |
691 | /* fallback tunnels for initns only */ | |
692 | if (!strncmp(str, "initns", 6)) | |
693 | sysctl_fb_tunnels_only_for_init_net = 1; | |
694 | /* no fallback tunnels anywhere */ | |
695 | else if (!strncmp(str, "none", 4)) | |
696 | sysctl_fb_tunnels_only_for_init_net = 2; | |
697 | ||
698 | return 1; | |
699 | } | |
700 | __setup("fb_tunnels=", fb_tunnels_only_for_init_net_sysctl_setup); | |
701 | ||
024626e3 | 702 | static __net_init int sysctl_core_net_init(struct net *net) |
33eb9cfc | 703 | { |
e187013a | 704 | struct ctl_table *tbl, *tmp; |
024626e3 | 705 | |
d5a4502e | 706 | tbl = netns_core_table; |
09ad9bc7 | 707 | if (!net_eq(net, &init_net)) { |
d5a4502e | 708 | tbl = kmemdup(tbl, sizeof(netns_core_table), GFP_KERNEL); |
024626e3 PE |
709 | if (tbl == NULL) |
710 | goto err_dup; | |
711 | ||
e187013a AK |
712 | for (tmp = tbl; tmp->procname; tmp++) |
713 | tmp->data += (char *)net - (char *)&init_net; | |
024626e3 PE |
714 | } |
715 | ||
c899710f JG |
716 | net->core.sysctl_hdr = register_net_sysctl_sz(net, "net/core", tbl, |
717 | ARRAY_SIZE(netns_core_table)); | |
8efa6e93 | 718 | if (net->core.sysctl_hdr == NULL) |
024626e3 | 719 | goto err_reg; |
33eb9cfc | 720 | |
024626e3 PE |
721 | return 0; |
722 | ||
723 | err_reg: | |
d5a4502e | 724 | if (tbl != netns_core_table) |
024626e3 PE |
725 | kfree(tbl); |
726 | err_dup: | |
727 | return -ENOMEM; | |
728 | } | |
729 | ||
730 | static __net_exit void sysctl_core_net_exit(struct net *net) | |
731 | { | |
732 | struct ctl_table *tbl; | |
733 | ||
8efa6e93 PE |
734 | tbl = net->core.sysctl_hdr->ctl_table_arg; |
735 | unregister_net_sysctl_table(net->core.sysctl_hdr); | |
d5a4502e | 736 | BUG_ON(tbl == netns_core_table); |
50bcfe8d PA |
737 | #if IS_ENABLED(CONFIG_RPS) |
738 | kfree(net->core.rps_default_mask); | |
739 | #endif | |
024626e3 PE |
740 | kfree(tbl); |
741 | } | |
742 | ||
743 | static __net_initdata struct pernet_operations sysctl_core_ops = { | |
744 | .init = sysctl_core_net_init, | |
745 | .exit = sysctl_core_net_exit, | |
746 | }; | |
747 | ||
748 | static __init int sysctl_core_init(void) | |
749 | { | |
43444757 | 750 | register_net_sysctl(&init_net, "net/core", net_core_table); |
024626e3 | 751 | return register_pernet_subsys(&sysctl_core_ops); |
33eb9cfc PE |
752 | } |
753 | ||
b27aeadb | 754 | fs_initcall(sysctl_core_init); |