Merge 4.14.31 into android-4.14
[GitHub/moto-9609/android_kernel_motorola_exynos9610.git] / kernel / sysctl.c
1 /*
2 * sysctl.c: General linux system control interface
3 *
4 * Begun 24 March 1995, Stephen Tweedie
5 * Added /proc support, Dec 1995
6 * Added bdflush entry and intvec min/max checking, 2/23/96, Tom Dyas.
7 * Added hooks for /proc/sys/net (minor, minor patch), 96/4/1, Mike Shaver.
8 * Added kernel/java-{interpreter,appletviewer}, 96/5/10, Mike Shaver.
9 * Dynamic registration fixes, Stephen Tweedie.
10 * Added kswapd-interval, ctrl-alt-del, printk stuff, 1/8/97, Chris Horn.
11 * Made sysctl support optional via CONFIG_SYSCTL, 1/10/97, Chris
12 * Horn.
13 * Added proc_doulongvec_ms_jiffies_minmax, 09/08/99, Carlos H. Bauer.
14 * Added proc_doulongvec_minmax, 09/08/99, Carlos H. Bauer.
15 * Changed linked lists to use list.h instead of lists.h, 02/24/00, Bill
16 * Wendling.
17 * The list_for_each() macro wasn't appropriate for the sysctl loop.
18 * Removed it and replaced it with older style, 03/23/00, Bill Wendling
19 */
20
21 #include <linux/module.h>
22 #include <linux/aio.h>
23 #include <linux/mm.h>
24 #include <linux/swap.h>
25 #include <linux/slab.h>
26 #include <linux/sysctl.h>
27 #include <linux/bitmap.h>
28 #include <linux/signal.h>
29 #include <linux/printk.h>
30 #include <linux/proc_fs.h>
31 #include <linux/security.h>
32 #include <linux/ctype.h>
33 #include <linux/kmemleak.h>
34 #include <linux/fs.h>
35 #include <linux/init.h>
36 #include <linux/kernel.h>
37 #include <linux/kobject.h>
38 #include <linux/net.h>
39 #include <linux/sysrq.h>
40 #include <linux/highuid.h>
41 #include <linux/writeback.h>
42 #include <linux/ratelimit.h>
43 #include <linux/compaction.h>
44 #include <linux/hugetlb.h>
45 #include <linux/initrd.h>
46 #include <linux/key.h>
47 #include <linux/times.h>
48 #include <linux/limits.h>
49 #include <linux/dcache.h>
50 #include <linux/dnotify.h>
51 #include <linux/syscalls.h>
52 #include <linux/vmstat.h>
53 #include <linux/nfs_fs.h>
54 #include <linux/acpi.h>
55 #include <linux/reboot.h>
56 #include <linux/ftrace.h>
57 #include <linux/perf_event.h>
58 #include <linux/kprobes.h>
59 #include <linux/pipe_fs_i.h>
60 #include <linux/oom.h>
61 #include <linux/kmod.h>
62 #include <linux/capability.h>
63 #include <linux/binfmts.h>
64 #include <linux/sched/sysctl.h>
65 #include <linux/sched/coredump.h>
66 #include <linux/kexec.h>
67 #include <linux/bpf.h>
68 #include <linux/mount.h>
69
70 #include <linux/uaccess.h>
71 #include <asm/processor.h>
72
73 #ifdef CONFIG_X86
74 #include <asm/nmi.h>
75 #include <asm/stacktrace.h>
76 #include <asm/io.h>
77 #endif
78 #ifdef CONFIG_SPARC
79 #include <asm/setup.h>
80 #endif
81 #ifdef CONFIG_BSD_PROCESS_ACCT
82 #include <linux/acct.h>
83 #endif
84 #ifdef CONFIG_RT_MUTEXES
85 #include <linux/rtmutex.h>
86 #endif
87 #if defined(CONFIG_PROVE_LOCKING) || defined(CONFIG_LOCK_STAT)
88 #include <linux/lockdep.h>
89 #endif
90 #ifdef CONFIG_CHR_DEV_SG
91 #include <scsi/sg.h>
92 #endif
93
94 #ifdef CONFIG_LOCKUP_DETECTOR
95 #include <linux/nmi.h>
96 #endif
97
98 #if defined(CONFIG_SYSCTL)
99
100 /* External variables not in a header file. */
101 extern int suid_dumpable;
102 #ifdef CONFIG_COREDUMP
103 extern int core_uses_pid;
104 extern char core_pattern[];
105 extern unsigned int core_pipe_limit;
106 #endif
107 extern int pid_max;
108 extern int pid_max_min, pid_max_max;
109 extern int percpu_pagelist_fraction;
110 extern int latencytop_enabled;
111 extern unsigned int sysctl_nr_open_min, sysctl_nr_open_max;
112 #ifndef CONFIG_MMU
113 extern int sysctl_nr_trim_pages;
114 #endif
115
116 /* Constants used for minimum and maximum */
117 #ifdef CONFIG_LOCKUP_DETECTOR
118 static int sixty = 60;
119 #endif
120
121 static int __maybe_unused neg_one = -1;
122
123 static int zero;
124 static int __maybe_unused one = 1;
125 static int __maybe_unused two = 2;
126 static int __maybe_unused four = 4;
127 static unsigned long one_ul = 1;
128 static int one_hundred = 100;
129 static int one_thousand = 1000;
130 #ifdef CONFIG_PRINTK
131 static int ten_thousand = 10000;
132 #endif
133 #ifdef CONFIG_PERF_EVENTS
134 static int six_hundred_forty_kb = 640 * 1024;
135 #endif
136
137 /* this is needed for the proc_doulongvec_minmax of vm_dirty_bytes */
138 static unsigned long dirty_bytes_min = 2 * PAGE_SIZE;
139
140 /* this is needed for the proc_dointvec_minmax for [fs_]overflow UID and GID */
141 static int maxolduid = 65535;
142 static int minolduid;
143
144 static int ngroups_max = NGROUPS_MAX;
145 static const int cap_last_cap = CAP_LAST_CAP;
146
147 /*this is needed for proc_doulongvec_minmax of sysctl_hung_task_timeout_secs */
148 #ifdef CONFIG_DETECT_HUNG_TASK
149 static unsigned long hung_task_timeout_max = (LONG_MAX/HZ);
150 #endif
151
152 #ifdef CONFIG_INOTIFY_USER
153 #include <linux/inotify.h>
154 #endif
155 #ifdef CONFIG_SPARC
156 #endif
157
158 #ifdef __hppa__
159 extern int pwrsw_enabled;
160 #endif
161
162 #ifdef CONFIG_SYSCTL_ARCH_UNALIGN_ALLOW
163 extern int unaligned_enabled;
164 #endif
165
166 #ifdef CONFIG_IA64
167 extern int unaligned_dump_stack;
168 #endif
169
170 #ifdef CONFIG_SYSCTL_ARCH_UNALIGN_NO_WARN
171 extern int no_unaligned_warning;
172 #endif
173
174 #ifdef CONFIG_PROC_SYSCTL
175
176 /**
177 * enum sysctl_writes_mode - supported sysctl write modes
178 *
179 * @SYSCTL_WRITES_LEGACY: each write syscall must fully contain the sysctl value
180 * to be written, and multiple writes on the same sysctl file descriptor
181 * will rewrite the sysctl value, regardless of file position. No warning
182 * is issued when the initial position is not 0.
183 * @SYSCTL_WRITES_WARN: same as above but warn when the initial file position is
184 * not 0.
185 * @SYSCTL_WRITES_STRICT: writes to numeric sysctl entries must always be at
186 * file position 0 and the value must be fully contained in the buffer
187 * sent to the write syscall. If dealing with strings respect the file
188 * position, but restrict this to the max length of the buffer, anything
189 * passed the max lenght will be ignored. Multiple writes will append
190 * to the buffer.
191 *
192 * These write modes control how current file position affects the behavior of
193 * updating sysctl values through the proc interface on each write.
194 */
195 enum sysctl_writes_mode {
196 SYSCTL_WRITES_LEGACY = -1,
197 SYSCTL_WRITES_WARN = 0,
198 SYSCTL_WRITES_STRICT = 1,
199 };
200
201 static enum sysctl_writes_mode sysctl_writes_strict = SYSCTL_WRITES_STRICT;
202
203 static int proc_do_cad_pid(struct ctl_table *table, int write,
204 void __user *buffer, size_t *lenp, loff_t *ppos);
205 static int proc_taint(struct ctl_table *table, int write,
206 void __user *buffer, size_t *lenp, loff_t *ppos);
207 #endif
208
209 #ifdef CONFIG_PRINTK
210 static int proc_dointvec_minmax_sysadmin(struct ctl_table *table, int write,
211 void __user *buffer, size_t *lenp, loff_t *ppos);
212 #endif
213
214 static int proc_dointvec_minmax_coredump(struct ctl_table *table, int write,
215 void __user *buffer, size_t *lenp, loff_t *ppos);
216 #ifdef CONFIG_COREDUMP
217 static int proc_dostring_coredump(struct ctl_table *table, int write,
218 void __user *buffer, size_t *lenp, loff_t *ppos);
219 #endif
220
221 #ifdef CONFIG_MAGIC_SYSRQ
222 /* Note: sysrq code uses it's own private copy */
223 static int __sysrq_enabled = CONFIG_MAGIC_SYSRQ_DEFAULT_ENABLE;
224
225 static int sysrq_sysctl_handler(struct ctl_table *table, int write,
226 void __user *buffer, size_t *lenp,
227 loff_t *ppos)
228 {
229 int error;
230
231 error = proc_dointvec(table, write, buffer, lenp, ppos);
232 if (error)
233 return error;
234
235 if (write)
236 sysrq_toggle_support(__sysrq_enabled);
237
238 return 0;
239 }
240
241 #endif
242
243 static struct ctl_table kern_table[];
244 static struct ctl_table vm_table[];
245 static struct ctl_table fs_table[];
246 static struct ctl_table debug_table[];
247 static struct ctl_table dev_table[];
248 extern struct ctl_table random_table[];
249 #ifdef CONFIG_EPOLL
250 extern struct ctl_table epoll_table[];
251 #endif
252
253 #ifdef HAVE_ARCH_PICK_MMAP_LAYOUT
254 int sysctl_legacy_va_layout;
255 #endif
256
257 /* The default sysctl tables: */
258
259 static struct ctl_table sysctl_base_table[] = {
260 {
261 .procname = "kernel",
262 .mode = 0555,
263 .child = kern_table,
264 },
265 {
266 .procname = "vm",
267 .mode = 0555,
268 .child = vm_table,
269 },
270 {
271 .procname = "fs",
272 .mode = 0555,
273 .child = fs_table,
274 },
275 {
276 .procname = "debug",
277 .mode = 0555,
278 .child = debug_table,
279 },
280 {
281 .procname = "dev",
282 .mode = 0555,
283 .child = dev_table,
284 },
285 { }
286 };
287
288 #ifdef CONFIG_SCHED_DEBUG
289 static int min_sched_granularity_ns = 100000; /* 100 usecs */
290 static int max_sched_granularity_ns = NSEC_PER_SEC; /* 1 second */
291 static int min_wakeup_granularity_ns; /* 0 usecs */
292 static int max_wakeup_granularity_ns = NSEC_PER_SEC; /* 1 second */
293 #ifdef CONFIG_SMP
294 static int min_sched_tunable_scaling = SCHED_TUNABLESCALING_NONE;
295 static int max_sched_tunable_scaling = SCHED_TUNABLESCALING_END-1;
296 #endif /* CONFIG_SMP */
297 #endif /* CONFIG_SCHED_DEBUG */
298
299 #ifdef CONFIG_COMPACTION
300 static int min_extfrag_threshold;
301 static int max_extfrag_threshold = 1000;
302 #endif
303
304 static struct ctl_table kern_table[] = {
305 {
306 .procname = "sched_child_runs_first",
307 .data = &sysctl_sched_child_runs_first,
308 .maxlen = sizeof(unsigned int),
309 .mode = 0644,
310 .proc_handler = proc_dointvec,
311 },
312 #ifdef CONFIG_SCHED_DEBUG
313 {
314 .procname = "sched_min_granularity_ns",
315 .data = &sysctl_sched_min_granularity,
316 .maxlen = sizeof(unsigned int),
317 .mode = 0644,
318 .proc_handler = sched_proc_update_handler,
319 .extra1 = &min_sched_granularity_ns,
320 .extra2 = &max_sched_granularity_ns,
321 },
322 {
323 .procname = "sched_latency_ns",
324 .data = &sysctl_sched_latency,
325 .maxlen = sizeof(unsigned int),
326 .mode = 0644,
327 .proc_handler = sched_proc_update_handler,
328 .extra1 = &min_sched_granularity_ns,
329 .extra2 = &max_sched_granularity_ns,
330 },
331 #ifdef CONFIG_SCHED_WALT
332 {
333 .procname = "sched_use_walt_cpu_util",
334 .data = &sysctl_sched_use_walt_cpu_util,
335 .maxlen = sizeof(unsigned int),
336 .mode = 0644,
337 .proc_handler = proc_dointvec,
338 },
339 {
340 .procname = "sched_use_walt_task_util",
341 .data = &sysctl_sched_use_walt_task_util,
342 .maxlen = sizeof(unsigned int),
343 .mode = 0644,
344 .proc_handler = proc_dointvec,
345 },
346 {
347 .procname = "sched_walt_init_task_load_pct",
348 .data = &sysctl_sched_walt_init_task_load_pct,
349 .maxlen = sizeof(unsigned int),
350 .mode = 0644,
351 .proc_handler = proc_dointvec,
352 },
353 {
354 .procname = "sched_walt_cpu_high_irqload",
355 .data = &sysctl_sched_walt_cpu_high_irqload,
356 .maxlen = sizeof(unsigned int),
357 .mode = 0644,
358 .proc_handler = proc_dointvec,
359 },
360 #endif
361 {
362 .procname = "sched_sync_hint_enable",
363 .data = &sysctl_sched_sync_hint_enable,
364 .maxlen = sizeof(unsigned int),
365 .mode = 0644,
366 .proc_handler = proc_dointvec,
367 },
368 {
369 .procname = "sched_cstate_aware",
370 .data = &sysctl_sched_cstate_aware,
371 .maxlen = sizeof(unsigned int),
372 .mode = 0644,
373 .proc_handler = proc_dointvec,
374 },
375 {
376 .procname = "sched_wakeup_granularity_ns",
377 .data = &sysctl_sched_wakeup_granularity,
378 .maxlen = sizeof(unsigned int),
379 .mode = 0644,
380 .proc_handler = sched_proc_update_handler,
381 .extra1 = &min_wakeup_granularity_ns,
382 .extra2 = &max_wakeup_granularity_ns,
383 },
384 #ifdef CONFIG_SMP
385 {
386 .procname = "sched_tunable_scaling",
387 .data = &sysctl_sched_tunable_scaling,
388 .maxlen = sizeof(enum sched_tunable_scaling),
389 .mode = 0644,
390 .proc_handler = sched_proc_update_handler,
391 .extra1 = &min_sched_tunable_scaling,
392 .extra2 = &max_sched_tunable_scaling,
393 },
394 {
395 .procname = "sched_migration_cost_ns",
396 .data = &sysctl_sched_migration_cost,
397 .maxlen = sizeof(unsigned int),
398 .mode = 0644,
399 .proc_handler = proc_dointvec,
400 },
401 {
402 .procname = "sched_nr_migrate",
403 .data = &sysctl_sched_nr_migrate,
404 .maxlen = sizeof(unsigned int),
405 .mode = 0644,
406 .proc_handler = proc_dointvec,
407 },
408 {
409 .procname = "sched_time_avg_ms",
410 .data = &sysctl_sched_time_avg,
411 .maxlen = sizeof(unsigned int),
412 .mode = 0644,
413 .proc_handler = proc_dointvec_minmax,
414 .extra1 = &one,
415 },
416 #ifdef CONFIG_SCHEDSTATS
417 {
418 .procname = "sched_schedstats",
419 .data = NULL,
420 .maxlen = sizeof(unsigned int),
421 .mode = 0644,
422 .proc_handler = sysctl_schedstats,
423 .extra1 = &zero,
424 .extra2 = &one,
425 },
426 #endif /* CONFIG_SCHEDSTATS */
427 #endif /* CONFIG_SMP */
428 #ifdef CONFIG_NUMA_BALANCING
429 {
430 .procname = "numa_balancing_scan_delay_ms",
431 .data = &sysctl_numa_balancing_scan_delay,
432 .maxlen = sizeof(unsigned int),
433 .mode = 0644,
434 .proc_handler = proc_dointvec,
435 },
436 {
437 .procname = "numa_balancing_scan_period_min_ms",
438 .data = &sysctl_numa_balancing_scan_period_min,
439 .maxlen = sizeof(unsigned int),
440 .mode = 0644,
441 .proc_handler = proc_dointvec,
442 },
443 {
444 .procname = "numa_balancing_scan_period_max_ms",
445 .data = &sysctl_numa_balancing_scan_period_max,
446 .maxlen = sizeof(unsigned int),
447 .mode = 0644,
448 .proc_handler = proc_dointvec,
449 },
450 {
451 .procname = "numa_balancing_scan_size_mb",
452 .data = &sysctl_numa_balancing_scan_size,
453 .maxlen = sizeof(unsigned int),
454 .mode = 0644,
455 .proc_handler = proc_dointvec_minmax,
456 .extra1 = &one,
457 },
458 {
459 .procname = "numa_balancing",
460 .data = NULL, /* filled in by handler */
461 .maxlen = sizeof(unsigned int),
462 .mode = 0644,
463 .proc_handler = sysctl_numa_balancing,
464 .extra1 = &zero,
465 .extra2 = &one,
466 },
467 #endif /* CONFIG_NUMA_BALANCING */
468 #endif /* CONFIG_SCHED_DEBUG */
469 {
470 .procname = "sched_rt_period_us",
471 .data = &sysctl_sched_rt_period,
472 .maxlen = sizeof(unsigned int),
473 .mode = 0644,
474 .proc_handler = sched_rt_handler,
475 },
476 {
477 .procname = "sched_rt_runtime_us",
478 .data = &sysctl_sched_rt_runtime,
479 .maxlen = sizeof(int),
480 .mode = 0644,
481 .proc_handler = sched_rt_handler,
482 },
483 {
484 .procname = "sched_rr_timeslice_ms",
485 .data = &sysctl_sched_rr_timeslice,
486 .maxlen = sizeof(int),
487 .mode = 0644,
488 .proc_handler = sched_rr_handler,
489 },
490 #ifdef CONFIG_SCHED_AUTOGROUP
491 {
492 .procname = "sched_autogroup_enabled",
493 .data = &sysctl_sched_autogroup_enabled,
494 .maxlen = sizeof(unsigned int),
495 .mode = 0644,
496 .proc_handler = proc_dointvec_minmax,
497 .extra1 = &zero,
498 .extra2 = &one,
499 },
500 #endif
501 #ifdef CONFIG_CFS_BANDWIDTH
502 {
503 .procname = "sched_cfs_bandwidth_slice_us",
504 .data = &sysctl_sched_cfs_bandwidth_slice,
505 .maxlen = sizeof(unsigned int),
506 .mode = 0644,
507 .proc_handler = proc_dointvec_minmax,
508 .extra1 = &one,
509 },
510 #endif
511 #ifdef CONFIG_PROVE_LOCKING
512 {
513 .procname = "prove_locking",
514 .data = &prove_locking,
515 .maxlen = sizeof(int),
516 .mode = 0644,
517 .proc_handler = proc_dointvec,
518 },
519 #endif
520 #ifdef CONFIG_LOCK_STAT
521 {
522 .procname = "lock_stat",
523 .data = &lock_stat,
524 .maxlen = sizeof(int),
525 .mode = 0644,
526 .proc_handler = proc_dointvec,
527 },
528 #endif
529 {
530 .procname = "panic",
531 .data = &panic_timeout,
532 .maxlen = sizeof(int),
533 .mode = 0644,
534 .proc_handler = proc_dointvec,
535 },
536 #ifdef CONFIG_COREDUMP
537 {
538 .procname = "core_uses_pid",
539 .data = &core_uses_pid,
540 .maxlen = sizeof(int),
541 .mode = 0644,
542 .proc_handler = proc_dointvec,
543 },
544 {
545 .procname = "core_pattern",
546 .data = core_pattern,
547 .maxlen = CORENAME_MAX_SIZE,
548 .mode = 0644,
549 .proc_handler = proc_dostring_coredump,
550 },
551 {
552 .procname = "core_pipe_limit",
553 .data = &core_pipe_limit,
554 .maxlen = sizeof(unsigned int),
555 .mode = 0644,
556 .proc_handler = proc_dointvec,
557 },
558 #endif
559 #ifdef CONFIG_PROC_SYSCTL
560 {
561 .procname = "tainted",
562 .maxlen = sizeof(long),
563 .mode = 0644,
564 .proc_handler = proc_taint,
565 },
566 {
567 .procname = "sysctl_writes_strict",
568 .data = &sysctl_writes_strict,
569 .maxlen = sizeof(int),
570 .mode = 0644,
571 .proc_handler = proc_dointvec_minmax,
572 .extra1 = &neg_one,
573 .extra2 = &one,
574 },
575 #endif
576 #ifdef CONFIG_LATENCYTOP
577 {
578 .procname = "latencytop",
579 .data = &latencytop_enabled,
580 .maxlen = sizeof(int),
581 .mode = 0644,
582 .proc_handler = sysctl_latencytop,
583 },
584 #endif
585 #ifdef CONFIG_BLK_DEV_INITRD
586 {
587 .procname = "real-root-dev",
588 .data = &real_root_dev,
589 .maxlen = sizeof(int),
590 .mode = 0644,
591 .proc_handler = proc_dointvec,
592 },
593 #endif
594 {
595 .procname = "print-fatal-signals",
596 .data = &print_fatal_signals,
597 .maxlen = sizeof(int),
598 .mode = 0644,
599 .proc_handler = proc_dointvec,
600 },
601 #ifdef CONFIG_SPARC
602 {
603 .procname = "reboot-cmd",
604 .data = reboot_command,
605 .maxlen = 256,
606 .mode = 0644,
607 .proc_handler = proc_dostring,
608 },
609 {
610 .procname = "stop-a",
611 .data = &stop_a_enabled,
612 .maxlen = sizeof (int),
613 .mode = 0644,
614 .proc_handler = proc_dointvec,
615 },
616 {
617 .procname = "scons-poweroff",
618 .data = &scons_pwroff,
619 .maxlen = sizeof (int),
620 .mode = 0644,
621 .proc_handler = proc_dointvec,
622 },
623 #endif
624 #ifdef CONFIG_SPARC64
625 {
626 .procname = "tsb-ratio",
627 .data = &sysctl_tsb_ratio,
628 .maxlen = sizeof (int),
629 .mode = 0644,
630 .proc_handler = proc_dointvec,
631 },
632 #endif
633 #ifdef __hppa__
634 {
635 .procname = "soft-power",
636 .data = &pwrsw_enabled,
637 .maxlen = sizeof (int),
638 .mode = 0644,
639 .proc_handler = proc_dointvec,
640 },
641 #endif
642 #ifdef CONFIG_SYSCTL_ARCH_UNALIGN_ALLOW
643 {
644 .procname = "unaligned-trap",
645 .data = &unaligned_enabled,
646 .maxlen = sizeof (int),
647 .mode = 0644,
648 .proc_handler = proc_dointvec,
649 },
650 #endif
651 {
652 .procname = "ctrl-alt-del",
653 .data = &C_A_D,
654 .maxlen = sizeof(int),
655 .mode = 0644,
656 .proc_handler = proc_dointvec,
657 },
658 #ifdef CONFIG_FUNCTION_TRACER
659 {
660 .procname = "ftrace_enabled",
661 .data = &ftrace_enabled,
662 .maxlen = sizeof(int),
663 .mode = 0644,
664 .proc_handler = ftrace_enable_sysctl,
665 },
666 #endif
667 #ifdef CONFIG_STACK_TRACER
668 {
669 .procname = "stack_tracer_enabled",
670 .data = &stack_tracer_enabled,
671 .maxlen = sizeof(int),
672 .mode = 0644,
673 .proc_handler = stack_trace_sysctl,
674 },
675 #endif
676 #ifdef CONFIG_TRACING
677 {
678 .procname = "ftrace_dump_on_oops",
679 .data = &ftrace_dump_on_oops,
680 .maxlen = sizeof(int),
681 .mode = 0644,
682 .proc_handler = proc_dointvec,
683 },
684 {
685 .procname = "traceoff_on_warning",
686 .data = &__disable_trace_on_warning,
687 .maxlen = sizeof(__disable_trace_on_warning),
688 .mode = 0644,
689 .proc_handler = proc_dointvec,
690 },
691 {
692 .procname = "tracepoint_printk",
693 .data = &tracepoint_printk,
694 .maxlen = sizeof(tracepoint_printk),
695 .mode = 0644,
696 .proc_handler = tracepoint_printk_sysctl,
697 },
698 #endif
699 #ifdef CONFIG_KEXEC_CORE
700 {
701 .procname = "kexec_load_disabled",
702 .data = &kexec_load_disabled,
703 .maxlen = sizeof(int),
704 .mode = 0644,
705 /* only handle a transition from default "0" to "1" */
706 .proc_handler = proc_dointvec_minmax,
707 .extra1 = &one,
708 .extra2 = &one,
709 },
710 #endif
711 #ifdef CONFIG_MODULES
712 {
713 .procname = "modprobe",
714 .data = &modprobe_path,
715 .maxlen = KMOD_PATH_LEN,
716 .mode = 0644,
717 .proc_handler = proc_dostring,
718 },
719 {
720 .procname = "modules_disabled",
721 .data = &modules_disabled,
722 .maxlen = sizeof(int),
723 .mode = 0644,
724 /* only handle a transition from default "0" to "1" */
725 .proc_handler = proc_dointvec_minmax,
726 .extra1 = &one,
727 .extra2 = &one,
728 },
729 #endif
730 #ifdef CONFIG_UEVENT_HELPER
731 {
732 .procname = "hotplug",
733 .data = &uevent_helper,
734 .maxlen = UEVENT_HELPER_PATH_LEN,
735 .mode = 0644,
736 .proc_handler = proc_dostring,
737 },
738 #endif
739 #ifdef CONFIG_CHR_DEV_SG
740 {
741 .procname = "sg-big-buff",
742 .data = &sg_big_buff,
743 .maxlen = sizeof (int),
744 .mode = 0444,
745 .proc_handler = proc_dointvec,
746 },
747 #endif
748 #ifdef CONFIG_BSD_PROCESS_ACCT
749 {
750 .procname = "acct",
751 .data = &acct_parm,
752 .maxlen = 3*sizeof(int),
753 .mode = 0644,
754 .proc_handler = proc_dointvec,
755 },
756 #endif
757 #ifdef CONFIG_MAGIC_SYSRQ
758 {
759 .procname = "sysrq",
760 .data = &__sysrq_enabled,
761 .maxlen = sizeof (int),
762 .mode = 0644,
763 .proc_handler = sysrq_sysctl_handler,
764 },
765 #endif
766 #ifdef CONFIG_PROC_SYSCTL
767 {
768 .procname = "cad_pid",
769 .data = NULL,
770 .maxlen = sizeof (int),
771 .mode = 0600,
772 .proc_handler = proc_do_cad_pid,
773 },
774 #endif
775 {
776 .procname = "threads-max",
777 .data = NULL,
778 .maxlen = sizeof(int),
779 .mode = 0644,
780 .proc_handler = sysctl_max_threads,
781 },
782 {
783 .procname = "random",
784 .mode = 0555,
785 .child = random_table,
786 },
787 {
788 .procname = "usermodehelper",
789 .mode = 0555,
790 .child = usermodehelper_table,
791 },
792 {
793 .procname = "overflowuid",
794 .data = &overflowuid,
795 .maxlen = sizeof(int),
796 .mode = 0644,
797 .proc_handler = proc_dointvec_minmax,
798 .extra1 = &minolduid,
799 .extra2 = &maxolduid,
800 },
801 {
802 .procname = "overflowgid",
803 .data = &overflowgid,
804 .maxlen = sizeof(int),
805 .mode = 0644,
806 .proc_handler = proc_dointvec_minmax,
807 .extra1 = &minolduid,
808 .extra2 = &maxolduid,
809 },
810 #ifdef CONFIG_S390
811 #ifdef CONFIG_MATHEMU
812 {
813 .procname = "ieee_emulation_warnings",
814 .data = &sysctl_ieee_emulation_warnings,
815 .maxlen = sizeof(int),
816 .mode = 0644,
817 .proc_handler = proc_dointvec,
818 },
819 #endif
820 {
821 .procname = "userprocess_debug",
822 .data = &show_unhandled_signals,
823 .maxlen = sizeof(int),
824 .mode = 0644,
825 .proc_handler = proc_dointvec,
826 },
827 #endif
828 {
829 .procname = "pid_max",
830 .data = &pid_max,
831 .maxlen = sizeof (int),
832 .mode = 0644,
833 .proc_handler = proc_dointvec_minmax,
834 .extra1 = &pid_max_min,
835 .extra2 = &pid_max_max,
836 },
837 {
838 .procname = "panic_on_oops",
839 .data = &panic_on_oops,
840 .maxlen = sizeof(int),
841 .mode = 0644,
842 .proc_handler = proc_dointvec,
843 },
844 #if defined CONFIG_PRINTK
845 {
846 .procname = "printk",
847 .data = &console_loglevel,
848 .maxlen = 4*sizeof(int),
849 .mode = 0644,
850 .proc_handler = proc_dointvec,
851 },
852 {
853 .procname = "printk_ratelimit",
854 .data = &printk_ratelimit_state.interval,
855 .maxlen = sizeof(int),
856 .mode = 0644,
857 .proc_handler = proc_dointvec_jiffies,
858 },
859 {
860 .procname = "printk_ratelimit_burst",
861 .data = &printk_ratelimit_state.burst,
862 .maxlen = sizeof(int),
863 .mode = 0644,
864 .proc_handler = proc_dointvec,
865 },
866 {
867 .procname = "printk_delay",
868 .data = &printk_delay_msec,
869 .maxlen = sizeof(int),
870 .mode = 0644,
871 .proc_handler = proc_dointvec_minmax,
872 .extra1 = &zero,
873 .extra2 = &ten_thousand,
874 },
875 {
876 .procname = "printk_devkmsg",
877 .data = devkmsg_log_str,
878 .maxlen = DEVKMSG_STR_MAX_SIZE,
879 .mode = 0644,
880 .proc_handler = devkmsg_sysctl_set_loglvl,
881 },
882 {
883 .procname = "dmesg_restrict",
884 .data = &dmesg_restrict,
885 .maxlen = sizeof(int),
886 .mode = 0644,
887 .proc_handler = proc_dointvec_minmax_sysadmin,
888 .extra1 = &zero,
889 .extra2 = &one,
890 },
891 {
892 .procname = "kptr_restrict",
893 .data = &kptr_restrict,
894 .maxlen = sizeof(int),
895 .mode = 0644,
896 .proc_handler = proc_dointvec_minmax_sysadmin,
897 .extra1 = &zero,
898 .extra2 = &two,
899 },
900 #endif
901 {
902 .procname = "ngroups_max",
903 .data = &ngroups_max,
904 .maxlen = sizeof (int),
905 .mode = 0444,
906 .proc_handler = proc_dointvec,
907 },
908 {
909 .procname = "cap_last_cap",
910 .data = (void *)&cap_last_cap,
911 .maxlen = sizeof(int),
912 .mode = 0444,
913 .proc_handler = proc_dointvec,
914 },
915 #if defined(CONFIG_LOCKUP_DETECTOR)
916 {
917 .procname = "watchdog",
918 .data = &watchdog_user_enabled,
919 .maxlen = sizeof(int),
920 .mode = 0644,
921 .proc_handler = proc_watchdog,
922 .extra1 = &zero,
923 .extra2 = &one,
924 },
925 {
926 .procname = "watchdog_thresh",
927 .data = &watchdog_thresh,
928 .maxlen = sizeof(int),
929 .mode = 0644,
930 .proc_handler = proc_watchdog_thresh,
931 .extra1 = &zero,
932 .extra2 = &sixty,
933 },
934 {
935 .procname = "nmi_watchdog",
936 .data = &nmi_watchdog_user_enabled,
937 .maxlen = sizeof(int),
938 .mode = NMI_WATCHDOG_SYSCTL_PERM,
939 .proc_handler = proc_nmi_watchdog,
940 .extra1 = &zero,
941 .extra2 = &one,
942 },
943 {
944 .procname = "watchdog_cpumask",
945 .data = &watchdog_cpumask_bits,
946 .maxlen = NR_CPUS,
947 .mode = 0644,
948 .proc_handler = proc_watchdog_cpumask,
949 },
950 #ifdef CONFIG_SOFTLOCKUP_DETECTOR
951 {
952 .procname = "soft_watchdog",
953 .data = &soft_watchdog_user_enabled,
954 .maxlen = sizeof(int),
955 .mode = 0644,
956 .proc_handler = proc_soft_watchdog,
957 .extra1 = &zero,
958 .extra2 = &one,
959 },
960 {
961 .procname = "softlockup_panic",
962 .data = &softlockup_panic,
963 .maxlen = sizeof(int),
964 .mode = 0644,
965 .proc_handler = proc_dointvec_minmax,
966 .extra1 = &zero,
967 .extra2 = &one,
968 },
969 #ifdef CONFIG_SMP
970 {
971 .procname = "softlockup_all_cpu_backtrace",
972 .data = &sysctl_softlockup_all_cpu_backtrace,
973 .maxlen = sizeof(int),
974 .mode = 0644,
975 .proc_handler = proc_dointvec_minmax,
976 .extra1 = &zero,
977 .extra2 = &one,
978 },
979 #endif /* CONFIG_SMP */
980 #endif
981 #ifdef CONFIG_HARDLOCKUP_DETECTOR
982 {
983 .procname = "hardlockup_panic",
984 .data = &hardlockup_panic,
985 .maxlen = sizeof(int),
986 .mode = 0644,
987 .proc_handler = proc_dointvec_minmax,
988 .extra1 = &zero,
989 .extra2 = &one,
990 },
991 #ifdef CONFIG_SMP
992 {
993 .procname = "hardlockup_all_cpu_backtrace",
994 .data = &sysctl_hardlockup_all_cpu_backtrace,
995 .maxlen = sizeof(int),
996 .mode = 0644,
997 .proc_handler = proc_dointvec_minmax,
998 .extra1 = &zero,
999 .extra2 = &one,
1000 },
1001 #endif /* CONFIG_SMP */
1002 #endif
1003 #endif
1004
1005 #if defined(CONFIG_X86_LOCAL_APIC) && defined(CONFIG_X86)
1006 {
1007 .procname = "unknown_nmi_panic",
1008 .data = &unknown_nmi_panic,
1009 .maxlen = sizeof (int),
1010 .mode = 0644,
1011 .proc_handler = proc_dointvec,
1012 },
1013 #endif
1014 #if defined(CONFIG_X86)
1015 {
1016 .procname = "panic_on_unrecovered_nmi",
1017 .data = &panic_on_unrecovered_nmi,
1018 .maxlen = sizeof(int),
1019 .mode = 0644,
1020 .proc_handler = proc_dointvec,
1021 },
1022 {
1023 .procname = "panic_on_io_nmi",
1024 .data = &panic_on_io_nmi,
1025 .maxlen = sizeof(int),
1026 .mode = 0644,
1027 .proc_handler = proc_dointvec,
1028 },
1029 #ifdef CONFIG_DEBUG_STACKOVERFLOW
1030 {
1031 .procname = "panic_on_stackoverflow",
1032 .data = &sysctl_panic_on_stackoverflow,
1033 .maxlen = sizeof(int),
1034 .mode = 0644,
1035 .proc_handler = proc_dointvec,
1036 },
1037 #endif
1038 {
1039 .procname = "bootloader_type",
1040 .data = &bootloader_type,
1041 .maxlen = sizeof (int),
1042 .mode = 0444,
1043 .proc_handler = proc_dointvec,
1044 },
1045 {
1046 .procname = "bootloader_version",
1047 .data = &bootloader_version,
1048 .maxlen = sizeof (int),
1049 .mode = 0444,
1050 .proc_handler = proc_dointvec,
1051 },
1052 {
1053 .procname = "io_delay_type",
1054 .data = &io_delay_type,
1055 .maxlen = sizeof(int),
1056 .mode = 0644,
1057 .proc_handler = proc_dointvec,
1058 },
1059 #endif
1060 #if defined(CONFIG_MMU)
1061 {
1062 .procname = "randomize_va_space",
1063 .data = &randomize_va_space,
1064 .maxlen = sizeof(int),
1065 .mode = 0644,
1066 .proc_handler = proc_dointvec,
1067 },
1068 #endif
1069 #if defined(CONFIG_S390) && defined(CONFIG_SMP)
1070 {
1071 .procname = "spin_retry",
1072 .data = &spin_retry,
1073 .maxlen = sizeof (int),
1074 .mode = 0644,
1075 .proc_handler = proc_dointvec,
1076 },
1077 #endif
1078 #if defined(CONFIG_ACPI_SLEEP) && defined(CONFIG_X86)
1079 {
1080 .procname = "acpi_video_flags",
1081 .data = &acpi_realmode_flags,
1082 .maxlen = sizeof (unsigned long),
1083 .mode = 0644,
1084 .proc_handler = proc_doulongvec_minmax,
1085 },
1086 #endif
1087 #ifdef CONFIG_SYSCTL_ARCH_UNALIGN_NO_WARN
1088 {
1089 .procname = "ignore-unaligned-usertrap",
1090 .data = &no_unaligned_warning,
1091 .maxlen = sizeof (int),
1092 .mode = 0644,
1093 .proc_handler = proc_dointvec,
1094 },
1095 #endif
1096 #ifdef CONFIG_IA64
1097 {
1098 .procname = "unaligned-dump-stack",
1099 .data = &unaligned_dump_stack,
1100 .maxlen = sizeof (int),
1101 .mode = 0644,
1102 .proc_handler = proc_dointvec,
1103 },
1104 #endif
1105 #ifdef CONFIG_DETECT_HUNG_TASK
1106 {
1107 .procname = "hung_task_panic",
1108 .data = &sysctl_hung_task_panic,
1109 .maxlen = sizeof(int),
1110 .mode = 0644,
1111 .proc_handler = proc_dointvec_minmax,
1112 .extra1 = &zero,
1113 .extra2 = &one,
1114 },
1115 {
1116 .procname = "hung_task_check_count",
1117 .data = &sysctl_hung_task_check_count,
1118 .maxlen = sizeof(int),
1119 .mode = 0644,
1120 .proc_handler = proc_dointvec_minmax,
1121 .extra1 = &zero,
1122 },
1123 {
1124 .procname = "hung_task_timeout_secs",
1125 .data = &sysctl_hung_task_timeout_secs,
1126 .maxlen = sizeof(unsigned long),
1127 .mode = 0644,
1128 .proc_handler = proc_dohung_task_timeout_secs,
1129 .extra2 = &hung_task_timeout_max,
1130 },
1131 {
1132 .procname = "hung_task_warnings",
1133 .data = &sysctl_hung_task_warnings,
1134 .maxlen = sizeof(int),
1135 .mode = 0644,
1136 .proc_handler = proc_dointvec_minmax,
1137 .extra1 = &neg_one,
1138 },
1139 #endif
1140 #ifdef CONFIG_RT_MUTEXES
1141 {
1142 .procname = "max_lock_depth",
1143 .data = &max_lock_depth,
1144 .maxlen = sizeof(int),
1145 .mode = 0644,
1146 .proc_handler = proc_dointvec,
1147 },
1148 #endif
1149 {
1150 .procname = "poweroff_cmd",
1151 .data = &poweroff_cmd,
1152 .maxlen = POWEROFF_CMD_PATH_LEN,
1153 .mode = 0644,
1154 .proc_handler = proc_dostring,
1155 },
1156 #ifdef CONFIG_KEYS
1157 {
1158 .procname = "keys",
1159 .mode = 0555,
1160 .child = key_sysctls,
1161 },
1162 #endif
1163 #ifdef CONFIG_PERF_EVENTS
1164 /*
1165 * User-space scripts rely on the existence of this file
1166 * as a feature check for perf_events being enabled.
1167 *
1168 * So it's an ABI, do not remove!
1169 */
1170 {
1171 .procname = "perf_event_paranoid",
1172 .data = &sysctl_perf_event_paranoid,
1173 .maxlen = sizeof(sysctl_perf_event_paranoid),
1174 .mode = 0644,
1175 .proc_handler = proc_dointvec,
1176 },
1177 {
1178 .procname = "perf_event_mlock_kb",
1179 .data = &sysctl_perf_event_mlock,
1180 .maxlen = sizeof(sysctl_perf_event_mlock),
1181 .mode = 0644,
1182 .proc_handler = proc_dointvec,
1183 },
1184 {
1185 .procname = "perf_event_max_sample_rate",
1186 .data = &sysctl_perf_event_sample_rate,
1187 .maxlen = sizeof(sysctl_perf_event_sample_rate),
1188 .mode = 0644,
1189 .proc_handler = perf_proc_update_handler,
1190 .extra1 = &one,
1191 },
1192 {
1193 .procname = "perf_cpu_time_max_percent",
1194 .data = &sysctl_perf_cpu_time_max_percent,
1195 .maxlen = sizeof(sysctl_perf_cpu_time_max_percent),
1196 .mode = 0644,
1197 .proc_handler = perf_cpu_time_max_percent_handler,
1198 .extra1 = &zero,
1199 .extra2 = &one_hundred,
1200 },
1201 {
1202 .procname = "perf_event_max_stack",
1203 .data = &sysctl_perf_event_max_stack,
1204 .maxlen = sizeof(sysctl_perf_event_max_stack),
1205 .mode = 0644,
1206 .proc_handler = perf_event_max_stack_handler,
1207 .extra1 = &zero,
1208 .extra2 = &six_hundred_forty_kb,
1209 },
1210 {
1211 .procname = "perf_event_max_contexts_per_stack",
1212 .data = &sysctl_perf_event_max_contexts_per_stack,
1213 .maxlen = sizeof(sysctl_perf_event_max_contexts_per_stack),
1214 .mode = 0644,
1215 .proc_handler = perf_event_max_stack_handler,
1216 .extra1 = &zero,
1217 .extra2 = &one_thousand,
1218 },
1219 #endif
1220 {
1221 .procname = "panic_on_warn",
1222 .data = &panic_on_warn,
1223 .maxlen = sizeof(int),
1224 .mode = 0644,
1225 .proc_handler = proc_dointvec_minmax,
1226 .extra1 = &zero,
1227 .extra2 = &one,
1228 },
1229 #if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ_COMMON)
1230 {
1231 .procname = "timer_migration",
1232 .data = &sysctl_timer_migration,
1233 .maxlen = sizeof(unsigned int),
1234 .mode = 0644,
1235 .proc_handler = timer_migration_handler,
1236 .extra1 = &zero,
1237 .extra2 = &one,
1238 },
1239 #endif
1240 #ifdef CONFIG_BPF_SYSCALL
1241 {
1242 .procname = "unprivileged_bpf_disabled",
1243 .data = &sysctl_unprivileged_bpf_disabled,
1244 .maxlen = sizeof(sysctl_unprivileged_bpf_disabled),
1245 .mode = 0644,
1246 /* only handle a transition from default "0" to "1" */
1247 .proc_handler = proc_dointvec_minmax,
1248 .extra1 = &one,
1249 .extra2 = &one,
1250 },
1251 #endif
1252 #if defined(CONFIG_TREE_RCU) || defined(CONFIG_PREEMPT_RCU)
1253 {
1254 .procname = "panic_on_rcu_stall",
1255 .data = &sysctl_panic_on_rcu_stall,
1256 .maxlen = sizeof(sysctl_panic_on_rcu_stall),
1257 .mode = 0644,
1258 .proc_handler = proc_dointvec_minmax,
1259 .extra1 = &zero,
1260 .extra2 = &one,
1261 },
1262 #endif
1263 { }
1264 };
1265
1266 static struct ctl_table vm_table[] = {
1267 {
1268 .procname = "overcommit_memory",
1269 .data = &sysctl_overcommit_memory,
1270 .maxlen = sizeof(sysctl_overcommit_memory),
1271 .mode = 0644,
1272 .proc_handler = proc_dointvec_minmax,
1273 .extra1 = &zero,
1274 .extra2 = &two,
1275 },
1276 {
1277 .procname = "panic_on_oom",
1278 .data = &sysctl_panic_on_oom,
1279 .maxlen = sizeof(sysctl_panic_on_oom),
1280 .mode = 0644,
1281 .proc_handler = proc_dointvec_minmax,
1282 .extra1 = &zero,
1283 .extra2 = &two,
1284 },
1285 {
1286 .procname = "oom_kill_allocating_task",
1287 .data = &sysctl_oom_kill_allocating_task,
1288 .maxlen = sizeof(sysctl_oom_kill_allocating_task),
1289 .mode = 0644,
1290 .proc_handler = proc_dointvec,
1291 },
1292 {
1293 .procname = "oom_dump_tasks",
1294 .data = &sysctl_oom_dump_tasks,
1295 .maxlen = sizeof(sysctl_oom_dump_tasks),
1296 .mode = 0644,
1297 .proc_handler = proc_dointvec,
1298 },
1299 {
1300 .procname = "overcommit_ratio",
1301 .data = &sysctl_overcommit_ratio,
1302 .maxlen = sizeof(sysctl_overcommit_ratio),
1303 .mode = 0644,
1304 .proc_handler = overcommit_ratio_handler,
1305 },
1306 {
1307 .procname = "overcommit_kbytes",
1308 .data = &sysctl_overcommit_kbytes,
1309 .maxlen = sizeof(sysctl_overcommit_kbytes),
1310 .mode = 0644,
1311 .proc_handler = overcommit_kbytes_handler,
1312 },
1313 {
1314 .procname = "page-cluster",
1315 .data = &page_cluster,
1316 .maxlen = sizeof(int),
1317 .mode = 0644,
1318 .proc_handler = proc_dointvec_minmax,
1319 .extra1 = &zero,
1320 },
1321 {
1322 .procname = "dirty_background_ratio",
1323 .data = &dirty_background_ratio,
1324 .maxlen = sizeof(dirty_background_ratio),
1325 .mode = 0644,
1326 .proc_handler = dirty_background_ratio_handler,
1327 .extra1 = &zero,
1328 .extra2 = &one_hundred,
1329 },
1330 {
1331 .procname = "dirty_background_bytes",
1332 .data = &dirty_background_bytes,
1333 .maxlen = sizeof(dirty_background_bytes),
1334 .mode = 0644,
1335 .proc_handler = dirty_background_bytes_handler,
1336 .extra1 = &one_ul,
1337 },
1338 {
1339 .procname = "dirty_ratio",
1340 .data = &vm_dirty_ratio,
1341 .maxlen = sizeof(vm_dirty_ratio),
1342 .mode = 0644,
1343 .proc_handler = dirty_ratio_handler,
1344 .extra1 = &zero,
1345 .extra2 = &one_hundred,
1346 },
1347 {
1348 .procname = "dirty_bytes",
1349 .data = &vm_dirty_bytes,
1350 .maxlen = sizeof(vm_dirty_bytes),
1351 .mode = 0644,
1352 .proc_handler = dirty_bytes_handler,
1353 .extra1 = &dirty_bytes_min,
1354 },
1355 {
1356 .procname = "dirty_writeback_centisecs",
1357 .data = &dirty_writeback_interval,
1358 .maxlen = sizeof(dirty_writeback_interval),
1359 .mode = 0644,
1360 .proc_handler = dirty_writeback_centisecs_handler,
1361 },
1362 {
1363 .procname = "dirty_expire_centisecs",
1364 .data = &dirty_expire_interval,
1365 .maxlen = sizeof(dirty_expire_interval),
1366 .mode = 0644,
1367 .proc_handler = proc_dointvec_minmax,
1368 .extra1 = &zero,
1369 },
1370 {
1371 .procname = "dirtytime_expire_seconds",
1372 .data = &dirtytime_expire_interval,
1373 .maxlen = sizeof(dirty_expire_interval),
1374 .mode = 0644,
1375 .proc_handler = dirtytime_interval_handler,
1376 .extra1 = &zero,
1377 },
1378 {
1379 .procname = "nr_pdflush_threads",
1380 .mode = 0444 /* read-only */,
1381 .proc_handler = pdflush_proc_obsolete,
1382 },
1383 {
1384 .procname = "swappiness",
1385 .data = &vm_swappiness,
1386 .maxlen = sizeof(vm_swappiness),
1387 .mode = 0644,
1388 .proc_handler = proc_dointvec_minmax,
1389 .extra1 = &zero,
1390 .extra2 = &one_hundred,
1391 },
1392 #ifdef CONFIG_HUGETLB_PAGE
1393 {
1394 .procname = "nr_hugepages",
1395 .data = NULL,
1396 .maxlen = sizeof(unsigned long),
1397 .mode = 0644,
1398 .proc_handler = hugetlb_sysctl_handler,
1399 },
1400 #ifdef CONFIG_NUMA
1401 {
1402 .procname = "nr_hugepages_mempolicy",
1403 .data = NULL,
1404 .maxlen = sizeof(unsigned long),
1405 .mode = 0644,
1406 .proc_handler = &hugetlb_mempolicy_sysctl_handler,
1407 },
1408 #endif
1409 {
1410 .procname = "hugetlb_shm_group",
1411 .data = &sysctl_hugetlb_shm_group,
1412 .maxlen = sizeof(gid_t),
1413 .mode = 0644,
1414 .proc_handler = proc_dointvec,
1415 },
1416 {
1417 .procname = "hugepages_treat_as_movable",
1418 .data = &hugepages_treat_as_movable,
1419 .maxlen = sizeof(int),
1420 .mode = 0644,
1421 .proc_handler = proc_dointvec,
1422 },
1423 {
1424 .procname = "nr_overcommit_hugepages",
1425 .data = NULL,
1426 .maxlen = sizeof(unsigned long),
1427 .mode = 0644,
1428 .proc_handler = hugetlb_overcommit_handler,
1429 },
1430 #endif
1431 {
1432 .procname = "lowmem_reserve_ratio",
1433 .data = &sysctl_lowmem_reserve_ratio,
1434 .maxlen = sizeof(sysctl_lowmem_reserve_ratio),
1435 .mode = 0644,
1436 .proc_handler = lowmem_reserve_ratio_sysctl_handler,
1437 },
1438 {
1439 .procname = "drop_caches",
1440 .data = &sysctl_drop_caches,
1441 .maxlen = sizeof(int),
1442 .mode = 0644,
1443 .proc_handler = drop_caches_sysctl_handler,
1444 .extra1 = &one,
1445 .extra2 = &four,
1446 },
1447 #ifdef CONFIG_COMPACTION
1448 {
1449 .procname = "compact_memory",
1450 .data = &sysctl_compact_memory,
1451 .maxlen = sizeof(int),
1452 .mode = 0200,
1453 .proc_handler = sysctl_compaction_handler,
1454 },
1455 {
1456 .procname = "extfrag_threshold",
1457 .data = &sysctl_extfrag_threshold,
1458 .maxlen = sizeof(int),
1459 .mode = 0644,
1460 .proc_handler = sysctl_extfrag_handler,
1461 .extra1 = &min_extfrag_threshold,
1462 .extra2 = &max_extfrag_threshold,
1463 },
1464 {
1465 .procname = "compact_unevictable_allowed",
1466 .data = &sysctl_compact_unevictable_allowed,
1467 .maxlen = sizeof(int),
1468 .mode = 0644,
1469 .proc_handler = proc_dointvec,
1470 .extra1 = &zero,
1471 .extra2 = &one,
1472 },
1473
1474 #endif /* CONFIG_COMPACTION */
1475 {
1476 .procname = "min_free_kbytes",
1477 .data = &min_free_kbytes,
1478 .maxlen = sizeof(min_free_kbytes),
1479 .mode = 0644,
1480 .proc_handler = min_free_kbytes_sysctl_handler,
1481 .extra1 = &zero,
1482 },
1483 {
1484 .procname = "watermark_scale_factor",
1485 .data = &watermark_scale_factor,
1486 .maxlen = sizeof(watermark_scale_factor),
1487 .mode = 0644,
1488 .proc_handler = watermark_scale_factor_sysctl_handler,
1489 .extra1 = &one,
1490 .extra2 = &one_thousand,
1491 },
1492 {
1493 .procname = "percpu_pagelist_fraction",
1494 .data = &percpu_pagelist_fraction,
1495 .maxlen = sizeof(percpu_pagelist_fraction),
1496 .mode = 0644,
1497 .proc_handler = percpu_pagelist_fraction_sysctl_handler,
1498 .extra1 = &zero,
1499 },
1500 #ifdef CONFIG_MMU
1501 {
1502 .procname = "max_map_count",
1503 .data = &sysctl_max_map_count,
1504 .maxlen = sizeof(sysctl_max_map_count),
1505 .mode = 0644,
1506 .proc_handler = proc_dointvec_minmax,
1507 .extra1 = &zero,
1508 },
1509 #else
1510 {
1511 .procname = "nr_trim_pages",
1512 .data = &sysctl_nr_trim_pages,
1513 .maxlen = sizeof(sysctl_nr_trim_pages),
1514 .mode = 0644,
1515 .proc_handler = proc_dointvec_minmax,
1516 .extra1 = &zero,
1517 },
1518 #endif
1519 {
1520 .procname = "laptop_mode",
1521 .data = &laptop_mode,
1522 .maxlen = sizeof(laptop_mode),
1523 .mode = 0644,
1524 .proc_handler = proc_dointvec_jiffies,
1525 },
1526 {
1527 .procname = "block_dump",
1528 .data = &block_dump,
1529 .maxlen = sizeof(block_dump),
1530 .mode = 0644,
1531 .proc_handler = proc_dointvec,
1532 .extra1 = &zero,
1533 },
1534 {
1535 .procname = "vfs_cache_pressure",
1536 .data = &sysctl_vfs_cache_pressure,
1537 .maxlen = sizeof(sysctl_vfs_cache_pressure),
1538 .mode = 0644,
1539 .proc_handler = proc_dointvec,
1540 .extra1 = &zero,
1541 },
1542 #ifdef HAVE_ARCH_PICK_MMAP_LAYOUT
1543 {
1544 .procname = "legacy_va_layout",
1545 .data = &sysctl_legacy_va_layout,
1546 .maxlen = sizeof(sysctl_legacy_va_layout),
1547 .mode = 0644,
1548 .proc_handler = proc_dointvec,
1549 .extra1 = &zero,
1550 },
1551 #endif
1552 #ifdef CONFIG_NUMA
1553 {
1554 .procname = "zone_reclaim_mode",
1555 .data = &node_reclaim_mode,
1556 .maxlen = sizeof(node_reclaim_mode),
1557 .mode = 0644,
1558 .proc_handler = proc_dointvec,
1559 .extra1 = &zero,
1560 },
1561 {
1562 .procname = "min_unmapped_ratio",
1563 .data = &sysctl_min_unmapped_ratio,
1564 .maxlen = sizeof(sysctl_min_unmapped_ratio),
1565 .mode = 0644,
1566 .proc_handler = sysctl_min_unmapped_ratio_sysctl_handler,
1567 .extra1 = &zero,
1568 .extra2 = &one_hundred,
1569 },
1570 {
1571 .procname = "min_slab_ratio",
1572 .data = &sysctl_min_slab_ratio,
1573 .maxlen = sizeof(sysctl_min_slab_ratio),
1574 .mode = 0644,
1575 .proc_handler = sysctl_min_slab_ratio_sysctl_handler,
1576 .extra1 = &zero,
1577 .extra2 = &one_hundred,
1578 },
1579 #endif
1580 #ifdef CONFIG_SMP
1581 {
1582 .procname = "stat_interval",
1583 .data = &sysctl_stat_interval,
1584 .maxlen = sizeof(sysctl_stat_interval),
1585 .mode = 0644,
1586 .proc_handler = proc_dointvec_jiffies,
1587 },
1588 {
1589 .procname = "stat_refresh",
1590 .data = NULL,
1591 .maxlen = 0,
1592 .mode = 0600,
1593 .proc_handler = vmstat_refresh,
1594 },
1595 #endif
1596 #ifdef CONFIG_MMU
1597 {
1598 .procname = "mmap_min_addr",
1599 .data = &dac_mmap_min_addr,
1600 .maxlen = sizeof(unsigned long),
1601 .mode = 0644,
1602 .proc_handler = mmap_min_addr_handler,
1603 },
1604 #endif
1605 #ifdef CONFIG_NUMA
1606 {
1607 .procname = "numa_zonelist_order",
1608 .data = &numa_zonelist_order,
1609 .maxlen = NUMA_ZONELIST_ORDER_LEN,
1610 .mode = 0644,
1611 .proc_handler = numa_zonelist_order_handler,
1612 },
1613 #endif
1614 #if (defined(CONFIG_X86_32) && !defined(CONFIG_UML))|| \
1615 (defined(CONFIG_SUPERH) && defined(CONFIG_VSYSCALL))
1616 {
1617 .procname = "vdso_enabled",
1618 #ifdef CONFIG_X86_32
1619 .data = &vdso32_enabled,
1620 .maxlen = sizeof(vdso32_enabled),
1621 #else
1622 .data = &vdso_enabled,
1623 .maxlen = sizeof(vdso_enabled),
1624 #endif
1625 .mode = 0644,
1626 .proc_handler = proc_dointvec,
1627 .extra1 = &zero,
1628 },
1629 #endif
1630 #ifdef CONFIG_HIGHMEM
1631 {
1632 .procname = "highmem_is_dirtyable",
1633 .data = &vm_highmem_is_dirtyable,
1634 .maxlen = sizeof(vm_highmem_is_dirtyable),
1635 .mode = 0644,
1636 .proc_handler = proc_dointvec_minmax,
1637 .extra1 = &zero,
1638 .extra2 = &one,
1639 },
1640 #endif
1641 #ifdef CONFIG_MEMORY_FAILURE
1642 {
1643 .procname = "memory_failure_early_kill",
1644 .data = &sysctl_memory_failure_early_kill,
1645 .maxlen = sizeof(sysctl_memory_failure_early_kill),
1646 .mode = 0644,
1647 .proc_handler = proc_dointvec_minmax,
1648 .extra1 = &zero,
1649 .extra2 = &one,
1650 },
1651 {
1652 .procname = "memory_failure_recovery",
1653 .data = &sysctl_memory_failure_recovery,
1654 .maxlen = sizeof(sysctl_memory_failure_recovery),
1655 .mode = 0644,
1656 .proc_handler = proc_dointvec_minmax,
1657 .extra1 = &zero,
1658 .extra2 = &one,
1659 },
1660 #endif
1661 {
1662 .procname = "user_reserve_kbytes",
1663 .data = &sysctl_user_reserve_kbytes,
1664 .maxlen = sizeof(sysctl_user_reserve_kbytes),
1665 .mode = 0644,
1666 .proc_handler = proc_doulongvec_minmax,
1667 },
1668 {
1669 .procname = "admin_reserve_kbytes",
1670 .data = &sysctl_admin_reserve_kbytes,
1671 .maxlen = sizeof(sysctl_admin_reserve_kbytes),
1672 .mode = 0644,
1673 .proc_handler = proc_doulongvec_minmax,
1674 },
1675 #ifdef CONFIG_HAVE_ARCH_MMAP_RND_BITS
1676 {
1677 .procname = "mmap_rnd_bits",
1678 .data = &mmap_rnd_bits,
1679 .maxlen = sizeof(mmap_rnd_bits),
1680 .mode = 0600,
1681 .proc_handler = proc_dointvec_minmax,
1682 .extra1 = (void *)&mmap_rnd_bits_min,
1683 .extra2 = (void *)&mmap_rnd_bits_max,
1684 },
1685 #endif
1686 #ifdef CONFIG_HAVE_ARCH_MMAP_RND_COMPAT_BITS
1687 {
1688 .procname = "mmap_rnd_compat_bits",
1689 .data = &mmap_rnd_compat_bits,
1690 .maxlen = sizeof(mmap_rnd_compat_bits),
1691 .mode = 0600,
1692 .proc_handler = proc_dointvec_minmax,
1693 .extra1 = (void *)&mmap_rnd_compat_bits_min,
1694 .extra2 = (void *)&mmap_rnd_compat_bits_max,
1695 },
1696 #endif
1697 { }
1698 };
1699
1700 static struct ctl_table fs_table[] = {
1701 {
1702 .procname = "inode-nr",
1703 .data = &inodes_stat,
1704 .maxlen = 2*sizeof(long),
1705 .mode = 0444,
1706 .proc_handler = proc_nr_inodes,
1707 },
1708 {
1709 .procname = "inode-state",
1710 .data = &inodes_stat,
1711 .maxlen = 7*sizeof(long),
1712 .mode = 0444,
1713 .proc_handler = proc_nr_inodes,
1714 },
1715 {
1716 .procname = "file-nr",
1717 .data = &files_stat,
1718 .maxlen = sizeof(files_stat),
1719 .mode = 0444,
1720 .proc_handler = proc_nr_files,
1721 },
1722 {
1723 .procname = "file-max",
1724 .data = &files_stat.max_files,
1725 .maxlen = sizeof(files_stat.max_files),
1726 .mode = 0644,
1727 .proc_handler = proc_doulongvec_minmax,
1728 },
1729 {
1730 .procname = "nr_open",
1731 .data = &sysctl_nr_open,
1732 .maxlen = sizeof(unsigned int),
1733 .mode = 0644,
1734 .proc_handler = proc_dointvec_minmax,
1735 .extra1 = &sysctl_nr_open_min,
1736 .extra2 = &sysctl_nr_open_max,
1737 },
1738 {
1739 .procname = "dentry-state",
1740 .data = &dentry_stat,
1741 .maxlen = 6*sizeof(long),
1742 .mode = 0444,
1743 .proc_handler = proc_nr_dentry,
1744 },
1745 {
1746 .procname = "overflowuid",
1747 .data = &fs_overflowuid,
1748 .maxlen = sizeof(int),
1749 .mode = 0644,
1750 .proc_handler = proc_dointvec_minmax,
1751 .extra1 = &minolduid,
1752 .extra2 = &maxolduid,
1753 },
1754 {
1755 .procname = "overflowgid",
1756 .data = &fs_overflowgid,
1757 .maxlen = sizeof(int),
1758 .mode = 0644,
1759 .proc_handler = proc_dointvec_minmax,
1760 .extra1 = &minolduid,
1761 .extra2 = &maxolduid,
1762 },
1763 #ifdef CONFIG_FILE_LOCKING
1764 {
1765 .procname = "leases-enable",
1766 .data = &leases_enable,
1767 .maxlen = sizeof(int),
1768 .mode = 0644,
1769 .proc_handler = proc_dointvec,
1770 },
1771 #endif
1772 #ifdef CONFIG_DNOTIFY
1773 {
1774 .procname = "dir-notify-enable",
1775 .data = &dir_notify_enable,
1776 .maxlen = sizeof(int),
1777 .mode = 0644,
1778 .proc_handler = proc_dointvec,
1779 },
1780 #endif
1781 #ifdef CONFIG_MMU
1782 #ifdef CONFIG_FILE_LOCKING
1783 {
1784 .procname = "lease-break-time",
1785 .data = &lease_break_time,
1786 .maxlen = sizeof(int),
1787 .mode = 0644,
1788 .proc_handler = proc_dointvec,
1789 },
1790 #endif
1791 #ifdef CONFIG_AIO
1792 {
1793 .procname = "aio-nr",
1794 .data = &aio_nr,
1795 .maxlen = sizeof(aio_nr),
1796 .mode = 0444,
1797 .proc_handler = proc_doulongvec_minmax,
1798 },
1799 {
1800 .procname = "aio-max-nr",
1801 .data = &aio_max_nr,
1802 .maxlen = sizeof(aio_max_nr),
1803 .mode = 0644,
1804 .proc_handler = proc_doulongvec_minmax,
1805 },
1806 #endif /* CONFIG_AIO */
1807 #ifdef CONFIG_INOTIFY_USER
1808 {
1809 .procname = "inotify",
1810 .mode = 0555,
1811 .child = inotify_table,
1812 },
1813 #endif
1814 #ifdef CONFIG_EPOLL
1815 {
1816 .procname = "epoll",
1817 .mode = 0555,
1818 .child = epoll_table,
1819 },
1820 #endif
1821 #endif
1822 {
1823 .procname = "protected_symlinks",
1824 .data = &sysctl_protected_symlinks,
1825 .maxlen = sizeof(int),
1826 .mode = 0600,
1827 .proc_handler = proc_dointvec_minmax,
1828 .extra1 = &zero,
1829 .extra2 = &one,
1830 },
1831 {
1832 .procname = "protected_hardlinks",
1833 .data = &sysctl_protected_hardlinks,
1834 .maxlen = sizeof(int),
1835 .mode = 0600,
1836 .proc_handler = proc_dointvec_minmax,
1837 .extra1 = &zero,
1838 .extra2 = &one,
1839 },
1840 {
1841 .procname = "suid_dumpable",
1842 .data = &suid_dumpable,
1843 .maxlen = sizeof(int),
1844 .mode = 0644,
1845 .proc_handler = proc_dointvec_minmax_coredump,
1846 .extra1 = &zero,
1847 .extra2 = &two,
1848 },
1849 #if defined(CONFIG_BINFMT_MISC) || defined(CONFIG_BINFMT_MISC_MODULE)
1850 {
1851 .procname = "binfmt_misc",
1852 .mode = 0555,
1853 .child = sysctl_mount_point,
1854 },
1855 #endif
1856 {
1857 .procname = "pipe-max-size",
1858 .data = &pipe_max_size,
1859 .maxlen = sizeof(pipe_max_size),
1860 .mode = 0644,
1861 .proc_handler = &pipe_proc_fn,
1862 .extra1 = &pipe_min_size,
1863 },
1864 {
1865 .procname = "pipe-user-pages-hard",
1866 .data = &pipe_user_pages_hard,
1867 .maxlen = sizeof(pipe_user_pages_hard),
1868 .mode = 0644,
1869 .proc_handler = proc_doulongvec_minmax,
1870 },
1871 {
1872 .procname = "pipe-user-pages-soft",
1873 .data = &pipe_user_pages_soft,
1874 .maxlen = sizeof(pipe_user_pages_soft),
1875 .mode = 0644,
1876 .proc_handler = proc_doulongvec_minmax,
1877 },
1878 {
1879 .procname = "mount-max",
1880 .data = &sysctl_mount_max,
1881 .maxlen = sizeof(unsigned int),
1882 .mode = 0644,
1883 .proc_handler = proc_dointvec_minmax,
1884 .extra1 = &one,
1885 },
1886 { }
1887 };
1888
1889 static struct ctl_table debug_table[] = {
1890 #ifdef CONFIG_SYSCTL_EXCEPTION_TRACE
1891 {
1892 .procname = "exception-trace",
1893 .data = &show_unhandled_signals,
1894 .maxlen = sizeof(int),
1895 .mode = 0644,
1896 .proc_handler = proc_dointvec
1897 },
1898 #endif
1899 #if defined(CONFIG_OPTPROBES)
1900 {
1901 .procname = "kprobes-optimization",
1902 .data = &sysctl_kprobes_optimization,
1903 .maxlen = sizeof(int),
1904 .mode = 0644,
1905 .proc_handler = proc_kprobes_optimization_handler,
1906 .extra1 = &zero,
1907 .extra2 = &one,
1908 },
1909 #endif
1910 { }
1911 };
1912
1913 static struct ctl_table dev_table[] = {
1914 { }
1915 };
1916
1917 int __init sysctl_init(void)
1918 {
1919 struct ctl_table_header *hdr;
1920
1921 hdr = register_sysctl_table(sysctl_base_table);
1922 kmemleak_not_leak(hdr);
1923 return 0;
1924 }
1925
1926 #endif /* CONFIG_SYSCTL */
1927
1928 /*
1929 * /proc/sys support
1930 */
1931
1932 #ifdef CONFIG_PROC_SYSCTL
1933
1934 static int _proc_do_string(char *data, int maxlen, int write,
1935 char __user *buffer,
1936 size_t *lenp, loff_t *ppos)
1937 {
1938 size_t len;
1939 char __user *p;
1940 char c;
1941
1942 if (!data || !maxlen || !*lenp) {
1943 *lenp = 0;
1944 return 0;
1945 }
1946
1947 if (write) {
1948 if (sysctl_writes_strict == SYSCTL_WRITES_STRICT) {
1949 /* Only continue writes not past the end of buffer. */
1950 len = strlen(data);
1951 if (len > maxlen - 1)
1952 len = maxlen - 1;
1953
1954 if (*ppos > len)
1955 return 0;
1956 len = *ppos;
1957 } else {
1958 /* Start writing from beginning of buffer. */
1959 len = 0;
1960 }
1961
1962 *ppos += *lenp;
1963 p = buffer;
1964 while ((p - buffer) < *lenp && len < maxlen - 1) {
1965 if (get_user(c, p++))
1966 return -EFAULT;
1967 if (c == 0 || c == '\n')
1968 break;
1969 data[len++] = c;
1970 }
1971 data[len] = 0;
1972 } else {
1973 len = strlen(data);
1974 if (len > maxlen)
1975 len = maxlen;
1976
1977 if (*ppos > len) {
1978 *lenp = 0;
1979 return 0;
1980 }
1981
1982 data += *ppos;
1983 len -= *ppos;
1984
1985 if (len > *lenp)
1986 len = *lenp;
1987 if (len)
1988 if (copy_to_user(buffer, data, len))
1989 return -EFAULT;
1990 if (len < *lenp) {
1991 if (put_user('\n', buffer + len))
1992 return -EFAULT;
1993 len++;
1994 }
1995 *lenp = len;
1996 *ppos += len;
1997 }
1998 return 0;
1999 }
2000
2001 static void warn_sysctl_write(struct ctl_table *table)
2002 {
2003 pr_warn_once("%s wrote to %s when file position was not 0!\n"
2004 "This will not be supported in the future. To silence this\n"
2005 "warning, set kernel.sysctl_writes_strict = -1\n",
2006 current->comm, table->procname);
2007 }
2008
2009 /**
2010 * proc_first_pos_non_zero_ignore - check if firs position is allowed
2011 * @ppos: file position
2012 * @table: the sysctl table
2013 *
2014 * Returns true if the first position is non-zero and the sysctl_writes_strict
2015 * mode indicates this is not allowed for numeric input types. String proc
2016 * hadlers can ignore the return value.
2017 */
2018 static bool proc_first_pos_non_zero_ignore(loff_t *ppos,
2019 struct ctl_table *table)
2020 {
2021 if (!*ppos)
2022 return false;
2023
2024 switch (sysctl_writes_strict) {
2025 case SYSCTL_WRITES_STRICT:
2026 return true;
2027 case SYSCTL_WRITES_WARN:
2028 warn_sysctl_write(table);
2029 return false;
2030 default:
2031 return false;
2032 }
2033 }
2034
2035 /**
2036 * proc_dostring - read a string sysctl
2037 * @table: the sysctl table
2038 * @write: %TRUE if this is a write to the sysctl file
2039 * @buffer: the user buffer
2040 * @lenp: the size of the user buffer
2041 * @ppos: file position
2042 *
2043 * Reads/writes a string from/to the user buffer. If the kernel
2044 * buffer provided is not large enough to hold the string, the
2045 * string is truncated. The copied string is %NULL-terminated.
2046 * If the string is being read by the user process, it is copied
2047 * and a newline '\n' is added. It is truncated if the buffer is
2048 * not large enough.
2049 *
2050 * Returns 0 on success.
2051 */
2052 int proc_dostring(struct ctl_table *table, int write,
2053 void __user *buffer, size_t *lenp, loff_t *ppos)
2054 {
2055 if (write)
2056 proc_first_pos_non_zero_ignore(ppos, table);
2057
2058 return _proc_do_string((char *)(table->data), table->maxlen, write,
2059 (char __user *)buffer, lenp, ppos);
2060 }
2061
2062 static size_t proc_skip_spaces(char **buf)
2063 {
2064 size_t ret;
2065 char *tmp = skip_spaces(*buf);
2066 ret = tmp - *buf;
2067 *buf = tmp;
2068 return ret;
2069 }
2070
2071 static void proc_skip_char(char **buf, size_t *size, const char v)
2072 {
2073 while (*size) {
2074 if (**buf != v)
2075 break;
2076 (*size)--;
2077 (*buf)++;
2078 }
2079 }
2080
2081 #define TMPBUFLEN 22
2082 /**
2083 * proc_get_long - reads an ASCII formatted integer from a user buffer
2084 *
2085 * @buf: a kernel buffer
2086 * @size: size of the kernel buffer
2087 * @val: this is where the number will be stored
2088 * @neg: set to %TRUE if number is negative
2089 * @perm_tr: a vector which contains the allowed trailers
2090 * @perm_tr_len: size of the perm_tr vector
2091 * @tr: pointer to store the trailer character
2092 *
2093 * In case of success %0 is returned and @buf and @size are updated with
2094 * the amount of bytes read. If @tr is non-NULL and a trailing
2095 * character exists (size is non-zero after returning from this
2096 * function), @tr is updated with the trailing character.
2097 */
2098 static int proc_get_long(char **buf, size_t *size,
2099 unsigned long *val, bool *neg,
2100 const char *perm_tr, unsigned perm_tr_len, char *tr)
2101 {
2102 int len;
2103 char *p, tmp[TMPBUFLEN];
2104
2105 if (!*size)
2106 return -EINVAL;
2107
2108 len = *size;
2109 if (len > TMPBUFLEN - 1)
2110 len = TMPBUFLEN - 1;
2111
2112 memcpy(tmp, *buf, len);
2113
2114 tmp[len] = 0;
2115 p = tmp;
2116 if (*p == '-' && *size > 1) {
2117 *neg = true;
2118 p++;
2119 } else
2120 *neg = false;
2121 if (!isdigit(*p))
2122 return -EINVAL;
2123
2124 *val = simple_strtoul(p, &p, 0);
2125
2126 len = p - tmp;
2127
2128 /* We don't know if the next char is whitespace thus we may accept
2129 * invalid integers (e.g. 1234...a) or two integers instead of one
2130 * (e.g. 123...1). So lets not allow such large numbers. */
2131 if (len == TMPBUFLEN - 1)
2132 return -EINVAL;
2133
2134 if (len < *size && perm_tr_len && !memchr(perm_tr, *p, perm_tr_len))
2135 return -EINVAL;
2136
2137 if (tr && (len < *size))
2138 *tr = *p;
2139
2140 *buf += len;
2141 *size -= len;
2142
2143 return 0;
2144 }
2145
2146 /**
2147 * proc_put_long - converts an integer to a decimal ASCII formatted string
2148 *
2149 * @buf: the user buffer
2150 * @size: the size of the user buffer
2151 * @val: the integer to be converted
2152 * @neg: sign of the number, %TRUE for negative
2153 *
2154 * In case of success %0 is returned and @buf and @size are updated with
2155 * the amount of bytes written.
2156 */
2157 static int proc_put_long(void __user **buf, size_t *size, unsigned long val,
2158 bool neg)
2159 {
2160 int len;
2161 char tmp[TMPBUFLEN], *p = tmp;
2162
2163 sprintf(p, "%s%lu", neg ? "-" : "", val);
2164 len = strlen(tmp);
2165 if (len > *size)
2166 len = *size;
2167 if (copy_to_user(*buf, tmp, len))
2168 return -EFAULT;
2169 *size -= len;
2170 *buf += len;
2171 return 0;
2172 }
2173 #undef TMPBUFLEN
2174
2175 static int proc_put_char(void __user **buf, size_t *size, char c)
2176 {
2177 if (*size) {
2178 char __user **buffer = (char __user **)buf;
2179 if (put_user(c, *buffer))
2180 return -EFAULT;
2181 (*size)--, (*buffer)++;
2182 *buf = *buffer;
2183 }
2184 return 0;
2185 }
2186
2187 static int do_proc_dointvec_conv(bool *negp, unsigned long *lvalp,
2188 int *valp,
2189 int write, void *data)
2190 {
2191 if (write) {
2192 if (*negp) {
2193 if (*lvalp > (unsigned long) INT_MAX + 1)
2194 return -EINVAL;
2195 *valp = -*lvalp;
2196 } else {
2197 if (*lvalp > (unsigned long) INT_MAX)
2198 return -EINVAL;
2199 *valp = *lvalp;
2200 }
2201 } else {
2202 int val = *valp;
2203 if (val < 0) {
2204 *negp = true;
2205 *lvalp = -(unsigned long)val;
2206 } else {
2207 *negp = false;
2208 *lvalp = (unsigned long)val;
2209 }
2210 }
2211 return 0;
2212 }
2213
2214 static int do_proc_douintvec_conv(unsigned long *lvalp,
2215 unsigned int *valp,
2216 int write, void *data)
2217 {
2218 if (write) {
2219 if (*lvalp > UINT_MAX)
2220 return -EINVAL;
2221 *valp = *lvalp;
2222 } else {
2223 unsigned int val = *valp;
2224 *lvalp = (unsigned long)val;
2225 }
2226 return 0;
2227 }
2228
2229 static const char proc_wspace_sep[] = { ' ', '\t', '\n' };
2230
2231 static int __do_proc_dointvec(void *tbl_data, struct ctl_table *table,
2232 int write, void __user *buffer,
2233 size_t *lenp, loff_t *ppos,
2234 int (*conv)(bool *negp, unsigned long *lvalp, int *valp,
2235 int write, void *data),
2236 void *data)
2237 {
2238 int *i, vleft, first = 1, err = 0;
2239 size_t left;
2240 char *kbuf = NULL, *p;
2241
2242 if (!tbl_data || !table->maxlen || !*lenp || (*ppos && !write)) {
2243 *lenp = 0;
2244 return 0;
2245 }
2246
2247 i = (int *) tbl_data;
2248 vleft = table->maxlen / sizeof(*i);
2249 left = *lenp;
2250
2251 if (!conv)
2252 conv = do_proc_dointvec_conv;
2253
2254 if (write) {
2255 if (proc_first_pos_non_zero_ignore(ppos, table))
2256 goto out;
2257
2258 if (left > PAGE_SIZE - 1)
2259 left = PAGE_SIZE - 1;
2260 p = kbuf = memdup_user_nul(buffer, left);
2261 if (IS_ERR(kbuf))
2262 return PTR_ERR(kbuf);
2263 }
2264
2265 for (; left && vleft--; i++, first=0) {
2266 unsigned long lval;
2267 bool neg;
2268
2269 if (write) {
2270 left -= proc_skip_spaces(&p);
2271
2272 if (!left)
2273 break;
2274 err = proc_get_long(&p, &left, &lval, &neg,
2275 proc_wspace_sep,
2276 sizeof(proc_wspace_sep), NULL);
2277 if (err)
2278 break;
2279 if (conv(&neg, &lval, i, 1, data)) {
2280 err = -EINVAL;
2281 break;
2282 }
2283 } else {
2284 if (conv(&neg, &lval, i, 0, data)) {
2285 err = -EINVAL;
2286 break;
2287 }
2288 if (!first)
2289 err = proc_put_char(&buffer, &left, '\t');
2290 if (err)
2291 break;
2292 err = proc_put_long(&buffer, &left, lval, neg);
2293 if (err)
2294 break;
2295 }
2296 }
2297
2298 if (!write && !first && left && !err)
2299 err = proc_put_char(&buffer, &left, '\n');
2300 if (write && !err && left)
2301 left -= proc_skip_spaces(&p);
2302 if (write) {
2303 kfree(kbuf);
2304 if (first)
2305 return err ? : -EINVAL;
2306 }
2307 *lenp -= left;
2308 out:
2309 *ppos += *lenp;
2310 return err;
2311 }
2312
2313 static int do_proc_dointvec(struct ctl_table *table, int write,
2314 void __user *buffer, size_t *lenp, loff_t *ppos,
2315 int (*conv)(bool *negp, unsigned long *lvalp, int *valp,
2316 int write, void *data),
2317 void *data)
2318 {
2319 return __do_proc_dointvec(table->data, table, write,
2320 buffer, lenp, ppos, conv, data);
2321 }
2322
2323 static int do_proc_douintvec_w(unsigned int *tbl_data,
2324 struct ctl_table *table,
2325 void __user *buffer,
2326 size_t *lenp, loff_t *ppos,
2327 int (*conv)(unsigned long *lvalp,
2328 unsigned int *valp,
2329 int write, void *data),
2330 void *data)
2331 {
2332 unsigned long lval;
2333 int err = 0;
2334 size_t left;
2335 bool neg;
2336 char *kbuf = NULL, *p;
2337
2338 left = *lenp;
2339
2340 if (proc_first_pos_non_zero_ignore(ppos, table))
2341 goto bail_early;
2342
2343 if (left > PAGE_SIZE - 1)
2344 left = PAGE_SIZE - 1;
2345
2346 p = kbuf = memdup_user_nul(buffer, left);
2347 if (IS_ERR(kbuf))
2348 return -EINVAL;
2349
2350 left -= proc_skip_spaces(&p);
2351 if (!left) {
2352 err = -EINVAL;
2353 goto out_free;
2354 }
2355
2356 err = proc_get_long(&p, &left, &lval, &neg,
2357 proc_wspace_sep,
2358 sizeof(proc_wspace_sep), NULL);
2359 if (err || neg) {
2360 err = -EINVAL;
2361 goto out_free;
2362 }
2363
2364 if (conv(&lval, tbl_data, 1, data)) {
2365 err = -EINVAL;
2366 goto out_free;
2367 }
2368
2369 if (!err && left)
2370 left -= proc_skip_spaces(&p);
2371
2372 out_free:
2373 kfree(kbuf);
2374 if (err)
2375 return -EINVAL;
2376
2377 return 0;
2378
2379 /* This is in keeping with old __do_proc_dointvec() */
2380 bail_early:
2381 *ppos += *lenp;
2382 return err;
2383 }
2384
2385 static int do_proc_douintvec_r(unsigned int *tbl_data, void __user *buffer,
2386 size_t *lenp, loff_t *ppos,
2387 int (*conv)(unsigned long *lvalp,
2388 unsigned int *valp,
2389 int write, void *data),
2390 void *data)
2391 {
2392 unsigned long lval;
2393 int err = 0;
2394 size_t left;
2395
2396 left = *lenp;
2397
2398 if (conv(&lval, tbl_data, 0, data)) {
2399 err = -EINVAL;
2400 goto out;
2401 }
2402
2403 err = proc_put_long(&buffer, &left, lval, false);
2404 if (err || !left)
2405 goto out;
2406
2407 err = proc_put_char(&buffer, &left, '\n');
2408
2409 out:
2410 *lenp -= left;
2411 *ppos += *lenp;
2412
2413 return err;
2414 }
2415
2416 static int __do_proc_douintvec(void *tbl_data, struct ctl_table *table,
2417 int write, void __user *buffer,
2418 size_t *lenp, loff_t *ppos,
2419 int (*conv)(unsigned long *lvalp,
2420 unsigned int *valp,
2421 int write, void *data),
2422 void *data)
2423 {
2424 unsigned int *i, vleft;
2425
2426 if (!tbl_data || !table->maxlen || !*lenp || (*ppos && !write)) {
2427 *lenp = 0;
2428 return 0;
2429 }
2430
2431 i = (unsigned int *) tbl_data;
2432 vleft = table->maxlen / sizeof(*i);
2433
2434 /*
2435 * Arrays are not supported, keep this simple. *Do not* add
2436 * support for them.
2437 */
2438 if (vleft != 1) {
2439 *lenp = 0;
2440 return -EINVAL;
2441 }
2442
2443 if (!conv)
2444 conv = do_proc_douintvec_conv;
2445
2446 if (write)
2447 return do_proc_douintvec_w(i, table, buffer, lenp, ppos,
2448 conv, data);
2449 return do_proc_douintvec_r(i, buffer, lenp, ppos, conv, data);
2450 }
2451
2452 static int do_proc_douintvec(struct ctl_table *table, int write,
2453 void __user *buffer, size_t *lenp, loff_t *ppos,
2454 int (*conv)(unsigned long *lvalp,
2455 unsigned int *valp,
2456 int write, void *data),
2457 void *data)
2458 {
2459 return __do_proc_douintvec(table->data, table, write,
2460 buffer, lenp, ppos, conv, data);
2461 }
2462
2463 /**
2464 * proc_dointvec - read a vector of integers
2465 * @table: the sysctl table
2466 * @write: %TRUE if this is a write to the sysctl file
2467 * @buffer: the user buffer
2468 * @lenp: the size of the user buffer
2469 * @ppos: file position
2470 *
2471 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2472 * values from/to the user buffer, treated as an ASCII string.
2473 *
2474 * Returns 0 on success.
2475 */
2476 int proc_dointvec(struct ctl_table *table, int write,
2477 void __user *buffer, size_t *lenp, loff_t *ppos)
2478 {
2479 return do_proc_dointvec(table, write, buffer, lenp, ppos, NULL, NULL);
2480 }
2481
2482 /**
2483 * proc_douintvec - read a vector of unsigned integers
2484 * @table: the sysctl table
2485 * @write: %TRUE if this is a write to the sysctl file
2486 * @buffer: the user buffer
2487 * @lenp: the size of the user buffer
2488 * @ppos: file position
2489 *
2490 * Reads/writes up to table->maxlen/sizeof(unsigned int) unsigned integer
2491 * values from/to the user buffer, treated as an ASCII string.
2492 *
2493 * Returns 0 on success.
2494 */
2495 int proc_douintvec(struct ctl_table *table, int write,
2496 void __user *buffer, size_t *lenp, loff_t *ppos)
2497 {
2498 return do_proc_douintvec(table, write, buffer, lenp, ppos,
2499 do_proc_douintvec_conv, NULL);
2500 }
2501
2502 /*
2503 * Taint values can only be increased
2504 * This means we can safely use a temporary.
2505 */
2506 static int proc_taint(struct ctl_table *table, int write,
2507 void __user *buffer, size_t *lenp, loff_t *ppos)
2508 {
2509 struct ctl_table t;
2510 unsigned long tmptaint = get_taint();
2511 int err;
2512
2513 if (write && !capable(CAP_SYS_ADMIN))
2514 return -EPERM;
2515
2516 t = *table;
2517 t.data = &tmptaint;
2518 err = proc_doulongvec_minmax(&t, write, buffer, lenp, ppos);
2519 if (err < 0)
2520 return err;
2521
2522 if (write) {
2523 /*
2524 * Poor man's atomic or. Not worth adding a primitive
2525 * to everyone's atomic.h for this
2526 */
2527 int i;
2528 for (i = 0; i < BITS_PER_LONG && tmptaint >> i; i++) {
2529 if ((tmptaint >> i) & 1)
2530 add_taint(i, LOCKDEP_STILL_OK);
2531 }
2532 }
2533
2534 return err;
2535 }
2536
2537 #ifdef CONFIG_PRINTK
2538 static int proc_dointvec_minmax_sysadmin(struct ctl_table *table, int write,
2539 void __user *buffer, size_t *lenp, loff_t *ppos)
2540 {
2541 if (write && !capable(CAP_SYS_ADMIN))
2542 return -EPERM;
2543
2544 return proc_dointvec_minmax(table, write, buffer, lenp, ppos);
2545 }
2546 #endif
2547
2548 struct do_proc_dointvec_minmax_conv_param {
2549 int *min;
2550 int *max;
2551 };
2552
2553 static int do_proc_dointvec_minmax_conv(bool *negp, unsigned long *lvalp,
2554 int *valp,
2555 int write, void *data)
2556 {
2557 struct do_proc_dointvec_minmax_conv_param *param = data;
2558 if (write) {
2559 int val = *negp ? -*lvalp : *lvalp;
2560 if ((param->min && *param->min > val) ||
2561 (param->max && *param->max < val))
2562 return -EINVAL;
2563 *valp = val;
2564 } else {
2565 int val = *valp;
2566 if (val < 0) {
2567 *negp = true;
2568 *lvalp = -(unsigned long)val;
2569 } else {
2570 *negp = false;
2571 *lvalp = (unsigned long)val;
2572 }
2573 }
2574 return 0;
2575 }
2576
2577 /**
2578 * proc_dointvec_minmax - read a vector of integers with min/max values
2579 * @table: the sysctl table
2580 * @write: %TRUE if this is a write to the sysctl file
2581 * @buffer: the user buffer
2582 * @lenp: the size of the user buffer
2583 * @ppos: file position
2584 *
2585 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2586 * values from/to the user buffer, treated as an ASCII string.
2587 *
2588 * This routine will ensure the values are within the range specified by
2589 * table->extra1 (min) and table->extra2 (max).
2590 *
2591 * Returns 0 on success.
2592 */
2593 int proc_dointvec_minmax(struct ctl_table *table, int write,
2594 void __user *buffer, size_t *lenp, loff_t *ppos)
2595 {
2596 struct do_proc_dointvec_minmax_conv_param param = {
2597 .min = (int *) table->extra1,
2598 .max = (int *) table->extra2,
2599 };
2600 return do_proc_dointvec(table, write, buffer, lenp, ppos,
2601 do_proc_dointvec_minmax_conv, &param);
2602 }
2603
2604 struct do_proc_douintvec_minmax_conv_param {
2605 unsigned int *min;
2606 unsigned int *max;
2607 };
2608
2609 static int do_proc_douintvec_minmax_conv(unsigned long *lvalp,
2610 unsigned int *valp,
2611 int write, void *data)
2612 {
2613 struct do_proc_douintvec_minmax_conv_param *param = data;
2614
2615 if (write) {
2616 unsigned int val = *lvalp;
2617
2618 if ((param->min && *param->min > val) ||
2619 (param->max && *param->max < val))
2620 return -ERANGE;
2621
2622 if (*lvalp > UINT_MAX)
2623 return -EINVAL;
2624 *valp = val;
2625 } else {
2626 unsigned int val = *valp;
2627 *lvalp = (unsigned long) val;
2628 }
2629
2630 return 0;
2631 }
2632
2633 /**
2634 * proc_douintvec_minmax - read a vector of unsigned ints with min/max values
2635 * @table: the sysctl table
2636 * @write: %TRUE if this is a write to the sysctl file
2637 * @buffer: the user buffer
2638 * @lenp: the size of the user buffer
2639 * @ppos: file position
2640 *
2641 * Reads/writes up to table->maxlen/sizeof(unsigned int) unsigned integer
2642 * values from/to the user buffer, treated as an ASCII string. Negative
2643 * strings are not allowed.
2644 *
2645 * This routine will ensure the values are within the range specified by
2646 * table->extra1 (min) and table->extra2 (max). There is a final sanity
2647 * check for UINT_MAX to avoid having to support wrap around uses from
2648 * userspace.
2649 *
2650 * Returns 0 on success.
2651 */
2652 int proc_douintvec_minmax(struct ctl_table *table, int write,
2653 void __user *buffer, size_t *lenp, loff_t *ppos)
2654 {
2655 struct do_proc_douintvec_minmax_conv_param param = {
2656 .min = (unsigned int *) table->extra1,
2657 .max = (unsigned int *) table->extra2,
2658 };
2659 return do_proc_douintvec(table, write, buffer, lenp, ppos,
2660 do_proc_douintvec_minmax_conv, &param);
2661 }
2662
2663 static void validate_coredump_safety(void)
2664 {
2665 #ifdef CONFIG_COREDUMP
2666 if (suid_dumpable == SUID_DUMP_ROOT &&
2667 core_pattern[0] != '/' && core_pattern[0] != '|') {
2668 printk(KERN_WARNING
2669 "Unsafe core_pattern used with fs.suid_dumpable=2.\n"
2670 "Pipe handler or fully qualified core dump path required.\n"
2671 "Set kernel.core_pattern before fs.suid_dumpable.\n"
2672 );
2673 }
2674 #endif
2675 }
2676
2677 static int proc_dointvec_minmax_coredump(struct ctl_table *table, int write,
2678 void __user *buffer, size_t *lenp, loff_t *ppos)
2679 {
2680 int error = proc_dointvec_minmax(table, write, buffer, lenp, ppos);
2681 if (!error)
2682 validate_coredump_safety();
2683 return error;
2684 }
2685
2686 #ifdef CONFIG_COREDUMP
2687 static int proc_dostring_coredump(struct ctl_table *table, int write,
2688 void __user *buffer, size_t *lenp, loff_t *ppos)
2689 {
2690 int error = proc_dostring(table, write, buffer, lenp, ppos);
2691 if (!error)
2692 validate_coredump_safety();
2693 return error;
2694 }
2695 #endif
2696
2697 static int __do_proc_doulongvec_minmax(void *data, struct ctl_table *table, int write,
2698 void __user *buffer,
2699 size_t *lenp, loff_t *ppos,
2700 unsigned long convmul,
2701 unsigned long convdiv)
2702 {
2703 unsigned long *i, *min, *max;
2704 int vleft, first = 1, err = 0;
2705 size_t left;
2706 char *kbuf = NULL, *p;
2707
2708 if (!data || !table->maxlen || !*lenp || (*ppos && !write)) {
2709 *lenp = 0;
2710 return 0;
2711 }
2712
2713 i = (unsigned long *) data;
2714 min = (unsigned long *) table->extra1;
2715 max = (unsigned long *) table->extra2;
2716 vleft = table->maxlen / sizeof(unsigned long);
2717 left = *lenp;
2718
2719 if (write) {
2720 if (proc_first_pos_non_zero_ignore(ppos, table))
2721 goto out;
2722
2723 if (left > PAGE_SIZE - 1)
2724 left = PAGE_SIZE - 1;
2725 p = kbuf = memdup_user_nul(buffer, left);
2726 if (IS_ERR(kbuf))
2727 return PTR_ERR(kbuf);
2728 }
2729
2730 for (; left && vleft--; i++, first = 0) {
2731 unsigned long val;
2732
2733 if (write) {
2734 bool neg;
2735
2736 left -= proc_skip_spaces(&p);
2737
2738 err = proc_get_long(&p, &left, &val, &neg,
2739 proc_wspace_sep,
2740 sizeof(proc_wspace_sep), NULL);
2741 if (err)
2742 break;
2743 if (neg)
2744 continue;
2745 val = convmul * val / convdiv;
2746 if ((min && val < *min) || (max && val > *max))
2747 continue;
2748 *i = val;
2749 } else {
2750 val = convdiv * (*i) / convmul;
2751 if (!first) {
2752 err = proc_put_char(&buffer, &left, '\t');
2753 if (err)
2754 break;
2755 }
2756 err = proc_put_long(&buffer, &left, val, false);
2757 if (err)
2758 break;
2759 }
2760 }
2761
2762 if (!write && !first && left && !err)
2763 err = proc_put_char(&buffer, &left, '\n');
2764 if (write && !err)
2765 left -= proc_skip_spaces(&p);
2766 if (write) {
2767 kfree(kbuf);
2768 if (first)
2769 return err ? : -EINVAL;
2770 }
2771 *lenp -= left;
2772 out:
2773 *ppos += *lenp;
2774 return err;
2775 }
2776
2777 static int do_proc_doulongvec_minmax(struct ctl_table *table, int write,
2778 void __user *buffer,
2779 size_t *lenp, loff_t *ppos,
2780 unsigned long convmul,
2781 unsigned long convdiv)
2782 {
2783 return __do_proc_doulongvec_minmax(table->data, table, write,
2784 buffer, lenp, ppos, convmul, convdiv);
2785 }
2786
2787 /**
2788 * proc_doulongvec_minmax - read a vector of long integers with min/max values
2789 * @table: the sysctl table
2790 * @write: %TRUE if this is a write to the sysctl file
2791 * @buffer: the user buffer
2792 * @lenp: the size of the user buffer
2793 * @ppos: file position
2794 *
2795 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long
2796 * values from/to the user buffer, treated as an ASCII string.
2797 *
2798 * This routine will ensure the values are within the range specified by
2799 * table->extra1 (min) and table->extra2 (max).
2800 *
2801 * Returns 0 on success.
2802 */
2803 int proc_doulongvec_minmax(struct ctl_table *table, int write,
2804 void __user *buffer, size_t *lenp, loff_t *ppos)
2805 {
2806 return do_proc_doulongvec_minmax(table, write, buffer, lenp, ppos, 1l, 1l);
2807 }
2808
2809 /**
2810 * proc_doulongvec_ms_jiffies_minmax - read a vector of millisecond values with min/max values
2811 * @table: the sysctl table
2812 * @write: %TRUE if this is a write to the sysctl file
2813 * @buffer: the user buffer
2814 * @lenp: the size of the user buffer
2815 * @ppos: file position
2816 *
2817 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long
2818 * values from/to the user buffer, treated as an ASCII string. The values
2819 * are treated as milliseconds, and converted to jiffies when they are stored.
2820 *
2821 * This routine will ensure the values are within the range specified by
2822 * table->extra1 (min) and table->extra2 (max).
2823 *
2824 * Returns 0 on success.
2825 */
2826 int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write,
2827 void __user *buffer,
2828 size_t *lenp, loff_t *ppos)
2829 {
2830 return do_proc_doulongvec_minmax(table, write, buffer,
2831 lenp, ppos, HZ, 1000l);
2832 }
2833
2834
2835 static int do_proc_dointvec_jiffies_conv(bool *negp, unsigned long *lvalp,
2836 int *valp,
2837 int write, void *data)
2838 {
2839 if (write) {
2840 if (*lvalp > INT_MAX / HZ)
2841 return 1;
2842 *valp = *negp ? -(*lvalp*HZ) : (*lvalp*HZ);
2843 } else {
2844 int val = *valp;
2845 unsigned long lval;
2846 if (val < 0) {
2847 *negp = true;
2848 lval = -(unsigned long)val;
2849 } else {
2850 *negp = false;
2851 lval = (unsigned long)val;
2852 }
2853 *lvalp = lval / HZ;
2854 }
2855 return 0;
2856 }
2857
2858 static int do_proc_dointvec_userhz_jiffies_conv(bool *negp, unsigned long *lvalp,
2859 int *valp,
2860 int write, void *data)
2861 {
2862 if (write) {
2863 if (USER_HZ < HZ && *lvalp > (LONG_MAX / HZ) * USER_HZ)
2864 return 1;
2865 *valp = clock_t_to_jiffies(*negp ? -*lvalp : *lvalp);
2866 } else {
2867 int val = *valp;
2868 unsigned long lval;
2869 if (val < 0) {
2870 *negp = true;
2871 lval = -(unsigned long)val;
2872 } else {
2873 *negp = false;
2874 lval = (unsigned long)val;
2875 }
2876 *lvalp = jiffies_to_clock_t(lval);
2877 }
2878 return 0;
2879 }
2880
2881 static int do_proc_dointvec_ms_jiffies_conv(bool *negp, unsigned long *lvalp,
2882 int *valp,
2883 int write, void *data)
2884 {
2885 if (write) {
2886 unsigned long jif = msecs_to_jiffies(*negp ? -*lvalp : *lvalp);
2887
2888 if (jif > INT_MAX)
2889 return 1;
2890 *valp = (int)jif;
2891 } else {
2892 int val = *valp;
2893 unsigned long lval;
2894 if (val < 0) {
2895 *negp = true;
2896 lval = -(unsigned long)val;
2897 } else {
2898 *negp = false;
2899 lval = (unsigned long)val;
2900 }
2901 *lvalp = jiffies_to_msecs(lval);
2902 }
2903 return 0;
2904 }
2905
2906 /**
2907 * proc_dointvec_jiffies - read a vector of integers as seconds
2908 * @table: the sysctl table
2909 * @write: %TRUE if this is a write to the sysctl file
2910 * @buffer: the user buffer
2911 * @lenp: the size of the user buffer
2912 * @ppos: file position
2913 *
2914 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2915 * values from/to the user buffer, treated as an ASCII string.
2916 * The values read are assumed to be in seconds, and are converted into
2917 * jiffies.
2918 *
2919 * Returns 0 on success.
2920 */
2921 int proc_dointvec_jiffies(struct ctl_table *table, int write,
2922 void __user *buffer, size_t *lenp, loff_t *ppos)
2923 {
2924 return do_proc_dointvec(table,write,buffer,lenp,ppos,
2925 do_proc_dointvec_jiffies_conv,NULL);
2926 }
2927
2928 /**
2929 * proc_dointvec_userhz_jiffies - read a vector of integers as 1/USER_HZ seconds
2930 * @table: the sysctl table
2931 * @write: %TRUE if this is a write to the sysctl file
2932 * @buffer: the user buffer
2933 * @lenp: the size of the user buffer
2934 * @ppos: pointer to the file position
2935 *
2936 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2937 * values from/to the user buffer, treated as an ASCII string.
2938 * The values read are assumed to be in 1/USER_HZ seconds, and
2939 * are converted into jiffies.
2940 *
2941 * Returns 0 on success.
2942 */
2943 int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write,
2944 void __user *buffer, size_t *lenp, loff_t *ppos)
2945 {
2946 return do_proc_dointvec(table,write,buffer,lenp,ppos,
2947 do_proc_dointvec_userhz_jiffies_conv,NULL);
2948 }
2949
2950 /**
2951 * proc_dointvec_ms_jiffies - read a vector of integers as 1 milliseconds
2952 * @table: the sysctl table
2953 * @write: %TRUE if this is a write to the sysctl file
2954 * @buffer: the user buffer
2955 * @lenp: the size of the user buffer
2956 * @ppos: file position
2957 * @ppos: the current position in the file
2958 *
2959 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2960 * values from/to the user buffer, treated as an ASCII string.
2961 * The values read are assumed to be in 1/1000 seconds, and
2962 * are converted into jiffies.
2963 *
2964 * Returns 0 on success.
2965 */
2966 int proc_dointvec_ms_jiffies(struct ctl_table *table, int write,
2967 void __user *buffer, size_t *lenp, loff_t *ppos)
2968 {
2969 return do_proc_dointvec(table, write, buffer, lenp, ppos,
2970 do_proc_dointvec_ms_jiffies_conv, NULL);
2971 }
2972
2973 static int proc_do_cad_pid(struct ctl_table *table, int write,
2974 void __user *buffer, size_t *lenp, loff_t *ppos)
2975 {
2976 struct pid *new_pid;
2977 pid_t tmp;
2978 int r;
2979
2980 tmp = pid_vnr(cad_pid);
2981
2982 r = __do_proc_dointvec(&tmp, table, write, buffer,
2983 lenp, ppos, NULL, NULL);
2984 if (r || !write)
2985 return r;
2986
2987 new_pid = find_get_pid(tmp);
2988 if (!new_pid)
2989 return -ESRCH;
2990
2991 put_pid(xchg(&cad_pid, new_pid));
2992 return 0;
2993 }
2994
2995 /**
2996 * proc_do_large_bitmap - read/write from/to a large bitmap
2997 * @table: the sysctl table
2998 * @write: %TRUE if this is a write to the sysctl file
2999 * @buffer: the user buffer
3000 * @lenp: the size of the user buffer
3001 * @ppos: file position
3002 *
3003 * The bitmap is stored at table->data and the bitmap length (in bits)
3004 * in table->maxlen.
3005 *
3006 * We use a range comma separated format (e.g. 1,3-4,10-10) so that
3007 * large bitmaps may be represented in a compact manner. Writing into
3008 * the file will clear the bitmap then update it with the given input.
3009 *
3010 * Returns 0 on success.
3011 */
3012 int proc_do_large_bitmap(struct ctl_table *table, int write,
3013 void __user *buffer, size_t *lenp, loff_t *ppos)
3014 {
3015 int err = 0;
3016 bool first = 1;
3017 size_t left = *lenp;
3018 unsigned long bitmap_len = table->maxlen;
3019 unsigned long *bitmap = *(unsigned long **) table->data;
3020 unsigned long *tmp_bitmap = NULL;
3021 char tr_a[] = { '-', ',', '\n' }, tr_b[] = { ',', '\n', 0 }, c;
3022
3023 if (!bitmap || !bitmap_len || !left || (*ppos && !write)) {
3024 *lenp = 0;
3025 return 0;
3026 }
3027
3028 if (write) {
3029 char *kbuf, *p;
3030
3031 if (left > PAGE_SIZE - 1)
3032 left = PAGE_SIZE - 1;
3033
3034 p = kbuf = memdup_user_nul(buffer, left);
3035 if (IS_ERR(kbuf))
3036 return PTR_ERR(kbuf);
3037
3038 tmp_bitmap = kzalloc(BITS_TO_LONGS(bitmap_len) * sizeof(unsigned long),
3039 GFP_KERNEL);
3040 if (!tmp_bitmap) {
3041 kfree(kbuf);
3042 return -ENOMEM;
3043 }
3044 proc_skip_char(&p, &left, '\n');
3045 while (!err && left) {
3046 unsigned long val_a, val_b;
3047 bool neg;
3048
3049 err = proc_get_long(&p, &left, &val_a, &neg, tr_a,
3050 sizeof(tr_a), &c);
3051 if (err)
3052 break;
3053 if (val_a >= bitmap_len || neg) {
3054 err = -EINVAL;
3055 break;
3056 }
3057
3058 val_b = val_a;
3059 if (left) {
3060 p++;
3061 left--;
3062 }
3063
3064 if (c == '-') {
3065 err = proc_get_long(&p, &left, &val_b,
3066 &neg, tr_b, sizeof(tr_b),
3067 &c);
3068 if (err)
3069 break;
3070 if (val_b >= bitmap_len || neg ||
3071 val_a > val_b) {
3072 err = -EINVAL;
3073 break;
3074 }
3075 if (left) {
3076 p++;
3077 left--;
3078 }
3079 }
3080
3081 bitmap_set(tmp_bitmap, val_a, val_b - val_a + 1);
3082 first = 0;
3083 proc_skip_char(&p, &left, '\n');
3084 }
3085 kfree(kbuf);
3086 } else {
3087 unsigned long bit_a, bit_b = 0;
3088
3089 while (left) {
3090 bit_a = find_next_bit(bitmap, bitmap_len, bit_b);
3091 if (bit_a >= bitmap_len)
3092 break;
3093 bit_b = find_next_zero_bit(bitmap, bitmap_len,
3094 bit_a + 1) - 1;
3095
3096 if (!first) {
3097 err = proc_put_char(&buffer, &left, ',');
3098 if (err)
3099 break;
3100 }
3101 err = proc_put_long(&buffer, &left, bit_a, false);
3102 if (err)
3103 break;
3104 if (bit_a != bit_b) {
3105 err = proc_put_char(&buffer, &left, '-');
3106 if (err)
3107 break;
3108 err = proc_put_long(&buffer, &left, bit_b, false);
3109 if (err)
3110 break;
3111 }
3112
3113 first = 0; bit_b++;
3114 }
3115 if (!err)
3116 err = proc_put_char(&buffer, &left, '\n');
3117 }
3118
3119 if (!err) {
3120 if (write) {
3121 if (*ppos)
3122 bitmap_or(bitmap, bitmap, tmp_bitmap, bitmap_len);
3123 else
3124 bitmap_copy(bitmap, tmp_bitmap, bitmap_len);
3125 }
3126 kfree(tmp_bitmap);
3127 *lenp -= left;
3128 *ppos += *lenp;
3129 return 0;
3130 } else {
3131 kfree(tmp_bitmap);
3132 return err;
3133 }
3134 }
3135
3136 #else /* CONFIG_PROC_SYSCTL */
3137
3138 int proc_dostring(struct ctl_table *table, int write,
3139 void __user *buffer, size_t *lenp, loff_t *ppos)
3140 {
3141 return -ENOSYS;
3142 }
3143
3144 int proc_dointvec(struct ctl_table *table, int write,
3145 void __user *buffer, size_t *lenp, loff_t *ppos)
3146 {
3147 return -ENOSYS;
3148 }
3149
3150 int proc_douintvec(struct ctl_table *table, int write,
3151 void __user *buffer, size_t *lenp, loff_t *ppos)
3152 {
3153 return -ENOSYS;
3154 }
3155
3156 int proc_dointvec_minmax(struct ctl_table *table, int write,
3157 void __user *buffer, size_t *lenp, loff_t *ppos)
3158 {
3159 return -ENOSYS;
3160 }
3161
3162 int proc_douintvec_minmax(struct ctl_table *table, int write,
3163 void __user *buffer, size_t *lenp, loff_t *ppos)
3164 {
3165 return -ENOSYS;
3166 }
3167
3168 int proc_dointvec_jiffies(struct ctl_table *table, int write,
3169 void __user *buffer, size_t *lenp, loff_t *ppos)
3170 {
3171 return -ENOSYS;
3172 }
3173
3174 int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write,
3175 void __user *buffer, size_t *lenp, loff_t *ppos)
3176 {
3177 return -ENOSYS;
3178 }
3179
3180 int proc_dointvec_ms_jiffies(struct ctl_table *table, int write,
3181 void __user *buffer, size_t *lenp, loff_t *ppos)
3182 {
3183 return -ENOSYS;
3184 }
3185
3186 int proc_doulongvec_minmax(struct ctl_table *table, int write,
3187 void __user *buffer, size_t *lenp, loff_t *ppos)
3188 {
3189 return -ENOSYS;
3190 }
3191
3192 int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write,
3193 void __user *buffer,
3194 size_t *lenp, loff_t *ppos)
3195 {
3196 return -ENOSYS;
3197 }
3198
3199
3200 #endif /* CONFIG_PROC_SYSCTL */
3201
3202 /*
3203 * No sense putting this after each symbol definition, twice,
3204 * exception granted :-)
3205 */
3206 EXPORT_SYMBOL(proc_dointvec);
3207 EXPORT_SYMBOL(proc_douintvec);
3208 EXPORT_SYMBOL(proc_dointvec_jiffies);
3209 EXPORT_SYMBOL(proc_dointvec_minmax);
3210 EXPORT_SYMBOL_GPL(proc_douintvec_minmax);
3211 EXPORT_SYMBOL(proc_dointvec_userhz_jiffies);
3212 EXPORT_SYMBOL(proc_dointvec_ms_jiffies);
3213 EXPORT_SYMBOL(proc_dostring);
3214 EXPORT_SYMBOL(proc_doulongvec_minmax);
3215 EXPORT_SYMBOL(proc_doulongvec_ms_jiffies_minmax);