2 * sysctl.c: General linux system control interface
4 * Begun 24 March 1995, Stephen Tweedie
5 * Added /proc support, Dec 1995
6 * Added bdflush entry and intvec min/max checking, 2/23/96, Tom Dyas.
7 * Added hooks for /proc/sys/net (minor, minor patch), 96/4/1, Mike Shaver.
8 * Added kernel/java-{interpreter,appletviewer}, 96/5/10, Mike Shaver.
9 * Dynamic registration fixes, Stephen Tweedie.
10 * Added kswapd-interval, ctrl-alt-del, printk stuff, 1/8/97, Chris Horn.
11 * Made sysctl support optional via CONFIG_SYSCTL, 1/10/97, Chris
13 * Added proc_doulongvec_ms_jiffies_minmax, 09/08/99, Carlos H. Bauer.
14 * Added proc_doulongvec_minmax, 09/08/99, Carlos H. Bauer.
15 * Changed linked lists to use list.h instead of lists.h, 02/24/00, Bill
17 * The list_for_each() macro wasn't appropriate for the sysctl loop.
18 * Removed it and replaced it with older style, 03/23/00, Bill Wendling
21 #include <linux/module.h>
23 #include <linux/swap.h>
24 #include <linux/slab.h>
25 #include <linux/sysctl.h>
26 #include <linux/proc_fs.h>
27 #include <linux/security.h>
28 #include <linux/ctype.h>
29 #include <linux/utsname.h>
30 #include <linux/smp_lock.h>
32 #include <linux/init.h>
33 #include <linux/kernel.h>
34 #include <linux/kobject.h>
35 #include <linux/net.h>
36 #include <linux/sysrq.h>
37 #include <linux/highuid.h>
38 #include <linux/writeback.h>
39 #include <linux/hugetlb.h>
40 #include <linux/initrd.h>
41 #include <linux/key.h>
42 #include <linux/times.h>
43 #include <linux/limits.h>
44 #include <linux/dcache.h>
45 #include <linux/syscalls.h>
46 #include <linux/nfs_fs.h>
47 #include <linux/acpi.h>
48 #include <linux/reboot.h>
50 #include <asm/uaccess.h>
51 #include <asm/processor.h>
55 #include <asm/stacktrace.h>
59 static int deprecated_sysctl_warning(struct __sysctl_args *args);
61 #if defined(CONFIG_SYSCTL)
63 /* External variables not in a header file. */
65 extern int print_fatal_signals;
66 extern int sysctl_overcommit_memory;
67 extern int sysctl_overcommit_ratio;
68 extern int sysctl_panic_on_oom;
69 extern int sysctl_oom_kill_allocating_task;
70 extern int sysctl_oom_dump_tasks;
71 extern int max_threads;
72 extern int core_uses_pid;
73 extern int suid_dumpable;
74 extern char core_pattern[];
76 extern int min_free_kbytes;
77 extern int pid_max_min, pid_max_max;
78 extern int sysctl_drop_caches;
79 extern int percpu_pagelist_fraction;
80 extern int compat_log;
81 extern int maps_protect;
82 extern int sysctl_stat_interval;
83 extern int latencytop_enabled;
84 extern int sysctl_nr_open_min, sysctl_nr_open_max;
86 /* Constants used for minimum and maximum */
87 #if defined(CONFIG_DETECT_SOFTLOCKUP) || defined(CONFIG_HIGHMEM)
91 #ifdef CONFIG_DETECT_SOFTLOCKUP
92 static int sixty = 60;
100 static int one_hundred = 100;
102 /* this is needed for the proc_dointvec_minmax for [fs_]overflow UID and GID */
103 static int maxolduid = 65535;
104 static int minolduid;
105 static int min_percpu_pagelist_fract = 8;
107 static int ngroups_max = NGROUPS_MAX;
110 extern char modprobe_path[];
112 #ifdef CONFIG_CHR_DEV_SG
113 extern int sg_big_buff;
117 extern char reboot_command [];
118 extern int stop_a_enabled;
119 extern int scons_pwroff;
123 extern int pwrsw_enabled;
124 extern int unaligned_enabled;
128 #ifdef CONFIG_MATHEMU
129 extern int sysctl_ieee_emulation_warnings;
131 extern int sysctl_userprocess_debug;
132 extern int spin_retry;
135 #ifdef CONFIG_BSD_PROCESS_ACCT
136 extern int acct_parm[];
140 extern int no_unaligned_warning;
143 #ifdef CONFIG_RT_MUTEXES
144 extern int max_lock_depth;
147 #ifdef CONFIG_PROC_SYSCTL
148 static int proc_do_cad_pid(struct ctl_table *table, int write, struct file *filp,
149 void __user *buffer, size_t *lenp, loff_t *ppos);
150 static int proc_dointvec_taint(struct ctl_table *table, int write, struct file *filp,
151 void __user *buffer, size_t *lenp, loff_t *ppos);
154 static struct ctl_table root_table[];
155 static struct ctl_table_root sysctl_table_root;
156 static struct ctl_table_header root_table_header = {
157 .ctl_table = root_table,
158 .ctl_entry = LIST_HEAD_INIT(sysctl_table_root.header_list),
159 .root = &sysctl_table_root,
161 static struct ctl_table_root sysctl_table_root = {
162 .root_list = LIST_HEAD_INIT(sysctl_table_root.root_list),
163 .header_list = LIST_HEAD_INIT(root_table_header.ctl_entry),
166 static struct ctl_table kern_table[];
167 static struct ctl_table vm_table[];
168 static struct ctl_table fs_table[];
169 static struct ctl_table debug_table[];
170 static struct ctl_table dev_table[];
171 extern struct ctl_table random_table[];
172 #ifdef CONFIG_INOTIFY_USER
173 extern struct ctl_table inotify_table[];
176 #ifdef HAVE_ARCH_PICK_MMAP_LAYOUT
177 int sysctl_legacy_va_layout;
180 extern int prove_locking;
181 extern int lock_stat;
183 /* The default sysctl tables: */
185 static struct ctl_table root_table[] = {
187 .ctl_name = CTL_KERN,
188 .procname = "kernel",
205 .ctl_name = CTL_DEBUG,
208 .child = debug_table,
217 * NOTE: do not add new entries to this table unless you have read
218 * Documentation/sysctl/ctl_unnumbered.txt
223 #ifdef CONFIG_SCHED_DEBUG
224 static int min_sched_granularity_ns = 100000; /* 100 usecs */
225 static int max_sched_granularity_ns = NSEC_PER_SEC; /* 1 second */
226 static int min_wakeup_granularity_ns; /* 0 usecs */
227 static int max_wakeup_granularity_ns = NSEC_PER_SEC; /* 1 second */
230 static struct ctl_table kern_table[] = {
231 #ifdef CONFIG_SCHED_DEBUG
233 .ctl_name = CTL_UNNUMBERED,
234 .procname = "sched_min_granularity_ns",
235 .data = &sysctl_sched_min_granularity,
236 .maxlen = sizeof(unsigned int),
238 .proc_handler = &sched_nr_latency_handler,
239 .strategy = &sysctl_intvec,
240 .extra1 = &min_sched_granularity_ns,
241 .extra2 = &max_sched_granularity_ns,
244 .ctl_name = CTL_UNNUMBERED,
245 .procname = "sched_latency_ns",
246 .data = &sysctl_sched_latency,
247 .maxlen = sizeof(unsigned int),
249 .proc_handler = &sched_nr_latency_handler,
250 .strategy = &sysctl_intvec,
251 .extra1 = &min_sched_granularity_ns,
252 .extra2 = &max_sched_granularity_ns,
255 .ctl_name = CTL_UNNUMBERED,
256 .procname = "sched_wakeup_granularity_ns",
257 .data = &sysctl_sched_wakeup_granularity,
258 .maxlen = sizeof(unsigned int),
260 .proc_handler = &proc_dointvec_minmax,
261 .strategy = &sysctl_intvec,
262 .extra1 = &min_wakeup_granularity_ns,
263 .extra2 = &max_wakeup_granularity_ns,
266 .ctl_name = CTL_UNNUMBERED,
267 .procname = "sched_child_runs_first",
268 .data = &sysctl_sched_child_runs_first,
269 .maxlen = sizeof(unsigned int),
271 .proc_handler = &proc_dointvec,
274 .ctl_name = CTL_UNNUMBERED,
275 .procname = "sched_features",
276 .data = &sysctl_sched_features,
277 .maxlen = sizeof(unsigned int),
279 .proc_handler = &proc_dointvec,
282 .ctl_name = CTL_UNNUMBERED,
283 .procname = "sched_migration_cost",
284 .data = &sysctl_sched_migration_cost,
285 .maxlen = sizeof(unsigned int),
287 .proc_handler = &proc_dointvec,
290 .ctl_name = CTL_UNNUMBERED,
291 .procname = "sched_nr_migrate",
292 .data = &sysctl_sched_nr_migrate,
293 .maxlen = sizeof(unsigned int),
295 .proc_handler = &proc_dointvec,
299 .ctl_name = CTL_UNNUMBERED,
300 .procname = "sched_rt_period_us",
301 .data = &sysctl_sched_rt_period,
302 .maxlen = sizeof(unsigned int),
304 .proc_handler = &sched_rt_handler,
307 .ctl_name = CTL_UNNUMBERED,
308 .procname = "sched_rt_runtime_us",
309 .data = &sysctl_sched_rt_runtime,
310 .maxlen = sizeof(int),
312 .proc_handler = &sched_rt_handler,
315 .ctl_name = CTL_UNNUMBERED,
316 .procname = "sched_compat_yield",
317 .data = &sysctl_sched_compat_yield,
318 .maxlen = sizeof(unsigned int),
320 .proc_handler = &proc_dointvec,
322 #ifdef CONFIG_PROVE_LOCKING
324 .ctl_name = CTL_UNNUMBERED,
325 .procname = "prove_locking",
326 .data = &prove_locking,
327 .maxlen = sizeof(int),
329 .proc_handler = &proc_dointvec,
332 #ifdef CONFIG_LOCK_STAT
334 .ctl_name = CTL_UNNUMBERED,
335 .procname = "lock_stat",
337 .maxlen = sizeof(int),
339 .proc_handler = &proc_dointvec,
343 .ctl_name = KERN_PANIC,
345 .data = &panic_timeout,
346 .maxlen = sizeof(int),
348 .proc_handler = &proc_dointvec,
351 .ctl_name = KERN_CORE_USES_PID,
352 .procname = "core_uses_pid",
353 .data = &core_uses_pid,
354 .maxlen = sizeof(int),
356 .proc_handler = &proc_dointvec,
359 .ctl_name = KERN_CORE_PATTERN,
360 .procname = "core_pattern",
361 .data = core_pattern,
362 .maxlen = CORENAME_MAX_SIZE,
364 .proc_handler = &proc_dostring,
365 .strategy = &sysctl_string,
367 #ifdef CONFIG_PROC_SYSCTL
369 .procname = "tainted",
371 .maxlen = sizeof(int),
373 .proc_handler = &proc_dointvec_taint,
376 #ifdef CONFIG_LATENCYTOP
378 .procname = "latencytop",
379 .data = &latencytop_enabled,
380 .maxlen = sizeof(int),
382 .proc_handler = &proc_dointvec,
385 #ifdef CONFIG_BLK_DEV_INITRD
387 .ctl_name = KERN_REALROOTDEV,
388 .procname = "real-root-dev",
389 .data = &real_root_dev,
390 .maxlen = sizeof(int),
392 .proc_handler = &proc_dointvec,
396 .ctl_name = CTL_UNNUMBERED,
397 .procname = "print-fatal-signals",
398 .data = &print_fatal_signals,
399 .maxlen = sizeof(int),
401 .proc_handler = &proc_dointvec,
405 .ctl_name = KERN_SPARC_REBOOT,
406 .procname = "reboot-cmd",
407 .data = reboot_command,
410 .proc_handler = &proc_dostring,
411 .strategy = &sysctl_string,
414 .ctl_name = KERN_SPARC_STOP_A,
415 .procname = "stop-a",
416 .data = &stop_a_enabled,
417 .maxlen = sizeof (int),
419 .proc_handler = &proc_dointvec,
422 .ctl_name = KERN_SPARC_SCONS_PWROFF,
423 .procname = "scons-poweroff",
424 .data = &scons_pwroff,
425 .maxlen = sizeof (int),
427 .proc_handler = &proc_dointvec,
432 .ctl_name = KERN_HPPA_PWRSW,
433 .procname = "soft-power",
434 .data = &pwrsw_enabled,
435 .maxlen = sizeof (int),
437 .proc_handler = &proc_dointvec,
440 .ctl_name = KERN_HPPA_UNALIGNED,
441 .procname = "unaligned-trap",
442 .data = &unaligned_enabled,
443 .maxlen = sizeof (int),
445 .proc_handler = &proc_dointvec,
449 .ctl_name = KERN_CTLALTDEL,
450 .procname = "ctrl-alt-del",
452 .maxlen = sizeof(int),
454 .proc_handler = &proc_dointvec,
458 .ctl_name = KERN_MODPROBE,
459 .procname = "modprobe",
460 .data = &modprobe_path,
461 .maxlen = KMOD_PATH_LEN,
463 .proc_handler = &proc_dostring,
464 .strategy = &sysctl_string,
467 #if defined(CONFIG_HOTPLUG) && defined(CONFIG_NET)
469 .ctl_name = KERN_HOTPLUG,
470 .procname = "hotplug",
471 .data = &uevent_helper,
472 .maxlen = UEVENT_HELPER_PATH_LEN,
474 .proc_handler = &proc_dostring,
475 .strategy = &sysctl_string,
478 #ifdef CONFIG_CHR_DEV_SG
480 .ctl_name = KERN_SG_BIG_BUFF,
481 .procname = "sg-big-buff",
482 .data = &sg_big_buff,
483 .maxlen = sizeof (int),
485 .proc_handler = &proc_dointvec,
488 #ifdef CONFIG_BSD_PROCESS_ACCT
490 .ctl_name = KERN_ACCT,
493 .maxlen = 3*sizeof(int),
495 .proc_handler = &proc_dointvec,
498 #ifdef CONFIG_MAGIC_SYSRQ
500 .ctl_name = KERN_SYSRQ,
502 .data = &__sysrq_enabled,
503 .maxlen = sizeof (int),
505 .proc_handler = &proc_dointvec,
508 #ifdef CONFIG_PROC_SYSCTL
510 .procname = "cad_pid",
512 .maxlen = sizeof (int),
514 .proc_handler = &proc_do_cad_pid,
518 .ctl_name = KERN_MAX_THREADS,
519 .procname = "threads-max",
520 .data = &max_threads,
521 .maxlen = sizeof(int),
523 .proc_handler = &proc_dointvec,
526 .ctl_name = KERN_RANDOM,
527 .procname = "random",
529 .child = random_table,
532 .ctl_name = KERN_OVERFLOWUID,
533 .procname = "overflowuid",
534 .data = &overflowuid,
535 .maxlen = sizeof(int),
537 .proc_handler = &proc_dointvec_minmax,
538 .strategy = &sysctl_intvec,
539 .extra1 = &minolduid,
540 .extra2 = &maxolduid,
543 .ctl_name = KERN_OVERFLOWGID,
544 .procname = "overflowgid",
545 .data = &overflowgid,
546 .maxlen = sizeof(int),
548 .proc_handler = &proc_dointvec_minmax,
549 .strategy = &sysctl_intvec,
550 .extra1 = &minolduid,
551 .extra2 = &maxolduid,
554 #ifdef CONFIG_MATHEMU
556 .ctl_name = KERN_IEEE_EMULATION_WARNINGS,
557 .procname = "ieee_emulation_warnings",
558 .data = &sysctl_ieee_emulation_warnings,
559 .maxlen = sizeof(int),
561 .proc_handler = &proc_dointvec,
565 .ctl_name = KERN_S390_USER_DEBUG_LOGGING,
566 .procname = "userprocess_debug",
567 .data = &sysctl_userprocess_debug,
568 .maxlen = sizeof(int),
570 .proc_handler = &proc_dointvec,
574 .ctl_name = KERN_PIDMAX,
575 .procname = "pid_max",
577 .maxlen = sizeof (int),
579 .proc_handler = &proc_dointvec_minmax,
580 .strategy = sysctl_intvec,
581 .extra1 = &pid_max_min,
582 .extra2 = &pid_max_max,
585 .ctl_name = KERN_PANIC_ON_OOPS,
586 .procname = "panic_on_oops",
587 .data = &panic_on_oops,
588 .maxlen = sizeof(int),
590 .proc_handler = &proc_dointvec,
592 #if defined CONFIG_PRINTK
594 .ctl_name = KERN_PRINTK,
595 .procname = "printk",
596 .data = &console_loglevel,
597 .maxlen = 4*sizeof(int),
599 .proc_handler = &proc_dointvec,
602 .ctl_name = KERN_PRINTK_RATELIMIT,
603 .procname = "printk_ratelimit",
604 .data = &printk_ratelimit_jiffies,
605 .maxlen = sizeof(int),
607 .proc_handler = &proc_dointvec_jiffies,
608 .strategy = &sysctl_jiffies,
611 .ctl_name = KERN_PRINTK_RATELIMIT_BURST,
612 .procname = "printk_ratelimit_burst",
613 .data = &printk_ratelimit_burst,
614 .maxlen = sizeof(int),
616 .proc_handler = &proc_dointvec,
620 .ctl_name = KERN_NGROUPS_MAX,
621 .procname = "ngroups_max",
622 .data = &ngroups_max,
623 .maxlen = sizeof (int),
625 .proc_handler = &proc_dointvec,
627 #if defined(CONFIG_X86_LOCAL_APIC) && defined(CONFIG_X86)
629 .ctl_name = KERN_UNKNOWN_NMI_PANIC,
630 .procname = "unknown_nmi_panic",
631 .data = &unknown_nmi_panic,
632 .maxlen = sizeof (int),
634 .proc_handler = &proc_dointvec,
637 .procname = "nmi_watchdog",
638 .data = &nmi_watchdog_enabled,
639 .maxlen = sizeof (int),
641 .proc_handler = &proc_nmi_enabled,
644 #if defined(CONFIG_X86)
646 .ctl_name = KERN_PANIC_ON_NMI,
647 .procname = "panic_on_unrecovered_nmi",
648 .data = &panic_on_unrecovered_nmi,
649 .maxlen = sizeof(int),
651 .proc_handler = &proc_dointvec,
654 .ctl_name = KERN_BOOTLOADER_TYPE,
655 .procname = "bootloader_type",
656 .data = &bootloader_type,
657 .maxlen = sizeof (int),
659 .proc_handler = &proc_dointvec,
662 .ctl_name = CTL_UNNUMBERED,
663 .procname = "kstack_depth_to_print",
664 .data = &kstack_depth_to_print,
665 .maxlen = sizeof(int),
667 .proc_handler = &proc_dointvec,
670 .ctl_name = CTL_UNNUMBERED,
671 .procname = "io_delay_type",
672 .data = &io_delay_type,
673 .maxlen = sizeof(int),
675 .proc_handler = &proc_dointvec,
678 #if defined(CONFIG_MMU)
680 .ctl_name = KERN_RANDOMIZE,
681 .procname = "randomize_va_space",
682 .data = &randomize_va_space,
683 .maxlen = sizeof(int),
685 .proc_handler = &proc_dointvec,
688 #if defined(CONFIG_S390) && defined(CONFIG_SMP)
690 .ctl_name = KERN_SPIN_RETRY,
691 .procname = "spin_retry",
693 .maxlen = sizeof (int),
695 .proc_handler = &proc_dointvec,
698 #if defined(CONFIG_ACPI_SLEEP) && defined(CONFIG_X86)
700 .procname = "acpi_video_flags",
701 .data = &acpi_realmode_flags,
702 .maxlen = sizeof (unsigned long),
704 .proc_handler = &proc_doulongvec_minmax,
709 .ctl_name = KERN_IA64_UNALIGNED,
710 .procname = "ignore-unaligned-usertrap",
711 .data = &no_unaligned_warning,
712 .maxlen = sizeof (int),
714 .proc_handler = &proc_dointvec,
717 #ifdef CONFIG_DETECT_SOFTLOCKUP
719 .ctl_name = CTL_UNNUMBERED,
720 .procname = "softlockup_thresh",
721 .data = &softlockup_thresh,
722 .maxlen = sizeof(unsigned long),
724 .proc_handler = &proc_doulongvec_minmax,
725 .strategy = &sysctl_intvec,
730 .ctl_name = CTL_UNNUMBERED,
731 .procname = "hung_task_check_count",
732 .data = &sysctl_hung_task_check_count,
733 .maxlen = sizeof(unsigned long),
735 .proc_handler = &proc_doulongvec_minmax,
736 .strategy = &sysctl_intvec,
739 .ctl_name = CTL_UNNUMBERED,
740 .procname = "hung_task_timeout_secs",
741 .data = &sysctl_hung_task_timeout_secs,
742 .maxlen = sizeof(unsigned long),
744 .proc_handler = &proc_doulongvec_minmax,
745 .strategy = &sysctl_intvec,
748 .ctl_name = CTL_UNNUMBERED,
749 .procname = "hung_task_warnings",
750 .data = &sysctl_hung_task_warnings,
751 .maxlen = sizeof(unsigned long),
753 .proc_handler = &proc_doulongvec_minmax,
754 .strategy = &sysctl_intvec,
759 .ctl_name = KERN_COMPAT_LOG,
760 .procname = "compat-log",
762 .maxlen = sizeof (int),
764 .proc_handler = &proc_dointvec,
767 #ifdef CONFIG_RT_MUTEXES
769 .ctl_name = KERN_MAX_LOCK_DEPTH,
770 .procname = "max_lock_depth",
771 .data = &max_lock_depth,
772 .maxlen = sizeof(int),
774 .proc_handler = &proc_dointvec,
777 #ifdef CONFIG_PROC_FS
779 .ctl_name = CTL_UNNUMBERED,
780 .procname = "maps_protect",
781 .data = &maps_protect,
782 .maxlen = sizeof(int),
784 .proc_handler = &proc_dointvec,
788 .ctl_name = CTL_UNNUMBERED,
789 .procname = "poweroff_cmd",
790 .data = &poweroff_cmd,
791 .maxlen = POWEROFF_CMD_PATH_LEN,
793 .proc_handler = &proc_dostring,
794 .strategy = &sysctl_string,
798 .ctl_name = CTL_UNNUMBERED,
801 .child = key_sysctls,
805 * NOTE: do not add new entries to this table unless you have read
806 * Documentation/sysctl/ctl_unnumbered.txt
811 static struct ctl_table vm_table[] = {
813 .ctl_name = VM_OVERCOMMIT_MEMORY,
814 .procname = "overcommit_memory",
815 .data = &sysctl_overcommit_memory,
816 .maxlen = sizeof(sysctl_overcommit_memory),
818 .proc_handler = &proc_dointvec,
821 .ctl_name = VM_PANIC_ON_OOM,
822 .procname = "panic_on_oom",
823 .data = &sysctl_panic_on_oom,
824 .maxlen = sizeof(sysctl_panic_on_oom),
826 .proc_handler = &proc_dointvec,
829 .ctl_name = CTL_UNNUMBERED,
830 .procname = "oom_kill_allocating_task",
831 .data = &sysctl_oom_kill_allocating_task,
832 .maxlen = sizeof(sysctl_oom_kill_allocating_task),
834 .proc_handler = &proc_dointvec,
837 .ctl_name = CTL_UNNUMBERED,
838 .procname = "oom_dump_tasks",
839 .data = &sysctl_oom_dump_tasks,
840 .maxlen = sizeof(sysctl_oom_dump_tasks),
842 .proc_handler = &proc_dointvec,
845 .ctl_name = VM_OVERCOMMIT_RATIO,
846 .procname = "overcommit_ratio",
847 .data = &sysctl_overcommit_ratio,
848 .maxlen = sizeof(sysctl_overcommit_ratio),
850 .proc_handler = &proc_dointvec,
853 .ctl_name = VM_PAGE_CLUSTER,
854 .procname = "page-cluster",
855 .data = &page_cluster,
856 .maxlen = sizeof(int),
858 .proc_handler = &proc_dointvec,
861 .ctl_name = VM_DIRTY_BACKGROUND,
862 .procname = "dirty_background_ratio",
863 .data = &dirty_background_ratio,
864 .maxlen = sizeof(dirty_background_ratio),
866 .proc_handler = &proc_dointvec_minmax,
867 .strategy = &sysctl_intvec,
869 .extra2 = &one_hundred,
872 .ctl_name = VM_DIRTY_RATIO,
873 .procname = "dirty_ratio",
874 .data = &vm_dirty_ratio,
875 .maxlen = sizeof(vm_dirty_ratio),
877 .proc_handler = &dirty_ratio_handler,
878 .strategy = &sysctl_intvec,
880 .extra2 = &one_hundred,
883 .procname = "dirty_writeback_centisecs",
884 .data = &dirty_writeback_interval,
885 .maxlen = sizeof(dirty_writeback_interval),
887 .proc_handler = &dirty_writeback_centisecs_handler,
890 .procname = "dirty_expire_centisecs",
891 .data = &dirty_expire_interval,
892 .maxlen = sizeof(dirty_expire_interval),
894 .proc_handler = &proc_dointvec_userhz_jiffies,
897 .ctl_name = VM_NR_PDFLUSH_THREADS,
898 .procname = "nr_pdflush_threads",
899 .data = &nr_pdflush_threads,
900 .maxlen = sizeof nr_pdflush_threads,
901 .mode = 0444 /* read-only*/,
902 .proc_handler = &proc_dointvec,
905 .ctl_name = VM_SWAPPINESS,
906 .procname = "swappiness",
907 .data = &vm_swappiness,
908 .maxlen = sizeof(vm_swappiness),
910 .proc_handler = &proc_dointvec_minmax,
911 .strategy = &sysctl_intvec,
913 .extra2 = &one_hundred,
915 #ifdef CONFIG_HUGETLB_PAGE
917 .procname = "nr_hugepages",
918 .data = &max_huge_pages,
919 .maxlen = sizeof(unsigned long),
921 .proc_handler = &hugetlb_sysctl_handler,
922 .extra1 = (void *)&hugetlb_zero,
923 .extra2 = (void *)&hugetlb_infinity,
926 .ctl_name = VM_HUGETLB_GROUP,
927 .procname = "hugetlb_shm_group",
928 .data = &sysctl_hugetlb_shm_group,
929 .maxlen = sizeof(gid_t),
931 .proc_handler = &proc_dointvec,
934 .ctl_name = CTL_UNNUMBERED,
935 .procname = "hugepages_treat_as_movable",
936 .data = &hugepages_treat_as_movable,
937 .maxlen = sizeof(int),
939 .proc_handler = &hugetlb_treat_movable_handler,
942 .ctl_name = CTL_UNNUMBERED,
943 .procname = "nr_overcommit_hugepages",
944 .data = &sysctl_overcommit_huge_pages,
945 .maxlen = sizeof(sysctl_overcommit_huge_pages),
947 .proc_handler = &hugetlb_overcommit_handler,
951 .ctl_name = VM_LOWMEM_RESERVE_RATIO,
952 .procname = "lowmem_reserve_ratio",
953 .data = &sysctl_lowmem_reserve_ratio,
954 .maxlen = sizeof(sysctl_lowmem_reserve_ratio),
956 .proc_handler = &lowmem_reserve_ratio_sysctl_handler,
957 .strategy = &sysctl_intvec,
960 .ctl_name = VM_DROP_PAGECACHE,
961 .procname = "drop_caches",
962 .data = &sysctl_drop_caches,
963 .maxlen = sizeof(int),
965 .proc_handler = drop_caches_sysctl_handler,
966 .strategy = &sysctl_intvec,
969 .ctl_name = VM_MIN_FREE_KBYTES,
970 .procname = "min_free_kbytes",
971 .data = &min_free_kbytes,
972 .maxlen = sizeof(min_free_kbytes),
974 .proc_handler = &min_free_kbytes_sysctl_handler,
975 .strategy = &sysctl_intvec,
979 .ctl_name = VM_PERCPU_PAGELIST_FRACTION,
980 .procname = "percpu_pagelist_fraction",
981 .data = &percpu_pagelist_fraction,
982 .maxlen = sizeof(percpu_pagelist_fraction),
984 .proc_handler = &percpu_pagelist_fraction_sysctl_handler,
985 .strategy = &sysctl_intvec,
986 .extra1 = &min_percpu_pagelist_fract,
990 .ctl_name = VM_MAX_MAP_COUNT,
991 .procname = "max_map_count",
992 .data = &sysctl_max_map_count,
993 .maxlen = sizeof(sysctl_max_map_count),
995 .proc_handler = &proc_dointvec
999 .ctl_name = VM_LAPTOP_MODE,
1000 .procname = "laptop_mode",
1001 .data = &laptop_mode,
1002 .maxlen = sizeof(laptop_mode),
1004 .proc_handler = &proc_dointvec_jiffies,
1005 .strategy = &sysctl_jiffies,
1008 .ctl_name = VM_BLOCK_DUMP,
1009 .procname = "block_dump",
1010 .data = &block_dump,
1011 .maxlen = sizeof(block_dump),
1013 .proc_handler = &proc_dointvec,
1014 .strategy = &sysctl_intvec,
1018 .ctl_name = VM_VFS_CACHE_PRESSURE,
1019 .procname = "vfs_cache_pressure",
1020 .data = &sysctl_vfs_cache_pressure,
1021 .maxlen = sizeof(sysctl_vfs_cache_pressure),
1023 .proc_handler = &proc_dointvec,
1024 .strategy = &sysctl_intvec,
1027 #ifdef HAVE_ARCH_PICK_MMAP_LAYOUT
1029 .ctl_name = VM_LEGACY_VA_LAYOUT,
1030 .procname = "legacy_va_layout",
1031 .data = &sysctl_legacy_va_layout,
1032 .maxlen = sizeof(sysctl_legacy_va_layout),
1034 .proc_handler = &proc_dointvec,
1035 .strategy = &sysctl_intvec,
1041 .ctl_name = VM_ZONE_RECLAIM_MODE,
1042 .procname = "zone_reclaim_mode",
1043 .data = &zone_reclaim_mode,
1044 .maxlen = sizeof(zone_reclaim_mode),
1046 .proc_handler = &proc_dointvec,
1047 .strategy = &sysctl_intvec,
1051 .ctl_name = VM_MIN_UNMAPPED,
1052 .procname = "min_unmapped_ratio",
1053 .data = &sysctl_min_unmapped_ratio,
1054 .maxlen = sizeof(sysctl_min_unmapped_ratio),
1056 .proc_handler = &sysctl_min_unmapped_ratio_sysctl_handler,
1057 .strategy = &sysctl_intvec,
1059 .extra2 = &one_hundred,
1062 .ctl_name = VM_MIN_SLAB,
1063 .procname = "min_slab_ratio",
1064 .data = &sysctl_min_slab_ratio,
1065 .maxlen = sizeof(sysctl_min_slab_ratio),
1067 .proc_handler = &sysctl_min_slab_ratio_sysctl_handler,
1068 .strategy = &sysctl_intvec,
1070 .extra2 = &one_hundred,
1075 .ctl_name = CTL_UNNUMBERED,
1076 .procname = "stat_interval",
1077 .data = &sysctl_stat_interval,
1078 .maxlen = sizeof(sysctl_stat_interval),
1080 .proc_handler = &proc_dointvec_jiffies,
1081 .strategy = &sysctl_jiffies,
1084 #ifdef CONFIG_SECURITY
1086 .ctl_name = CTL_UNNUMBERED,
1087 .procname = "mmap_min_addr",
1088 .data = &mmap_min_addr,
1089 .maxlen = sizeof(unsigned long),
1091 .proc_handler = &proc_doulongvec_minmax,
1096 .ctl_name = CTL_UNNUMBERED,
1097 .procname = "numa_zonelist_order",
1098 .data = &numa_zonelist_order,
1099 .maxlen = NUMA_ZONELIST_ORDER_LEN,
1101 .proc_handler = &numa_zonelist_order_handler,
1102 .strategy = &sysctl_string,
1105 #if (defined(CONFIG_X86_32) && !defined(CONFIG_UML))|| \
1106 (defined(CONFIG_SUPERH) && defined(CONFIG_VSYSCALL))
1108 .ctl_name = VM_VDSO_ENABLED,
1109 .procname = "vdso_enabled",
1110 .data = &vdso_enabled,
1111 .maxlen = sizeof(vdso_enabled),
1113 .proc_handler = &proc_dointvec,
1114 .strategy = &sysctl_intvec,
1118 #ifdef CONFIG_HIGHMEM
1120 .ctl_name = CTL_UNNUMBERED,
1121 .procname = "highmem_is_dirtyable",
1122 .data = &vm_highmem_is_dirtyable,
1123 .maxlen = sizeof(vm_highmem_is_dirtyable),
1125 .proc_handler = &proc_dointvec_minmax,
1126 .strategy = &sysctl_intvec,
1132 * NOTE: do not add new entries to this table unless you have read
1133 * Documentation/sysctl/ctl_unnumbered.txt
1138 #if defined(CONFIG_BINFMT_MISC) || defined(CONFIG_BINFMT_MISC_MODULE)
1139 static struct ctl_table binfmt_misc_table[] = {
1144 static struct ctl_table fs_table[] = {
1146 .ctl_name = FS_NRINODE,
1147 .procname = "inode-nr",
1148 .data = &inodes_stat,
1149 .maxlen = 2*sizeof(int),
1151 .proc_handler = &proc_dointvec,
1154 .ctl_name = FS_STATINODE,
1155 .procname = "inode-state",
1156 .data = &inodes_stat,
1157 .maxlen = 7*sizeof(int),
1159 .proc_handler = &proc_dointvec,
1162 .procname = "file-nr",
1163 .data = &files_stat,
1164 .maxlen = 3*sizeof(int),
1166 .proc_handler = &proc_nr_files,
1169 .ctl_name = FS_MAXFILE,
1170 .procname = "file-max",
1171 .data = &files_stat.max_files,
1172 .maxlen = sizeof(int),
1174 .proc_handler = &proc_dointvec,
1177 .ctl_name = CTL_UNNUMBERED,
1178 .procname = "nr_open",
1179 .data = &sysctl_nr_open,
1180 .maxlen = sizeof(int),
1182 .proc_handler = &proc_dointvec_minmax,
1183 .extra1 = &sysctl_nr_open_min,
1184 .extra2 = &sysctl_nr_open_max,
1187 .ctl_name = FS_DENTRY,
1188 .procname = "dentry-state",
1189 .data = &dentry_stat,
1190 .maxlen = 6*sizeof(int),
1192 .proc_handler = &proc_dointvec,
1195 .ctl_name = FS_OVERFLOWUID,
1196 .procname = "overflowuid",
1197 .data = &fs_overflowuid,
1198 .maxlen = sizeof(int),
1200 .proc_handler = &proc_dointvec_minmax,
1201 .strategy = &sysctl_intvec,
1202 .extra1 = &minolduid,
1203 .extra2 = &maxolduid,
1206 .ctl_name = FS_OVERFLOWGID,
1207 .procname = "overflowgid",
1208 .data = &fs_overflowgid,
1209 .maxlen = sizeof(int),
1211 .proc_handler = &proc_dointvec_minmax,
1212 .strategy = &sysctl_intvec,
1213 .extra1 = &minolduid,
1214 .extra2 = &maxolduid,
1217 .ctl_name = FS_LEASES,
1218 .procname = "leases-enable",
1219 .data = &leases_enable,
1220 .maxlen = sizeof(int),
1222 .proc_handler = &proc_dointvec,
1224 #ifdef CONFIG_DNOTIFY
1226 .ctl_name = FS_DIR_NOTIFY,
1227 .procname = "dir-notify-enable",
1228 .data = &dir_notify_enable,
1229 .maxlen = sizeof(int),
1231 .proc_handler = &proc_dointvec,
1236 .ctl_name = FS_LEASE_TIME,
1237 .procname = "lease-break-time",
1238 .data = &lease_break_time,
1239 .maxlen = sizeof(int),
1241 .proc_handler = &proc_dointvec_minmax,
1242 .strategy = &sysctl_intvec,
1247 .procname = "aio-nr",
1249 .maxlen = sizeof(aio_nr),
1251 .proc_handler = &proc_doulongvec_minmax,
1254 .procname = "aio-max-nr",
1255 .data = &aio_max_nr,
1256 .maxlen = sizeof(aio_max_nr),
1258 .proc_handler = &proc_doulongvec_minmax,
1260 #ifdef CONFIG_INOTIFY_USER
1262 .ctl_name = FS_INOTIFY,
1263 .procname = "inotify",
1265 .child = inotify_table,
1270 .ctl_name = KERN_SETUID_DUMPABLE,
1271 .procname = "suid_dumpable",
1272 .data = &suid_dumpable,
1273 .maxlen = sizeof(int),
1275 .proc_handler = &proc_dointvec,
1277 #if defined(CONFIG_BINFMT_MISC) || defined(CONFIG_BINFMT_MISC_MODULE)
1279 .ctl_name = CTL_UNNUMBERED,
1280 .procname = "binfmt_misc",
1282 .child = binfmt_misc_table,
1286 * NOTE: do not add new entries to this table unless you have read
1287 * Documentation/sysctl/ctl_unnumbered.txt
1292 static struct ctl_table debug_table[] = {
1293 #if defined(CONFIG_X86) || defined(CONFIG_PPC)
1295 .ctl_name = CTL_UNNUMBERED,
1296 .procname = "exception-trace",
1297 .data = &show_unhandled_signals,
1298 .maxlen = sizeof(int),
1300 .proc_handler = proc_dointvec
1306 static struct ctl_table dev_table[] = {
1310 static DEFINE_SPINLOCK(sysctl_lock);
1312 /* called under sysctl_lock */
1313 static int use_table(struct ctl_table_header *p)
1315 if (unlikely(p->unregistering))
1321 /* called under sysctl_lock */
1322 static void unuse_table(struct ctl_table_header *p)
1325 if (unlikely(p->unregistering))
1326 complete(p->unregistering);
1329 /* called under sysctl_lock, will reacquire if has to wait */
1330 static void start_unregistering(struct ctl_table_header *p)
1333 * if p->used is 0, nobody will ever touch that entry again;
1334 * we'll eliminate all paths to it before dropping sysctl_lock
1336 if (unlikely(p->used)) {
1337 struct completion wait;
1338 init_completion(&wait);
1339 p->unregistering = &wait;
1340 spin_unlock(&sysctl_lock);
1341 wait_for_completion(&wait);
1342 spin_lock(&sysctl_lock);
1345 * do not remove from the list until nobody holds it; walking the
1346 * list in do_sysctl() relies on that.
1348 list_del_init(&p->ctl_entry);
1351 void sysctl_head_finish(struct ctl_table_header *head)
1355 spin_lock(&sysctl_lock);
1357 spin_unlock(&sysctl_lock);
1360 static struct list_head *
1361 lookup_header_list(struct ctl_table_root *root, struct nsproxy *namespaces)
1363 struct list_head *header_list;
1364 header_list = &root->header_list;
1366 header_list = root->lookup(root, namespaces);
1370 struct ctl_table_header *__sysctl_head_next(struct nsproxy *namespaces,
1371 struct ctl_table_header *prev)
1373 struct ctl_table_root *root;
1374 struct list_head *header_list;
1375 struct ctl_table_header *head;
1376 struct list_head *tmp;
1378 spin_lock(&sysctl_lock);
1381 tmp = &prev->ctl_entry;
1385 tmp = &root_table_header.ctl_entry;
1387 head = list_entry(tmp, struct ctl_table_header, ctl_entry);
1389 if (!use_table(head))
1391 spin_unlock(&sysctl_lock);
1396 header_list = lookup_header_list(root, namespaces);
1397 if (tmp != header_list)
1401 root = list_entry(root->root_list.next,
1402 struct ctl_table_root, root_list);
1403 if (root == &sysctl_table_root)
1405 header_list = lookup_header_list(root, namespaces);
1406 } while (list_empty(header_list));
1407 tmp = header_list->next;
1410 spin_unlock(&sysctl_lock);
1414 struct ctl_table_header *sysctl_head_next(struct ctl_table_header *prev)
1416 return __sysctl_head_next(current->nsproxy, prev);
1419 void register_sysctl_root(struct ctl_table_root *root)
1421 spin_lock(&sysctl_lock);
1422 list_add_tail(&root->root_list, &sysctl_table_root.root_list);
1423 spin_unlock(&sysctl_lock);
1426 #ifdef CONFIG_SYSCTL_SYSCALL
1427 /* Perform the actual read/write of a sysctl table entry. */
1428 static int do_sysctl_strategy(struct ctl_table_root *root,
1429 struct ctl_table *table,
1430 int __user *name, int nlen,
1431 void __user *oldval, size_t __user *oldlenp,
1432 void __user *newval, size_t newlen)
1440 if (sysctl_perm(root, table, op))
1443 if (table->strategy) {
1444 rc = table->strategy(table, name, nlen, oldval, oldlenp,
1452 /* If there is no strategy routine, or if the strategy returns
1453 * zero, proceed with automatic r/w */
1454 if (table->data && table->maxlen) {
1455 rc = sysctl_data(table, name, nlen, oldval, oldlenp,
1463 static int parse_table(int __user *name, int nlen,
1464 void __user *oldval, size_t __user *oldlenp,
1465 void __user *newval, size_t newlen,
1466 struct ctl_table_root *root,
1467 struct ctl_table *table)
1473 if (get_user(n, name))
1475 for ( ; table->ctl_name || table->procname; table++) {
1476 if (!table->ctl_name)
1478 if (n == table->ctl_name) {
1481 if (sysctl_perm(root, table, 001))
1485 table = table->child;
1488 error = do_sysctl_strategy(root, table, name, nlen,
1497 int do_sysctl(int __user *name, int nlen, void __user *oldval, size_t __user *oldlenp,
1498 void __user *newval, size_t newlen)
1500 struct ctl_table_header *head;
1501 int error = -ENOTDIR;
1503 if (nlen <= 0 || nlen >= CTL_MAXNAME)
1507 if (!oldlenp || get_user(old_len, oldlenp))
1511 for (head = sysctl_head_next(NULL); head;
1512 head = sysctl_head_next(head)) {
1513 error = parse_table(name, nlen, oldval, oldlenp,
1515 head->root, head->ctl_table);
1516 if (error != -ENOTDIR) {
1517 sysctl_head_finish(head);
1524 asmlinkage long sys_sysctl(struct __sysctl_args __user *args)
1526 struct __sysctl_args tmp;
1529 if (copy_from_user(&tmp, args, sizeof(tmp)))
1532 error = deprecated_sysctl_warning(&tmp);
1537 error = do_sysctl(tmp.name, tmp.nlen, tmp.oldval, tmp.oldlenp,
1538 tmp.newval, tmp.newlen);
1543 #endif /* CONFIG_SYSCTL_SYSCALL */
1546 * sysctl_perm does NOT grant the superuser all rights automatically, because
1547 * some sysctl variables are readonly even to root.
1550 static int test_perm(int mode, int op)
1554 else if (in_egroup_p(0))
1556 if ((mode & op & 0007) == op)
1561 int sysctl_perm(struct ctl_table_root *root, struct ctl_table *table, int op)
1566 error = security_sysctl(table, op);
1570 if (root->permissions)
1571 mode = root->permissions(root, current->nsproxy, table);
1575 return test_perm(mode, op);
1578 static void sysctl_set_parent(struct ctl_table *parent, struct ctl_table *table)
1580 for (; table->ctl_name || table->procname; table++) {
1581 table->parent = parent;
1583 sysctl_set_parent(table, table->child);
1587 static __init int sysctl_init(void)
1589 sysctl_set_parent(NULL, root_table);
1590 #ifdef CONFIG_SYSCTL_SYSCALL_CHECK
1593 err = sysctl_check_table(current->nsproxy, root_table);
1599 core_initcall(sysctl_init);
1602 * __register_sysctl_paths - register a sysctl hierarchy
1603 * @root: List of sysctl headers to register on
1604 * @namespaces: Data to compute which lists of sysctl entries are visible
1605 * @path: The path to the directory the sysctl table is in.
1606 * @table: the top-level table structure
1608 * Register a sysctl table hierarchy. @table should be a filled in ctl_table
1609 * array. A completely 0 filled entry terminates the table.
1611 * The members of the &struct ctl_table structure are used as follows:
1613 * ctl_name - This is the numeric sysctl value used by sysctl(2). The number
1614 * must be unique within that level of sysctl
1616 * procname - the name of the sysctl file under /proc/sys. Set to %NULL to not
1617 * enter a sysctl file
1619 * data - a pointer to data for use by proc_handler
1621 * maxlen - the maximum size in bytes of the data
1623 * mode - the file permissions for the /proc/sys file, and for sysctl(2)
1625 * child - a pointer to the child sysctl table if this entry is a directory, or
1628 * proc_handler - the text handler routine (described below)
1630 * strategy - the strategy routine (described below)
1632 * de - for internal use by the sysctl routines
1634 * extra1, extra2 - extra pointers usable by the proc handler routines
1636 * Leaf nodes in the sysctl tree will be represented by a single file
1637 * under /proc; non-leaf nodes will be represented by directories.
1639 * sysctl(2) can automatically manage read and write requests through
1640 * the sysctl table. The data and maxlen fields of the ctl_table
1641 * struct enable minimal validation of the values being written to be
1642 * performed, and the mode field allows minimal authentication.
1644 * More sophisticated management can be enabled by the provision of a
1645 * strategy routine with the table entry. This will be called before
1646 * any automatic read or write of the data is performed.
1648 * The strategy routine may return
1650 * < 0 - Error occurred (error is passed to user process)
1652 * 0 - OK - proceed with automatic read or write.
1654 * > 0 - OK - read or write has been done by the strategy routine, so
1655 * return immediately.
1657 * There must be a proc_handler routine for any terminal nodes
1658 * mirrored under /proc/sys (non-terminals are handled by a built-in
1659 * directory handler). Several default handlers are available to
1660 * cover common cases -
1662 * proc_dostring(), proc_dointvec(), proc_dointvec_jiffies(),
1663 * proc_dointvec_userhz_jiffies(), proc_dointvec_minmax(),
1664 * proc_doulongvec_ms_jiffies_minmax(), proc_doulongvec_minmax()
1666 * It is the handler's job to read the input buffer from user memory
1667 * and process it. The handler should return 0 on success.
1669 * This routine returns %NULL on a failure to register, and a pointer
1670 * to the table header on success.
1672 struct ctl_table_header *__register_sysctl_paths(
1673 struct ctl_table_root *root,
1674 struct nsproxy *namespaces,
1675 const struct ctl_path *path, struct ctl_table *table)
1677 struct list_head *header_list;
1678 struct ctl_table_header *header;
1679 struct ctl_table *new, **prevp;
1680 unsigned int n, npath;
1682 /* Count the path components */
1683 for (npath = 0; path[npath].ctl_name || path[npath].procname; ++npath)
1687 * For each path component, allocate a 2-element ctl_table array.
1688 * The first array element will be filled with the sysctl entry
1689 * for this, the second will be the sentinel (ctl_name == 0).
1691 * We allocate everything in one go so that we don't have to
1692 * worry about freeing additional memory in unregister_sysctl_table.
1694 header = kzalloc(sizeof(struct ctl_table_header) +
1695 (2 * npath * sizeof(struct ctl_table)), GFP_KERNEL);
1699 new = (struct ctl_table *) (header + 1);
1701 /* Now connect the dots */
1702 prevp = &header->ctl_table;
1703 for (n = 0; n < npath; ++n, ++path) {
1704 /* Copy the procname */
1705 new->procname = path->procname;
1706 new->ctl_name = path->ctl_name;
1710 prevp = &new->child;
1715 header->ctl_table_arg = table;
1717 INIT_LIST_HEAD(&header->ctl_entry);
1719 header->unregistering = NULL;
1720 header->root = root;
1721 sysctl_set_parent(NULL, header->ctl_table);
1722 #ifdef CONFIG_SYSCTL_SYSCALL_CHECK
1723 if (sysctl_check_table(namespaces, header->ctl_table)) {
1728 spin_lock(&sysctl_lock);
1729 header_list = lookup_header_list(root, namespaces);
1730 list_add_tail(&header->ctl_entry, header_list);
1731 spin_unlock(&sysctl_lock);
1737 * register_sysctl_table_path - register a sysctl table hierarchy
1738 * @path: The path to the directory the sysctl table is in.
1739 * @table: the top-level table structure
1741 * Register a sysctl table hierarchy. @table should be a filled in ctl_table
1742 * array. A completely 0 filled entry terminates the table.
1744 * See __register_sysctl_paths for more details.
1746 struct ctl_table_header *register_sysctl_paths(const struct ctl_path *path,
1747 struct ctl_table *table)
1749 return __register_sysctl_paths(&sysctl_table_root, current->nsproxy,
1754 * register_sysctl_table - register a sysctl table hierarchy
1755 * @table: the top-level table structure
1757 * Register a sysctl table hierarchy. @table should be a filled in ctl_table
1758 * array. A completely 0 filled entry terminates the table.
1760 * See register_sysctl_paths for more details.
1762 struct ctl_table_header *register_sysctl_table(struct ctl_table *table)
1764 static const struct ctl_path null_path[] = { {} };
1766 return register_sysctl_paths(null_path, table);
1770 * unregister_sysctl_table - unregister a sysctl table hierarchy
1771 * @header: the header returned from register_sysctl_table
1773 * Unregisters the sysctl table and all children. proc entries may not
1774 * actually be removed until they are no longer used by anyone.
1776 void unregister_sysctl_table(struct ctl_table_header * header)
1783 spin_lock(&sysctl_lock);
1784 start_unregistering(header);
1785 spin_unlock(&sysctl_lock);
1789 #else /* !CONFIG_SYSCTL */
1790 struct ctl_table_header *register_sysctl_table(struct ctl_table * table)
1795 struct ctl_table_header *register_sysctl_paths(const struct ctl_path *path,
1796 struct ctl_table *table)
1801 void unregister_sysctl_table(struct ctl_table_header * table)
1805 #endif /* CONFIG_SYSCTL */
1811 #ifdef CONFIG_PROC_SYSCTL
1813 static int _proc_do_string(void* data, int maxlen, int write,
1814 struct file *filp, void __user *buffer,
1815 size_t *lenp, loff_t *ppos)
1821 if (!data || !maxlen || !*lenp) {
1829 while (len < *lenp) {
1830 if (get_user(c, p++))
1832 if (c == 0 || c == '\n')
1838 if(copy_from_user(data, buffer, len))
1840 ((char *) data)[len] = 0;
1858 if(copy_to_user(buffer, data, len))
1861 if(put_user('\n', ((char __user *) buffer) + len))
1872 * proc_dostring - read a string sysctl
1873 * @table: the sysctl table
1874 * @write: %TRUE if this is a write to the sysctl file
1875 * @filp: the file structure
1876 * @buffer: the user buffer
1877 * @lenp: the size of the user buffer
1878 * @ppos: file position
1880 * Reads/writes a string from/to the user buffer. If the kernel
1881 * buffer provided is not large enough to hold the string, the
1882 * string is truncated. The copied string is %NULL-terminated.
1883 * If the string is being read by the user process, it is copied
1884 * and a newline '\n' is added. It is truncated if the buffer is
1887 * Returns 0 on success.
1889 int proc_dostring(struct ctl_table *table, int write, struct file *filp,
1890 void __user *buffer, size_t *lenp, loff_t *ppos)
1892 return _proc_do_string(table->data, table->maxlen, write, filp,
1893 buffer, lenp, ppos);
1897 static int do_proc_dointvec_conv(int *negp, unsigned long *lvalp,
1899 int write, void *data)
1902 *valp = *negp ? -*lvalp : *lvalp;
1907 *lvalp = (unsigned long)-val;
1910 *lvalp = (unsigned long)val;
1916 static int __do_proc_dointvec(void *tbl_data, struct ctl_table *table,
1917 int write, struct file *filp, void __user *buffer,
1918 size_t *lenp, loff_t *ppos,
1919 int (*conv)(int *negp, unsigned long *lvalp, int *valp,
1920 int write, void *data),
1923 #define TMPBUFLEN 21
1924 int *i, vleft, first=1, neg, val;
1928 char buf[TMPBUFLEN], *p;
1929 char __user *s = buffer;
1931 if (!tbl_data || !table->maxlen || !*lenp ||
1932 (*ppos && !write)) {
1937 i = (int *) tbl_data;
1938 vleft = table->maxlen / sizeof(*i);
1942 conv = do_proc_dointvec_conv;
1944 for (; left && vleft--; i++, first=0) {
1959 if (len > sizeof(buf) - 1)
1960 len = sizeof(buf) - 1;
1961 if (copy_from_user(buf, s, len))
1965 if (*p == '-' && left > 1) {
1969 if (*p < '0' || *p > '9')
1972 lval = simple_strtoul(p, &p, 0);
1975 if ((len < left) && *p && !isspace(*p))
1982 if (conv(&neg, &lval, i, 1, data))
1989 if (conv(&neg, &lval, i, 0, data))
1992 sprintf(p, "%s%lu", neg ? "-" : "", lval);
1996 if(copy_to_user(s, buf, len))
2003 if (!write && !first && left) {
2004 if(put_user('\n', s))
2011 if (get_user(c, s++))
2026 static int do_proc_dointvec(struct ctl_table *table, int write, struct file *filp,
2027 void __user *buffer, size_t *lenp, loff_t *ppos,
2028 int (*conv)(int *negp, unsigned long *lvalp, int *valp,
2029 int write, void *data),
2032 return __do_proc_dointvec(table->data, table, write, filp,
2033 buffer, lenp, ppos, conv, data);
2037 * proc_dointvec - read a vector of integers
2038 * @table: the sysctl table
2039 * @write: %TRUE if this is a write to the sysctl file
2040 * @filp: the file structure
2041 * @buffer: the user buffer
2042 * @lenp: the size of the user buffer
2043 * @ppos: file position
2045 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2046 * values from/to the user buffer, treated as an ASCII string.
2048 * Returns 0 on success.
2050 int proc_dointvec(struct ctl_table *table, int write, struct file *filp,
2051 void __user *buffer, size_t *lenp, loff_t *ppos)
2053 return do_proc_dointvec(table,write,filp,buffer,lenp,ppos,
2061 static int do_proc_dointvec_bset_conv(int *negp, unsigned long *lvalp,
2063 int write, void *data)
2065 int op = *(int *)data;
2067 int val = *negp ? -*lvalp : *lvalp;
2069 case OP_SET: *valp = val; break;
2070 case OP_AND: *valp &= val; break;
2071 case OP_OR: *valp |= val; break;
2077 *lvalp = (unsigned long)-val;
2080 *lvalp = (unsigned long)val;
2087 * Taint values can only be increased
2089 static int proc_dointvec_taint(struct ctl_table *table, int write, struct file *filp,
2090 void __user *buffer, size_t *lenp, loff_t *ppos)
2094 if (write && !capable(CAP_SYS_ADMIN))
2098 return do_proc_dointvec(table,write,filp,buffer,lenp,ppos,
2099 do_proc_dointvec_bset_conv,&op);
2102 struct do_proc_dointvec_minmax_conv_param {
2107 static int do_proc_dointvec_minmax_conv(int *negp, unsigned long *lvalp,
2109 int write, void *data)
2111 struct do_proc_dointvec_minmax_conv_param *param = data;
2113 int val = *negp ? -*lvalp : *lvalp;
2114 if ((param->min && *param->min > val) ||
2115 (param->max && *param->max < val))
2122 *lvalp = (unsigned long)-val;
2125 *lvalp = (unsigned long)val;
2132 * proc_dointvec_minmax - read a vector of integers with min/max values
2133 * @table: the sysctl table
2134 * @write: %TRUE if this is a write to the sysctl file
2135 * @filp: the file structure
2136 * @buffer: the user buffer
2137 * @lenp: the size of the user buffer
2138 * @ppos: file position
2140 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2141 * values from/to the user buffer, treated as an ASCII string.
2143 * This routine will ensure the values are within the range specified by
2144 * table->extra1 (min) and table->extra2 (max).
2146 * Returns 0 on success.
2148 int proc_dointvec_minmax(struct ctl_table *table, int write, struct file *filp,
2149 void __user *buffer, size_t *lenp, loff_t *ppos)
2151 struct do_proc_dointvec_minmax_conv_param param = {
2152 .min = (int *) table->extra1,
2153 .max = (int *) table->extra2,
2155 return do_proc_dointvec(table, write, filp, buffer, lenp, ppos,
2156 do_proc_dointvec_minmax_conv, ¶m);
2159 static int __do_proc_doulongvec_minmax(void *data, struct ctl_table *table, int write,
2161 void __user *buffer,
2162 size_t *lenp, loff_t *ppos,
2163 unsigned long convmul,
2164 unsigned long convdiv)
2166 #define TMPBUFLEN 21
2167 unsigned long *i, *min, *max, val;
2168 int vleft, first=1, neg;
2170 char buf[TMPBUFLEN], *p;
2171 char __user *s = buffer;
2173 if (!data || !table->maxlen || !*lenp ||
2174 (*ppos && !write)) {
2179 i = (unsigned long *) data;
2180 min = (unsigned long *) table->extra1;
2181 max = (unsigned long *) table->extra2;
2182 vleft = table->maxlen / sizeof(unsigned long);
2185 for (; left && vleft--; i++, min++, max++, first=0) {
2200 if (len > TMPBUFLEN-1)
2202 if (copy_from_user(buf, s, len))
2206 if (*p == '-' && left > 1) {
2210 if (*p < '0' || *p > '9')
2212 val = simple_strtoul(p, &p, 0) * convmul / convdiv ;
2214 if ((len < left) && *p && !isspace(*p))
2223 if ((min && val < *min) || (max && val > *max))
2230 sprintf(p, "%lu", convdiv * (*i) / convmul);
2234 if(copy_to_user(s, buf, len))
2241 if (!write && !first && left) {
2242 if(put_user('\n', s))
2249 if (get_user(c, s++))
2264 static int do_proc_doulongvec_minmax(struct ctl_table *table, int write,
2266 void __user *buffer,
2267 size_t *lenp, loff_t *ppos,
2268 unsigned long convmul,
2269 unsigned long convdiv)
2271 return __do_proc_doulongvec_minmax(table->data, table, write,
2272 filp, buffer, lenp, ppos, convmul, convdiv);
2276 * proc_doulongvec_minmax - read a vector of long integers with min/max values
2277 * @table: the sysctl table
2278 * @write: %TRUE if this is a write to the sysctl file
2279 * @filp: the file structure
2280 * @buffer: the user buffer
2281 * @lenp: the size of the user buffer
2282 * @ppos: file position
2284 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long
2285 * values from/to the user buffer, treated as an ASCII string.
2287 * This routine will ensure the values are within the range specified by
2288 * table->extra1 (min) and table->extra2 (max).
2290 * Returns 0 on success.
2292 int proc_doulongvec_minmax(struct ctl_table *table, int write, struct file *filp,
2293 void __user *buffer, size_t *lenp, loff_t *ppos)
2295 return do_proc_doulongvec_minmax(table, write, filp, buffer, lenp, ppos, 1l, 1l);
2299 * proc_doulongvec_ms_jiffies_minmax - read a vector of millisecond values with min/max values
2300 * @table: the sysctl table
2301 * @write: %TRUE if this is a write to the sysctl file
2302 * @filp: the file structure
2303 * @buffer: the user buffer
2304 * @lenp: the size of the user buffer
2305 * @ppos: file position
2307 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long
2308 * values from/to the user buffer, treated as an ASCII string. The values
2309 * are treated as milliseconds, and converted to jiffies when they are stored.
2311 * This routine will ensure the values are within the range specified by
2312 * table->extra1 (min) and table->extra2 (max).
2314 * Returns 0 on success.
2316 int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write,
2318 void __user *buffer,
2319 size_t *lenp, loff_t *ppos)
2321 return do_proc_doulongvec_minmax(table, write, filp, buffer,
2322 lenp, ppos, HZ, 1000l);
2326 static int do_proc_dointvec_jiffies_conv(int *negp, unsigned long *lvalp,
2328 int write, void *data)
2331 if (*lvalp > LONG_MAX / HZ)
2333 *valp = *negp ? -(*lvalp*HZ) : (*lvalp*HZ);
2339 lval = (unsigned long)-val;
2342 lval = (unsigned long)val;
2349 static int do_proc_dointvec_userhz_jiffies_conv(int *negp, unsigned long *lvalp,
2351 int write, void *data)
2354 if (USER_HZ < HZ && *lvalp > (LONG_MAX / HZ) * USER_HZ)
2356 *valp = clock_t_to_jiffies(*negp ? -*lvalp : *lvalp);
2362 lval = (unsigned long)-val;
2365 lval = (unsigned long)val;
2367 *lvalp = jiffies_to_clock_t(lval);
2372 static int do_proc_dointvec_ms_jiffies_conv(int *negp, unsigned long *lvalp,
2374 int write, void *data)
2377 *valp = msecs_to_jiffies(*negp ? -*lvalp : *lvalp);
2383 lval = (unsigned long)-val;
2386 lval = (unsigned long)val;
2388 *lvalp = jiffies_to_msecs(lval);
2394 * proc_dointvec_jiffies - read a vector of integers as seconds
2395 * @table: the sysctl table
2396 * @write: %TRUE if this is a write to the sysctl file
2397 * @filp: the file structure
2398 * @buffer: the user buffer
2399 * @lenp: the size of the user buffer
2400 * @ppos: file position
2402 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2403 * values from/to the user buffer, treated as an ASCII string.
2404 * The values read are assumed to be in seconds, and are converted into
2407 * Returns 0 on success.
2409 int proc_dointvec_jiffies(struct ctl_table *table, int write, struct file *filp,
2410 void __user *buffer, size_t *lenp, loff_t *ppos)
2412 return do_proc_dointvec(table,write,filp,buffer,lenp,ppos,
2413 do_proc_dointvec_jiffies_conv,NULL);
2417 * proc_dointvec_userhz_jiffies - read a vector of integers as 1/USER_HZ seconds
2418 * @table: the sysctl table
2419 * @write: %TRUE if this is a write to the sysctl file
2420 * @filp: the file structure
2421 * @buffer: the user buffer
2422 * @lenp: the size of the user buffer
2423 * @ppos: pointer to the file position
2425 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2426 * values from/to the user buffer, treated as an ASCII string.
2427 * The values read are assumed to be in 1/USER_HZ seconds, and
2428 * are converted into jiffies.
2430 * Returns 0 on success.
2432 int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write, struct file *filp,
2433 void __user *buffer, size_t *lenp, loff_t *ppos)
2435 return do_proc_dointvec(table,write,filp,buffer,lenp,ppos,
2436 do_proc_dointvec_userhz_jiffies_conv,NULL);
2440 * proc_dointvec_ms_jiffies - read a vector of integers as 1 milliseconds
2441 * @table: the sysctl table
2442 * @write: %TRUE if this is a write to the sysctl file
2443 * @filp: the file structure
2444 * @buffer: the user buffer
2445 * @lenp: the size of the user buffer
2446 * @ppos: file position
2447 * @ppos: the current position in the file
2449 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2450 * values from/to the user buffer, treated as an ASCII string.
2451 * The values read are assumed to be in 1/1000 seconds, and
2452 * are converted into jiffies.
2454 * Returns 0 on success.
2456 int proc_dointvec_ms_jiffies(struct ctl_table *table, int write, struct file *filp,
2457 void __user *buffer, size_t *lenp, loff_t *ppos)
2459 return do_proc_dointvec(table, write, filp, buffer, lenp, ppos,
2460 do_proc_dointvec_ms_jiffies_conv, NULL);
2463 static int proc_do_cad_pid(struct ctl_table *table, int write, struct file *filp,
2464 void __user *buffer, size_t *lenp, loff_t *ppos)
2466 struct pid *new_pid;
2470 tmp = pid_vnr(cad_pid);
2472 r = __do_proc_dointvec(&tmp, table, write, filp, buffer,
2473 lenp, ppos, NULL, NULL);
2477 new_pid = find_get_pid(tmp);
2481 put_pid(xchg(&cad_pid, new_pid));
2485 #else /* CONFIG_PROC_FS */
2487 int proc_dostring(struct ctl_table *table, int write, struct file *filp,
2488 void __user *buffer, size_t *lenp, loff_t *ppos)
2493 int proc_dointvec(struct ctl_table *table, int write, struct file *filp,
2494 void __user *buffer, size_t *lenp, loff_t *ppos)
2499 int proc_dointvec_minmax(struct ctl_table *table, int write, struct file *filp,
2500 void __user *buffer, size_t *lenp, loff_t *ppos)
2505 int proc_dointvec_jiffies(struct ctl_table *table, int write, struct file *filp,
2506 void __user *buffer, size_t *lenp, loff_t *ppos)
2511 int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write, struct file *filp,
2512 void __user *buffer, size_t *lenp, loff_t *ppos)
2517 int proc_dointvec_ms_jiffies(struct ctl_table *table, int write, struct file *filp,
2518 void __user *buffer, size_t *lenp, loff_t *ppos)
2523 int proc_doulongvec_minmax(struct ctl_table *table, int write, struct file *filp,
2524 void __user *buffer, size_t *lenp, loff_t *ppos)
2529 int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write,
2531 void __user *buffer,
2532 size_t *lenp, loff_t *ppos)
2538 #endif /* CONFIG_PROC_FS */
2541 #ifdef CONFIG_SYSCTL_SYSCALL
2543 * General sysctl support routines
2546 /* The generic sysctl data routine (used if no strategy routine supplied) */
2547 int sysctl_data(struct ctl_table *table, int __user *name, int nlen,
2548 void __user *oldval, size_t __user *oldlenp,
2549 void __user *newval, size_t newlen)
2553 /* Get out of I don't have a variable */
2554 if (!table->data || !table->maxlen)
2557 if (oldval && oldlenp) {
2558 if (get_user(len, oldlenp))
2561 if (len > table->maxlen)
2562 len = table->maxlen;
2563 if (copy_to_user(oldval, table->data, len))
2565 if (put_user(len, oldlenp))
2570 if (newval && newlen) {
2571 if (newlen > table->maxlen)
2572 newlen = table->maxlen;
2574 if (copy_from_user(table->data, newval, newlen))
2580 /* The generic string strategy routine: */
2581 int sysctl_string(struct ctl_table *table, int __user *name, int nlen,
2582 void __user *oldval, size_t __user *oldlenp,
2583 void __user *newval, size_t newlen)
2585 if (!table->data || !table->maxlen)
2588 if (oldval && oldlenp) {
2590 if (get_user(bufsize, oldlenp))
2593 size_t len = strlen(table->data), copied;
2595 /* This shouldn't trigger for a well-formed sysctl */
2596 if (len > table->maxlen)
2597 len = table->maxlen;
2599 /* Copy up to a max of bufsize-1 bytes of the string */
2600 copied = (len >= bufsize) ? bufsize - 1 : len;
2602 if (copy_to_user(oldval, table->data, copied) ||
2603 put_user(0, (char __user *)(oldval + copied)))
2605 if (put_user(len, oldlenp))
2609 if (newval && newlen) {
2610 size_t len = newlen;
2611 if (len > table->maxlen)
2612 len = table->maxlen;
2613 if(copy_from_user(table->data, newval, len))
2615 if (len == table->maxlen)
2617 ((char *) table->data)[len] = 0;
2623 * This function makes sure that all of the integers in the vector
2624 * are between the minimum and maximum values given in the arrays
2625 * table->extra1 and table->extra2, respectively.
2627 int sysctl_intvec(struct ctl_table *table, int __user *name, int nlen,
2628 void __user *oldval, size_t __user *oldlenp,
2629 void __user *newval, size_t newlen)
2632 if (newval && newlen) {
2633 int __user *vec = (int __user *) newval;
2634 int *min = (int *) table->extra1;
2635 int *max = (int *) table->extra2;
2639 if (newlen % sizeof(int) != 0)
2642 if (!table->extra1 && !table->extra2)
2645 if (newlen > table->maxlen)
2646 newlen = table->maxlen;
2647 length = newlen / sizeof(int);
2649 for (i = 0; i < length; i++) {
2651 if (get_user(value, vec + i))
2653 if (min && value < min[i])
2655 if (max && value > max[i])
2662 /* Strategy function to convert jiffies to seconds */
2663 int sysctl_jiffies(struct ctl_table *table, int __user *name, int nlen,
2664 void __user *oldval, size_t __user *oldlenp,
2665 void __user *newval, size_t newlen)
2667 if (oldval && oldlenp) {
2670 if (get_user(olen, oldlenp))
2675 if (olen < sizeof(int))
2678 val = *(int *)(table->data) / HZ;
2679 if (put_user(val, (int __user *)oldval))
2681 if (put_user(sizeof(int), oldlenp))
2685 if (newval && newlen) {
2687 if (newlen != sizeof(int))
2689 if (get_user(new, (int __user *)newval))
2691 *(int *)(table->data) = new*HZ;
2696 /* Strategy function to convert jiffies to seconds */
2697 int sysctl_ms_jiffies(struct ctl_table *table, int __user *name, int nlen,
2698 void __user *oldval, size_t __user *oldlenp,
2699 void __user *newval, size_t newlen)
2701 if (oldval && oldlenp) {
2704 if (get_user(olen, oldlenp))
2709 if (olen < sizeof(int))
2712 val = jiffies_to_msecs(*(int *)(table->data));
2713 if (put_user(val, (int __user *)oldval))
2715 if (put_user(sizeof(int), oldlenp))
2719 if (newval && newlen) {
2721 if (newlen != sizeof(int))
2723 if (get_user(new, (int __user *)newval))
2725 *(int *)(table->data) = msecs_to_jiffies(new);
2732 #else /* CONFIG_SYSCTL_SYSCALL */
2735 asmlinkage long sys_sysctl(struct __sysctl_args __user *args)
2737 struct __sysctl_args tmp;
2740 if (copy_from_user(&tmp, args, sizeof(tmp)))
2743 error = deprecated_sysctl_warning(&tmp);
2745 /* If no error reading the parameters then just -ENOSYS ... */
2752 int sysctl_data(struct ctl_table *table, int __user *name, int nlen,
2753 void __user *oldval, size_t __user *oldlenp,
2754 void __user *newval, size_t newlen)
2759 int sysctl_string(struct ctl_table *table, int __user *name, int nlen,
2760 void __user *oldval, size_t __user *oldlenp,
2761 void __user *newval, size_t newlen)
2766 int sysctl_intvec(struct ctl_table *table, int __user *name, int nlen,
2767 void __user *oldval, size_t __user *oldlenp,
2768 void __user *newval, size_t newlen)
2773 int sysctl_jiffies(struct ctl_table *table, int __user *name, int nlen,
2774 void __user *oldval, size_t __user *oldlenp,
2775 void __user *newval, size_t newlen)
2780 int sysctl_ms_jiffies(struct ctl_table *table, int __user *name, int nlen,
2781 void __user *oldval, size_t __user *oldlenp,
2782 void __user *newval, size_t newlen)
2787 #endif /* CONFIG_SYSCTL_SYSCALL */
2789 static int deprecated_sysctl_warning(struct __sysctl_args *args)
2791 static int msg_count;
2792 int name[CTL_MAXNAME];
2795 /* Check args->nlen. */
2796 if (args->nlen < 0 || args->nlen > CTL_MAXNAME)
2799 /* Read in the sysctl name for better debug message logging */
2800 for (i = 0; i < args->nlen; i++)
2801 if (get_user(name[i], args->name + i))
2804 /* Ignore accesses to kernel.version */
2805 if ((args->nlen == 2) && (name[0] == CTL_KERN) && (name[1] == KERN_VERSION))
2808 if (msg_count < 5) {
2811 "warning: process `%s' used the deprecated sysctl "
2812 "system call with ", current->comm);
2813 for (i = 0; i < args->nlen; i++)
2814 printk("%d.", name[i]);
2821 * No sense putting this after each symbol definition, twice,
2822 * exception granted :-)
2824 EXPORT_SYMBOL(proc_dointvec);
2825 EXPORT_SYMBOL(proc_dointvec_jiffies);
2826 EXPORT_SYMBOL(proc_dointvec_minmax);
2827 EXPORT_SYMBOL(proc_dointvec_userhz_jiffies);
2828 EXPORT_SYMBOL(proc_dointvec_ms_jiffies);
2829 EXPORT_SYMBOL(proc_dostring);
2830 EXPORT_SYMBOL(proc_doulongvec_minmax);
2831 EXPORT_SYMBOL(proc_doulongvec_ms_jiffies_minmax);
2832 EXPORT_SYMBOL(register_sysctl_table);
2833 EXPORT_SYMBOL(register_sysctl_paths);
2834 EXPORT_SYMBOL(sysctl_intvec);
2835 EXPORT_SYMBOL(sysctl_jiffies);
2836 EXPORT_SYMBOL(sysctl_ms_jiffies);
2837 EXPORT_SYMBOL(sysctl_string);
2838 EXPORT_SYMBOL(sysctl_data);
2839 EXPORT_SYMBOL(unregister_sysctl_table);