Linux Audio

Check our new training course

Loading...
v4.10.11
   1/*
   2 * sysctl.c: General linux system control interface
   3 *
   4 * Begun 24 March 1995, Stephen Tweedie
   5 * Added /proc support, Dec 1995
   6 * Added bdflush entry and intvec min/max checking, 2/23/96, Tom Dyas.
   7 * Added hooks for /proc/sys/net (minor, minor patch), 96/4/1, Mike Shaver.
   8 * Added kernel/java-{interpreter,appletviewer}, 96/5/10, Mike Shaver.
   9 * Dynamic registration fixes, Stephen Tweedie.
  10 * Added kswapd-interval, ctrl-alt-del, printk stuff, 1/8/97, Chris Horn.
  11 * Made sysctl support optional via CONFIG_SYSCTL, 1/10/97, Chris
  12 *  Horn.
  13 * Added proc_doulongvec_ms_jiffies_minmax, 09/08/99, Carlos H. Bauer.
  14 * Added proc_doulongvec_minmax, 09/08/99, Carlos H. Bauer.
  15 * Changed linked lists to use list.h instead of lists.h, 02/24/00, Bill
  16 *  Wendling.
  17 * The list_for_each() macro wasn't appropriate for the sysctl loop.
  18 *  Removed it and replaced it with older style, 03/23/00, Bill Wendling
  19 */
  20
  21#include <linux/module.h>
  22#include <linux/aio.h>
  23#include <linux/mm.h>
  24#include <linux/swap.h>
  25#include <linux/slab.h>
  26#include <linux/sysctl.h>
  27#include <linux/bitmap.h>
  28#include <linux/signal.h>
  29#include <linux/printk.h>
  30#include <linux/proc_fs.h>
  31#include <linux/security.h>
  32#include <linux/ctype.h>
  33#include <linux/kmemcheck.h>
  34#include <linux/kmemleak.h>
  35#include <linux/fs.h>
  36#include <linux/init.h>
  37#include <linux/kernel.h>
  38#include <linux/kobject.h>
  39#include <linux/net.h>
  40#include <linux/sysrq.h>
  41#include <linux/highuid.h>
  42#include <linux/writeback.h>
  43#include <linux/ratelimit.h>
  44#include <linux/compaction.h>
  45#include <linux/hugetlb.h>
  46#include <linux/initrd.h>
  47#include <linux/key.h>
  48#include <linux/times.h>
  49#include <linux/limits.h>
  50#include <linux/dcache.h>
  51#include <linux/dnotify.h>
  52#include <linux/syscalls.h>
  53#include <linux/vmstat.h>
  54#include <linux/nfs_fs.h>
  55#include <linux/acpi.h>
  56#include <linux/reboot.h>
  57#include <linux/ftrace.h>
  58#include <linux/perf_event.h>
  59#include <linux/kprobes.h>
  60#include <linux/pipe_fs_i.h>
  61#include <linux/oom.h>
  62#include <linux/kmod.h>
  63#include <linux/capability.h>
  64#include <linux/binfmts.h>
  65#include <linux/sched/sysctl.h>
 
  66#include <linux/kexec.h>
  67#include <linux/bpf.h>
  68#include <linux/mount.h>
 
  69
  70#include <linux/uaccess.h>
  71#include <asm/processor.h>
  72
  73#ifdef CONFIG_X86
  74#include <asm/nmi.h>
  75#include <asm/stacktrace.h>
  76#include <asm/io.h>
  77#endif
  78#ifdef CONFIG_SPARC
  79#include <asm/setup.h>
  80#endif
  81#ifdef CONFIG_BSD_PROCESS_ACCT
  82#include <linux/acct.h>
  83#endif
  84#ifdef CONFIG_RT_MUTEXES
  85#include <linux/rtmutex.h>
  86#endif
  87#if defined(CONFIG_PROVE_LOCKING) || defined(CONFIG_LOCK_STAT)
  88#include <linux/lockdep.h>
  89#endif
  90#ifdef CONFIG_CHR_DEV_SG
  91#include <scsi/sg.h>
  92#endif
  93
  94#ifdef CONFIG_LOCKUP_DETECTOR
  95#include <linux/nmi.h>
  96#endif
  97
  98#if defined(CONFIG_SYSCTL)
  99
 100/* External variables not in a header file. */
 101extern int suid_dumpable;
 102#ifdef CONFIG_COREDUMP
 103extern int core_uses_pid;
 104extern char core_pattern[];
 105extern unsigned int core_pipe_limit;
 106#endif
 107extern int pid_max;
 108extern int pid_max_min, pid_max_max;
 109extern int percpu_pagelist_fraction;
 110extern int latencytop_enabled;
 111extern unsigned int sysctl_nr_open_min, sysctl_nr_open_max;
 112#ifndef CONFIG_MMU
 113extern int sysctl_nr_trim_pages;
 114#endif
 115
 116/* Constants used for minimum and  maximum */
 117#ifdef CONFIG_LOCKUP_DETECTOR
 118static int sixty = 60;
 119#endif
 120
 121static int __maybe_unused neg_one = -1;
 122
 123static int zero;
 124static int __maybe_unused one = 1;
 125static int __maybe_unused two = 2;
 126static int __maybe_unused four = 4;
 127static unsigned long one_ul = 1;
 128static int one_hundred = 100;
 129static int one_thousand = 1000;
 130#ifdef CONFIG_PRINTK
 131static int ten_thousand = 10000;
 132#endif
 133#ifdef CONFIG_PERF_EVENTS
 134static int six_hundred_forty_kb = 640 * 1024;
 135#endif
 136
 137/* this is needed for the proc_doulongvec_minmax of vm_dirty_bytes */
 138static unsigned long dirty_bytes_min = 2 * PAGE_SIZE;
 139
 140/* this is needed for the proc_dointvec_minmax for [fs_]overflow UID and GID */
 141static int maxolduid = 65535;
 142static int minolduid;
 143
 144static int ngroups_max = NGROUPS_MAX;
 145static const int cap_last_cap = CAP_LAST_CAP;
 146
 147/*this is needed for proc_doulongvec_minmax of sysctl_hung_task_timeout_secs */
 148#ifdef CONFIG_DETECT_HUNG_TASK
 149static unsigned long hung_task_timeout_max = (LONG_MAX/HZ);
 150#endif
 151
 152#ifdef CONFIG_INOTIFY_USER
 153#include <linux/inotify.h>
 154#endif
 155#ifdef CONFIG_SPARC
 156#endif
 157
 158#ifdef __hppa__
 159extern int pwrsw_enabled;
 160#endif
 161
 162#ifdef CONFIG_SYSCTL_ARCH_UNALIGN_ALLOW
 163extern int unaligned_enabled;
 164#endif
 165
 166#ifdef CONFIG_IA64
 167extern int unaligned_dump_stack;
 168#endif
 169
 170#ifdef CONFIG_SYSCTL_ARCH_UNALIGN_NO_WARN
 171extern int no_unaligned_warning;
 172#endif
 173
 174#ifdef CONFIG_PROC_SYSCTL
 175
 176#define SYSCTL_WRITES_LEGACY	-1
 177#define SYSCTL_WRITES_WARN	 0
 178#define SYSCTL_WRITES_STRICT	 1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 179
 180static int sysctl_writes_strict = SYSCTL_WRITES_STRICT;
 181
 182static int proc_do_cad_pid(struct ctl_table *table, int write,
 183		  void __user *buffer, size_t *lenp, loff_t *ppos);
 184static int proc_taint(struct ctl_table *table, int write,
 185			       void __user *buffer, size_t *lenp, loff_t *ppos);
 186#endif
 187
 188#ifdef CONFIG_PRINTK
 189static int proc_dointvec_minmax_sysadmin(struct ctl_table *table, int write,
 190				void __user *buffer, size_t *lenp, loff_t *ppos);
 191#endif
 192
 193static int proc_dointvec_minmax_coredump(struct ctl_table *table, int write,
 194		void __user *buffer, size_t *lenp, loff_t *ppos);
 195#ifdef CONFIG_COREDUMP
 196static int proc_dostring_coredump(struct ctl_table *table, int write,
 197		void __user *buffer, size_t *lenp, loff_t *ppos);
 198#endif
 
 
 199
 200#ifdef CONFIG_MAGIC_SYSRQ
 201/* Note: sysrq code uses it's own private copy */
 202static int __sysrq_enabled = CONFIG_MAGIC_SYSRQ_DEFAULT_ENABLE;
 203
 204static int sysrq_sysctl_handler(struct ctl_table *table, int write,
 205				void __user *buffer, size_t *lenp,
 206				loff_t *ppos)
 207{
 208	int error;
 209
 210	error = proc_dointvec(table, write, buffer, lenp, ppos);
 211	if (error)
 212		return error;
 213
 214	if (write)
 215		sysrq_toggle_support(__sysrq_enabled);
 216
 217	return 0;
 218}
 219
 220#endif
 221
 222static struct ctl_table kern_table[];
 223static struct ctl_table vm_table[];
 224static struct ctl_table fs_table[];
 225static struct ctl_table debug_table[];
 226static struct ctl_table dev_table[];
 227extern struct ctl_table random_table[];
 228#ifdef CONFIG_EPOLL
 229extern struct ctl_table epoll_table[];
 230#endif
 231
 
 
 
 
 232#ifdef HAVE_ARCH_PICK_MMAP_LAYOUT
 233int sysctl_legacy_va_layout;
 234#endif
 235
 236/* The default sysctl tables: */
 237
 238static struct ctl_table sysctl_base_table[] = {
 239	{
 240		.procname	= "kernel",
 241		.mode		= 0555,
 242		.child		= kern_table,
 243	},
 244	{
 245		.procname	= "vm",
 246		.mode		= 0555,
 247		.child		= vm_table,
 248	},
 249	{
 250		.procname	= "fs",
 251		.mode		= 0555,
 252		.child		= fs_table,
 253	},
 254	{
 255		.procname	= "debug",
 256		.mode		= 0555,
 257		.child		= debug_table,
 258	},
 259	{
 260		.procname	= "dev",
 261		.mode		= 0555,
 262		.child		= dev_table,
 263	},
 264	{ }
 265};
 266
 267#ifdef CONFIG_SCHED_DEBUG
 268static int min_sched_granularity_ns = 100000;		/* 100 usecs */
 269static int max_sched_granularity_ns = NSEC_PER_SEC;	/* 1 second */
 270static int min_wakeup_granularity_ns;			/* 0 usecs */
 271static int max_wakeup_granularity_ns = NSEC_PER_SEC;	/* 1 second */
 272#ifdef CONFIG_SMP
 273static int min_sched_tunable_scaling = SCHED_TUNABLESCALING_NONE;
 274static int max_sched_tunable_scaling = SCHED_TUNABLESCALING_END-1;
 275#endif /* CONFIG_SMP */
 276#endif /* CONFIG_SCHED_DEBUG */
 277
 278#ifdef CONFIG_COMPACTION
 279static int min_extfrag_threshold;
 280static int max_extfrag_threshold = 1000;
 281#endif
 282
 283static struct ctl_table kern_table[] = {
 284	{
 285		.procname	= "sched_child_runs_first",
 286		.data		= &sysctl_sched_child_runs_first,
 287		.maxlen		= sizeof(unsigned int),
 288		.mode		= 0644,
 289		.proc_handler	= proc_dointvec,
 290	},
 291#ifdef CONFIG_SCHED_DEBUG
 292	{
 293		.procname	= "sched_min_granularity_ns",
 294		.data		= &sysctl_sched_min_granularity,
 295		.maxlen		= sizeof(unsigned int),
 296		.mode		= 0644,
 297		.proc_handler	= sched_proc_update_handler,
 298		.extra1		= &min_sched_granularity_ns,
 299		.extra2		= &max_sched_granularity_ns,
 300	},
 301	{
 302		.procname	= "sched_latency_ns",
 303		.data		= &sysctl_sched_latency,
 304		.maxlen		= sizeof(unsigned int),
 305		.mode		= 0644,
 306		.proc_handler	= sched_proc_update_handler,
 307		.extra1		= &min_sched_granularity_ns,
 308		.extra2		= &max_sched_granularity_ns,
 309	},
 310	{
 311		.procname	= "sched_wakeup_granularity_ns",
 312		.data		= &sysctl_sched_wakeup_granularity,
 313		.maxlen		= sizeof(unsigned int),
 314		.mode		= 0644,
 315		.proc_handler	= sched_proc_update_handler,
 316		.extra1		= &min_wakeup_granularity_ns,
 317		.extra2		= &max_wakeup_granularity_ns,
 318	},
 319#ifdef CONFIG_SMP
 320	{
 321		.procname	= "sched_tunable_scaling",
 322		.data		= &sysctl_sched_tunable_scaling,
 323		.maxlen		= sizeof(enum sched_tunable_scaling),
 324		.mode		= 0644,
 325		.proc_handler	= sched_proc_update_handler,
 326		.extra1		= &min_sched_tunable_scaling,
 327		.extra2		= &max_sched_tunable_scaling,
 328	},
 329	{
 330		.procname	= "sched_migration_cost_ns",
 331		.data		= &sysctl_sched_migration_cost,
 332		.maxlen		= sizeof(unsigned int),
 333		.mode		= 0644,
 334		.proc_handler	= proc_dointvec,
 335	},
 336	{
 337		.procname	= "sched_nr_migrate",
 338		.data		= &sysctl_sched_nr_migrate,
 339		.maxlen		= sizeof(unsigned int),
 340		.mode		= 0644,
 341		.proc_handler	= proc_dointvec,
 342	},
 343	{
 344		.procname	= "sched_time_avg_ms",
 345		.data		= &sysctl_sched_time_avg,
 346		.maxlen		= sizeof(unsigned int),
 347		.mode		= 0644,
 348		.proc_handler	= proc_dointvec,
 
 349	},
 350#ifdef CONFIG_SCHEDSTATS
 351	{
 352		.procname	= "sched_schedstats",
 353		.data		= NULL,
 354		.maxlen		= sizeof(unsigned int),
 355		.mode		= 0644,
 356		.proc_handler	= sysctl_schedstats,
 357		.extra1		= &zero,
 358		.extra2		= &one,
 359	},
 360#endif /* CONFIG_SCHEDSTATS */
 361#endif /* CONFIG_SMP */
 362#ifdef CONFIG_NUMA_BALANCING
 363	{
 364		.procname	= "numa_balancing_scan_delay_ms",
 365		.data		= &sysctl_numa_balancing_scan_delay,
 366		.maxlen		= sizeof(unsigned int),
 367		.mode		= 0644,
 368		.proc_handler	= proc_dointvec,
 369	},
 370	{
 371		.procname	= "numa_balancing_scan_period_min_ms",
 372		.data		= &sysctl_numa_balancing_scan_period_min,
 373		.maxlen		= sizeof(unsigned int),
 374		.mode		= 0644,
 375		.proc_handler	= proc_dointvec,
 376	},
 377	{
 378		.procname	= "numa_balancing_scan_period_max_ms",
 379		.data		= &sysctl_numa_balancing_scan_period_max,
 380		.maxlen		= sizeof(unsigned int),
 381		.mode		= 0644,
 382		.proc_handler	= proc_dointvec,
 383	},
 384	{
 385		.procname	= "numa_balancing_scan_size_mb",
 386		.data		= &sysctl_numa_balancing_scan_size,
 387		.maxlen		= sizeof(unsigned int),
 388		.mode		= 0644,
 389		.proc_handler	= proc_dointvec_minmax,
 390		.extra1		= &one,
 391	},
 392	{
 393		.procname	= "numa_balancing",
 394		.data		= NULL, /* filled in by handler */
 395		.maxlen		= sizeof(unsigned int),
 396		.mode		= 0644,
 397		.proc_handler	= sysctl_numa_balancing,
 398		.extra1		= &zero,
 399		.extra2		= &one,
 400	},
 401#endif /* CONFIG_NUMA_BALANCING */
 402#endif /* CONFIG_SCHED_DEBUG */
 403	{
 404		.procname	= "sched_rt_period_us",
 405		.data		= &sysctl_sched_rt_period,
 406		.maxlen		= sizeof(unsigned int),
 407		.mode		= 0644,
 408		.proc_handler	= sched_rt_handler,
 409	},
 410	{
 411		.procname	= "sched_rt_runtime_us",
 412		.data		= &sysctl_sched_rt_runtime,
 413		.maxlen		= sizeof(int),
 414		.mode		= 0644,
 415		.proc_handler	= sched_rt_handler,
 416	},
 417	{
 418		.procname	= "sched_rr_timeslice_ms",
 419		.data		= &sched_rr_timeslice,
 420		.maxlen		= sizeof(int),
 421		.mode		= 0644,
 422		.proc_handler	= sched_rr_handler,
 423	},
 424#ifdef CONFIG_SCHED_AUTOGROUP
 425	{
 426		.procname	= "sched_autogroup_enabled",
 427		.data		= &sysctl_sched_autogroup_enabled,
 428		.maxlen		= sizeof(unsigned int),
 429		.mode		= 0644,
 430		.proc_handler	= proc_dointvec_minmax,
 431		.extra1		= &zero,
 432		.extra2		= &one,
 433	},
 434#endif
 435#ifdef CONFIG_CFS_BANDWIDTH
 436	{
 437		.procname	= "sched_cfs_bandwidth_slice_us",
 438		.data		= &sysctl_sched_cfs_bandwidth_slice,
 439		.maxlen		= sizeof(unsigned int),
 440		.mode		= 0644,
 441		.proc_handler	= proc_dointvec_minmax,
 442		.extra1		= &one,
 443	},
 444#endif
 445#ifdef CONFIG_PROVE_LOCKING
 446	{
 447		.procname	= "prove_locking",
 448		.data		= &prove_locking,
 449		.maxlen		= sizeof(int),
 450		.mode		= 0644,
 451		.proc_handler	= proc_dointvec,
 452	},
 453#endif
 454#ifdef CONFIG_LOCK_STAT
 455	{
 456		.procname	= "lock_stat",
 457		.data		= &lock_stat,
 458		.maxlen		= sizeof(int),
 459		.mode		= 0644,
 460		.proc_handler	= proc_dointvec,
 461	},
 462#endif
 463	{
 464		.procname	= "panic",
 465		.data		= &panic_timeout,
 466		.maxlen		= sizeof(int),
 467		.mode		= 0644,
 468		.proc_handler	= proc_dointvec,
 469	},
 470#ifdef CONFIG_COREDUMP
 471	{
 472		.procname	= "core_uses_pid",
 473		.data		= &core_uses_pid,
 474		.maxlen		= sizeof(int),
 475		.mode		= 0644,
 476		.proc_handler	= proc_dointvec,
 477	},
 478	{
 479		.procname	= "core_pattern",
 480		.data		= core_pattern,
 481		.maxlen		= CORENAME_MAX_SIZE,
 482		.mode		= 0644,
 483		.proc_handler	= proc_dostring_coredump,
 484	},
 485	{
 486		.procname	= "core_pipe_limit",
 487		.data		= &core_pipe_limit,
 488		.maxlen		= sizeof(unsigned int),
 489		.mode		= 0644,
 490		.proc_handler	= proc_dointvec,
 491	},
 492#endif
 493#ifdef CONFIG_PROC_SYSCTL
 494	{
 495		.procname	= "tainted",
 496		.maxlen 	= sizeof(long),
 497		.mode		= 0644,
 498		.proc_handler	= proc_taint,
 499	},
 500	{
 501		.procname	= "sysctl_writes_strict",
 502		.data		= &sysctl_writes_strict,
 503		.maxlen		= sizeof(int),
 504		.mode		= 0644,
 505		.proc_handler	= proc_dointvec_minmax,
 506		.extra1		= &neg_one,
 507		.extra2		= &one,
 508	},
 509#endif
 510#ifdef CONFIG_LATENCYTOP
 511	{
 512		.procname	= "latencytop",
 513		.data		= &latencytop_enabled,
 514		.maxlen		= sizeof(int),
 515		.mode		= 0644,
 516		.proc_handler	= sysctl_latencytop,
 517	},
 518#endif
 519#ifdef CONFIG_BLK_DEV_INITRD
 520	{
 521		.procname	= "real-root-dev",
 522		.data		= &real_root_dev,
 523		.maxlen		= sizeof(int),
 524		.mode		= 0644,
 525		.proc_handler	= proc_dointvec,
 526	},
 527#endif
 528	{
 529		.procname	= "print-fatal-signals",
 530		.data		= &print_fatal_signals,
 531		.maxlen		= sizeof(int),
 532		.mode		= 0644,
 533		.proc_handler	= proc_dointvec,
 534	},
 535#ifdef CONFIG_SPARC
 536	{
 537		.procname	= "reboot-cmd",
 538		.data		= reboot_command,
 539		.maxlen		= 256,
 540		.mode		= 0644,
 541		.proc_handler	= proc_dostring,
 542	},
 543	{
 544		.procname	= "stop-a",
 545		.data		= &stop_a_enabled,
 546		.maxlen		= sizeof (int),
 547		.mode		= 0644,
 548		.proc_handler	= proc_dointvec,
 549	},
 550	{
 551		.procname	= "scons-poweroff",
 552		.data		= &scons_pwroff,
 553		.maxlen		= sizeof (int),
 554		.mode		= 0644,
 555		.proc_handler	= proc_dointvec,
 556	},
 557#endif
 558#ifdef CONFIG_SPARC64
 559	{
 560		.procname	= "tsb-ratio",
 561		.data		= &sysctl_tsb_ratio,
 562		.maxlen		= sizeof (int),
 563		.mode		= 0644,
 564		.proc_handler	= proc_dointvec,
 565	},
 566#endif
 567#ifdef __hppa__
 568	{
 569		.procname	= "soft-power",
 570		.data		= &pwrsw_enabled,
 571		.maxlen		= sizeof (int),
 572	 	.mode		= 0644,
 573		.proc_handler	= proc_dointvec,
 574	},
 575#endif
 576#ifdef CONFIG_SYSCTL_ARCH_UNALIGN_ALLOW
 577	{
 578		.procname	= "unaligned-trap",
 579		.data		= &unaligned_enabled,
 580		.maxlen		= sizeof (int),
 581		.mode		= 0644,
 582		.proc_handler	= proc_dointvec,
 583	},
 584#endif
 585	{
 586		.procname	= "ctrl-alt-del",
 587		.data		= &C_A_D,
 588		.maxlen		= sizeof(int),
 589		.mode		= 0644,
 590		.proc_handler	= proc_dointvec,
 591	},
 592#ifdef CONFIG_FUNCTION_TRACER
 593	{
 594		.procname	= "ftrace_enabled",
 595		.data		= &ftrace_enabled,
 596		.maxlen		= sizeof(int),
 597		.mode		= 0644,
 598		.proc_handler	= ftrace_enable_sysctl,
 599	},
 600#endif
 601#ifdef CONFIG_STACK_TRACER
 602	{
 603		.procname	= "stack_tracer_enabled",
 604		.data		= &stack_tracer_enabled,
 605		.maxlen		= sizeof(int),
 606		.mode		= 0644,
 607		.proc_handler	= stack_trace_sysctl,
 608	},
 609#endif
 610#ifdef CONFIG_TRACING
 611	{
 612		.procname	= "ftrace_dump_on_oops",
 613		.data		= &ftrace_dump_on_oops,
 614		.maxlen		= sizeof(int),
 615		.mode		= 0644,
 616		.proc_handler	= proc_dointvec,
 617	},
 618	{
 619		.procname	= "traceoff_on_warning",
 620		.data		= &__disable_trace_on_warning,
 621		.maxlen		= sizeof(__disable_trace_on_warning),
 622		.mode		= 0644,
 623		.proc_handler	= proc_dointvec,
 624	},
 625	{
 626		.procname	= "tracepoint_printk",
 627		.data		= &tracepoint_printk,
 628		.maxlen		= sizeof(tracepoint_printk),
 629		.mode		= 0644,
 630		.proc_handler	= tracepoint_printk_sysctl,
 631	},
 632#endif
 633#ifdef CONFIG_KEXEC_CORE
 634	{
 635		.procname	= "kexec_load_disabled",
 636		.data		= &kexec_load_disabled,
 637		.maxlen		= sizeof(int),
 638		.mode		= 0644,
 639		/* only handle a transition from default "0" to "1" */
 640		.proc_handler	= proc_dointvec_minmax,
 641		.extra1		= &one,
 642		.extra2		= &one,
 643	},
 644#endif
 645#ifdef CONFIG_MODULES
 646	{
 647		.procname	= "modprobe",
 648		.data		= &modprobe_path,
 649		.maxlen		= KMOD_PATH_LEN,
 650		.mode		= 0644,
 651		.proc_handler	= proc_dostring,
 652	},
 653	{
 654		.procname	= "modules_disabled",
 655		.data		= &modules_disabled,
 656		.maxlen		= sizeof(int),
 657		.mode		= 0644,
 658		/* only handle a transition from default "0" to "1" */
 659		.proc_handler	= proc_dointvec_minmax,
 660		.extra1		= &one,
 661		.extra2		= &one,
 662	},
 663#endif
 664#ifdef CONFIG_UEVENT_HELPER
 665	{
 666		.procname	= "hotplug",
 667		.data		= &uevent_helper,
 668		.maxlen		= UEVENT_HELPER_PATH_LEN,
 669		.mode		= 0644,
 670		.proc_handler	= proc_dostring,
 671	},
 672#endif
 673#ifdef CONFIG_CHR_DEV_SG
 674	{
 675		.procname	= "sg-big-buff",
 676		.data		= &sg_big_buff,
 677		.maxlen		= sizeof (int),
 678		.mode		= 0444,
 679		.proc_handler	= proc_dointvec,
 680	},
 681#endif
 682#ifdef CONFIG_BSD_PROCESS_ACCT
 683	{
 684		.procname	= "acct",
 685		.data		= &acct_parm,
 686		.maxlen		= 3*sizeof(int),
 687		.mode		= 0644,
 688		.proc_handler	= proc_dointvec,
 689	},
 690#endif
 691#ifdef CONFIG_MAGIC_SYSRQ
 692	{
 693		.procname	= "sysrq",
 694		.data		= &__sysrq_enabled,
 695		.maxlen		= sizeof (int),
 696		.mode		= 0644,
 697		.proc_handler	= sysrq_sysctl_handler,
 698	},
 699#endif
 700#ifdef CONFIG_PROC_SYSCTL
 701	{
 702		.procname	= "cad_pid",
 703		.data		= NULL,
 704		.maxlen		= sizeof (int),
 705		.mode		= 0600,
 706		.proc_handler	= proc_do_cad_pid,
 707	},
 708#endif
 709	{
 710		.procname	= "threads-max",
 711		.data		= NULL,
 712		.maxlen		= sizeof(int),
 713		.mode		= 0644,
 714		.proc_handler	= sysctl_max_threads,
 715	},
 716	{
 717		.procname	= "random",
 718		.mode		= 0555,
 719		.child		= random_table,
 720	},
 721	{
 722		.procname	= "usermodehelper",
 723		.mode		= 0555,
 724		.child		= usermodehelper_table,
 725	},
 
 
 
 
 
 
 
 726	{
 727		.procname	= "overflowuid",
 728		.data		= &overflowuid,
 729		.maxlen		= sizeof(int),
 730		.mode		= 0644,
 731		.proc_handler	= proc_dointvec_minmax,
 732		.extra1		= &minolduid,
 733		.extra2		= &maxolduid,
 734	},
 735	{
 736		.procname	= "overflowgid",
 737		.data		= &overflowgid,
 738		.maxlen		= sizeof(int),
 739		.mode		= 0644,
 740		.proc_handler	= proc_dointvec_minmax,
 741		.extra1		= &minolduid,
 742		.extra2		= &maxolduid,
 743	},
 744#ifdef CONFIG_S390
 745#ifdef CONFIG_MATHEMU
 746	{
 747		.procname	= "ieee_emulation_warnings",
 748		.data		= &sysctl_ieee_emulation_warnings,
 749		.maxlen		= sizeof(int),
 750		.mode		= 0644,
 751		.proc_handler	= proc_dointvec,
 752	},
 753#endif
 754	{
 755		.procname	= "userprocess_debug",
 756		.data		= &show_unhandled_signals,
 757		.maxlen		= sizeof(int),
 758		.mode		= 0644,
 759		.proc_handler	= proc_dointvec,
 760	},
 761#endif
 762	{
 763		.procname	= "pid_max",
 764		.data		= &pid_max,
 765		.maxlen		= sizeof (int),
 766		.mode		= 0644,
 767		.proc_handler	= proc_dointvec_minmax,
 768		.extra1		= &pid_max_min,
 769		.extra2		= &pid_max_max,
 770	},
 771	{
 772		.procname	= "panic_on_oops",
 773		.data		= &panic_on_oops,
 774		.maxlen		= sizeof(int),
 775		.mode		= 0644,
 776		.proc_handler	= proc_dointvec,
 777	},
 778#if defined CONFIG_PRINTK
 779	{
 780		.procname	= "printk",
 781		.data		= &console_loglevel,
 782		.maxlen		= 4*sizeof(int),
 783		.mode		= 0644,
 784		.proc_handler	= proc_dointvec,
 785	},
 786	{
 787		.procname	= "printk_ratelimit",
 788		.data		= &printk_ratelimit_state.interval,
 789		.maxlen		= sizeof(int),
 790		.mode		= 0644,
 791		.proc_handler	= proc_dointvec_jiffies,
 792	},
 793	{
 794		.procname	= "printk_ratelimit_burst",
 795		.data		= &printk_ratelimit_state.burst,
 796		.maxlen		= sizeof(int),
 797		.mode		= 0644,
 798		.proc_handler	= proc_dointvec,
 799	},
 800	{
 801		.procname	= "printk_delay",
 802		.data		= &printk_delay_msec,
 803		.maxlen		= sizeof(int),
 804		.mode		= 0644,
 805		.proc_handler	= proc_dointvec_minmax,
 806		.extra1		= &zero,
 807		.extra2		= &ten_thousand,
 808	},
 809	{
 810		.procname	= "printk_devkmsg",
 811		.data		= devkmsg_log_str,
 812		.maxlen		= DEVKMSG_STR_MAX_SIZE,
 813		.mode		= 0644,
 814		.proc_handler	= devkmsg_sysctl_set_loglvl,
 815	},
 816	{
 817		.procname	= "dmesg_restrict",
 818		.data		= &dmesg_restrict,
 819		.maxlen		= sizeof(int),
 820		.mode		= 0644,
 821		.proc_handler	= proc_dointvec_minmax_sysadmin,
 822		.extra1		= &zero,
 823		.extra2		= &one,
 824	},
 825	{
 826		.procname	= "kptr_restrict",
 827		.data		= &kptr_restrict,
 828		.maxlen		= sizeof(int),
 829		.mode		= 0644,
 830		.proc_handler	= proc_dointvec_minmax_sysadmin,
 831		.extra1		= &zero,
 832		.extra2		= &two,
 833	},
 834#endif
 835	{
 836		.procname	= "ngroups_max",
 837		.data		= &ngroups_max,
 838		.maxlen		= sizeof (int),
 839		.mode		= 0444,
 840		.proc_handler	= proc_dointvec,
 841	},
 842	{
 843		.procname	= "cap_last_cap",
 844		.data		= (void *)&cap_last_cap,
 845		.maxlen		= sizeof(int),
 846		.mode		= 0444,
 847		.proc_handler	= proc_dointvec,
 848	},
 849#if defined(CONFIG_LOCKUP_DETECTOR)
 850	{
 851		.procname       = "watchdog",
 852		.data           = &watchdog_user_enabled,
 853		.maxlen         = sizeof (int),
 854		.mode           = 0644,
 855		.proc_handler   = proc_watchdog,
 856		.extra1		= &zero,
 857		.extra2		= &one,
 858	},
 859	{
 860		.procname	= "watchdog_thresh",
 861		.data		= &watchdog_thresh,
 862		.maxlen		= sizeof(int),
 863		.mode		= 0644,
 864		.proc_handler	= proc_watchdog_thresh,
 865		.extra1		= &zero,
 866		.extra2		= &sixty,
 867	},
 868	{
 869		.procname       = "nmi_watchdog",
 870		.data           = &nmi_watchdog_enabled,
 871		.maxlen         = sizeof (int),
 872		.mode           = 0644,
 873		.proc_handler   = proc_nmi_watchdog,
 874		.extra1		= &zero,
 875#if defined(CONFIG_HAVE_NMI_WATCHDOG) || defined(CONFIG_HARDLOCKUP_DETECTOR)
 876		.extra2		= &one,
 877#else
 878		.extra2		= &zero,
 879#endif
 880	},
 881	{
 882		.procname       = "soft_watchdog",
 883		.data           = &soft_watchdog_enabled,
 884		.maxlen         = sizeof (int),
 885		.mode           = 0644,
 886		.proc_handler   = proc_soft_watchdog,
 887		.extra1		= &zero,
 888		.extra2		= &one,
 889	},
 890	{
 891		.procname	= "watchdog_cpumask",
 892		.data		= &watchdog_cpumask_bits,
 893		.maxlen		= NR_CPUS,
 894		.mode		= 0644,
 895		.proc_handler	= proc_watchdog_cpumask,
 896	},
 
 
 
 
 
 
 
 
 
 
 897	{
 898		.procname	= "softlockup_panic",
 899		.data		= &softlockup_panic,
 900		.maxlen		= sizeof(int),
 901		.mode		= 0644,
 902		.proc_handler	= proc_dointvec_minmax,
 903		.extra1		= &zero,
 904		.extra2		= &one,
 905	},
 906#ifdef CONFIG_HARDLOCKUP_DETECTOR
 907	{
 908		.procname	= "hardlockup_panic",
 909		.data		= &hardlockup_panic,
 910		.maxlen		= sizeof(int),
 911		.mode		= 0644,
 912		.proc_handler	= proc_dointvec_minmax,
 913		.extra1		= &zero,
 914		.extra2		= &one,
 915	},
 
 916#endif
 917#ifdef CONFIG_SMP
 918	{
 919		.procname	= "softlockup_all_cpu_backtrace",
 920		.data		= &sysctl_softlockup_all_cpu_backtrace,
 921		.maxlen		= sizeof(int),
 922		.mode		= 0644,
 923		.proc_handler	= proc_dointvec_minmax,
 924		.extra1		= &zero,
 925		.extra2		= &one,
 926	},
 
 927	{
 928		.procname	= "hardlockup_all_cpu_backtrace",
 929		.data		= &sysctl_hardlockup_all_cpu_backtrace,
 930		.maxlen		= sizeof(int),
 931		.mode		= 0644,
 932		.proc_handler	= proc_dointvec_minmax,
 933		.extra1		= &zero,
 934		.extra2		= &one,
 935	},
 936#endif /* CONFIG_SMP */
 937#endif
 
 
 938#if defined(CONFIG_X86_LOCAL_APIC) && defined(CONFIG_X86)
 939	{
 940		.procname       = "unknown_nmi_panic",
 941		.data           = &unknown_nmi_panic,
 942		.maxlen         = sizeof (int),
 943		.mode           = 0644,
 944		.proc_handler   = proc_dointvec,
 945	},
 946#endif
 947#if defined(CONFIG_X86)
 948	{
 949		.procname	= "panic_on_unrecovered_nmi",
 950		.data		= &panic_on_unrecovered_nmi,
 951		.maxlen		= sizeof(int),
 952		.mode		= 0644,
 953		.proc_handler	= proc_dointvec,
 954	},
 955	{
 956		.procname	= "panic_on_io_nmi",
 957		.data		= &panic_on_io_nmi,
 958		.maxlen		= sizeof(int),
 959		.mode		= 0644,
 960		.proc_handler	= proc_dointvec,
 961	},
 962#ifdef CONFIG_DEBUG_STACKOVERFLOW
 963	{
 964		.procname	= "panic_on_stackoverflow",
 965		.data		= &sysctl_panic_on_stackoverflow,
 966		.maxlen		= sizeof(int),
 967		.mode		= 0644,
 968		.proc_handler	= proc_dointvec,
 969	},
 970#endif
 971	{
 972		.procname	= "bootloader_type",
 973		.data		= &bootloader_type,
 974		.maxlen		= sizeof (int),
 975		.mode		= 0444,
 976		.proc_handler	= proc_dointvec,
 977	},
 978	{
 979		.procname	= "bootloader_version",
 980		.data		= &bootloader_version,
 981		.maxlen		= sizeof (int),
 982		.mode		= 0444,
 983		.proc_handler	= proc_dointvec,
 984	},
 985	{
 986		.procname	= "io_delay_type",
 987		.data		= &io_delay_type,
 988		.maxlen		= sizeof(int),
 989		.mode		= 0644,
 990		.proc_handler	= proc_dointvec,
 991	},
 992#endif
 993#if defined(CONFIG_MMU)
 994	{
 995		.procname	= "randomize_va_space",
 996		.data		= &randomize_va_space,
 997		.maxlen		= sizeof(int),
 998		.mode		= 0644,
 999		.proc_handler	= proc_dointvec,
1000	},
1001#endif
1002#if defined(CONFIG_S390) && defined(CONFIG_SMP)
1003	{
1004		.procname	= "spin_retry",
1005		.data		= &spin_retry,
1006		.maxlen		= sizeof (int),
1007		.mode		= 0644,
1008		.proc_handler	= proc_dointvec,
1009	},
1010#endif
1011#if	defined(CONFIG_ACPI_SLEEP) && defined(CONFIG_X86)
1012	{
1013		.procname	= "acpi_video_flags",
1014		.data		= &acpi_realmode_flags,
1015		.maxlen		= sizeof (unsigned long),
1016		.mode		= 0644,
1017		.proc_handler	= proc_doulongvec_minmax,
1018	},
1019#endif
1020#ifdef CONFIG_SYSCTL_ARCH_UNALIGN_NO_WARN
1021	{
1022		.procname	= "ignore-unaligned-usertrap",
1023		.data		= &no_unaligned_warning,
1024		.maxlen		= sizeof (int),
1025	 	.mode		= 0644,
1026		.proc_handler	= proc_dointvec,
1027	},
1028#endif
1029#ifdef CONFIG_IA64
1030	{
1031		.procname	= "unaligned-dump-stack",
1032		.data		= &unaligned_dump_stack,
1033		.maxlen		= sizeof (int),
1034		.mode		= 0644,
1035		.proc_handler	= proc_dointvec,
1036	},
1037#endif
1038#ifdef CONFIG_DETECT_HUNG_TASK
1039	{
1040		.procname	= "hung_task_panic",
1041		.data		= &sysctl_hung_task_panic,
1042		.maxlen		= sizeof(int),
1043		.mode		= 0644,
1044		.proc_handler	= proc_dointvec_minmax,
1045		.extra1		= &zero,
1046		.extra2		= &one,
1047	},
1048	{
1049		.procname	= "hung_task_check_count",
1050		.data		= &sysctl_hung_task_check_count,
1051		.maxlen		= sizeof(int),
1052		.mode		= 0644,
1053		.proc_handler	= proc_dointvec_minmax,
1054		.extra1		= &zero,
1055	},
1056	{
1057		.procname	= "hung_task_timeout_secs",
1058		.data		= &sysctl_hung_task_timeout_secs,
1059		.maxlen		= sizeof(unsigned long),
1060		.mode		= 0644,
1061		.proc_handler	= proc_dohung_task_timeout_secs,
1062		.extra2		= &hung_task_timeout_max,
1063	},
1064	{
1065		.procname	= "hung_task_warnings",
1066		.data		= &sysctl_hung_task_warnings,
1067		.maxlen		= sizeof(int),
1068		.mode		= 0644,
1069		.proc_handler	= proc_dointvec_minmax,
1070		.extra1		= &neg_one,
1071	},
1072#endif
1073#ifdef CONFIG_RT_MUTEXES
1074	{
1075		.procname	= "max_lock_depth",
1076		.data		= &max_lock_depth,
1077		.maxlen		= sizeof(int),
1078		.mode		= 0644,
1079		.proc_handler	= proc_dointvec,
1080	},
1081#endif
1082	{
1083		.procname	= "poweroff_cmd",
1084		.data		= &poweroff_cmd,
1085		.maxlen		= POWEROFF_CMD_PATH_LEN,
1086		.mode		= 0644,
1087		.proc_handler	= proc_dostring,
1088	},
1089#ifdef CONFIG_KEYS
1090	{
1091		.procname	= "keys",
1092		.mode		= 0555,
1093		.child		= key_sysctls,
1094	},
1095#endif
1096#ifdef CONFIG_PERF_EVENTS
1097	/*
1098	 * User-space scripts rely on the existence of this file
1099	 * as a feature check for perf_events being enabled.
1100	 *
1101	 * So it's an ABI, do not remove!
1102	 */
1103	{
1104		.procname	= "perf_event_paranoid",
1105		.data		= &sysctl_perf_event_paranoid,
1106		.maxlen		= sizeof(sysctl_perf_event_paranoid),
1107		.mode		= 0644,
1108		.proc_handler	= proc_dointvec,
1109	},
1110	{
1111		.procname	= "perf_event_mlock_kb",
1112		.data		= &sysctl_perf_event_mlock,
1113		.maxlen		= sizeof(sysctl_perf_event_mlock),
1114		.mode		= 0644,
1115		.proc_handler	= proc_dointvec,
1116	},
1117	{
1118		.procname	= "perf_event_max_sample_rate",
1119		.data		= &sysctl_perf_event_sample_rate,
1120		.maxlen		= sizeof(sysctl_perf_event_sample_rate),
1121		.mode		= 0644,
1122		.proc_handler	= perf_proc_update_handler,
1123		.extra1		= &one,
1124	},
1125	{
1126		.procname	= "perf_cpu_time_max_percent",
1127		.data		= &sysctl_perf_cpu_time_max_percent,
1128		.maxlen		= sizeof(sysctl_perf_cpu_time_max_percent),
1129		.mode		= 0644,
1130		.proc_handler	= perf_cpu_time_max_percent_handler,
1131		.extra1		= &zero,
1132		.extra2		= &one_hundred,
1133	},
1134	{
1135		.procname	= "perf_event_max_stack",
1136		.data		= &sysctl_perf_event_max_stack,
1137		.maxlen		= sizeof(sysctl_perf_event_max_stack),
1138		.mode		= 0644,
1139		.proc_handler	= perf_event_max_stack_handler,
1140		.extra1		= &zero,
1141		.extra2		= &six_hundred_forty_kb,
1142	},
1143	{
1144		.procname	= "perf_event_max_contexts_per_stack",
1145		.data		= &sysctl_perf_event_max_contexts_per_stack,
1146		.maxlen		= sizeof(sysctl_perf_event_max_contexts_per_stack),
1147		.mode		= 0644,
1148		.proc_handler	= perf_event_max_stack_handler,
1149		.extra1		= &zero,
1150		.extra2		= &one_thousand,
1151	},
1152#endif
1153#ifdef CONFIG_KMEMCHECK
1154	{
1155		.procname	= "kmemcheck",
1156		.data		= &kmemcheck_enabled,
1157		.maxlen		= sizeof(int),
1158		.mode		= 0644,
1159		.proc_handler	= proc_dointvec,
1160	},
1161#endif
1162	{
1163		.procname	= "panic_on_warn",
1164		.data		= &panic_on_warn,
1165		.maxlen		= sizeof(int),
1166		.mode		= 0644,
1167		.proc_handler	= proc_dointvec_minmax,
1168		.extra1		= &zero,
1169		.extra2		= &one,
1170	},
1171#if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ_COMMON)
1172	{
1173		.procname	= "timer_migration",
1174		.data		= &sysctl_timer_migration,
1175		.maxlen		= sizeof(unsigned int),
1176		.mode		= 0644,
1177		.proc_handler	= timer_migration_handler,
 
 
1178	},
1179#endif
1180#ifdef CONFIG_BPF_SYSCALL
1181	{
1182		.procname	= "unprivileged_bpf_disabled",
1183		.data		= &sysctl_unprivileged_bpf_disabled,
1184		.maxlen		= sizeof(sysctl_unprivileged_bpf_disabled),
1185		.mode		= 0644,
1186		/* only handle a transition from default "0" to "1" */
1187		.proc_handler	= proc_dointvec_minmax,
1188		.extra1		= &one,
1189		.extra2		= &one,
1190	},
1191#endif
1192#if defined(CONFIG_TREE_RCU) || defined(CONFIG_PREEMPT_RCU)
1193	{
1194		.procname	= "panic_on_rcu_stall",
1195		.data		= &sysctl_panic_on_rcu_stall,
1196		.maxlen		= sizeof(sysctl_panic_on_rcu_stall),
1197		.mode		= 0644,
1198		.proc_handler	= proc_dointvec_minmax,
1199		.extra1		= &zero,
1200		.extra2		= &one,
1201	},
1202#endif
1203	{ }
1204};
1205
1206static struct ctl_table vm_table[] = {
1207	{
1208		.procname	= "overcommit_memory",
1209		.data		= &sysctl_overcommit_memory,
1210		.maxlen		= sizeof(sysctl_overcommit_memory),
1211		.mode		= 0644,
1212		.proc_handler	= proc_dointvec_minmax,
1213		.extra1		= &zero,
1214		.extra2		= &two,
1215	},
1216	{
1217		.procname	= "panic_on_oom",
1218		.data		= &sysctl_panic_on_oom,
1219		.maxlen		= sizeof(sysctl_panic_on_oom),
1220		.mode		= 0644,
1221		.proc_handler	= proc_dointvec_minmax,
1222		.extra1		= &zero,
1223		.extra2		= &two,
1224	},
1225	{
1226		.procname	= "oom_kill_allocating_task",
1227		.data		= &sysctl_oom_kill_allocating_task,
1228		.maxlen		= sizeof(sysctl_oom_kill_allocating_task),
1229		.mode		= 0644,
1230		.proc_handler	= proc_dointvec,
1231	},
1232	{
1233		.procname	= "oom_dump_tasks",
1234		.data		= &sysctl_oom_dump_tasks,
1235		.maxlen		= sizeof(sysctl_oom_dump_tasks),
1236		.mode		= 0644,
1237		.proc_handler	= proc_dointvec,
1238	},
1239	{
1240		.procname	= "overcommit_ratio",
1241		.data		= &sysctl_overcommit_ratio,
1242		.maxlen		= sizeof(sysctl_overcommit_ratio),
1243		.mode		= 0644,
1244		.proc_handler	= overcommit_ratio_handler,
1245	},
1246	{
1247		.procname	= "overcommit_kbytes",
1248		.data		= &sysctl_overcommit_kbytes,
1249		.maxlen		= sizeof(sysctl_overcommit_kbytes),
1250		.mode		= 0644,
1251		.proc_handler	= overcommit_kbytes_handler,
1252	},
1253	{
1254		.procname	= "page-cluster", 
1255		.data		= &page_cluster,
1256		.maxlen		= sizeof(int),
1257		.mode		= 0644,
1258		.proc_handler	= proc_dointvec_minmax,
1259		.extra1		= &zero,
1260	},
1261	{
1262		.procname	= "dirty_background_ratio",
1263		.data		= &dirty_background_ratio,
1264		.maxlen		= sizeof(dirty_background_ratio),
1265		.mode		= 0644,
1266		.proc_handler	= dirty_background_ratio_handler,
1267		.extra1		= &zero,
1268		.extra2		= &one_hundred,
1269	},
1270	{
1271		.procname	= "dirty_background_bytes",
1272		.data		= &dirty_background_bytes,
1273		.maxlen		= sizeof(dirty_background_bytes),
1274		.mode		= 0644,
1275		.proc_handler	= dirty_background_bytes_handler,
1276		.extra1		= &one_ul,
1277	},
1278	{
1279		.procname	= "dirty_ratio",
1280		.data		= &vm_dirty_ratio,
1281		.maxlen		= sizeof(vm_dirty_ratio),
1282		.mode		= 0644,
1283		.proc_handler	= dirty_ratio_handler,
1284		.extra1		= &zero,
1285		.extra2		= &one_hundred,
1286	},
1287	{
1288		.procname	= "dirty_bytes",
1289		.data		= &vm_dirty_bytes,
1290		.maxlen		= sizeof(vm_dirty_bytes),
1291		.mode		= 0644,
1292		.proc_handler	= dirty_bytes_handler,
1293		.extra1		= &dirty_bytes_min,
1294	},
1295	{
1296		.procname	= "dirty_writeback_centisecs",
1297		.data		= &dirty_writeback_interval,
1298		.maxlen		= sizeof(dirty_writeback_interval),
1299		.mode		= 0644,
1300		.proc_handler	= dirty_writeback_centisecs_handler,
1301	},
1302	{
1303		.procname	= "dirty_expire_centisecs",
1304		.data		= &dirty_expire_interval,
1305		.maxlen		= sizeof(dirty_expire_interval),
1306		.mode		= 0644,
1307		.proc_handler	= proc_dointvec_minmax,
1308		.extra1		= &zero,
1309	},
1310	{
1311		.procname	= "dirtytime_expire_seconds",
1312		.data		= &dirtytime_expire_interval,
1313		.maxlen		= sizeof(dirty_expire_interval),
1314		.mode		= 0644,
1315		.proc_handler	= dirtytime_interval_handler,
1316		.extra1		= &zero,
1317	},
1318	{
1319		.procname       = "nr_pdflush_threads",
1320		.mode           = 0444 /* read-only */,
1321		.proc_handler   = pdflush_proc_obsolete,
1322	},
1323	{
1324		.procname	= "swappiness",
1325		.data		= &vm_swappiness,
1326		.maxlen		= sizeof(vm_swappiness),
1327		.mode		= 0644,
1328		.proc_handler	= proc_dointvec_minmax,
1329		.extra1		= &zero,
1330		.extra2		= &one_hundred,
1331	},
1332#ifdef CONFIG_HUGETLB_PAGE
1333	{
1334		.procname	= "nr_hugepages",
1335		.data		= NULL,
1336		.maxlen		= sizeof(unsigned long),
1337		.mode		= 0644,
1338		.proc_handler	= hugetlb_sysctl_handler,
1339	},
1340#ifdef CONFIG_NUMA
1341	{
1342		.procname       = "nr_hugepages_mempolicy",
1343		.data           = NULL,
1344		.maxlen         = sizeof(unsigned long),
1345		.mode           = 0644,
1346		.proc_handler   = &hugetlb_mempolicy_sysctl_handler,
1347	},
 
 
 
 
 
 
 
 
 
1348#endif
1349	 {
1350		.procname	= "hugetlb_shm_group",
1351		.data		= &sysctl_hugetlb_shm_group,
1352		.maxlen		= sizeof(gid_t),
1353		.mode		= 0644,
1354		.proc_handler	= proc_dointvec,
1355	 },
1356	 {
1357		.procname	= "hugepages_treat_as_movable",
1358		.data		= &hugepages_treat_as_movable,
1359		.maxlen		= sizeof(int),
1360		.mode		= 0644,
1361		.proc_handler	= proc_dointvec,
1362	},
1363	{
1364		.procname	= "nr_overcommit_hugepages",
1365		.data		= NULL,
1366		.maxlen		= sizeof(unsigned long),
1367		.mode		= 0644,
1368		.proc_handler	= hugetlb_overcommit_handler,
1369	},
1370#endif
1371	{
1372		.procname	= "lowmem_reserve_ratio",
1373		.data		= &sysctl_lowmem_reserve_ratio,
1374		.maxlen		= sizeof(sysctl_lowmem_reserve_ratio),
1375		.mode		= 0644,
1376		.proc_handler	= lowmem_reserve_ratio_sysctl_handler,
1377	},
1378	{
1379		.procname	= "drop_caches",
1380		.data		= &sysctl_drop_caches,
1381		.maxlen		= sizeof(int),
1382		.mode		= 0644,
1383		.proc_handler	= drop_caches_sysctl_handler,
1384		.extra1		= &one,
1385		.extra2		= &four,
1386	},
1387#ifdef CONFIG_COMPACTION
1388	{
1389		.procname	= "compact_memory",
1390		.data		= &sysctl_compact_memory,
1391		.maxlen		= sizeof(int),
1392		.mode		= 0200,
1393		.proc_handler	= sysctl_compaction_handler,
1394	},
1395	{
1396		.procname	= "extfrag_threshold",
1397		.data		= &sysctl_extfrag_threshold,
1398		.maxlen		= sizeof(int),
1399		.mode		= 0644,
1400		.proc_handler	= sysctl_extfrag_handler,
1401		.extra1		= &min_extfrag_threshold,
1402		.extra2		= &max_extfrag_threshold,
1403	},
1404	{
1405		.procname	= "compact_unevictable_allowed",
1406		.data		= &sysctl_compact_unevictable_allowed,
1407		.maxlen		= sizeof(int),
1408		.mode		= 0644,
1409		.proc_handler	= proc_dointvec,
1410		.extra1		= &zero,
1411		.extra2		= &one,
1412	},
1413
1414#endif /* CONFIG_COMPACTION */
1415	{
1416		.procname	= "min_free_kbytes",
1417		.data		= &min_free_kbytes,
1418		.maxlen		= sizeof(min_free_kbytes),
1419		.mode		= 0644,
1420		.proc_handler	= min_free_kbytes_sysctl_handler,
1421		.extra1		= &zero,
1422	},
1423	{
1424		.procname	= "watermark_scale_factor",
1425		.data		= &watermark_scale_factor,
1426		.maxlen		= sizeof(watermark_scale_factor),
1427		.mode		= 0644,
1428		.proc_handler	= watermark_scale_factor_sysctl_handler,
1429		.extra1		= &one,
1430		.extra2		= &one_thousand,
1431	},
1432	{
1433		.procname	= "percpu_pagelist_fraction",
1434		.data		= &percpu_pagelist_fraction,
1435		.maxlen		= sizeof(percpu_pagelist_fraction),
1436		.mode		= 0644,
1437		.proc_handler	= percpu_pagelist_fraction_sysctl_handler,
1438		.extra1		= &zero,
1439	},
1440#ifdef CONFIG_MMU
1441	{
1442		.procname	= "max_map_count",
1443		.data		= &sysctl_max_map_count,
1444		.maxlen		= sizeof(sysctl_max_map_count),
1445		.mode		= 0644,
1446		.proc_handler	= proc_dointvec_minmax,
1447		.extra1		= &zero,
1448	},
1449#else
1450	{
1451		.procname	= "nr_trim_pages",
1452		.data		= &sysctl_nr_trim_pages,
1453		.maxlen		= sizeof(sysctl_nr_trim_pages),
1454		.mode		= 0644,
1455		.proc_handler	= proc_dointvec_minmax,
1456		.extra1		= &zero,
1457	},
1458#endif
1459	{
1460		.procname	= "laptop_mode",
1461		.data		= &laptop_mode,
1462		.maxlen		= sizeof(laptop_mode),
1463		.mode		= 0644,
1464		.proc_handler	= proc_dointvec_jiffies,
1465	},
1466	{
1467		.procname	= "block_dump",
1468		.data		= &block_dump,
1469		.maxlen		= sizeof(block_dump),
1470		.mode		= 0644,
1471		.proc_handler	= proc_dointvec,
1472		.extra1		= &zero,
1473	},
1474	{
1475		.procname	= "vfs_cache_pressure",
1476		.data		= &sysctl_vfs_cache_pressure,
1477		.maxlen		= sizeof(sysctl_vfs_cache_pressure),
1478		.mode		= 0644,
1479		.proc_handler	= proc_dointvec,
1480		.extra1		= &zero,
1481	},
1482#ifdef HAVE_ARCH_PICK_MMAP_LAYOUT
1483	{
1484		.procname	= "legacy_va_layout",
1485		.data		= &sysctl_legacy_va_layout,
1486		.maxlen		= sizeof(sysctl_legacy_va_layout),
1487		.mode		= 0644,
1488		.proc_handler	= proc_dointvec,
1489		.extra1		= &zero,
1490	},
1491#endif
1492#ifdef CONFIG_NUMA
1493	{
1494		.procname	= "zone_reclaim_mode",
1495		.data		= &node_reclaim_mode,
1496		.maxlen		= sizeof(node_reclaim_mode),
1497		.mode		= 0644,
1498		.proc_handler	= proc_dointvec,
1499		.extra1		= &zero,
1500	},
1501	{
1502		.procname	= "min_unmapped_ratio",
1503		.data		= &sysctl_min_unmapped_ratio,
1504		.maxlen		= sizeof(sysctl_min_unmapped_ratio),
1505		.mode		= 0644,
1506		.proc_handler	= sysctl_min_unmapped_ratio_sysctl_handler,
1507		.extra1		= &zero,
1508		.extra2		= &one_hundred,
1509	},
1510	{
1511		.procname	= "min_slab_ratio",
1512		.data		= &sysctl_min_slab_ratio,
1513		.maxlen		= sizeof(sysctl_min_slab_ratio),
1514		.mode		= 0644,
1515		.proc_handler	= sysctl_min_slab_ratio_sysctl_handler,
1516		.extra1		= &zero,
1517		.extra2		= &one_hundred,
1518	},
1519#endif
1520#ifdef CONFIG_SMP
1521	{
1522		.procname	= "stat_interval",
1523		.data		= &sysctl_stat_interval,
1524		.maxlen		= sizeof(sysctl_stat_interval),
1525		.mode		= 0644,
1526		.proc_handler	= proc_dointvec_jiffies,
1527	},
1528	{
1529		.procname	= "stat_refresh",
1530		.data		= NULL,
1531		.maxlen		= 0,
1532		.mode		= 0600,
1533		.proc_handler	= vmstat_refresh,
1534	},
1535#endif
1536#ifdef CONFIG_MMU
1537	{
1538		.procname	= "mmap_min_addr",
1539		.data		= &dac_mmap_min_addr,
1540		.maxlen		= sizeof(unsigned long),
1541		.mode		= 0644,
1542		.proc_handler	= mmap_min_addr_handler,
1543	},
1544#endif
1545#ifdef CONFIG_NUMA
1546	{
1547		.procname	= "numa_zonelist_order",
1548		.data		= &numa_zonelist_order,
1549		.maxlen		= NUMA_ZONELIST_ORDER_LEN,
1550		.mode		= 0644,
1551		.proc_handler	= numa_zonelist_order_handler,
1552	},
1553#endif
1554#if (defined(CONFIG_X86_32) && !defined(CONFIG_UML))|| \
1555   (defined(CONFIG_SUPERH) && defined(CONFIG_VSYSCALL))
1556	{
1557		.procname	= "vdso_enabled",
1558#ifdef CONFIG_X86_32
1559		.data		= &vdso32_enabled,
1560		.maxlen		= sizeof(vdso32_enabled),
1561#else
1562		.data		= &vdso_enabled,
1563		.maxlen		= sizeof(vdso_enabled),
1564#endif
1565		.mode		= 0644,
1566		.proc_handler	= proc_dointvec,
1567		.extra1		= &zero,
1568	},
1569#endif
1570#ifdef CONFIG_HIGHMEM
1571	{
1572		.procname	= "highmem_is_dirtyable",
1573		.data		= &vm_highmem_is_dirtyable,
1574		.maxlen		= sizeof(vm_highmem_is_dirtyable),
1575		.mode		= 0644,
1576		.proc_handler	= proc_dointvec_minmax,
1577		.extra1		= &zero,
1578		.extra2		= &one,
1579	},
1580#endif
1581#ifdef CONFIG_MEMORY_FAILURE
1582	{
1583		.procname	= "memory_failure_early_kill",
1584		.data		= &sysctl_memory_failure_early_kill,
1585		.maxlen		= sizeof(sysctl_memory_failure_early_kill),
1586		.mode		= 0644,
1587		.proc_handler	= proc_dointvec_minmax,
1588		.extra1		= &zero,
1589		.extra2		= &one,
1590	},
1591	{
1592		.procname	= "memory_failure_recovery",
1593		.data		= &sysctl_memory_failure_recovery,
1594		.maxlen		= sizeof(sysctl_memory_failure_recovery),
1595		.mode		= 0644,
1596		.proc_handler	= proc_dointvec_minmax,
1597		.extra1		= &zero,
1598		.extra2		= &one,
1599	},
1600#endif
1601	{
1602		.procname	= "user_reserve_kbytes",
1603		.data		= &sysctl_user_reserve_kbytes,
1604		.maxlen		= sizeof(sysctl_user_reserve_kbytes),
1605		.mode		= 0644,
1606		.proc_handler	= proc_doulongvec_minmax,
1607	},
1608	{
1609		.procname	= "admin_reserve_kbytes",
1610		.data		= &sysctl_admin_reserve_kbytes,
1611		.maxlen		= sizeof(sysctl_admin_reserve_kbytes),
1612		.mode		= 0644,
1613		.proc_handler	= proc_doulongvec_minmax,
1614	},
1615#ifdef CONFIG_HAVE_ARCH_MMAP_RND_BITS
1616	{
1617		.procname	= "mmap_rnd_bits",
1618		.data		= &mmap_rnd_bits,
1619		.maxlen		= sizeof(mmap_rnd_bits),
1620		.mode		= 0600,
1621		.proc_handler	= proc_dointvec_minmax,
1622		.extra1		= (void *)&mmap_rnd_bits_min,
1623		.extra2		= (void *)&mmap_rnd_bits_max,
1624	},
1625#endif
1626#ifdef CONFIG_HAVE_ARCH_MMAP_RND_COMPAT_BITS
1627	{
1628		.procname	= "mmap_rnd_compat_bits",
1629		.data		= &mmap_rnd_compat_bits,
1630		.maxlen		= sizeof(mmap_rnd_compat_bits),
1631		.mode		= 0600,
1632		.proc_handler	= proc_dointvec_minmax,
1633		.extra1		= (void *)&mmap_rnd_compat_bits_min,
1634		.extra2		= (void *)&mmap_rnd_compat_bits_max,
1635	},
1636#endif
1637	{ }
1638};
1639
1640static struct ctl_table fs_table[] = {
1641	{
1642		.procname	= "inode-nr",
1643		.data		= &inodes_stat,
1644		.maxlen		= 2*sizeof(long),
1645		.mode		= 0444,
1646		.proc_handler	= proc_nr_inodes,
1647	},
1648	{
1649		.procname	= "inode-state",
1650		.data		= &inodes_stat,
1651		.maxlen		= 7*sizeof(long),
1652		.mode		= 0444,
1653		.proc_handler	= proc_nr_inodes,
1654	},
1655	{
1656		.procname	= "file-nr",
1657		.data		= &files_stat,
1658		.maxlen		= sizeof(files_stat),
1659		.mode		= 0444,
1660		.proc_handler	= proc_nr_files,
1661	},
1662	{
1663		.procname	= "file-max",
1664		.data		= &files_stat.max_files,
1665		.maxlen		= sizeof(files_stat.max_files),
1666		.mode		= 0644,
1667		.proc_handler	= proc_doulongvec_minmax,
1668	},
1669	{
1670		.procname	= "nr_open",
1671		.data		= &sysctl_nr_open,
1672		.maxlen		= sizeof(unsigned int),
1673		.mode		= 0644,
1674		.proc_handler	= proc_dointvec_minmax,
1675		.extra1		= &sysctl_nr_open_min,
1676		.extra2		= &sysctl_nr_open_max,
1677	},
1678	{
1679		.procname	= "dentry-state",
1680		.data		= &dentry_stat,
1681		.maxlen		= 6*sizeof(long),
1682		.mode		= 0444,
1683		.proc_handler	= proc_nr_dentry,
1684	},
1685	{
1686		.procname	= "overflowuid",
1687		.data		= &fs_overflowuid,
1688		.maxlen		= sizeof(int),
1689		.mode		= 0644,
1690		.proc_handler	= proc_dointvec_minmax,
1691		.extra1		= &minolduid,
1692		.extra2		= &maxolduid,
1693	},
1694	{
1695		.procname	= "overflowgid",
1696		.data		= &fs_overflowgid,
1697		.maxlen		= sizeof(int),
1698		.mode		= 0644,
1699		.proc_handler	= proc_dointvec_minmax,
1700		.extra1		= &minolduid,
1701		.extra2		= &maxolduid,
1702	},
1703#ifdef CONFIG_FILE_LOCKING
1704	{
1705		.procname	= "leases-enable",
1706		.data		= &leases_enable,
1707		.maxlen		= sizeof(int),
1708		.mode		= 0644,
1709		.proc_handler	= proc_dointvec,
1710	},
1711#endif
1712#ifdef CONFIG_DNOTIFY
1713	{
1714		.procname	= "dir-notify-enable",
1715		.data		= &dir_notify_enable,
1716		.maxlen		= sizeof(int),
1717		.mode		= 0644,
1718		.proc_handler	= proc_dointvec,
1719	},
1720#endif
1721#ifdef CONFIG_MMU
1722#ifdef CONFIG_FILE_LOCKING
1723	{
1724		.procname	= "lease-break-time",
1725		.data		= &lease_break_time,
1726		.maxlen		= sizeof(int),
1727		.mode		= 0644,
1728		.proc_handler	= proc_dointvec,
1729	},
1730#endif
1731#ifdef CONFIG_AIO
1732	{
1733		.procname	= "aio-nr",
1734		.data		= &aio_nr,
1735		.maxlen		= sizeof(aio_nr),
1736		.mode		= 0444,
1737		.proc_handler	= proc_doulongvec_minmax,
1738	},
1739	{
1740		.procname	= "aio-max-nr",
1741		.data		= &aio_max_nr,
1742		.maxlen		= sizeof(aio_max_nr),
1743		.mode		= 0644,
1744		.proc_handler	= proc_doulongvec_minmax,
1745	},
1746#endif /* CONFIG_AIO */
1747#ifdef CONFIG_INOTIFY_USER
1748	{
1749		.procname	= "inotify",
1750		.mode		= 0555,
1751		.child		= inotify_table,
1752	},
1753#endif	
1754#ifdef CONFIG_EPOLL
1755	{
1756		.procname	= "epoll",
1757		.mode		= 0555,
1758		.child		= epoll_table,
1759	},
1760#endif
1761#endif
1762	{
1763		.procname	= "protected_symlinks",
1764		.data		= &sysctl_protected_symlinks,
1765		.maxlen		= sizeof(int),
1766		.mode		= 0600,
1767		.proc_handler	= proc_dointvec_minmax,
1768		.extra1		= &zero,
1769		.extra2		= &one,
1770	},
1771	{
1772		.procname	= "protected_hardlinks",
1773		.data		= &sysctl_protected_hardlinks,
1774		.maxlen		= sizeof(int),
1775		.mode		= 0600,
1776		.proc_handler	= proc_dointvec_minmax,
1777		.extra1		= &zero,
1778		.extra2		= &one,
1779	},
1780	{
1781		.procname	= "suid_dumpable",
1782		.data		= &suid_dumpable,
1783		.maxlen		= sizeof(int),
1784		.mode		= 0644,
1785		.proc_handler	= proc_dointvec_minmax_coredump,
1786		.extra1		= &zero,
1787		.extra2		= &two,
1788	},
1789#if defined(CONFIG_BINFMT_MISC) || defined(CONFIG_BINFMT_MISC_MODULE)
1790	{
1791		.procname	= "binfmt_misc",
1792		.mode		= 0555,
1793		.child		= sysctl_mount_point,
1794	},
1795#endif
1796	{
1797		.procname	= "pipe-max-size",
1798		.data		= &pipe_max_size,
1799		.maxlen		= sizeof(int),
1800		.mode		= 0644,
1801		.proc_handler	= &pipe_proc_fn,
1802		.extra1		= &pipe_min_size,
1803	},
1804	{
1805		.procname	= "pipe-user-pages-hard",
1806		.data		= &pipe_user_pages_hard,
1807		.maxlen		= sizeof(pipe_user_pages_hard),
1808		.mode		= 0644,
1809		.proc_handler	= proc_doulongvec_minmax,
1810	},
1811	{
1812		.procname	= "pipe-user-pages-soft",
1813		.data		= &pipe_user_pages_soft,
1814		.maxlen		= sizeof(pipe_user_pages_soft),
1815		.mode		= 0644,
1816		.proc_handler	= proc_doulongvec_minmax,
1817	},
1818	{
1819		.procname	= "mount-max",
1820		.data		= &sysctl_mount_max,
1821		.maxlen		= sizeof(unsigned int),
1822		.mode		= 0644,
1823		.proc_handler	= proc_dointvec_minmax,
1824		.extra1		= &one,
1825	},
1826	{ }
1827};
1828
1829static struct ctl_table debug_table[] = {
1830#ifdef CONFIG_SYSCTL_EXCEPTION_TRACE
1831	{
1832		.procname	= "exception-trace",
1833		.data		= &show_unhandled_signals,
1834		.maxlen		= sizeof(int),
1835		.mode		= 0644,
1836		.proc_handler	= proc_dointvec
1837	},
1838#endif
1839#if defined(CONFIG_OPTPROBES)
1840	{
1841		.procname	= "kprobes-optimization",
1842		.data		= &sysctl_kprobes_optimization,
1843		.maxlen		= sizeof(int),
1844		.mode		= 0644,
1845		.proc_handler	= proc_kprobes_optimization_handler,
1846		.extra1		= &zero,
1847		.extra2		= &one,
1848	},
1849#endif
1850	{ }
1851};
1852
1853static struct ctl_table dev_table[] = {
1854	{ }
1855};
1856
1857int __init sysctl_init(void)
1858{
1859	struct ctl_table_header *hdr;
1860
1861	hdr = register_sysctl_table(sysctl_base_table);
1862	kmemleak_not_leak(hdr);
1863	return 0;
1864}
1865
1866#endif /* CONFIG_SYSCTL */
1867
1868/*
1869 * /proc/sys support
1870 */
1871
1872#ifdef CONFIG_PROC_SYSCTL
1873
1874static int _proc_do_string(char *data, int maxlen, int write,
1875			   char __user *buffer,
1876			   size_t *lenp, loff_t *ppos)
1877{
1878	size_t len;
1879	char __user *p;
1880	char c;
1881
1882	if (!data || !maxlen || !*lenp) {
1883		*lenp = 0;
1884		return 0;
1885	}
1886
1887	if (write) {
1888		if (sysctl_writes_strict == SYSCTL_WRITES_STRICT) {
1889			/* Only continue writes not past the end of buffer. */
1890			len = strlen(data);
1891			if (len > maxlen - 1)
1892				len = maxlen - 1;
1893
1894			if (*ppos > len)
1895				return 0;
1896			len = *ppos;
1897		} else {
1898			/* Start writing from beginning of buffer. */
1899			len = 0;
1900		}
1901
1902		*ppos += *lenp;
1903		p = buffer;
1904		while ((p - buffer) < *lenp && len < maxlen - 1) {
1905			if (get_user(c, p++))
1906				return -EFAULT;
1907			if (c == 0 || c == '\n')
1908				break;
1909			data[len++] = c;
1910		}
1911		data[len] = 0;
1912	} else {
1913		len = strlen(data);
1914		if (len > maxlen)
1915			len = maxlen;
1916
1917		if (*ppos > len) {
1918			*lenp = 0;
1919			return 0;
1920		}
1921
1922		data += *ppos;
1923		len  -= *ppos;
1924
1925		if (len > *lenp)
1926			len = *lenp;
1927		if (len)
1928			if (copy_to_user(buffer, data, len))
1929				return -EFAULT;
1930		if (len < *lenp) {
1931			if (put_user('\n', buffer + len))
1932				return -EFAULT;
1933			len++;
1934		}
1935		*lenp = len;
1936		*ppos += len;
1937	}
1938	return 0;
1939}
1940
1941static void warn_sysctl_write(struct ctl_table *table)
1942{
1943	pr_warn_once("%s wrote to %s when file position was not 0!\n"
1944		"This will not be supported in the future. To silence this\n"
1945		"warning, set kernel.sysctl_writes_strict = -1\n",
1946		current->comm, table->procname);
1947}
1948
1949/**
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1950 * proc_dostring - read a string sysctl
1951 * @table: the sysctl table
1952 * @write: %TRUE if this is a write to the sysctl file
1953 * @buffer: the user buffer
1954 * @lenp: the size of the user buffer
1955 * @ppos: file position
1956 *
1957 * Reads/writes a string from/to the user buffer. If the kernel
1958 * buffer provided is not large enough to hold the string, the
1959 * string is truncated. The copied string is %NULL-terminated.
1960 * If the string is being read by the user process, it is copied
1961 * and a newline '\n' is added. It is truncated if the buffer is
1962 * not large enough.
1963 *
1964 * Returns 0 on success.
1965 */
1966int proc_dostring(struct ctl_table *table, int write,
1967		  void __user *buffer, size_t *lenp, loff_t *ppos)
1968{
1969	if (write && *ppos && sysctl_writes_strict == SYSCTL_WRITES_WARN)
1970		warn_sysctl_write(table);
1971
1972	return _proc_do_string((char *)(table->data), table->maxlen, write,
1973			       (char __user *)buffer, lenp, ppos);
1974}
1975
1976static size_t proc_skip_spaces(char **buf)
1977{
1978	size_t ret;
1979	char *tmp = skip_spaces(*buf);
1980	ret = tmp - *buf;
1981	*buf = tmp;
1982	return ret;
1983}
1984
1985static void proc_skip_char(char **buf, size_t *size, const char v)
1986{
1987	while (*size) {
1988		if (**buf != v)
1989			break;
1990		(*size)--;
1991		(*buf)++;
1992	}
1993}
1994
1995#define TMPBUFLEN 22
1996/**
1997 * proc_get_long - reads an ASCII formatted integer from a user buffer
1998 *
1999 * @buf: a kernel buffer
2000 * @size: size of the kernel buffer
2001 * @val: this is where the number will be stored
2002 * @neg: set to %TRUE if number is negative
2003 * @perm_tr: a vector which contains the allowed trailers
2004 * @perm_tr_len: size of the perm_tr vector
2005 * @tr: pointer to store the trailer character
2006 *
2007 * In case of success %0 is returned and @buf and @size are updated with
2008 * the amount of bytes read. If @tr is non-NULL and a trailing
2009 * character exists (size is non-zero after returning from this
2010 * function), @tr is updated with the trailing character.
2011 */
2012static int proc_get_long(char **buf, size_t *size,
2013			  unsigned long *val, bool *neg,
2014			  const char *perm_tr, unsigned perm_tr_len, char *tr)
2015{
2016	int len;
2017	char *p, tmp[TMPBUFLEN];
2018
2019	if (!*size)
2020		return -EINVAL;
2021
2022	len = *size;
2023	if (len > TMPBUFLEN - 1)
2024		len = TMPBUFLEN - 1;
2025
2026	memcpy(tmp, *buf, len);
2027
2028	tmp[len] = 0;
2029	p = tmp;
2030	if (*p == '-' && *size > 1) {
2031		*neg = true;
2032		p++;
2033	} else
2034		*neg = false;
2035	if (!isdigit(*p))
2036		return -EINVAL;
2037
2038	*val = simple_strtoul(p, &p, 0);
2039
2040	len = p - tmp;
2041
2042	/* We don't know if the next char is whitespace thus we may accept
2043	 * invalid integers (e.g. 1234...a) or two integers instead of one
2044	 * (e.g. 123...1). So lets not allow such large numbers. */
2045	if (len == TMPBUFLEN - 1)
2046		return -EINVAL;
2047
2048	if (len < *size && perm_tr_len && !memchr(perm_tr, *p, perm_tr_len))
2049		return -EINVAL;
2050
2051	if (tr && (len < *size))
2052		*tr = *p;
2053
2054	*buf += len;
2055	*size -= len;
2056
2057	return 0;
2058}
2059
2060/**
2061 * proc_put_long - converts an integer to a decimal ASCII formatted string
2062 *
2063 * @buf: the user buffer
2064 * @size: the size of the user buffer
2065 * @val: the integer to be converted
2066 * @neg: sign of the number, %TRUE for negative
2067 *
2068 * In case of success %0 is returned and @buf and @size are updated with
2069 * the amount of bytes written.
2070 */
2071static int proc_put_long(void __user **buf, size_t *size, unsigned long val,
2072			  bool neg)
2073{
2074	int len;
2075	char tmp[TMPBUFLEN], *p = tmp;
2076
2077	sprintf(p, "%s%lu", neg ? "-" : "", val);
2078	len = strlen(tmp);
2079	if (len > *size)
2080		len = *size;
2081	if (copy_to_user(*buf, tmp, len))
2082		return -EFAULT;
2083	*size -= len;
2084	*buf += len;
2085	return 0;
2086}
2087#undef TMPBUFLEN
2088
2089static int proc_put_char(void __user **buf, size_t *size, char c)
2090{
2091	if (*size) {
2092		char __user **buffer = (char __user **)buf;
2093		if (put_user(c, *buffer))
2094			return -EFAULT;
2095		(*size)--, (*buffer)++;
2096		*buf = *buffer;
2097	}
2098	return 0;
2099}
2100
2101static int do_proc_dointvec_conv(bool *negp, unsigned long *lvalp,
2102				 int *valp,
2103				 int write, void *data)
2104{
2105	if (write) {
2106		if (*negp) {
2107			if (*lvalp > (unsigned long) INT_MAX + 1)
2108				return -EINVAL;
2109			*valp = -*lvalp;
2110		} else {
2111			if (*lvalp > (unsigned long) INT_MAX)
2112				return -EINVAL;
2113			*valp = *lvalp;
2114		}
2115	} else {
2116		int val = *valp;
2117		if (val < 0) {
2118			*negp = true;
2119			*lvalp = -(unsigned long)val;
2120		} else {
2121			*negp = false;
2122			*lvalp = (unsigned long)val;
2123		}
2124	}
2125	return 0;
2126}
2127
2128static int do_proc_douintvec_conv(bool *negp, unsigned long *lvalp,
2129				 int *valp,
2130				 int write, void *data)
2131{
2132	if (write) {
2133		if (*negp)
2134			return -EINVAL;
2135		*valp = *lvalp;
2136	} else {
2137		unsigned int val = *valp;
2138		*lvalp = (unsigned long)val;
2139	}
2140	return 0;
2141}
2142
2143static const char proc_wspace_sep[] = { ' ', '\t', '\n' };
2144
2145static int __do_proc_dointvec(void *tbl_data, struct ctl_table *table,
2146		  int write, void __user *buffer,
2147		  size_t *lenp, loff_t *ppos,
2148		  int (*conv)(bool *negp, unsigned long *lvalp, int *valp,
2149			      int write, void *data),
2150		  void *data)
2151{
2152	int *i, vleft, first = 1, err = 0;
2153	size_t left;
2154	char *kbuf = NULL, *p;
2155	
2156	if (!tbl_data || !table->maxlen || !*lenp || (*ppos && !write)) {
2157		*lenp = 0;
2158		return 0;
2159	}
2160	
2161	i = (int *) tbl_data;
2162	vleft = table->maxlen / sizeof(*i);
2163	left = *lenp;
2164
2165	if (!conv)
2166		conv = do_proc_dointvec_conv;
2167
2168	if (write) {
2169		if (*ppos) {
2170			switch (sysctl_writes_strict) {
2171			case SYSCTL_WRITES_STRICT:
2172				goto out;
2173			case SYSCTL_WRITES_WARN:
2174				warn_sysctl_write(table);
2175				break;
2176			default:
2177				break;
2178			}
2179		}
2180
2181		if (left > PAGE_SIZE - 1)
2182			left = PAGE_SIZE - 1;
2183		p = kbuf = memdup_user_nul(buffer, left);
2184		if (IS_ERR(kbuf))
2185			return PTR_ERR(kbuf);
2186	}
2187
2188	for (; left && vleft--; i++, first=0) {
2189		unsigned long lval;
2190		bool neg;
2191
2192		if (write) {
2193			left -= proc_skip_spaces(&p);
2194
2195			if (!left)
2196				break;
2197			err = proc_get_long(&p, &left, &lval, &neg,
2198					     proc_wspace_sep,
2199					     sizeof(proc_wspace_sep), NULL);
2200			if (err)
2201				break;
2202			if (conv(&neg, &lval, i, 1, data)) {
2203				err = -EINVAL;
2204				break;
2205			}
2206		} else {
2207			if (conv(&neg, &lval, i, 0, data)) {
2208				err = -EINVAL;
2209				break;
2210			}
2211			if (!first)
2212				err = proc_put_char(&buffer, &left, '\t');
2213			if (err)
2214				break;
2215			err = proc_put_long(&buffer, &left, lval, neg);
2216			if (err)
2217				break;
2218		}
2219	}
2220
2221	if (!write && !first && left && !err)
2222		err = proc_put_char(&buffer, &left, '\n');
2223	if (write && !err && left)
2224		left -= proc_skip_spaces(&p);
2225	if (write) {
2226		kfree(kbuf);
2227		if (first)
2228			return err ? : -EINVAL;
2229	}
2230	*lenp -= left;
2231out:
2232	*ppos += *lenp;
2233	return err;
2234}
2235
2236static int do_proc_dointvec(struct ctl_table *table, int write,
2237		  void __user *buffer, size_t *lenp, loff_t *ppos,
2238		  int (*conv)(bool *negp, unsigned long *lvalp, int *valp,
2239			      int write, void *data),
2240		  void *data)
2241{
2242	return __do_proc_dointvec(table->data, table, write,
2243			buffer, lenp, ppos, conv, data);
2244}
2245
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2246/**
2247 * proc_dointvec - read a vector of integers
2248 * @table: the sysctl table
2249 * @write: %TRUE if this is a write to the sysctl file
2250 * @buffer: the user buffer
2251 * @lenp: the size of the user buffer
2252 * @ppos: file position
2253 *
2254 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2255 * values from/to the user buffer, treated as an ASCII string. 
2256 *
2257 * Returns 0 on success.
2258 */
2259int proc_dointvec(struct ctl_table *table, int write,
2260		     void __user *buffer, size_t *lenp, loff_t *ppos)
2261{
2262	return do_proc_dointvec(table, write, buffer, lenp, ppos, NULL, NULL);
2263}
2264
2265/**
2266 * proc_douintvec - read a vector of unsigned integers
2267 * @table: the sysctl table
2268 * @write: %TRUE if this is a write to the sysctl file
2269 * @buffer: the user buffer
2270 * @lenp: the size of the user buffer
2271 * @ppos: file position
2272 *
2273 * Reads/writes up to table->maxlen/sizeof(unsigned int) unsigned integer
2274 * values from/to the user buffer, treated as an ASCII string.
2275 *
2276 * Returns 0 on success.
2277 */
2278int proc_douintvec(struct ctl_table *table, int write,
2279		     void __user *buffer, size_t *lenp, loff_t *ppos)
2280{
2281	return do_proc_dointvec(table, write, buffer, lenp, ppos,
2282				do_proc_douintvec_conv, NULL);
2283}
2284
2285/*
2286 * Taint values can only be increased
2287 * This means we can safely use a temporary.
2288 */
2289static int proc_taint(struct ctl_table *table, int write,
2290			       void __user *buffer, size_t *lenp, loff_t *ppos)
2291{
2292	struct ctl_table t;
2293	unsigned long tmptaint = get_taint();
2294	int err;
2295
2296	if (write && !capable(CAP_SYS_ADMIN))
2297		return -EPERM;
2298
2299	t = *table;
2300	t.data = &tmptaint;
2301	err = proc_doulongvec_minmax(&t, write, buffer, lenp, ppos);
2302	if (err < 0)
2303		return err;
2304
2305	if (write) {
2306		/*
2307		 * Poor man's atomic or. Not worth adding a primitive
2308		 * to everyone's atomic.h for this
2309		 */
2310		int i;
2311		for (i = 0; i < BITS_PER_LONG && tmptaint >> i; i++) {
2312			if ((tmptaint >> i) & 1)
2313				add_taint(i, LOCKDEP_STILL_OK);
2314		}
2315	}
2316
2317	return err;
2318}
2319
2320#ifdef CONFIG_PRINTK
2321static int proc_dointvec_minmax_sysadmin(struct ctl_table *table, int write,
2322				void __user *buffer, size_t *lenp, loff_t *ppos)
2323{
2324	if (write && !capable(CAP_SYS_ADMIN))
2325		return -EPERM;
2326
2327	return proc_dointvec_minmax(table, write, buffer, lenp, ppos);
2328}
2329#endif
2330
 
 
 
 
 
 
 
 
 
2331struct do_proc_dointvec_minmax_conv_param {
2332	int *min;
2333	int *max;
2334};
2335
2336static int do_proc_dointvec_minmax_conv(bool *negp, unsigned long *lvalp,
2337					int *valp,
2338					int write, void *data)
2339{
2340	struct do_proc_dointvec_minmax_conv_param *param = data;
2341	if (write) {
2342		int val = *negp ? -*lvalp : *lvalp;
2343		if ((param->min && *param->min > val) ||
2344		    (param->max && *param->max < val))
2345			return -EINVAL;
2346		*valp = val;
2347	} else {
2348		int val = *valp;
2349		if (val < 0) {
2350			*negp = true;
2351			*lvalp = -(unsigned long)val;
2352		} else {
2353			*negp = false;
2354			*lvalp = (unsigned long)val;
2355		}
2356	}
2357	return 0;
2358}
2359
2360/**
2361 * proc_dointvec_minmax - read a vector of integers with min/max values
2362 * @table: the sysctl table
2363 * @write: %TRUE if this is a write to the sysctl file
2364 * @buffer: the user buffer
2365 * @lenp: the size of the user buffer
2366 * @ppos: file position
2367 *
2368 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2369 * values from/to the user buffer, treated as an ASCII string.
2370 *
2371 * This routine will ensure the values are within the range specified by
2372 * table->extra1 (min) and table->extra2 (max).
2373 *
2374 * Returns 0 on success.
2375 */
2376int proc_dointvec_minmax(struct ctl_table *table, int write,
2377		  void __user *buffer, size_t *lenp, loff_t *ppos)
2378{
2379	struct do_proc_dointvec_minmax_conv_param param = {
2380		.min = (int *) table->extra1,
2381		.max = (int *) table->extra2,
2382	};
2383	return do_proc_dointvec(table, write, buffer, lenp, ppos,
2384				do_proc_dointvec_minmax_conv, &param);
2385}
2386
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2387static void validate_coredump_safety(void)
2388{
2389#ifdef CONFIG_COREDUMP
2390	if (suid_dumpable == SUID_DUMP_ROOT &&
2391	    core_pattern[0] != '/' && core_pattern[0] != '|') {
2392		printk(KERN_WARNING
2393"Unsafe core_pattern used with fs.suid_dumpable=2.\n"
2394"Pipe handler or fully qualified core dump path required.\n"
2395"Set kernel.core_pattern before fs.suid_dumpable.\n"
2396		);
2397	}
2398#endif
2399}
2400
2401static int proc_dointvec_minmax_coredump(struct ctl_table *table, int write,
2402		void __user *buffer, size_t *lenp, loff_t *ppos)
2403{
2404	int error = proc_dointvec_minmax(table, write, buffer, lenp, ppos);
2405	if (!error)
2406		validate_coredump_safety();
2407	return error;
2408}
2409
2410#ifdef CONFIG_COREDUMP
2411static int proc_dostring_coredump(struct ctl_table *table, int write,
2412		  void __user *buffer, size_t *lenp, loff_t *ppos)
2413{
2414	int error = proc_dostring(table, write, buffer, lenp, ppos);
2415	if (!error)
2416		validate_coredump_safety();
2417	return error;
2418}
2419#endif
2420
2421static int __do_proc_doulongvec_minmax(void *data, struct ctl_table *table, int write,
2422				     void __user *buffer,
2423				     size_t *lenp, loff_t *ppos,
2424				     unsigned long convmul,
2425				     unsigned long convdiv)
2426{
2427	unsigned long *i, *min, *max;
2428	int vleft, first = 1, err = 0;
2429	size_t left;
2430	char *kbuf = NULL, *p;
2431
2432	if (!data || !table->maxlen || !*lenp || (*ppos && !write)) {
2433		*lenp = 0;
2434		return 0;
2435	}
2436
2437	i = (unsigned long *) data;
2438	min = (unsigned long *) table->extra1;
2439	max = (unsigned long *) table->extra2;
2440	vleft = table->maxlen / sizeof(unsigned long);
2441	left = *lenp;
2442
2443	if (write) {
2444		if (*ppos) {
2445			switch (sysctl_writes_strict) {
2446			case SYSCTL_WRITES_STRICT:
2447				goto out;
2448			case SYSCTL_WRITES_WARN:
2449				warn_sysctl_write(table);
2450				break;
2451			default:
2452				break;
2453			}
2454		}
2455
2456		if (left > PAGE_SIZE - 1)
2457			left = PAGE_SIZE - 1;
2458		p = kbuf = memdup_user_nul(buffer, left);
2459		if (IS_ERR(kbuf))
2460			return PTR_ERR(kbuf);
2461	}
2462
2463	for (; left && vleft--; i++, first = 0) {
2464		unsigned long val;
2465
2466		if (write) {
2467			bool neg;
2468
2469			left -= proc_skip_spaces(&p);
2470
2471			err = proc_get_long(&p, &left, &val, &neg,
2472					     proc_wspace_sep,
2473					     sizeof(proc_wspace_sep), NULL);
2474			if (err)
2475				break;
2476			if (neg)
2477				continue;
2478			val = convmul * val / convdiv;
2479			if ((min && val < *min) || (max && val > *max))
2480				continue;
2481			*i = val;
2482		} else {
2483			val = convdiv * (*i) / convmul;
2484			if (!first) {
2485				err = proc_put_char(&buffer, &left, '\t');
2486				if (err)
2487					break;
2488			}
2489			err = proc_put_long(&buffer, &left, val, false);
2490			if (err)
2491				break;
2492		}
2493	}
2494
2495	if (!write && !first && left && !err)
2496		err = proc_put_char(&buffer, &left, '\n');
2497	if (write && !err)
2498		left -= proc_skip_spaces(&p);
2499	if (write) {
2500		kfree(kbuf);
2501		if (first)
2502			return err ? : -EINVAL;
2503	}
2504	*lenp -= left;
2505out:
2506	*ppos += *lenp;
2507	return err;
2508}
2509
2510static int do_proc_doulongvec_minmax(struct ctl_table *table, int write,
2511				     void __user *buffer,
2512				     size_t *lenp, loff_t *ppos,
2513				     unsigned long convmul,
2514				     unsigned long convdiv)
2515{
2516	return __do_proc_doulongvec_minmax(table->data, table, write,
2517			buffer, lenp, ppos, convmul, convdiv);
2518}
2519
2520/**
2521 * proc_doulongvec_minmax - read a vector of long integers with min/max values
2522 * @table: the sysctl table
2523 * @write: %TRUE if this is a write to the sysctl file
2524 * @buffer: the user buffer
2525 * @lenp: the size of the user buffer
2526 * @ppos: file position
2527 *
2528 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long
2529 * values from/to the user buffer, treated as an ASCII string.
2530 *
2531 * This routine will ensure the values are within the range specified by
2532 * table->extra1 (min) and table->extra2 (max).
2533 *
2534 * Returns 0 on success.
2535 */
2536int proc_doulongvec_minmax(struct ctl_table *table, int write,
2537			   void __user *buffer, size_t *lenp, loff_t *ppos)
2538{
2539    return do_proc_doulongvec_minmax(table, write, buffer, lenp, ppos, 1l, 1l);
2540}
2541
2542/**
2543 * proc_doulongvec_ms_jiffies_minmax - read a vector of millisecond values with min/max values
2544 * @table: the sysctl table
2545 * @write: %TRUE if this is a write to the sysctl file
2546 * @buffer: the user buffer
2547 * @lenp: the size of the user buffer
2548 * @ppos: file position
2549 *
2550 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long
2551 * values from/to the user buffer, treated as an ASCII string. The values
2552 * are treated as milliseconds, and converted to jiffies when they are stored.
2553 *
2554 * This routine will ensure the values are within the range specified by
2555 * table->extra1 (min) and table->extra2 (max).
2556 *
2557 * Returns 0 on success.
2558 */
2559int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write,
2560				      void __user *buffer,
2561				      size_t *lenp, loff_t *ppos)
2562{
2563    return do_proc_doulongvec_minmax(table, write, buffer,
2564				     lenp, ppos, HZ, 1000l);
2565}
2566
2567
2568static int do_proc_dointvec_jiffies_conv(bool *negp, unsigned long *lvalp,
2569					 int *valp,
2570					 int write, void *data)
2571{
2572	if (write) {
2573		if (*lvalp > LONG_MAX / HZ)
2574			return 1;
2575		*valp = *negp ? -(*lvalp*HZ) : (*lvalp*HZ);
2576	} else {
2577		int val = *valp;
2578		unsigned long lval;
2579		if (val < 0) {
2580			*negp = true;
2581			lval = -(unsigned long)val;
2582		} else {
2583			*negp = false;
2584			lval = (unsigned long)val;
2585		}
2586		*lvalp = lval / HZ;
2587	}
2588	return 0;
2589}
2590
2591static int do_proc_dointvec_userhz_jiffies_conv(bool *negp, unsigned long *lvalp,
2592						int *valp,
2593						int write, void *data)
2594{
2595	if (write) {
2596		if (USER_HZ < HZ && *lvalp > (LONG_MAX / HZ) * USER_HZ)
2597			return 1;
2598		*valp = clock_t_to_jiffies(*negp ? -*lvalp : *lvalp);
2599	} else {
2600		int val = *valp;
2601		unsigned long lval;
2602		if (val < 0) {
2603			*negp = true;
2604			lval = -(unsigned long)val;
2605		} else {
2606			*negp = false;
2607			lval = (unsigned long)val;
2608		}
2609		*lvalp = jiffies_to_clock_t(lval);
2610	}
2611	return 0;
2612}
2613
2614static int do_proc_dointvec_ms_jiffies_conv(bool *negp, unsigned long *lvalp,
2615					    int *valp,
2616					    int write, void *data)
2617{
2618	if (write) {
2619		unsigned long jif = msecs_to_jiffies(*negp ? -*lvalp : *lvalp);
2620
2621		if (jif > INT_MAX)
2622			return 1;
2623		*valp = (int)jif;
2624	} else {
2625		int val = *valp;
2626		unsigned long lval;
2627		if (val < 0) {
2628			*negp = true;
2629			lval = -(unsigned long)val;
2630		} else {
2631			*negp = false;
2632			lval = (unsigned long)val;
2633		}
2634		*lvalp = jiffies_to_msecs(lval);
2635	}
2636	return 0;
2637}
2638
2639/**
2640 * proc_dointvec_jiffies - read a vector of integers as seconds
2641 * @table: the sysctl table
2642 * @write: %TRUE if this is a write to the sysctl file
2643 * @buffer: the user buffer
2644 * @lenp: the size of the user buffer
2645 * @ppos: file position
2646 *
2647 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2648 * values from/to the user buffer, treated as an ASCII string. 
2649 * The values read are assumed to be in seconds, and are converted into
2650 * jiffies.
2651 *
2652 * Returns 0 on success.
2653 */
2654int proc_dointvec_jiffies(struct ctl_table *table, int write,
2655			  void __user *buffer, size_t *lenp, loff_t *ppos)
2656{
2657    return do_proc_dointvec(table,write,buffer,lenp,ppos,
2658		    	    do_proc_dointvec_jiffies_conv,NULL);
2659}
2660
2661/**
2662 * proc_dointvec_userhz_jiffies - read a vector of integers as 1/USER_HZ seconds
2663 * @table: the sysctl table
2664 * @write: %TRUE if this is a write to the sysctl file
2665 * @buffer: the user buffer
2666 * @lenp: the size of the user buffer
2667 * @ppos: pointer to the file position
2668 *
2669 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2670 * values from/to the user buffer, treated as an ASCII string. 
2671 * The values read are assumed to be in 1/USER_HZ seconds, and 
2672 * are converted into jiffies.
2673 *
2674 * Returns 0 on success.
2675 */
2676int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write,
2677				 void __user *buffer, size_t *lenp, loff_t *ppos)
2678{
2679    return do_proc_dointvec(table,write,buffer,lenp,ppos,
2680		    	    do_proc_dointvec_userhz_jiffies_conv,NULL);
2681}
2682
2683/**
2684 * proc_dointvec_ms_jiffies - read a vector of integers as 1 milliseconds
2685 * @table: the sysctl table
2686 * @write: %TRUE if this is a write to the sysctl file
2687 * @buffer: the user buffer
2688 * @lenp: the size of the user buffer
2689 * @ppos: file position
2690 * @ppos: the current position in the file
2691 *
2692 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2693 * values from/to the user buffer, treated as an ASCII string. 
2694 * The values read are assumed to be in 1/1000 seconds, and 
2695 * are converted into jiffies.
2696 *
2697 * Returns 0 on success.
2698 */
2699int proc_dointvec_ms_jiffies(struct ctl_table *table, int write,
2700			     void __user *buffer, size_t *lenp, loff_t *ppos)
2701{
2702	return do_proc_dointvec(table, write, buffer, lenp, ppos,
2703				do_proc_dointvec_ms_jiffies_conv, NULL);
2704}
2705
2706static int proc_do_cad_pid(struct ctl_table *table, int write,
2707			   void __user *buffer, size_t *lenp, loff_t *ppos)
2708{
2709	struct pid *new_pid;
2710	pid_t tmp;
2711	int r;
2712
2713	tmp = pid_vnr(cad_pid);
2714
2715	r = __do_proc_dointvec(&tmp, table, write, buffer,
2716			       lenp, ppos, NULL, NULL);
2717	if (r || !write)
2718		return r;
2719
2720	new_pid = find_get_pid(tmp);
2721	if (!new_pid)
2722		return -ESRCH;
2723
2724	put_pid(xchg(&cad_pid, new_pid));
2725	return 0;
2726}
2727
2728/**
2729 * proc_do_large_bitmap - read/write from/to a large bitmap
2730 * @table: the sysctl table
2731 * @write: %TRUE if this is a write to the sysctl file
2732 * @buffer: the user buffer
2733 * @lenp: the size of the user buffer
2734 * @ppos: file position
2735 *
2736 * The bitmap is stored at table->data and the bitmap length (in bits)
2737 * in table->maxlen.
2738 *
2739 * We use a range comma separated format (e.g. 1,3-4,10-10) so that
2740 * large bitmaps may be represented in a compact manner. Writing into
2741 * the file will clear the bitmap then update it with the given input.
2742 *
2743 * Returns 0 on success.
2744 */
2745int proc_do_large_bitmap(struct ctl_table *table, int write,
2746			 void __user *buffer, size_t *lenp, loff_t *ppos)
2747{
2748	int err = 0;
2749	bool first = 1;
2750	size_t left = *lenp;
2751	unsigned long bitmap_len = table->maxlen;
2752	unsigned long *bitmap = *(unsigned long **) table->data;
2753	unsigned long *tmp_bitmap = NULL;
2754	char tr_a[] = { '-', ',', '\n' }, tr_b[] = { ',', '\n', 0 }, c;
2755
2756	if (!bitmap || !bitmap_len || !left || (*ppos && !write)) {
2757		*lenp = 0;
2758		return 0;
2759	}
2760
2761	if (write) {
2762		char *kbuf, *p;
2763
2764		if (left > PAGE_SIZE - 1)
2765			left = PAGE_SIZE - 1;
2766
2767		p = kbuf = memdup_user_nul(buffer, left);
2768		if (IS_ERR(kbuf))
2769			return PTR_ERR(kbuf);
2770
2771		tmp_bitmap = kzalloc(BITS_TO_LONGS(bitmap_len) * sizeof(unsigned long),
2772				     GFP_KERNEL);
2773		if (!tmp_bitmap) {
2774			kfree(kbuf);
2775			return -ENOMEM;
2776		}
2777		proc_skip_char(&p, &left, '\n');
2778		while (!err && left) {
2779			unsigned long val_a, val_b;
2780			bool neg;
2781
2782			err = proc_get_long(&p, &left, &val_a, &neg, tr_a,
2783					     sizeof(tr_a), &c);
2784			if (err)
2785				break;
2786			if (val_a >= bitmap_len || neg) {
2787				err = -EINVAL;
2788				break;
2789			}
2790
2791			val_b = val_a;
2792			if (left) {
2793				p++;
2794				left--;
2795			}
2796
2797			if (c == '-') {
2798				err = proc_get_long(&p, &left, &val_b,
2799						     &neg, tr_b, sizeof(tr_b),
2800						     &c);
2801				if (err)
2802					break;
2803				if (val_b >= bitmap_len || neg ||
2804				    val_a > val_b) {
2805					err = -EINVAL;
2806					break;
2807				}
2808				if (left) {
2809					p++;
2810					left--;
2811				}
2812			}
2813
2814			bitmap_set(tmp_bitmap, val_a, val_b - val_a + 1);
2815			first = 0;
2816			proc_skip_char(&p, &left, '\n');
2817		}
2818		kfree(kbuf);
2819	} else {
2820		unsigned long bit_a, bit_b = 0;
2821
2822		while (left) {
2823			bit_a = find_next_bit(bitmap, bitmap_len, bit_b);
2824			if (bit_a >= bitmap_len)
2825				break;
2826			bit_b = find_next_zero_bit(bitmap, bitmap_len,
2827						   bit_a + 1) - 1;
2828
2829			if (!first) {
2830				err = proc_put_char(&buffer, &left, ',');
2831				if (err)
2832					break;
2833			}
2834			err = proc_put_long(&buffer, &left, bit_a, false);
2835			if (err)
2836				break;
2837			if (bit_a != bit_b) {
2838				err = proc_put_char(&buffer, &left, '-');
2839				if (err)
2840					break;
2841				err = proc_put_long(&buffer, &left, bit_b, false);
2842				if (err)
2843					break;
2844			}
2845
2846			first = 0; bit_b++;
2847		}
2848		if (!err)
2849			err = proc_put_char(&buffer, &left, '\n');
2850	}
2851
2852	if (!err) {
2853		if (write) {
2854			if (*ppos)
2855				bitmap_or(bitmap, bitmap, tmp_bitmap, bitmap_len);
2856			else
2857				bitmap_copy(bitmap, tmp_bitmap, bitmap_len);
2858		}
2859		kfree(tmp_bitmap);
2860		*lenp -= left;
2861		*ppos += *lenp;
2862		return 0;
2863	} else {
2864		kfree(tmp_bitmap);
2865		return err;
2866	}
 
 
 
2867}
2868
2869#else /* CONFIG_PROC_SYSCTL */
2870
2871int proc_dostring(struct ctl_table *table, int write,
2872		  void __user *buffer, size_t *lenp, loff_t *ppos)
2873{
2874	return -ENOSYS;
2875}
2876
2877int proc_dointvec(struct ctl_table *table, int write,
2878		  void __user *buffer, size_t *lenp, loff_t *ppos)
2879{
2880	return -ENOSYS;
2881}
2882
2883int proc_douintvec(struct ctl_table *table, int write,
2884		  void __user *buffer, size_t *lenp, loff_t *ppos)
2885{
2886	return -ENOSYS;
2887}
2888
2889int proc_dointvec_minmax(struct ctl_table *table, int write,
2890		    void __user *buffer, size_t *lenp, loff_t *ppos)
2891{
2892	return -ENOSYS;
2893}
2894
 
 
 
 
 
 
2895int proc_dointvec_jiffies(struct ctl_table *table, int write,
2896		    void __user *buffer, size_t *lenp, loff_t *ppos)
2897{
2898	return -ENOSYS;
2899}
2900
2901int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write,
2902		    void __user *buffer, size_t *lenp, loff_t *ppos)
2903{
2904	return -ENOSYS;
2905}
2906
2907int proc_dointvec_ms_jiffies(struct ctl_table *table, int write,
2908			     void __user *buffer, size_t *lenp, loff_t *ppos)
2909{
2910	return -ENOSYS;
2911}
2912
2913int proc_doulongvec_minmax(struct ctl_table *table, int write,
2914		    void __user *buffer, size_t *lenp, loff_t *ppos)
2915{
2916	return -ENOSYS;
2917}
2918
2919int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write,
2920				      void __user *buffer,
2921				      size_t *lenp, loff_t *ppos)
2922{
2923    return -ENOSYS;
2924}
2925
2926
2927#endif /* CONFIG_PROC_SYSCTL */
2928
2929/*
2930 * No sense putting this after each symbol definition, twice,
2931 * exception granted :-)
2932 */
2933EXPORT_SYMBOL(proc_dointvec);
2934EXPORT_SYMBOL(proc_douintvec);
2935EXPORT_SYMBOL(proc_dointvec_jiffies);
2936EXPORT_SYMBOL(proc_dointvec_minmax);
 
2937EXPORT_SYMBOL(proc_dointvec_userhz_jiffies);
2938EXPORT_SYMBOL(proc_dointvec_ms_jiffies);
2939EXPORT_SYMBOL(proc_dostring);
2940EXPORT_SYMBOL(proc_doulongvec_minmax);
2941EXPORT_SYMBOL(proc_doulongvec_ms_jiffies_minmax);
v4.17
   1/*
   2 * sysctl.c: General linux system control interface
   3 *
   4 * Begun 24 March 1995, Stephen Tweedie
   5 * Added /proc support, Dec 1995
   6 * Added bdflush entry and intvec min/max checking, 2/23/96, Tom Dyas.
   7 * Added hooks for /proc/sys/net (minor, minor patch), 96/4/1, Mike Shaver.
   8 * Added kernel/java-{interpreter,appletviewer}, 96/5/10, Mike Shaver.
   9 * Dynamic registration fixes, Stephen Tweedie.
  10 * Added kswapd-interval, ctrl-alt-del, printk stuff, 1/8/97, Chris Horn.
  11 * Made sysctl support optional via CONFIG_SYSCTL, 1/10/97, Chris
  12 *  Horn.
  13 * Added proc_doulongvec_ms_jiffies_minmax, 09/08/99, Carlos H. Bauer.
  14 * Added proc_doulongvec_minmax, 09/08/99, Carlos H. Bauer.
  15 * Changed linked lists to use list.h instead of lists.h, 02/24/00, Bill
  16 *  Wendling.
  17 * The list_for_each() macro wasn't appropriate for the sysctl loop.
  18 *  Removed it and replaced it with older style, 03/23/00, Bill Wendling
  19 */
  20
  21#include <linux/module.h>
  22#include <linux/aio.h>
  23#include <linux/mm.h>
  24#include <linux/swap.h>
  25#include <linux/slab.h>
  26#include <linux/sysctl.h>
  27#include <linux/bitmap.h>
  28#include <linux/signal.h>
  29#include <linux/printk.h>
  30#include <linux/proc_fs.h>
  31#include <linux/security.h>
  32#include <linux/ctype.h>
 
  33#include <linux/kmemleak.h>
  34#include <linux/fs.h>
  35#include <linux/init.h>
  36#include <linux/kernel.h>
  37#include <linux/kobject.h>
  38#include <linux/net.h>
  39#include <linux/sysrq.h>
  40#include <linux/highuid.h>
  41#include <linux/writeback.h>
  42#include <linux/ratelimit.h>
  43#include <linux/compaction.h>
  44#include <linux/hugetlb.h>
  45#include <linux/initrd.h>
  46#include <linux/key.h>
  47#include <linux/times.h>
  48#include <linux/limits.h>
  49#include <linux/dcache.h>
  50#include <linux/dnotify.h>
  51#include <linux/syscalls.h>
  52#include <linux/vmstat.h>
  53#include <linux/nfs_fs.h>
  54#include <linux/acpi.h>
  55#include <linux/reboot.h>
  56#include <linux/ftrace.h>
  57#include <linux/perf_event.h>
  58#include <linux/kprobes.h>
  59#include <linux/pipe_fs_i.h>
  60#include <linux/oom.h>
  61#include <linux/kmod.h>
  62#include <linux/capability.h>
  63#include <linux/binfmts.h>
  64#include <linux/sched/sysctl.h>
  65#include <linux/sched/coredump.h>
  66#include <linux/kexec.h>
  67#include <linux/bpf.h>
  68#include <linux/mount.h>
  69#include <linux/pipe_fs_i.h>
  70
  71#include <linux/uaccess.h>
  72#include <asm/processor.h>
  73
  74#ifdef CONFIG_X86
  75#include <asm/nmi.h>
  76#include <asm/stacktrace.h>
  77#include <asm/io.h>
  78#endif
  79#ifdef CONFIG_SPARC
  80#include <asm/setup.h>
  81#endif
  82#ifdef CONFIG_BSD_PROCESS_ACCT
  83#include <linux/acct.h>
  84#endif
  85#ifdef CONFIG_RT_MUTEXES
  86#include <linux/rtmutex.h>
  87#endif
  88#if defined(CONFIG_PROVE_LOCKING) || defined(CONFIG_LOCK_STAT)
  89#include <linux/lockdep.h>
  90#endif
  91#ifdef CONFIG_CHR_DEV_SG
  92#include <scsi/sg.h>
  93#endif
  94
  95#ifdef CONFIG_LOCKUP_DETECTOR
  96#include <linux/nmi.h>
  97#endif
  98
  99#if defined(CONFIG_SYSCTL)
 100
 101/* External variables not in a header file. */
 102extern int suid_dumpable;
 103#ifdef CONFIG_COREDUMP
 104extern int core_uses_pid;
 105extern char core_pattern[];
 106extern unsigned int core_pipe_limit;
 107#endif
 108extern int pid_max;
 109extern int pid_max_min, pid_max_max;
 110extern int percpu_pagelist_fraction;
 111extern int latencytop_enabled;
 112extern unsigned int sysctl_nr_open_min, sysctl_nr_open_max;
 113#ifndef CONFIG_MMU
 114extern int sysctl_nr_trim_pages;
 115#endif
 116
 117/* Constants used for minimum and  maximum */
 118#ifdef CONFIG_LOCKUP_DETECTOR
 119static int sixty = 60;
 120#endif
 121
 122static int __maybe_unused neg_one = -1;
 123
 124static int zero;
 125static int __maybe_unused one = 1;
 126static int __maybe_unused two = 2;
 127static int __maybe_unused four = 4;
 128static unsigned long one_ul = 1;
 129static int one_hundred = 100;
 130static int one_thousand = 1000;
 131#ifdef CONFIG_PRINTK
 132static int ten_thousand = 10000;
 133#endif
 134#ifdef CONFIG_PERF_EVENTS
 135static int six_hundred_forty_kb = 640 * 1024;
 136#endif
 137
 138/* this is needed for the proc_doulongvec_minmax of vm_dirty_bytes */
 139static unsigned long dirty_bytes_min = 2 * PAGE_SIZE;
 140
 141/* this is needed for the proc_dointvec_minmax for [fs_]overflow UID and GID */
 142static int maxolduid = 65535;
 143static int minolduid;
 144
 145static int ngroups_max = NGROUPS_MAX;
 146static const int cap_last_cap = CAP_LAST_CAP;
 147
 148/*this is needed for proc_doulongvec_minmax of sysctl_hung_task_timeout_secs */
 149#ifdef CONFIG_DETECT_HUNG_TASK
 150static unsigned long hung_task_timeout_max = (LONG_MAX/HZ);
 151#endif
 152
 153#ifdef CONFIG_INOTIFY_USER
 154#include <linux/inotify.h>
 155#endif
 156#ifdef CONFIG_SPARC
 157#endif
 158
 159#ifdef __hppa__
 160extern int pwrsw_enabled;
 161#endif
 162
 163#ifdef CONFIG_SYSCTL_ARCH_UNALIGN_ALLOW
 164extern int unaligned_enabled;
 165#endif
 166
 167#ifdef CONFIG_IA64
 168extern int unaligned_dump_stack;
 169#endif
 170
 171#ifdef CONFIG_SYSCTL_ARCH_UNALIGN_NO_WARN
 172extern int no_unaligned_warning;
 173#endif
 174
 175#ifdef CONFIG_PROC_SYSCTL
 176
 177/**
 178 * enum sysctl_writes_mode - supported sysctl write modes
 179 *
 180 * @SYSCTL_WRITES_LEGACY: each write syscall must fully contain the sysctl value
 181 * 	to be written, and multiple writes on the same sysctl file descriptor
 182 * 	will rewrite the sysctl value, regardless of file position. No warning
 183 * 	is issued when the initial position is not 0.
 184 * @SYSCTL_WRITES_WARN: same as above but warn when the initial file position is
 185 * 	not 0.
 186 * @SYSCTL_WRITES_STRICT: writes to numeric sysctl entries must always be at
 187 * 	file position 0 and the value must be fully contained in the buffer
 188 * 	sent to the write syscall. If dealing with strings respect the file
 189 * 	position, but restrict this to the max length of the buffer, anything
 190 * 	passed the max lenght will be ignored. Multiple writes will append
 191 * 	to the buffer.
 192 *
 193 * These write modes control how current file position affects the behavior of
 194 * updating sysctl values through the proc interface on each write.
 195 */
 196enum sysctl_writes_mode {
 197	SYSCTL_WRITES_LEGACY		= -1,
 198	SYSCTL_WRITES_WARN		= 0,
 199	SYSCTL_WRITES_STRICT		= 1,
 200};
 201
 202static enum sysctl_writes_mode sysctl_writes_strict = SYSCTL_WRITES_STRICT;
 203
 204static int proc_do_cad_pid(struct ctl_table *table, int write,
 205		  void __user *buffer, size_t *lenp, loff_t *ppos);
 206static int proc_taint(struct ctl_table *table, int write,
 207			       void __user *buffer, size_t *lenp, loff_t *ppos);
 208#endif
 209
 210#ifdef CONFIG_PRINTK
 211static int proc_dointvec_minmax_sysadmin(struct ctl_table *table, int write,
 212				void __user *buffer, size_t *lenp, loff_t *ppos);
 213#endif
 214
 215static int proc_dointvec_minmax_coredump(struct ctl_table *table, int write,
 216		void __user *buffer, size_t *lenp, loff_t *ppos);
 217#ifdef CONFIG_COREDUMP
 218static int proc_dostring_coredump(struct ctl_table *table, int write,
 219		void __user *buffer, size_t *lenp, loff_t *ppos);
 220#endif
 221static int proc_dopipe_max_size(struct ctl_table *table, int write,
 222		void __user *buffer, size_t *lenp, loff_t *ppos);
 223
 224#ifdef CONFIG_MAGIC_SYSRQ
 225/* Note: sysrq code uses it's own private copy */
 226static int __sysrq_enabled = CONFIG_MAGIC_SYSRQ_DEFAULT_ENABLE;
 227
 228static int sysrq_sysctl_handler(struct ctl_table *table, int write,
 229				void __user *buffer, size_t *lenp,
 230				loff_t *ppos)
 231{
 232	int error;
 233
 234	error = proc_dointvec(table, write, buffer, lenp, ppos);
 235	if (error)
 236		return error;
 237
 238	if (write)
 239		sysrq_toggle_support(__sysrq_enabled);
 240
 241	return 0;
 242}
 243
 244#endif
 245
 246static struct ctl_table kern_table[];
 247static struct ctl_table vm_table[];
 248static struct ctl_table fs_table[];
 249static struct ctl_table debug_table[];
 250static struct ctl_table dev_table[];
 251extern struct ctl_table random_table[];
 252#ifdef CONFIG_EPOLL
 253extern struct ctl_table epoll_table[];
 254#endif
 255
 256#ifdef CONFIG_FW_LOADER_USER_HELPER
 257extern struct ctl_table firmware_config_table[];
 258#endif
 259
 260#ifdef HAVE_ARCH_PICK_MMAP_LAYOUT
 261int sysctl_legacy_va_layout;
 262#endif
 263
 264/* The default sysctl tables: */
 265
 266static struct ctl_table sysctl_base_table[] = {
 267	{
 268		.procname	= "kernel",
 269		.mode		= 0555,
 270		.child		= kern_table,
 271	},
 272	{
 273		.procname	= "vm",
 274		.mode		= 0555,
 275		.child		= vm_table,
 276	},
 277	{
 278		.procname	= "fs",
 279		.mode		= 0555,
 280		.child		= fs_table,
 281	},
 282	{
 283		.procname	= "debug",
 284		.mode		= 0555,
 285		.child		= debug_table,
 286	},
 287	{
 288		.procname	= "dev",
 289		.mode		= 0555,
 290		.child		= dev_table,
 291	},
 292	{ }
 293};
 294
 295#ifdef CONFIG_SCHED_DEBUG
 296static int min_sched_granularity_ns = 100000;		/* 100 usecs */
 297static int max_sched_granularity_ns = NSEC_PER_SEC;	/* 1 second */
 298static int min_wakeup_granularity_ns;			/* 0 usecs */
 299static int max_wakeup_granularity_ns = NSEC_PER_SEC;	/* 1 second */
 300#ifdef CONFIG_SMP
 301static int min_sched_tunable_scaling = SCHED_TUNABLESCALING_NONE;
 302static int max_sched_tunable_scaling = SCHED_TUNABLESCALING_END-1;
 303#endif /* CONFIG_SMP */
 304#endif /* CONFIG_SCHED_DEBUG */
 305
 306#ifdef CONFIG_COMPACTION
 307static int min_extfrag_threshold;
 308static int max_extfrag_threshold = 1000;
 309#endif
 310
 311static struct ctl_table kern_table[] = {
 312	{
 313		.procname	= "sched_child_runs_first",
 314		.data		= &sysctl_sched_child_runs_first,
 315		.maxlen		= sizeof(unsigned int),
 316		.mode		= 0644,
 317		.proc_handler	= proc_dointvec,
 318	},
 319#ifdef CONFIG_SCHED_DEBUG
 320	{
 321		.procname	= "sched_min_granularity_ns",
 322		.data		= &sysctl_sched_min_granularity,
 323		.maxlen		= sizeof(unsigned int),
 324		.mode		= 0644,
 325		.proc_handler	= sched_proc_update_handler,
 326		.extra1		= &min_sched_granularity_ns,
 327		.extra2		= &max_sched_granularity_ns,
 328	},
 329	{
 330		.procname	= "sched_latency_ns",
 331		.data		= &sysctl_sched_latency,
 332		.maxlen		= sizeof(unsigned int),
 333		.mode		= 0644,
 334		.proc_handler	= sched_proc_update_handler,
 335		.extra1		= &min_sched_granularity_ns,
 336		.extra2		= &max_sched_granularity_ns,
 337	},
 338	{
 339		.procname	= "sched_wakeup_granularity_ns",
 340		.data		= &sysctl_sched_wakeup_granularity,
 341		.maxlen		= sizeof(unsigned int),
 342		.mode		= 0644,
 343		.proc_handler	= sched_proc_update_handler,
 344		.extra1		= &min_wakeup_granularity_ns,
 345		.extra2		= &max_wakeup_granularity_ns,
 346	},
 347#ifdef CONFIG_SMP
 348	{
 349		.procname	= "sched_tunable_scaling",
 350		.data		= &sysctl_sched_tunable_scaling,
 351		.maxlen		= sizeof(enum sched_tunable_scaling),
 352		.mode		= 0644,
 353		.proc_handler	= sched_proc_update_handler,
 354		.extra1		= &min_sched_tunable_scaling,
 355		.extra2		= &max_sched_tunable_scaling,
 356	},
 357	{
 358		.procname	= "sched_migration_cost_ns",
 359		.data		= &sysctl_sched_migration_cost,
 360		.maxlen		= sizeof(unsigned int),
 361		.mode		= 0644,
 362		.proc_handler	= proc_dointvec,
 363	},
 364	{
 365		.procname	= "sched_nr_migrate",
 366		.data		= &sysctl_sched_nr_migrate,
 367		.maxlen		= sizeof(unsigned int),
 368		.mode		= 0644,
 369		.proc_handler	= proc_dointvec,
 370	},
 371	{
 372		.procname	= "sched_time_avg_ms",
 373		.data		= &sysctl_sched_time_avg,
 374		.maxlen		= sizeof(unsigned int),
 375		.mode		= 0644,
 376		.proc_handler	= proc_dointvec_minmax,
 377		.extra1		= &one,
 378	},
 379#ifdef CONFIG_SCHEDSTATS
 380	{
 381		.procname	= "sched_schedstats",
 382		.data		= NULL,
 383		.maxlen		= sizeof(unsigned int),
 384		.mode		= 0644,
 385		.proc_handler	= sysctl_schedstats,
 386		.extra1		= &zero,
 387		.extra2		= &one,
 388	},
 389#endif /* CONFIG_SCHEDSTATS */
 390#endif /* CONFIG_SMP */
 391#ifdef CONFIG_NUMA_BALANCING
 392	{
 393		.procname	= "numa_balancing_scan_delay_ms",
 394		.data		= &sysctl_numa_balancing_scan_delay,
 395		.maxlen		= sizeof(unsigned int),
 396		.mode		= 0644,
 397		.proc_handler	= proc_dointvec,
 398	},
 399	{
 400		.procname	= "numa_balancing_scan_period_min_ms",
 401		.data		= &sysctl_numa_balancing_scan_period_min,
 402		.maxlen		= sizeof(unsigned int),
 403		.mode		= 0644,
 404		.proc_handler	= proc_dointvec,
 405	},
 406	{
 407		.procname	= "numa_balancing_scan_period_max_ms",
 408		.data		= &sysctl_numa_balancing_scan_period_max,
 409		.maxlen		= sizeof(unsigned int),
 410		.mode		= 0644,
 411		.proc_handler	= proc_dointvec,
 412	},
 413	{
 414		.procname	= "numa_balancing_scan_size_mb",
 415		.data		= &sysctl_numa_balancing_scan_size,
 416		.maxlen		= sizeof(unsigned int),
 417		.mode		= 0644,
 418		.proc_handler	= proc_dointvec_minmax,
 419		.extra1		= &one,
 420	},
 421	{
 422		.procname	= "numa_balancing",
 423		.data		= NULL, /* filled in by handler */
 424		.maxlen		= sizeof(unsigned int),
 425		.mode		= 0644,
 426		.proc_handler	= sysctl_numa_balancing,
 427		.extra1		= &zero,
 428		.extra2		= &one,
 429	},
 430#endif /* CONFIG_NUMA_BALANCING */
 431#endif /* CONFIG_SCHED_DEBUG */
 432	{
 433		.procname	= "sched_rt_period_us",
 434		.data		= &sysctl_sched_rt_period,
 435		.maxlen		= sizeof(unsigned int),
 436		.mode		= 0644,
 437		.proc_handler	= sched_rt_handler,
 438	},
 439	{
 440		.procname	= "sched_rt_runtime_us",
 441		.data		= &sysctl_sched_rt_runtime,
 442		.maxlen		= sizeof(int),
 443		.mode		= 0644,
 444		.proc_handler	= sched_rt_handler,
 445	},
 446	{
 447		.procname	= "sched_rr_timeslice_ms",
 448		.data		= &sysctl_sched_rr_timeslice,
 449		.maxlen		= sizeof(int),
 450		.mode		= 0644,
 451		.proc_handler	= sched_rr_handler,
 452	},
 453#ifdef CONFIG_SCHED_AUTOGROUP
 454	{
 455		.procname	= "sched_autogroup_enabled",
 456		.data		= &sysctl_sched_autogroup_enabled,
 457		.maxlen		= sizeof(unsigned int),
 458		.mode		= 0644,
 459		.proc_handler	= proc_dointvec_minmax,
 460		.extra1		= &zero,
 461		.extra2		= &one,
 462	},
 463#endif
 464#ifdef CONFIG_CFS_BANDWIDTH
 465	{
 466		.procname	= "sched_cfs_bandwidth_slice_us",
 467		.data		= &sysctl_sched_cfs_bandwidth_slice,
 468		.maxlen		= sizeof(unsigned int),
 469		.mode		= 0644,
 470		.proc_handler	= proc_dointvec_minmax,
 471		.extra1		= &one,
 472	},
 473#endif
 474#ifdef CONFIG_PROVE_LOCKING
 475	{
 476		.procname	= "prove_locking",
 477		.data		= &prove_locking,
 478		.maxlen		= sizeof(int),
 479		.mode		= 0644,
 480		.proc_handler	= proc_dointvec,
 481	},
 482#endif
 483#ifdef CONFIG_LOCK_STAT
 484	{
 485		.procname	= "lock_stat",
 486		.data		= &lock_stat,
 487		.maxlen		= sizeof(int),
 488		.mode		= 0644,
 489		.proc_handler	= proc_dointvec,
 490	},
 491#endif
 492	{
 493		.procname	= "panic",
 494		.data		= &panic_timeout,
 495		.maxlen		= sizeof(int),
 496		.mode		= 0644,
 497		.proc_handler	= proc_dointvec,
 498	},
 499#ifdef CONFIG_COREDUMP
 500	{
 501		.procname	= "core_uses_pid",
 502		.data		= &core_uses_pid,
 503		.maxlen		= sizeof(int),
 504		.mode		= 0644,
 505		.proc_handler	= proc_dointvec,
 506	},
 507	{
 508		.procname	= "core_pattern",
 509		.data		= core_pattern,
 510		.maxlen		= CORENAME_MAX_SIZE,
 511		.mode		= 0644,
 512		.proc_handler	= proc_dostring_coredump,
 513	},
 514	{
 515		.procname	= "core_pipe_limit",
 516		.data		= &core_pipe_limit,
 517		.maxlen		= sizeof(unsigned int),
 518		.mode		= 0644,
 519		.proc_handler	= proc_dointvec,
 520	},
 521#endif
 522#ifdef CONFIG_PROC_SYSCTL
 523	{
 524		.procname	= "tainted",
 525		.maxlen 	= sizeof(long),
 526		.mode		= 0644,
 527		.proc_handler	= proc_taint,
 528	},
 529	{
 530		.procname	= "sysctl_writes_strict",
 531		.data		= &sysctl_writes_strict,
 532		.maxlen		= sizeof(int),
 533		.mode		= 0644,
 534		.proc_handler	= proc_dointvec_minmax,
 535		.extra1		= &neg_one,
 536		.extra2		= &one,
 537	},
 538#endif
 539#ifdef CONFIG_LATENCYTOP
 540	{
 541		.procname	= "latencytop",
 542		.data		= &latencytop_enabled,
 543		.maxlen		= sizeof(int),
 544		.mode		= 0644,
 545		.proc_handler	= sysctl_latencytop,
 546	},
 547#endif
 548#ifdef CONFIG_BLK_DEV_INITRD
 549	{
 550		.procname	= "real-root-dev",
 551		.data		= &real_root_dev,
 552		.maxlen		= sizeof(int),
 553		.mode		= 0644,
 554		.proc_handler	= proc_dointvec,
 555	},
 556#endif
 557	{
 558		.procname	= "print-fatal-signals",
 559		.data		= &print_fatal_signals,
 560		.maxlen		= sizeof(int),
 561		.mode		= 0644,
 562		.proc_handler	= proc_dointvec,
 563	},
 564#ifdef CONFIG_SPARC
 565	{
 566		.procname	= "reboot-cmd",
 567		.data		= reboot_command,
 568		.maxlen		= 256,
 569		.mode		= 0644,
 570		.proc_handler	= proc_dostring,
 571	},
 572	{
 573		.procname	= "stop-a",
 574		.data		= &stop_a_enabled,
 575		.maxlen		= sizeof (int),
 576		.mode		= 0644,
 577		.proc_handler	= proc_dointvec,
 578	},
 579	{
 580		.procname	= "scons-poweroff",
 581		.data		= &scons_pwroff,
 582		.maxlen		= sizeof (int),
 583		.mode		= 0644,
 584		.proc_handler	= proc_dointvec,
 585	},
 586#endif
 587#ifdef CONFIG_SPARC64
 588	{
 589		.procname	= "tsb-ratio",
 590		.data		= &sysctl_tsb_ratio,
 591		.maxlen		= sizeof (int),
 592		.mode		= 0644,
 593		.proc_handler	= proc_dointvec,
 594	},
 595#endif
 596#ifdef __hppa__
 597	{
 598		.procname	= "soft-power",
 599		.data		= &pwrsw_enabled,
 600		.maxlen		= sizeof (int),
 601	 	.mode		= 0644,
 602		.proc_handler	= proc_dointvec,
 603	},
 604#endif
 605#ifdef CONFIG_SYSCTL_ARCH_UNALIGN_ALLOW
 606	{
 607		.procname	= "unaligned-trap",
 608		.data		= &unaligned_enabled,
 609		.maxlen		= sizeof (int),
 610		.mode		= 0644,
 611		.proc_handler	= proc_dointvec,
 612	},
 613#endif
 614	{
 615		.procname	= "ctrl-alt-del",
 616		.data		= &C_A_D,
 617		.maxlen		= sizeof(int),
 618		.mode		= 0644,
 619		.proc_handler	= proc_dointvec,
 620	},
 621#ifdef CONFIG_FUNCTION_TRACER
 622	{
 623		.procname	= "ftrace_enabled",
 624		.data		= &ftrace_enabled,
 625		.maxlen		= sizeof(int),
 626		.mode		= 0644,
 627		.proc_handler	= ftrace_enable_sysctl,
 628	},
 629#endif
 630#ifdef CONFIG_STACK_TRACER
 631	{
 632		.procname	= "stack_tracer_enabled",
 633		.data		= &stack_tracer_enabled,
 634		.maxlen		= sizeof(int),
 635		.mode		= 0644,
 636		.proc_handler	= stack_trace_sysctl,
 637	},
 638#endif
 639#ifdef CONFIG_TRACING
 640	{
 641		.procname	= "ftrace_dump_on_oops",
 642		.data		= &ftrace_dump_on_oops,
 643		.maxlen		= sizeof(int),
 644		.mode		= 0644,
 645		.proc_handler	= proc_dointvec,
 646	},
 647	{
 648		.procname	= "traceoff_on_warning",
 649		.data		= &__disable_trace_on_warning,
 650		.maxlen		= sizeof(__disable_trace_on_warning),
 651		.mode		= 0644,
 652		.proc_handler	= proc_dointvec,
 653	},
 654	{
 655		.procname	= "tracepoint_printk",
 656		.data		= &tracepoint_printk,
 657		.maxlen		= sizeof(tracepoint_printk),
 658		.mode		= 0644,
 659		.proc_handler	= tracepoint_printk_sysctl,
 660	},
 661#endif
 662#ifdef CONFIG_KEXEC_CORE
 663	{
 664		.procname	= "kexec_load_disabled",
 665		.data		= &kexec_load_disabled,
 666		.maxlen		= sizeof(int),
 667		.mode		= 0644,
 668		/* only handle a transition from default "0" to "1" */
 669		.proc_handler	= proc_dointvec_minmax,
 670		.extra1		= &one,
 671		.extra2		= &one,
 672	},
 673#endif
 674#ifdef CONFIG_MODULES
 675	{
 676		.procname	= "modprobe",
 677		.data		= &modprobe_path,
 678		.maxlen		= KMOD_PATH_LEN,
 679		.mode		= 0644,
 680		.proc_handler	= proc_dostring,
 681	},
 682	{
 683		.procname	= "modules_disabled",
 684		.data		= &modules_disabled,
 685		.maxlen		= sizeof(int),
 686		.mode		= 0644,
 687		/* only handle a transition from default "0" to "1" */
 688		.proc_handler	= proc_dointvec_minmax,
 689		.extra1		= &one,
 690		.extra2		= &one,
 691	},
 692#endif
 693#ifdef CONFIG_UEVENT_HELPER
 694	{
 695		.procname	= "hotplug",
 696		.data		= &uevent_helper,
 697		.maxlen		= UEVENT_HELPER_PATH_LEN,
 698		.mode		= 0644,
 699		.proc_handler	= proc_dostring,
 700	},
 701#endif
 702#ifdef CONFIG_CHR_DEV_SG
 703	{
 704		.procname	= "sg-big-buff",
 705		.data		= &sg_big_buff,
 706		.maxlen		= sizeof (int),
 707		.mode		= 0444,
 708		.proc_handler	= proc_dointvec,
 709	},
 710#endif
 711#ifdef CONFIG_BSD_PROCESS_ACCT
 712	{
 713		.procname	= "acct",
 714		.data		= &acct_parm,
 715		.maxlen		= 3*sizeof(int),
 716		.mode		= 0644,
 717		.proc_handler	= proc_dointvec,
 718	},
 719#endif
 720#ifdef CONFIG_MAGIC_SYSRQ
 721	{
 722		.procname	= "sysrq",
 723		.data		= &__sysrq_enabled,
 724		.maxlen		= sizeof (int),
 725		.mode		= 0644,
 726		.proc_handler	= sysrq_sysctl_handler,
 727	},
 728#endif
 729#ifdef CONFIG_PROC_SYSCTL
 730	{
 731		.procname	= "cad_pid",
 732		.data		= NULL,
 733		.maxlen		= sizeof (int),
 734		.mode		= 0600,
 735		.proc_handler	= proc_do_cad_pid,
 736	},
 737#endif
 738	{
 739		.procname	= "threads-max",
 740		.data		= NULL,
 741		.maxlen		= sizeof(int),
 742		.mode		= 0644,
 743		.proc_handler	= sysctl_max_threads,
 744	},
 745	{
 746		.procname	= "random",
 747		.mode		= 0555,
 748		.child		= random_table,
 749	},
 750	{
 751		.procname	= "usermodehelper",
 752		.mode		= 0555,
 753		.child		= usermodehelper_table,
 754	},
 755#ifdef CONFIG_FW_LOADER_USER_HELPER
 756	{
 757		.procname	= "firmware_config",
 758		.mode		= 0555,
 759		.child		= firmware_config_table,
 760	},
 761#endif
 762	{
 763		.procname	= "overflowuid",
 764		.data		= &overflowuid,
 765		.maxlen		= sizeof(int),
 766		.mode		= 0644,
 767		.proc_handler	= proc_dointvec_minmax,
 768		.extra1		= &minolduid,
 769		.extra2		= &maxolduid,
 770	},
 771	{
 772		.procname	= "overflowgid",
 773		.data		= &overflowgid,
 774		.maxlen		= sizeof(int),
 775		.mode		= 0644,
 776		.proc_handler	= proc_dointvec_minmax,
 777		.extra1		= &minolduid,
 778		.extra2		= &maxolduid,
 779	},
 780#ifdef CONFIG_S390
 781#ifdef CONFIG_MATHEMU
 782	{
 783		.procname	= "ieee_emulation_warnings",
 784		.data		= &sysctl_ieee_emulation_warnings,
 785		.maxlen		= sizeof(int),
 786		.mode		= 0644,
 787		.proc_handler	= proc_dointvec,
 788	},
 789#endif
 790	{
 791		.procname	= "userprocess_debug",
 792		.data		= &show_unhandled_signals,
 793		.maxlen		= sizeof(int),
 794		.mode		= 0644,
 795		.proc_handler	= proc_dointvec,
 796	},
 797#endif
 798	{
 799		.procname	= "pid_max",
 800		.data		= &pid_max,
 801		.maxlen		= sizeof (int),
 802		.mode		= 0644,
 803		.proc_handler	= proc_dointvec_minmax,
 804		.extra1		= &pid_max_min,
 805		.extra2		= &pid_max_max,
 806	},
 807	{
 808		.procname	= "panic_on_oops",
 809		.data		= &panic_on_oops,
 810		.maxlen		= sizeof(int),
 811		.mode		= 0644,
 812		.proc_handler	= proc_dointvec,
 813	},
 814#if defined CONFIG_PRINTK
 815	{
 816		.procname	= "printk",
 817		.data		= &console_loglevel,
 818		.maxlen		= 4*sizeof(int),
 819		.mode		= 0644,
 820		.proc_handler	= proc_dointvec,
 821	},
 822	{
 823		.procname	= "printk_ratelimit",
 824		.data		= &printk_ratelimit_state.interval,
 825		.maxlen		= sizeof(int),
 826		.mode		= 0644,
 827		.proc_handler	= proc_dointvec_jiffies,
 828	},
 829	{
 830		.procname	= "printk_ratelimit_burst",
 831		.data		= &printk_ratelimit_state.burst,
 832		.maxlen		= sizeof(int),
 833		.mode		= 0644,
 834		.proc_handler	= proc_dointvec,
 835	},
 836	{
 837		.procname	= "printk_delay",
 838		.data		= &printk_delay_msec,
 839		.maxlen		= sizeof(int),
 840		.mode		= 0644,
 841		.proc_handler	= proc_dointvec_minmax,
 842		.extra1		= &zero,
 843		.extra2		= &ten_thousand,
 844	},
 845	{
 846		.procname	= "printk_devkmsg",
 847		.data		= devkmsg_log_str,
 848		.maxlen		= DEVKMSG_STR_MAX_SIZE,
 849		.mode		= 0644,
 850		.proc_handler	= devkmsg_sysctl_set_loglvl,
 851	},
 852	{
 853		.procname	= "dmesg_restrict",
 854		.data		= &dmesg_restrict,
 855		.maxlen		= sizeof(int),
 856		.mode		= 0644,
 857		.proc_handler	= proc_dointvec_minmax_sysadmin,
 858		.extra1		= &zero,
 859		.extra2		= &one,
 860	},
 861	{
 862		.procname	= "kptr_restrict",
 863		.data		= &kptr_restrict,
 864		.maxlen		= sizeof(int),
 865		.mode		= 0644,
 866		.proc_handler	= proc_dointvec_minmax_sysadmin,
 867		.extra1		= &zero,
 868		.extra2		= &two,
 869	},
 870#endif
 871	{
 872		.procname	= "ngroups_max",
 873		.data		= &ngroups_max,
 874		.maxlen		= sizeof (int),
 875		.mode		= 0444,
 876		.proc_handler	= proc_dointvec,
 877	},
 878	{
 879		.procname	= "cap_last_cap",
 880		.data		= (void *)&cap_last_cap,
 881		.maxlen		= sizeof(int),
 882		.mode		= 0444,
 883		.proc_handler	= proc_dointvec,
 884	},
 885#if defined(CONFIG_LOCKUP_DETECTOR)
 886	{
 887		.procname       = "watchdog",
 888		.data		= &watchdog_user_enabled,
 889		.maxlen		= sizeof(int),
 890		.mode		= 0644,
 891		.proc_handler   = proc_watchdog,
 892		.extra1		= &zero,
 893		.extra2		= &one,
 894	},
 895	{
 896		.procname	= "watchdog_thresh",
 897		.data		= &watchdog_thresh,
 898		.maxlen		= sizeof(int),
 899		.mode		= 0644,
 900		.proc_handler	= proc_watchdog_thresh,
 901		.extra1		= &zero,
 902		.extra2		= &sixty,
 903	},
 904	{
 905		.procname       = "nmi_watchdog",
 906		.data		= &nmi_watchdog_user_enabled,
 907		.maxlen		= sizeof(int),
 908		.mode		= NMI_WATCHDOG_SYSCTL_PERM,
 909		.proc_handler   = proc_nmi_watchdog,
 910		.extra1		= &zero,
 
 
 
 
 
 
 
 
 
 
 
 
 
 911		.extra2		= &one,
 912	},
 913	{
 914		.procname	= "watchdog_cpumask",
 915		.data		= &watchdog_cpumask_bits,
 916		.maxlen		= NR_CPUS,
 917		.mode		= 0644,
 918		.proc_handler	= proc_watchdog_cpumask,
 919	},
 920#ifdef CONFIG_SOFTLOCKUP_DETECTOR
 921	{
 922		.procname       = "soft_watchdog",
 923		.data		= &soft_watchdog_user_enabled,
 924		.maxlen		= sizeof(int),
 925		.mode		= 0644,
 926		.proc_handler   = proc_soft_watchdog,
 927		.extra1		= &zero,
 928		.extra2		= &one,
 929	},
 930	{
 931		.procname	= "softlockup_panic",
 932		.data		= &softlockup_panic,
 933		.maxlen		= sizeof(int),
 934		.mode		= 0644,
 935		.proc_handler	= proc_dointvec_minmax,
 936		.extra1		= &zero,
 937		.extra2		= &one,
 938	},
 939#ifdef CONFIG_SMP
 940	{
 941		.procname	= "softlockup_all_cpu_backtrace",
 942		.data		= &sysctl_softlockup_all_cpu_backtrace,
 943		.maxlen		= sizeof(int),
 944		.mode		= 0644,
 945		.proc_handler	= proc_dointvec_minmax,
 946		.extra1		= &zero,
 947		.extra2		= &one,
 948	},
 949#endif /* CONFIG_SMP */
 950#endif
 951#ifdef CONFIG_HARDLOCKUP_DETECTOR
 952	{
 953		.procname	= "hardlockup_panic",
 954		.data		= &hardlockup_panic,
 955		.maxlen		= sizeof(int),
 956		.mode		= 0644,
 957		.proc_handler	= proc_dointvec_minmax,
 958		.extra1		= &zero,
 959		.extra2		= &one,
 960	},
 961#ifdef CONFIG_SMP
 962	{
 963		.procname	= "hardlockup_all_cpu_backtrace",
 964		.data		= &sysctl_hardlockup_all_cpu_backtrace,
 965		.maxlen		= sizeof(int),
 966		.mode		= 0644,
 967		.proc_handler	= proc_dointvec_minmax,
 968		.extra1		= &zero,
 969		.extra2		= &one,
 970	},
 971#endif /* CONFIG_SMP */
 972#endif
 973#endif
 974
 975#if defined(CONFIG_X86_LOCAL_APIC) && defined(CONFIG_X86)
 976	{
 977		.procname       = "unknown_nmi_panic",
 978		.data           = &unknown_nmi_panic,
 979		.maxlen         = sizeof (int),
 980		.mode           = 0644,
 981		.proc_handler   = proc_dointvec,
 982	},
 983#endif
 984#if defined(CONFIG_X86)
 985	{
 986		.procname	= "panic_on_unrecovered_nmi",
 987		.data		= &panic_on_unrecovered_nmi,
 988		.maxlen		= sizeof(int),
 989		.mode		= 0644,
 990		.proc_handler	= proc_dointvec,
 991	},
 992	{
 993		.procname	= "panic_on_io_nmi",
 994		.data		= &panic_on_io_nmi,
 995		.maxlen		= sizeof(int),
 996		.mode		= 0644,
 997		.proc_handler	= proc_dointvec,
 998	},
 999#ifdef CONFIG_DEBUG_STACKOVERFLOW
1000	{
1001		.procname	= "panic_on_stackoverflow",
1002		.data		= &sysctl_panic_on_stackoverflow,
1003		.maxlen		= sizeof(int),
1004		.mode		= 0644,
1005		.proc_handler	= proc_dointvec,
1006	},
1007#endif
1008	{
1009		.procname	= "bootloader_type",
1010		.data		= &bootloader_type,
1011		.maxlen		= sizeof (int),
1012		.mode		= 0444,
1013		.proc_handler	= proc_dointvec,
1014	},
1015	{
1016		.procname	= "bootloader_version",
1017		.data		= &bootloader_version,
1018		.maxlen		= sizeof (int),
1019		.mode		= 0444,
1020		.proc_handler	= proc_dointvec,
1021	},
1022	{
1023		.procname	= "io_delay_type",
1024		.data		= &io_delay_type,
1025		.maxlen		= sizeof(int),
1026		.mode		= 0644,
1027		.proc_handler	= proc_dointvec,
1028	},
1029#endif
1030#if defined(CONFIG_MMU)
1031	{
1032		.procname	= "randomize_va_space",
1033		.data		= &randomize_va_space,
1034		.maxlen		= sizeof(int),
1035		.mode		= 0644,
1036		.proc_handler	= proc_dointvec,
1037	},
1038#endif
1039#if defined(CONFIG_S390) && defined(CONFIG_SMP)
1040	{
1041		.procname	= "spin_retry",
1042		.data		= &spin_retry,
1043		.maxlen		= sizeof (int),
1044		.mode		= 0644,
1045		.proc_handler	= proc_dointvec,
1046	},
1047#endif
1048#if	defined(CONFIG_ACPI_SLEEP) && defined(CONFIG_X86)
1049	{
1050		.procname	= "acpi_video_flags",
1051		.data		= &acpi_realmode_flags,
1052		.maxlen		= sizeof (unsigned long),
1053		.mode		= 0644,
1054		.proc_handler	= proc_doulongvec_minmax,
1055	},
1056#endif
1057#ifdef CONFIG_SYSCTL_ARCH_UNALIGN_NO_WARN
1058	{
1059		.procname	= "ignore-unaligned-usertrap",
1060		.data		= &no_unaligned_warning,
1061		.maxlen		= sizeof (int),
1062	 	.mode		= 0644,
1063		.proc_handler	= proc_dointvec,
1064	},
1065#endif
1066#ifdef CONFIG_IA64
1067	{
1068		.procname	= "unaligned-dump-stack",
1069		.data		= &unaligned_dump_stack,
1070		.maxlen		= sizeof (int),
1071		.mode		= 0644,
1072		.proc_handler	= proc_dointvec,
1073	},
1074#endif
1075#ifdef CONFIG_DETECT_HUNG_TASK
1076	{
1077		.procname	= "hung_task_panic",
1078		.data		= &sysctl_hung_task_panic,
1079		.maxlen		= sizeof(int),
1080		.mode		= 0644,
1081		.proc_handler	= proc_dointvec_minmax,
1082		.extra1		= &zero,
1083		.extra2		= &one,
1084	},
1085	{
1086		.procname	= "hung_task_check_count",
1087		.data		= &sysctl_hung_task_check_count,
1088		.maxlen		= sizeof(int),
1089		.mode		= 0644,
1090		.proc_handler	= proc_dointvec_minmax,
1091		.extra1		= &zero,
1092	},
1093	{
1094		.procname	= "hung_task_timeout_secs",
1095		.data		= &sysctl_hung_task_timeout_secs,
1096		.maxlen		= sizeof(unsigned long),
1097		.mode		= 0644,
1098		.proc_handler	= proc_dohung_task_timeout_secs,
1099		.extra2		= &hung_task_timeout_max,
1100	},
1101	{
1102		.procname	= "hung_task_warnings",
1103		.data		= &sysctl_hung_task_warnings,
1104		.maxlen		= sizeof(int),
1105		.mode		= 0644,
1106		.proc_handler	= proc_dointvec_minmax,
1107		.extra1		= &neg_one,
1108	},
1109#endif
1110#ifdef CONFIG_RT_MUTEXES
1111	{
1112		.procname	= "max_lock_depth",
1113		.data		= &max_lock_depth,
1114		.maxlen		= sizeof(int),
1115		.mode		= 0644,
1116		.proc_handler	= proc_dointvec,
1117	},
1118#endif
1119	{
1120		.procname	= "poweroff_cmd",
1121		.data		= &poweroff_cmd,
1122		.maxlen		= POWEROFF_CMD_PATH_LEN,
1123		.mode		= 0644,
1124		.proc_handler	= proc_dostring,
1125	},
1126#ifdef CONFIG_KEYS
1127	{
1128		.procname	= "keys",
1129		.mode		= 0555,
1130		.child		= key_sysctls,
1131	},
1132#endif
1133#ifdef CONFIG_PERF_EVENTS
1134	/*
1135	 * User-space scripts rely on the existence of this file
1136	 * as a feature check for perf_events being enabled.
1137	 *
1138	 * So it's an ABI, do not remove!
1139	 */
1140	{
1141		.procname	= "perf_event_paranoid",
1142		.data		= &sysctl_perf_event_paranoid,
1143		.maxlen		= sizeof(sysctl_perf_event_paranoid),
1144		.mode		= 0644,
1145		.proc_handler	= proc_dointvec,
1146	},
1147	{
1148		.procname	= "perf_event_mlock_kb",
1149		.data		= &sysctl_perf_event_mlock,
1150		.maxlen		= sizeof(sysctl_perf_event_mlock),
1151		.mode		= 0644,
1152		.proc_handler	= proc_dointvec,
1153	},
1154	{
1155		.procname	= "perf_event_max_sample_rate",
1156		.data		= &sysctl_perf_event_sample_rate,
1157		.maxlen		= sizeof(sysctl_perf_event_sample_rate),
1158		.mode		= 0644,
1159		.proc_handler	= perf_proc_update_handler,
1160		.extra1		= &one,
1161	},
1162	{
1163		.procname	= "perf_cpu_time_max_percent",
1164		.data		= &sysctl_perf_cpu_time_max_percent,
1165		.maxlen		= sizeof(sysctl_perf_cpu_time_max_percent),
1166		.mode		= 0644,
1167		.proc_handler	= perf_cpu_time_max_percent_handler,
1168		.extra1		= &zero,
1169		.extra2		= &one_hundred,
1170	},
1171	{
1172		.procname	= "perf_event_max_stack",
1173		.data		= &sysctl_perf_event_max_stack,
1174		.maxlen		= sizeof(sysctl_perf_event_max_stack),
1175		.mode		= 0644,
1176		.proc_handler	= perf_event_max_stack_handler,
1177		.extra1		= &zero,
1178		.extra2		= &six_hundred_forty_kb,
1179	},
1180	{
1181		.procname	= "perf_event_max_contexts_per_stack",
1182		.data		= &sysctl_perf_event_max_contexts_per_stack,
1183		.maxlen		= sizeof(sysctl_perf_event_max_contexts_per_stack),
1184		.mode		= 0644,
1185		.proc_handler	= perf_event_max_stack_handler,
1186		.extra1		= &zero,
1187		.extra2		= &one_thousand,
1188	},
1189#endif
 
 
 
 
 
 
 
 
 
1190	{
1191		.procname	= "panic_on_warn",
1192		.data		= &panic_on_warn,
1193		.maxlen		= sizeof(int),
1194		.mode		= 0644,
1195		.proc_handler	= proc_dointvec_minmax,
1196		.extra1		= &zero,
1197		.extra2		= &one,
1198	},
1199#if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ_COMMON)
1200	{
1201		.procname	= "timer_migration",
1202		.data		= &sysctl_timer_migration,
1203		.maxlen		= sizeof(unsigned int),
1204		.mode		= 0644,
1205		.proc_handler	= timer_migration_handler,
1206		.extra1		= &zero,
1207		.extra2		= &one,
1208	},
1209#endif
1210#ifdef CONFIG_BPF_SYSCALL
1211	{
1212		.procname	= "unprivileged_bpf_disabled",
1213		.data		= &sysctl_unprivileged_bpf_disabled,
1214		.maxlen		= sizeof(sysctl_unprivileged_bpf_disabled),
1215		.mode		= 0644,
1216		/* only handle a transition from default "0" to "1" */
1217		.proc_handler	= proc_dointvec_minmax,
1218		.extra1		= &one,
1219		.extra2		= &one,
1220	},
1221#endif
1222#if defined(CONFIG_TREE_RCU) || defined(CONFIG_PREEMPT_RCU)
1223	{
1224		.procname	= "panic_on_rcu_stall",
1225		.data		= &sysctl_panic_on_rcu_stall,
1226		.maxlen		= sizeof(sysctl_panic_on_rcu_stall),
1227		.mode		= 0644,
1228		.proc_handler	= proc_dointvec_minmax,
1229		.extra1		= &zero,
1230		.extra2		= &one,
1231	},
1232#endif
1233	{ }
1234};
1235
1236static struct ctl_table vm_table[] = {
1237	{
1238		.procname	= "overcommit_memory",
1239		.data		= &sysctl_overcommit_memory,
1240		.maxlen		= sizeof(sysctl_overcommit_memory),
1241		.mode		= 0644,
1242		.proc_handler	= proc_dointvec_minmax,
1243		.extra1		= &zero,
1244		.extra2		= &two,
1245	},
1246	{
1247		.procname	= "panic_on_oom",
1248		.data		= &sysctl_panic_on_oom,
1249		.maxlen		= sizeof(sysctl_panic_on_oom),
1250		.mode		= 0644,
1251		.proc_handler	= proc_dointvec_minmax,
1252		.extra1		= &zero,
1253		.extra2		= &two,
1254	},
1255	{
1256		.procname	= "oom_kill_allocating_task",
1257		.data		= &sysctl_oom_kill_allocating_task,
1258		.maxlen		= sizeof(sysctl_oom_kill_allocating_task),
1259		.mode		= 0644,
1260		.proc_handler	= proc_dointvec,
1261	},
1262	{
1263		.procname	= "oom_dump_tasks",
1264		.data		= &sysctl_oom_dump_tasks,
1265		.maxlen		= sizeof(sysctl_oom_dump_tasks),
1266		.mode		= 0644,
1267		.proc_handler	= proc_dointvec,
1268	},
1269	{
1270		.procname	= "overcommit_ratio",
1271		.data		= &sysctl_overcommit_ratio,
1272		.maxlen		= sizeof(sysctl_overcommit_ratio),
1273		.mode		= 0644,
1274		.proc_handler	= overcommit_ratio_handler,
1275	},
1276	{
1277		.procname	= "overcommit_kbytes",
1278		.data		= &sysctl_overcommit_kbytes,
1279		.maxlen		= sizeof(sysctl_overcommit_kbytes),
1280		.mode		= 0644,
1281		.proc_handler	= overcommit_kbytes_handler,
1282	},
1283	{
1284		.procname	= "page-cluster", 
1285		.data		= &page_cluster,
1286		.maxlen		= sizeof(int),
1287		.mode		= 0644,
1288		.proc_handler	= proc_dointvec_minmax,
1289		.extra1		= &zero,
1290	},
1291	{
1292		.procname	= "dirty_background_ratio",
1293		.data		= &dirty_background_ratio,
1294		.maxlen		= sizeof(dirty_background_ratio),
1295		.mode		= 0644,
1296		.proc_handler	= dirty_background_ratio_handler,
1297		.extra1		= &zero,
1298		.extra2		= &one_hundred,
1299	},
1300	{
1301		.procname	= "dirty_background_bytes",
1302		.data		= &dirty_background_bytes,
1303		.maxlen		= sizeof(dirty_background_bytes),
1304		.mode		= 0644,
1305		.proc_handler	= dirty_background_bytes_handler,
1306		.extra1		= &one_ul,
1307	},
1308	{
1309		.procname	= "dirty_ratio",
1310		.data		= &vm_dirty_ratio,
1311		.maxlen		= sizeof(vm_dirty_ratio),
1312		.mode		= 0644,
1313		.proc_handler	= dirty_ratio_handler,
1314		.extra1		= &zero,
1315		.extra2		= &one_hundred,
1316	},
1317	{
1318		.procname	= "dirty_bytes",
1319		.data		= &vm_dirty_bytes,
1320		.maxlen		= sizeof(vm_dirty_bytes),
1321		.mode		= 0644,
1322		.proc_handler	= dirty_bytes_handler,
1323		.extra1		= &dirty_bytes_min,
1324	},
1325	{
1326		.procname	= "dirty_writeback_centisecs",
1327		.data		= &dirty_writeback_interval,
1328		.maxlen		= sizeof(dirty_writeback_interval),
1329		.mode		= 0644,
1330		.proc_handler	= dirty_writeback_centisecs_handler,
1331	},
1332	{
1333		.procname	= "dirty_expire_centisecs",
1334		.data		= &dirty_expire_interval,
1335		.maxlen		= sizeof(dirty_expire_interval),
1336		.mode		= 0644,
1337		.proc_handler	= proc_dointvec_minmax,
1338		.extra1		= &zero,
1339	},
1340	{
1341		.procname	= "dirtytime_expire_seconds",
1342		.data		= &dirtytime_expire_interval,
1343		.maxlen		= sizeof(dirtytime_expire_interval),
1344		.mode		= 0644,
1345		.proc_handler	= dirtytime_interval_handler,
1346		.extra1		= &zero,
1347	},
1348	{
 
 
 
 
 
1349		.procname	= "swappiness",
1350		.data		= &vm_swappiness,
1351		.maxlen		= sizeof(vm_swappiness),
1352		.mode		= 0644,
1353		.proc_handler	= proc_dointvec_minmax,
1354		.extra1		= &zero,
1355		.extra2		= &one_hundred,
1356	},
1357#ifdef CONFIG_HUGETLB_PAGE
1358	{
1359		.procname	= "nr_hugepages",
1360		.data		= NULL,
1361		.maxlen		= sizeof(unsigned long),
1362		.mode		= 0644,
1363		.proc_handler	= hugetlb_sysctl_handler,
1364	},
1365#ifdef CONFIG_NUMA
1366	{
1367		.procname       = "nr_hugepages_mempolicy",
1368		.data           = NULL,
1369		.maxlen         = sizeof(unsigned long),
1370		.mode           = 0644,
1371		.proc_handler   = &hugetlb_mempolicy_sysctl_handler,
1372	},
1373	{
1374		.procname		= "numa_stat",
1375		.data			= &sysctl_vm_numa_stat,
1376		.maxlen			= sizeof(int),
1377		.mode			= 0644,
1378		.proc_handler	= sysctl_vm_numa_stat_handler,
1379		.extra1			= &zero,
1380		.extra2			= &one,
1381	},
1382#endif
1383	 {
1384		.procname	= "hugetlb_shm_group",
1385		.data		= &sysctl_hugetlb_shm_group,
1386		.maxlen		= sizeof(gid_t),
1387		.mode		= 0644,
1388		.proc_handler	= proc_dointvec,
1389	 },
 
 
 
 
 
 
 
1390	{
1391		.procname	= "nr_overcommit_hugepages",
1392		.data		= NULL,
1393		.maxlen		= sizeof(unsigned long),
1394		.mode		= 0644,
1395		.proc_handler	= hugetlb_overcommit_handler,
1396	},
1397#endif
1398	{
1399		.procname	= "lowmem_reserve_ratio",
1400		.data		= &sysctl_lowmem_reserve_ratio,
1401		.maxlen		= sizeof(sysctl_lowmem_reserve_ratio),
1402		.mode		= 0644,
1403		.proc_handler	= lowmem_reserve_ratio_sysctl_handler,
1404	},
1405	{
1406		.procname	= "drop_caches",
1407		.data		= &sysctl_drop_caches,
1408		.maxlen		= sizeof(int),
1409		.mode		= 0644,
1410		.proc_handler	= drop_caches_sysctl_handler,
1411		.extra1		= &one,
1412		.extra2		= &four,
1413	},
1414#ifdef CONFIG_COMPACTION
1415	{
1416		.procname	= "compact_memory",
1417		.data		= &sysctl_compact_memory,
1418		.maxlen		= sizeof(int),
1419		.mode		= 0200,
1420		.proc_handler	= sysctl_compaction_handler,
1421	},
1422	{
1423		.procname	= "extfrag_threshold",
1424		.data		= &sysctl_extfrag_threshold,
1425		.maxlen		= sizeof(int),
1426		.mode		= 0644,
1427		.proc_handler	= sysctl_extfrag_handler,
1428		.extra1		= &min_extfrag_threshold,
1429		.extra2		= &max_extfrag_threshold,
1430	},
1431	{
1432		.procname	= "compact_unevictable_allowed",
1433		.data		= &sysctl_compact_unevictable_allowed,
1434		.maxlen		= sizeof(int),
1435		.mode		= 0644,
1436		.proc_handler	= proc_dointvec,
1437		.extra1		= &zero,
1438		.extra2		= &one,
1439	},
1440
1441#endif /* CONFIG_COMPACTION */
1442	{
1443		.procname	= "min_free_kbytes",
1444		.data		= &min_free_kbytes,
1445		.maxlen		= sizeof(min_free_kbytes),
1446		.mode		= 0644,
1447		.proc_handler	= min_free_kbytes_sysctl_handler,
1448		.extra1		= &zero,
1449	},
1450	{
1451		.procname	= "watermark_scale_factor",
1452		.data		= &watermark_scale_factor,
1453		.maxlen		= sizeof(watermark_scale_factor),
1454		.mode		= 0644,
1455		.proc_handler	= watermark_scale_factor_sysctl_handler,
1456		.extra1		= &one,
1457		.extra2		= &one_thousand,
1458	},
1459	{
1460		.procname	= "percpu_pagelist_fraction",
1461		.data		= &percpu_pagelist_fraction,
1462		.maxlen		= sizeof(percpu_pagelist_fraction),
1463		.mode		= 0644,
1464		.proc_handler	= percpu_pagelist_fraction_sysctl_handler,
1465		.extra1		= &zero,
1466	},
1467#ifdef CONFIG_MMU
1468	{
1469		.procname	= "max_map_count",
1470		.data		= &sysctl_max_map_count,
1471		.maxlen		= sizeof(sysctl_max_map_count),
1472		.mode		= 0644,
1473		.proc_handler	= proc_dointvec_minmax,
1474		.extra1		= &zero,
1475	},
1476#else
1477	{
1478		.procname	= "nr_trim_pages",
1479		.data		= &sysctl_nr_trim_pages,
1480		.maxlen		= sizeof(sysctl_nr_trim_pages),
1481		.mode		= 0644,
1482		.proc_handler	= proc_dointvec_minmax,
1483		.extra1		= &zero,
1484	},
1485#endif
1486	{
1487		.procname	= "laptop_mode",
1488		.data		= &laptop_mode,
1489		.maxlen		= sizeof(laptop_mode),
1490		.mode		= 0644,
1491		.proc_handler	= proc_dointvec_jiffies,
1492	},
1493	{
1494		.procname	= "block_dump",
1495		.data		= &block_dump,
1496		.maxlen		= sizeof(block_dump),
1497		.mode		= 0644,
1498		.proc_handler	= proc_dointvec,
1499		.extra1		= &zero,
1500	},
1501	{
1502		.procname	= "vfs_cache_pressure",
1503		.data		= &sysctl_vfs_cache_pressure,
1504		.maxlen		= sizeof(sysctl_vfs_cache_pressure),
1505		.mode		= 0644,
1506		.proc_handler	= proc_dointvec,
1507		.extra1		= &zero,
1508	},
1509#ifdef HAVE_ARCH_PICK_MMAP_LAYOUT
1510	{
1511		.procname	= "legacy_va_layout",
1512		.data		= &sysctl_legacy_va_layout,
1513		.maxlen		= sizeof(sysctl_legacy_va_layout),
1514		.mode		= 0644,
1515		.proc_handler	= proc_dointvec,
1516		.extra1		= &zero,
1517	},
1518#endif
1519#ifdef CONFIG_NUMA
1520	{
1521		.procname	= "zone_reclaim_mode",
1522		.data		= &node_reclaim_mode,
1523		.maxlen		= sizeof(node_reclaim_mode),
1524		.mode		= 0644,
1525		.proc_handler	= proc_dointvec,
1526		.extra1		= &zero,
1527	},
1528	{
1529		.procname	= "min_unmapped_ratio",
1530		.data		= &sysctl_min_unmapped_ratio,
1531		.maxlen		= sizeof(sysctl_min_unmapped_ratio),
1532		.mode		= 0644,
1533		.proc_handler	= sysctl_min_unmapped_ratio_sysctl_handler,
1534		.extra1		= &zero,
1535		.extra2		= &one_hundred,
1536	},
1537	{
1538		.procname	= "min_slab_ratio",
1539		.data		= &sysctl_min_slab_ratio,
1540		.maxlen		= sizeof(sysctl_min_slab_ratio),
1541		.mode		= 0644,
1542		.proc_handler	= sysctl_min_slab_ratio_sysctl_handler,
1543		.extra1		= &zero,
1544		.extra2		= &one_hundred,
1545	},
1546#endif
1547#ifdef CONFIG_SMP
1548	{
1549		.procname	= "stat_interval",
1550		.data		= &sysctl_stat_interval,
1551		.maxlen		= sizeof(sysctl_stat_interval),
1552		.mode		= 0644,
1553		.proc_handler	= proc_dointvec_jiffies,
1554	},
1555	{
1556		.procname	= "stat_refresh",
1557		.data		= NULL,
1558		.maxlen		= 0,
1559		.mode		= 0600,
1560		.proc_handler	= vmstat_refresh,
1561	},
1562#endif
1563#ifdef CONFIG_MMU
1564	{
1565		.procname	= "mmap_min_addr",
1566		.data		= &dac_mmap_min_addr,
1567		.maxlen		= sizeof(unsigned long),
1568		.mode		= 0644,
1569		.proc_handler	= mmap_min_addr_handler,
1570	},
1571#endif
1572#ifdef CONFIG_NUMA
1573	{
1574		.procname	= "numa_zonelist_order",
1575		.data		= &numa_zonelist_order,
1576		.maxlen		= NUMA_ZONELIST_ORDER_LEN,
1577		.mode		= 0644,
1578		.proc_handler	= numa_zonelist_order_handler,
1579	},
1580#endif
1581#if (defined(CONFIG_X86_32) && !defined(CONFIG_UML))|| \
1582   (defined(CONFIG_SUPERH) && defined(CONFIG_VSYSCALL))
1583	{
1584		.procname	= "vdso_enabled",
1585#ifdef CONFIG_X86_32
1586		.data		= &vdso32_enabled,
1587		.maxlen		= sizeof(vdso32_enabled),
1588#else
1589		.data		= &vdso_enabled,
1590		.maxlen		= sizeof(vdso_enabled),
1591#endif
1592		.mode		= 0644,
1593		.proc_handler	= proc_dointvec,
1594		.extra1		= &zero,
1595	},
1596#endif
1597#ifdef CONFIG_HIGHMEM
1598	{
1599		.procname	= "highmem_is_dirtyable",
1600		.data		= &vm_highmem_is_dirtyable,
1601		.maxlen		= sizeof(vm_highmem_is_dirtyable),
1602		.mode		= 0644,
1603		.proc_handler	= proc_dointvec_minmax,
1604		.extra1		= &zero,
1605		.extra2		= &one,
1606	},
1607#endif
1608#ifdef CONFIG_MEMORY_FAILURE
1609	{
1610		.procname	= "memory_failure_early_kill",
1611		.data		= &sysctl_memory_failure_early_kill,
1612		.maxlen		= sizeof(sysctl_memory_failure_early_kill),
1613		.mode		= 0644,
1614		.proc_handler	= proc_dointvec_minmax,
1615		.extra1		= &zero,
1616		.extra2		= &one,
1617	},
1618	{
1619		.procname	= "memory_failure_recovery",
1620		.data		= &sysctl_memory_failure_recovery,
1621		.maxlen		= sizeof(sysctl_memory_failure_recovery),
1622		.mode		= 0644,
1623		.proc_handler	= proc_dointvec_minmax,
1624		.extra1		= &zero,
1625		.extra2		= &one,
1626	},
1627#endif
1628	{
1629		.procname	= "user_reserve_kbytes",
1630		.data		= &sysctl_user_reserve_kbytes,
1631		.maxlen		= sizeof(sysctl_user_reserve_kbytes),
1632		.mode		= 0644,
1633		.proc_handler	= proc_doulongvec_minmax,
1634	},
1635	{
1636		.procname	= "admin_reserve_kbytes",
1637		.data		= &sysctl_admin_reserve_kbytes,
1638		.maxlen		= sizeof(sysctl_admin_reserve_kbytes),
1639		.mode		= 0644,
1640		.proc_handler	= proc_doulongvec_minmax,
1641	},
1642#ifdef CONFIG_HAVE_ARCH_MMAP_RND_BITS
1643	{
1644		.procname	= "mmap_rnd_bits",
1645		.data		= &mmap_rnd_bits,
1646		.maxlen		= sizeof(mmap_rnd_bits),
1647		.mode		= 0600,
1648		.proc_handler	= proc_dointvec_minmax,
1649		.extra1		= (void *)&mmap_rnd_bits_min,
1650		.extra2		= (void *)&mmap_rnd_bits_max,
1651	},
1652#endif
1653#ifdef CONFIG_HAVE_ARCH_MMAP_RND_COMPAT_BITS
1654	{
1655		.procname	= "mmap_rnd_compat_bits",
1656		.data		= &mmap_rnd_compat_bits,
1657		.maxlen		= sizeof(mmap_rnd_compat_bits),
1658		.mode		= 0600,
1659		.proc_handler	= proc_dointvec_minmax,
1660		.extra1		= (void *)&mmap_rnd_compat_bits_min,
1661		.extra2		= (void *)&mmap_rnd_compat_bits_max,
1662	},
1663#endif
1664	{ }
1665};
1666
1667static struct ctl_table fs_table[] = {
1668	{
1669		.procname	= "inode-nr",
1670		.data		= &inodes_stat,
1671		.maxlen		= 2*sizeof(long),
1672		.mode		= 0444,
1673		.proc_handler	= proc_nr_inodes,
1674	},
1675	{
1676		.procname	= "inode-state",
1677		.data		= &inodes_stat,
1678		.maxlen		= 7*sizeof(long),
1679		.mode		= 0444,
1680		.proc_handler	= proc_nr_inodes,
1681	},
1682	{
1683		.procname	= "file-nr",
1684		.data		= &files_stat,
1685		.maxlen		= sizeof(files_stat),
1686		.mode		= 0444,
1687		.proc_handler	= proc_nr_files,
1688	},
1689	{
1690		.procname	= "file-max",
1691		.data		= &files_stat.max_files,
1692		.maxlen		= sizeof(files_stat.max_files),
1693		.mode		= 0644,
1694		.proc_handler	= proc_doulongvec_minmax,
1695	},
1696	{
1697		.procname	= "nr_open",
1698		.data		= &sysctl_nr_open,
1699		.maxlen		= sizeof(unsigned int),
1700		.mode		= 0644,
1701		.proc_handler	= proc_dointvec_minmax,
1702		.extra1		= &sysctl_nr_open_min,
1703		.extra2		= &sysctl_nr_open_max,
1704	},
1705	{
1706		.procname	= "dentry-state",
1707		.data		= &dentry_stat,
1708		.maxlen		= 6*sizeof(long),
1709		.mode		= 0444,
1710		.proc_handler	= proc_nr_dentry,
1711	},
1712	{
1713		.procname	= "overflowuid",
1714		.data		= &fs_overflowuid,
1715		.maxlen		= sizeof(int),
1716		.mode		= 0644,
1717		.proc_handler	= proc_dointvec_minmax,
1718		.extra1		= &minolduid,
1719		.extra2		= &maxolduid,
1720	},
1721	{
1722		.procname	= "overflowgid",
1723		.data		= &fs_overflowgid,
1724		.maxlen		= sizeof(int),
1725		.mode		= 0644,
1726		.proc_handler	= proc_dointvec_minmax,
1727		.extra1		= &minolduid,
1728		.extra2		= &maxolduid,
1729	},
1730#ifdef CONFIG_FILE_LOCKING
1731	{
1732		.procname	= "leases-enable",
1733		.data		= &leases_enable,
1734		.maxlen		= sizeof(int),
1735		.mode		= 0644,
1736		.proc_handler	= proc_dointvec,
1737	},
1738#endif
1739#ifdef CONFIG_DNOTIFY
1740	{
1741		.procname	= "dir-notify-enable",
1742		.data		= &dir_notify_enable,
1743		.maxlen		= sizeof(int),
1744		.mode		= 0644,
1745		.proc_handler	= proc_dointvec,
1746	},
1747#endif
1748#ifdef CONFIG_MMU
1749#ifdef CONFIG_FILE_LOCKING
1750	{
1751		.procname	= "lease-break-time",
1752		.data		= &lease_break_time,
1753		.maxlen		= sizeof(int),
1754		.mode		= 0644,
1755		.proc_handler	= proc_dointvec,
1756	},
1757#endif
1758#ifdef CONFIG_AIO
1759	{
1760		.procname	= "aio-nr",
1761		.data		= &aio_nr,
1762		.maxlen		= sizeof(aio_nr),
1763		.mode		= 0444,
1764		.proc_handler	= proc_doulongvec_minmax,
1765	},
1766	{
1767		.procname	= "aio-max-nr",
1768		.data		= &aio_max_nr,
1769		.maxlen		= sizeof(aio_max_nr),
1770		.mode		= 0644,
1771		.proc_handler	= proc_doulongvec_minmax,
1772	},
1773#endif /* CONFIG_AIO */
1774#ifdef CONFIG_INOTIFY_USER
1775	{
1776		.procname	= "inotify",
1777		.mode		= 0555,
1778		.child		= inotify_table,
1779	},
1780#endif	
1781#ifdef CONFIG_EPOLL
1782	{
1783		.procname	= "epoll",
1784		.mode		= 0555,
1785		.child		= epoll_table,
1786	},
1787#endif
1788#endif
1789	{
1790		.procname	= "protected_symlinks",
1791		.data		= &sysctl_protected_symlinks,
1792		.maxlen		= sizeof(int),
1793		.mode		= 0600,
1794		.proc_handler	= proc_dointvec_minmax,
1795		.extra1		= &zero,
1796		.extra2		= &one,
1797	},
1798	{
1799		.procname	= "protected_hardlinks",
1800		.data		= &sysctl_protected_hardlinks,
1801		.maxlen		= sizeof(int),
1802		.mode		= 0600,
1803		.proc_handler	= proc_dointvec_minmax,
1804		.extra1		= &zero,
1805		.extra2		= &one,
1806	},
1807	{
1808		.procname	= "suid_dumpable",
1809		.data		= &suid_dumpable,
1810		.maxlen		= sizeof(int),
1811		.mode		= 0644,
1812		.proc_handler	= proc_dointvec_minmax_coredump,
1813		.extra1		= &zero,
1814		.extra2		= &two,
1815	},
1816#if defined(CONFIG_BINFMT_MISC) || defined(CONFIG_BINFMT_MISC_MODULE)
1817	{
1818		.procname	= "binfmt_misc",
1819		.mode		= 0555,
1820		.child		= sysctl_mount_point,
1821	},
1822#endif
1823	{
1824		.procname	= "pipe-max-size",
1825		.data		= &pipe_max_size,
1826		.maxlen		= sizeof(pipe_max_size),
1827		.mode		= 0644,
1828		.proc_handler	= proc_dopipe_max_size,
 
1829	},
1830	{
1831		.procname	= "pipe-user-pages-hard",
1832		.data		= &pipe_user_pages_hard,
1833		.maxlen		= sizeof(pipe_user_pages_hard),
1834		.mode		= 0644,
1835		.proc_handler	= proc_doulongvec_minmax,
1836	},
1837	{
1838		.procname	= "pipe-user-pages-soft",
1839		.data		= &pipe_user_pages_soft,
1840		.maxlen		= sizeof(pipe_user_pages_soft),
1841		.mode		= 0644,
1842		.proc_handler	= proc_doulongvec_minmax,
1843	},
1844	{
1845		.procname	= "mount-max",
1846		.data		= &sysctl_mount_max,
1847		.maxlen		= sizeof(unsigned int),
1848		.mode		= 0644,
1849		.proc_handler	= proc_dointvec_minmax,
1850		.extra1		= &one,
1851	},
1852	{ }
1853};
1854
1855static struct ctl_table debug_table[] = {
1856#ifdef CONFIG_SYSCTL_EXCEPTION_TRACE
1857	{
1858		.procname	= "exception-trace",
1859		.data		= &show_unhandled_signals,
1860		.maxlen		= sizeof(int),
1861		.mode		= 0644,
1862		.proc_handler	= proc_dointvec
1863	},
1864#endif
1865#if defined(CONFIG_OPTPROBES)
1866	{
1867		.procname	= "kprobes-optimization",
1868		.data		= &sysctl_kprobes_optimization,
1869		.maxlen		= sizeof(int),
1870		.mode		= 0644,
1871		.proc_handler	= proc_kprobes_optimization_handler,
1872		.extra1		= &zero,
1873		.extra2		= &one,
1874	},
1875#endif
1876	{ }
1877};
1878
1879static struct ctl_table dev_table[] = {
1880	{ }
1881};
1882
1883int __init sysctl_init(void)
1884{
1885	struct ctl_table_header *hdr;
1886
1887	hdr = register_sysctl_table(sysctl_base_table);
1888	kmemleak_not_leak(hdr);
1889	return 0;
1890}
1891
1892#endif /* CONFIG_SYSCTL */
1893
1894/*
1895 * /proc/sys support
1896 */
1897
1898#ifdef CONFIG_PROC_SYSCTL
1899
1900static int _proc_do_string(char *data, int maxlen, int write,
1901			   char __user *buffer,
1902			   size_t *lenp, loff_t *ppos)
1903{
1904	size_t len;
1905	char __user *p;
1906	char c;
1907
1908	if (!data || !maxlen || !*lenp) {
1909		*lenp = 0;
1910		return 0;
1911	}
1912
1913	if (write) {
1914		if (sysctl_writes_strict == SYSCTL_WRITES_STRICT) {
1915			/* Only continue writes not past the end of buffer. */
1916			len = strlen(data);
1917			if (len > maxlen - 1)
1918				len = maxlen - 1;
1919
1920			if (*ppos > len)
1921				return 0;
1922			len = *ppos;
1923		} else {
1924			/* Start writing from beginning of buffer. */
1925			len = 0;
1926		}
1927
1928		*ppos += *lenp;
1929		p = buffer;
1930		while ((p - buffer) < *lenp && len < maxlen - 1) {
1931			if (get_user(c, p++))
1932				return -EFAULT;
1933			if (c == 0 || c == '\n')
1934				break;
1935			data[len++] = c;
1936		}
1937		data[len] = 0;
1938	} else {
1939		len = strlen(data);
1940		if (len > maxlen)
1941			len = maxlen;
1942
1943		if (*ppos > len) {
1944			*lenp = 0;
1945			return 0;
1946		}
1947
1948		data += *ppos;
1949		len  -= *ppos;
1950
1951		if (len > *lenp)
1952			len = *lenp;
1953		if (len)
1954			if (copy_to_user(buffer, data, len))
1955				return -EFAULT;
1956		if (len < *lenp) {
1957			if (put_user('\n', buffer + len))
1958				return -EFAULT;
1959			len++;
1960		}
1961		*lenp = len;
1962		*ppos += len;
1963	}
1964	return 0;
1965}
1966
1967static void warn_sysctl_write(struct ctl_table *table)
1968{
1969	pr_warn_once("%s wrote to %s when file position was not 0!\n"
1970		"This will not be supported in the future. To silence this\n"
1971		"warning, set kernel.sysctl_writes_strict = -1\n",
1972		current->comm, table->procname);
1973}
1974
1975/**
1976 * proc_first_pos_non_zero_ignore - check if firs position is allowed
1977 * @ppos: file position
1978 * @table: the sysctl table
1979 *
1980 * Returns true if the first position is non-zero and the sysctl_writes_strict
1981 * mode indicates this is not allowed for numeric input types. String proc
1982 * hadlers can ignore the return value.
1983 */
1984static bool proc_first_pos_non_zero_ignore(loff_t *ppos,
1985					   struct ctl_table *table)
1986{
1987	if (!*ppos)
1988		return false;
1989
1990	switch (sysctl_writes_strict) {
1991	case SYSCTL_WRITES_STRICT:
1992		return true;
1993	case SYSCTL_WRITES_WARN:
1994		warn_sysctl_write(table);
1995		return false;
1996	default:
1997		return false;
1998	}
1999}
2000
2001/**
2002 * proc_dostring - read a string sysctl
2003 * @table: the sysctl table
2004 * @write: %TRUE if this is a write to the sysctl file
2005 * @buffer: the user buffer
2006 * @lenp: the size of the user buffer
2007 * @ppos: file position
2008 *
2009 * Reads/writes a string from/to the user buffer. If the kernel
2010 * buffer provided is not large enough to hold the string, the
2011 * string is truncated. The copied string is %NULL-terminated.
2012 * If the string is being read by the user process, it is copied
2013 * and a newline '\n' is added. It is truncated if the buffer is
2014 * not large enough.
2015 *
2016 * Returns 0 on success.
2017 */
2018int proc_dostring(struct ctl_table *table, int write,
2019		  void __user *buffer, size_t *lenp, loff_t *ppos)
2020{
2021	if (write)
2022		proc_first_pos_non_zero_ignore(ppos, table);
2023
2024	return _proc_do_string((char *)(table->data), table->maxlen, write,
2025			       (char __user *)buffer, lenp, ppos);
2026}
2027
2028static size_t proc_skip_spaces(char **buf)
2029{
2030	size_t ret;
2031	char *tmp = skip_spaces(*buf);
2032	ret = tmp - *buf;
2033	*buf = tmp;
2034	return ret;
2035}
2036
2037static void proc_skip_char(char **buf, size_t *size, const char v)
2038{
2039	while (*size) {
2040		if (**buf != v)
2041			break;
2042		(*size)--;
2043		(*buf)++;
2044	}
2045}
2046
2047#define TMPBUFLEN 22
2048/**
2049 * proc_get_long - reads an ASCII formatted integer from a user buffer
2050 *
2051 * @buf: a kernel buffer
2052 * @size: size of the kernel buffer
2053 * @val: this is where the number will be stored
2054 * @neg: set to %TRUE if number is negative
2055 * @perm_tr: a vector which contains the allowed trailers
2056 * @perm_tr_len: size of the perm_tr vector
2057 * @tr: pointer to store the trailer character
2058 *
2059 * In case of success %0 is returned and @buf and @size are updated with
2060 * the amount of bytes read. If @tr is non-NULL and a trailing
2061 * character exists (size is non-zero after returning from this
2062 * function), @tr is updated with the trailing character.
2063 */
2064static int proc_get_long(char **buf, size_t *size,
2065			  unsigned long *val, bool *neg,
2066			  const char *perm_tr, unsigned perm_tr_len, char *tr)
2067{
2068	int len;
2069	char *p, tmp[TMPBUFLEN];
2070
2071	if (!*size)
2072		return -EINVAL;
2073
2074	len = *size;
2075	if (len > TMPBUFLEN - 1)
2076		len = TMPBUFLEN - 1;
2077
2078	memcpy(tmp, *buf, len);
2079
2080	tmp[len] = 0;
2081	p = tmp;
2082	if (*p == '-' && *size > 1) {
2083		*neg = true;
2084		p++;
2085	} else
2086		*neg = false;
2087	if (!isdigit(*p))
2088		return -EINVAL;
2089
2090	*val = simple_strtoul(p, &p, 0);
2091
2092	len = p - tmp;
2093
2094	/* We don't know if the next char is whitespace thus we may accept
2095	 * invalid integers (e.g. 1234...a) or two integers instead of one
2096	 * (e.g. 123...1). So lets not allow such large numbers. */
2097	if (len == TMPBUFLEN - 1)
2098		return -EINVAL;
2099
2100	if (len < *size && perm_tr_len && !memchr(perm_tr, *p, perm_tr_len))
2101		return -EINVAL;
2102
2103	if (tr && (len < *size))
2104		*tr = *p;
2105
2106	*buf += len;
2107	*size -= len;
2108
2109	return 0;
2110}
2111
2112/**
2113 * proc_put_long - converts an integer to a decimal ASCII formatted string
2114 *
2115 * @buf: the user buffer
2116 * @size: the size of the user buffer
2117 * @val: the integer to be converted
2118 * @neg: sign of the number, %TRUE for negative
2119 *
2120 * In case of success %0 is returned and @buf and @size are updated with
2121 * the amount of bytes written.
2122 */
2123static int proc_put_long(void __user **buf, size_t *size, unsigned long val,
2124			  bool neg)
2125{
2126	int len;
2127	char tmp[TMPBUFLEN], *p = tmp;
2128
2129	sprintf(p, "%s%lu", neg ? "-" : "", val);
2130	len = strlen(tmp);
2131	if (len > *size)
2132		len = *size;
2133	if (copy_to_user(*buf, tmp, len))
2134		return -EFAULT;
2135	*size -= len;
2136	*buf += len;
2137	return 0;
2138}
2139#undef TMPBUFLEN
2140
2141static int proc_put_char(void __user **buf, size_t *size, char c)
2142{
2143	if (*size) {
2144		char __user **buffer = (char __user **)buf;
2145		if (put_user(c, *buffer))
2146			return -EFAULT;
2147		(*size)--, (*buffer)++;
2148		*buf = *buffer;
2149	}
2150	return 0;
2151}
2152
2153static int do_proc_dointvec_conv(bool *negp, unsigned long *lvalp,
2154				 int *valp,
2155				 int write, void *data)
2156{
2157	if (write) {
2158		if (*negp) {
2159			if (*lvalp > (unsigned long) INT_MAX + 1)
2160				return -EINVAL;
2161			*valp = -*lvalp;
2162		} else {
2163			if (*lvalp > (unsigned long) INT_MAX)
2164				return -EINVAL;
2165			*valp = *lvalp;
2166		}
2167	} else {
2168		int val = *valp;
2169		if (val < 0) {
2170			*negp = true;
2171			*lvalp = -(unsigned long)val;
2172		} else {
2173			*negp = false;
2174			*lvalp = (unsigned long)val;
2175		}
2176	}
2177	return 0;
2178}
2179
2180static int do_proc_douintvec_conv(unsigned long *lvalp,
2181				  unsigned int *valp,
2182				  int write, void *data)
2183{
2184	if (write) {
2185		if (*lvalp > UINT_MAX)
2186			return -EINVAL;
2187		*valp = *lvalp;
2188	} else {
2189		unsigned int val = *valp;
2190		*lvalp = (unsigned long)val;
2191	}
2192	return 0;
2193}
2194
2195static const char proc_wspace_sep[] = { ' ', '\t', '\n' };
2196
2197static int __do_proc_dointvec(void *tbl_data, struct ctl_table *table,
2198		  int write, void __user *buffer,
2199		  size_t *lenp, loff_t *ppos,
2200		  int (*conv)(bool *negp, unsigned long *lvalp, int *valp,
2201			      int write, void *data),
2202		  void *data)
2203{
2204	int *i, vleft, first = 1, err = 0;
2205	size_t left;
2206	char *kbuf = NULL, *p;
2207	
2208	if (!tbl_data || !table->maxlen || !*lenp || (*ppos && !write)) {
2209		*lenp = 0;
2210		return 0;
2211	}
2212	
2213	i = (int *) tbl_data;
2214	vleft = table->maxlen / sizeof(*i);
2215	left = *lenp;
2216
2217	if (!conv)
2218		conv = do_proc_dointvec_conv;
2219
2220	if (write) {
2221		if (proc_first_pos_non_zero_ignore(ppos, table))
2222			goto out;
 
 
 
 
 
 
 
 
 
2223
2224		if (left > PAGE_SIZE - 1)
2225			left = PAGE_SIZE - 1;
2226		p = kbuf = memdup_user_nul(buffer, left);
2227		if (IS_ERR(kbuf))
2228			return PTR_ERR(kbuf);
2229	}
2230
2231	for (; left && vleft--; i++, first=0) {
2232		unsigned long lval;
2233		bool neg;
2234
2235		if (write) {
2236			left -= proc_skip_spaces(&p);
2237
2238			if (!left)
2239				break;
2240			err = proc_get_long(&p, &left, &lval, &neg,
2241					     proc_wspace_sep,
2242					     sizeof(proc_wspace_sep), NULL);
2243			if (err)
2244				break;
2245			if (conv(&neg, &lval, i, 1, data)) {
2246				err = -EINVAL;
2247				break;
2248			}
2249		} else {
2250			if (conv(&neg, &lval, i, 0, data)) {
2251				err = -EINVAL;
2252				break;
2253			}
2254			if (!first)
2255				err = proc_put_char(&buffer, &left, '\t');
2256			if (err)
2257				break;
2258			err = proc_put_long(&buffer, &left, lval, neg);
2259			if (err)
2260				break;
2261		}
2262	}
2263
2264	if (!write && !first && left && !err)
2265		err = proc_put_char(&buffer, &left, '\n');
2266	if (write && !err && left)
2267		left -= proc_skip_spaces(&p);
2268	if (write) {
2269		kfree(kbuf);
2270		if (first)
2271			return err ? : -EINVAL;
2272	}
2273	*lenp -= left;
2274out:
2275	*ppos += *lenp;
2276	return err;
2277}
2278
2279static int do_proc_dointvec(struct ctl_table *table, int write,
2280		  void __user *buffer, size_t *lenp, loff_t *ppos,
2281		  int (*conv)(bool *negp, unsigned long *lvalp, int *valp,
2282			      int write, void *data),
2283		  void *data)
2284{
2285	return __do_proc_dointvec(table->data, table, write,
2286			buffer, lenp, ppos, conv, data);
2287}
2288
2289static int do_proc_douintvec_w(unsigned int *tbl_data,
2290			       struct ctl_table *table,
2291			       void __user *buffer,
2292			       size_t *lenp, loff_t *ppos,
2293			       int (*conv)(unsigned long *lvalp,
2294					   unsigned int *valp,
2295					   int write, void *data),
2296			       void *data)
2297{
2298	unsigned long lval;
2299	int err = 0;
2300	size_t left;
2301	bool neg;
2302	char *kbuf = NULL, *p;
2303
2304	left = *lenp;
2305
2306	if (proc_first_pos_non_zero_ignore(ppos, table))
2307		goto bail_early;
2308
2309	if (left > PAGE_SIZE - 1)
2310		left = PAGE_SIZE - 1;
2311
2312	p = kbuf = memdup_user_nul(buffer, left);
2313	if (IS_ERR(kbuf))
2314		return -EINVAL;
2315
2316	left -= proc_skip_spaces(&p);
2317	if (!left) {
2318		err = -EINVAL;
2319		goto out_free;
2320	}
2321
2322	err = proc_get_long(&p, &left, &lval, &neg,
2323			     proc_wspace_sep,
2324			     sizeof(proc_wspace_sep), NULL);
2325	if (err || neg) {
2326		err = -EINVAL;
2327		goto out_free;
2328	}
2329
2330	if (conv(&lval, tbl_data, 1, data)) {
2331		err = -EINVAL;
2332		goto out_free;
2333	}
2334
2335	if (!err && left)
2336		left -= proc_skip_spaces(&p);
2337
2338out_free:
2339	kfree(kbuf);
2340	if (err)
2341		return -EINVAL;
2342
2343	return 0;
2344
2345	/* This is in keeping with old __do_proc_dointvec() */
2346bail_early:
2347	*ppos += *lenp;
2348	return err;
2349}
2350
2351static int do_proc_douintvec_r(unsigned int *tbl_data, void __user *buffer,
2352			       size_t *lenp, loff_t *ppos,
2353			       int (*conv)(unsigned long *lvalp,
2354					   unsigned int *valp,
2355					   int write, void *data),
2356			       void *data)
2357{
2358	unsigned long lval;
2359	int err = 0;
2360	size_t left;
2361
2362	left = *lenp;
2363
2364	if (conv(&lval, tbl_data, 0, data)) {
2365		err = -EINVAL;
2366		goto out;
2367	}
2368
2369	err = proc_put_long(&buffer, &left, lval, false);
2370	if (err || !left)
2371		goto out;
2372
2373	err = proc_put_char(&buffer, &left, '\n');
2374
2375out:
2376	*lenp -= left;
2377	*ppos += *lenp;
2378
2379	return err;
2380}
2381
2382static int __do_proc_douintvec(void *tbl_data, struct ctl_table *table,
2383			       int write, void __user *buffer,
2384			       size_t *lenp, loff_t *ppos,
2385			       int (*conv)(unsigned long *lvalp,
2386					   unsigned int *valp,
2387					   int write, void *data),
2388			       void *data)
2389{
2390	unsigned int *i, vleft;
2391
2392	if (!tbl_data || !table->maxlen || !*lenp || (*ppos && !write)) {
2393		*lenp = 0;
2394		return 0;
2395	}
2396
2397	i = (unsigned int *) tbl_data;
2398	vleft = table->maxlen / sizeof(*i);
2399
2400	/*
2401	 * Arrays are not supported, keep this simple. *Do not* add
2402	 * support for them.
2403	 */
2404	if (vleft != 1) {
2405		*lenp = 0;
2406		return -EINVAL;
2407	}
2408
2409	if (!conv)
2410		conv = do_proc_douintvec_conv;
2411
2412	if (write)
2413		return do_proc_douintvec_w(i, table, buffer, lenp, ppos,
2414					   conv, data);
2415	return do_proc_douintvec_r(i, buffer, lenp, ppos, conv, data);
2416}
2417
2418static int do_proc_douintvec(struct ctl_table *table, int write,
2419			     void __user *buffer, size_t *lenp, loff_t *ppos,
2420			     int (*conv)(unsigned long *lvalp,
2421					 unsigned int *valp,
2422					 int write, void *data),
2423			     void *data)
2424{
2425	return __do_proc_douintvec(table->data, table, write,
2426				   buffer, lenp, ppos, conv, data);
2427}
2428
2429/**
2430 * proc_dointvec - read a vector of integers
2431 * @table: the sysctl table
2432 * @write: %TRUE if this is a write to the sysctl file
2433 * @buffer: the user buffer
2434 * @lenp: the size of the user buffer
2435 * @ppos: file position
2436 *
2437 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2438 * values from/to the user buffer, treated as an ASCII string. 
2439 *
2440 * Returns 0 on success.
2441 */
2442int proc_dointvec(struct ctl_table *table, int write,
2443		     void __user *buffer, size_t *lenp, loff_t *ppos)
2444{
2445	return do_proc_dointvec(table, write, buffer, lenp, ppos, NULL, NULL);
2446}
2447
2448/**
2449 * proc_douintvec - read a vector of unsigned integers
2450 * @table: the sysctl table
2451 * @write: %TRUE if this is a write to the sysctl file
2452 * @buffer: the user buffer
2453 * @lenp: the size of the user buffer
2454 * @ppos: file position
2455 *
2456 * Reads/writes up to table->maxlen/sizeof(unsigned int) unsigned integer
2457 * values from/to the user buffer, treated as an ASCII string.
2458 *
2459 * Returns 0 on success.
2460 */
2461int proc_douintvec(struct ctl_table *table, int write,
2462		     void __user *buffer, size_t *lenp, loff_t *ppos)
2463{
2464	return do_proc_douintvec(table, write, buffer, lenp, ppos,
2465				 do_proc_douintvec_conv, NULL);
2466}
2467
2468/*
2469 * Taint values can only be increased
2470 * This means we can safely use a temporary.
2471 */
2472static int proc_taint(struct ctl_table *table, int write,
2473			       void __user *buffer, size_t *lenp, loff_t *ppos)
2474{
2475	struct ctl_table t;
2476	unsigned long tmptaint = get_taint();
2477	int err;
2478
2479	if (write && !capable(CAP_SYS_ADMIN))
2480		return -EPERM;
2481
2482	t = *table;
2483	t.data = &tmptaint;
2484	err = proc_doulongvec_minmax(&t, write, buffer, lenp, ppos);
2485	if (err < 0)
2486		return err;
2487
2488	if (write) {
2489		/*
2490		 * Poor man's atomic or. Not worth adding a primitive
2491		 * to everyone's atomic.h for this
2492		 */
2493		int i;
2494		for (i = 0; i < BITS_PER_LONG && tmptaint >> i; i++) {
2495			if ((tmptaint >> i) & 1)
2496				add_taint(i, LOCKDEP_STILL_OK);
2497		}
2498	}
2499
2500	return err;
2501}
2502
2503#ifdef CONFIG_PRINTK
2504static int proc_dointvec_minmax_sysadmin(struct ctl_table *table, int write,
2505				void __user *buffer, size_t *lenp, loff_t *ppos)
2506{
2507	if (write && !capable(CAP_SYS_ADMIN))
2508		return -EPERM;
2509
2510	return proc_dointvec_minmax(table, write, buffer, lenp, ppos);
2511}
2512#endif
2513
2514/**
2515 * struct do_proc_dointvec_minmax_conv_param - proc_dointvec_minmax() range checking structure
2516 * @min: pointer to minimum allowable value
2517 * @max: pointer to maximum allowable value
2518 *
2519 * The do_proc_dointvec_minmax_conv_param structure provides the
2520 * minimum and maximum values for doing range checking for those sysctl
2521 * parameters that use the proc_dointvec_minmax() handler.
2522 */
2523struct do_proc_dointvec_minmax_conv_param {
2524	int *min;
2525	int *max;
2526};
2527
2528static int do_proc_dointvec_minmax_conv(bool *negp, unsigned long *lvalp,
2529					int *valp,
2530					int write, void *data)
2531{
2532	struct do_proc_dointvec_minmax_conv_param *param = data;
2533	if (write) {
2534		int val = *negp ? -*lvalp : *lvalp;
2535		if ((param->min && *param->min > val) ||
2536		    (param->max && *param->max < val))
2537			return -EINVAL;
2538		*valp = val;
2539	} else {
2540		int val = *valp;
2541		if (val < 0) {
2542			*negp = true;
2543			*lvalp = -(unsigned long)val;
2544		} else {
2545			*negp = false;
2546			*lvalp = (unsigned long)val;
2547		}
2548	}
2549	return 0;
2550}
2551
2552/**
2553 * proc_dointvec_minmax - read a vector of integers with min/max values
2554 * @table: the sysctl table
2555 * @write: %TRUE if this is a write to the sysctl file
2556 * @buffer: the user buffer
2557 * @lenp: the size of the user buffer
2558 * @ppos: file position
2559 *
2560 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2561 * values from/to the user buffer, treated as an ASCII string.
2562 *
2563 * This routine will ensure the values are within the range specified by
2564 * table->extra1 (min) and table->extra2 (max).
2565 *
2566 * Returns 0 on success or -EINVAL on write when the range check fails.
2567 */
2568int proc_dointvec_minmax(struct ctl_table *table, int write,
2569		  void __user *buffer, size_t *lenp, loff_t *ppos)
2570{
2571	struct do_proc_dointvec_minmax_conv_param param = {
2572		.min = (int *) table->extra1,
2573		.max = (int *) table->extra2,
2574	};
2575	return do_proc_dointvec(table, write, buffer, lenp, ppos,
2576				do_proc_dointvec_minmax_conv, &param);
2577}
2578
2579/**
2580 * struct do_proc_douintvec_minmax_conv_param - proc_douintvec_minmax() range checking structure
2581 * @min: pointer to minimum allowable value
2582 * @max: pointer to maximum allowable value
2583 *
2584 * The do_proc_douintvec_minmax_conv_param structure provides the
2585 * minimum and maximum values for doing range checking for those sysctl
2586 * parameters that use the proc_douintvec_minmax() handler.
2587 */
2588struct do_proc_douintvec_minmax_conv_param {
2589	unsigned int *min;
2590	unsigned int *max;
2591};
2592
2593static int do_proc_douintvec_minmax_conv(unsigned long *lvalp,
2594					 unsigned int *valp,
2595					 int write, void *data)
2596{
2597	struct do_proc_douintvec_minmax_conv_param *param = data;
2598
2599	if (write) {
2600		unsigned int val = *lvalp;
2601
2602		if (*lvalp > UINT_MAX)
2603			return -EINVAL;
2604
2605		if ((param->min && *param->min > val) ||
2606		    (param->max && *param->max < val))
2607			return -ERANGE;
2608
2609		*valp = val;
2610	} else {
2611		unsigned int val = *valp;
2612		*lvalp = (unsigned long) val;
2613	}
2614
2615	return 0;
2616}
2617
2618/**
2619 * proc_douintvec_minmax - read a vector of unsigned ints with min/max values
2620 * @table: the sysctl table
2621 * @write: %TRUE if this is a write to the sysctl file
2622 * @buffer: the user buffer
2623 * @lenp: the size of the user buffer
2624 * @ppos: file position
2625 *
2626 * Reads/writes up to table->maxlen/sizeof(unsigned int) unsigned integer
2627 * values from/to the user buffer, treated as an ASCII string. Negative
2628 * strings are not allowed.
2629 *
2630 * This routine will ensure the values are within the range specified by
2631 * table->extra1 (min) and table->extra2 (max). There is a final sanity
2632 * check for UINT_MAX to avoid having to support wrap around uses from
2633 * userspace.
2634 *
2635 * Returns 0 on success or -ERANGE on write when the range check fails.
2636 */
2637int proc_douintvec_minmax(struct ctl_table *table, int write,
2638			  void __user *buffer, size_t *lenp, loff_t *ppos)
2639{
2640	struct do_proc_douintvec_minmax_conv_param param = {
2641		.min = (unsigned int *) table->extra1,
2642		.max = (unsigned int *) table->extra2,
2643	};
2644	return do_proc_douintvec(table, write, buffer, lenp, ppos,
2645				 do_proc_douintvec_minmax_conv, &param);
2646}
2647
2648static int do_proc_dopipe_max_size_conv(unsigned long *lvalp,
2649					unsigned int *valp,
2650					int write, void *data)
2651{
2652	if (write) {
2653		unsigned int val;
2654
2655		val = round_pipe_size(*lvalp);
2656		if (val == 0)
2657			return -EINVAL;
2658
2659		*valp = val;
2660	} else {
2661		unsigned int val = *valp;
2662		*lvalp = (unsigned long) val;
2663	}
2664
2665	return 0;
2666}
2667
2668static int proc_dopipe_max_size(struct ctl_table *table, int write,
2669				void __user *buffer, size_t *lenp, loff_t *ppos)
2670{
2671	return do_proc_douintvec(table, write, buffer, lenp, ppos,
2672				 do_proc_dopipe_max_size_conv, NULL);
2673}
2674
2675static void validate_coredump_safety(void)
2676{
2677#ifdef CONFIG_COREDUMP
2678	if (suid_dumpable == SUID_DUMP_ROOT &&
2679	    core_pattern[0] != '/' && core_pattern[0] != '|') {
2680		printk(KERN_WARNING
2681"Unsafe core_pattern used with fs.suid_dumpable=2.\n"
2682"Pipe handler or fully qualified core dump path required.\n"
2683"Set kernel.core_pattern before fs.suid_dumpable.\n"
2684		);
2685	}
2686#endif
2687}
2688
2689static int proc_dointvec_minmax_coredump(struct ctl_table *table, int write,
2690		void __user *buffer, size_t *lenp, loff_t *ppos)
2691{
2692	int error = proc_dointvec_minmax(table, write, buffer, lenp, ppos);
2693	if (!error)
2694		validate_coredump_safety();
2695	return error;
2696}
2697
2698#ifdef CONFIG_COREDUMP
2699static int proc_dostring_coredump(struct ctl_table *table, int write,
2700		  void __user *buffer, size_t *lenp, loff_t *ppos)
2701{
2702	int error = proc_dostring(table, write, buffer, lenp, ppos);
2703	if (!error)
2704		validate_coredump_safety();
2705	return error;
2706}
2707#endif
2708
2709static int __do_proc_doulongvec_minmax(void *data, struct ctl_table *table, int write,
2710				     void __user *buffer,
2711				     size_t *lenp, loff_t *ppos,
2712				     unsigned long convmul,
2713				     unsigned long convdiv)
2714{
2715	unsigned long *i, *min, *max;
2716	int vleft, first = 1, err = 0;
2717	size_t left;
2718	char *kbuf = NULL, *p;
2719
2720	if (!data || !table->maxlen || !*lenp || (*ppos && !write)) {
2721		*lenp = 0;
2722		return 0;
2723	}
2724
2725	i = (unsigned long *) data;
2726	min = (unsigned long *) table->extra1;
2727	max = (unsigned long *) table->extra2;
2728	vleft = table->maxlen / sizeof(unsigned long);
2729	left = *lenp;
2730
2731	if (write) {
2732		if (proc_first_pos_non_zero_ignore(ppos, table))
2733			goto out;
 
 
 
 
 
 
 
 
 
2734
2735		if (left > PAGE_SIZE - 1)
2736			left = PAGE_SIZE - 1;
2737		p = kbuf = memdup_user_nul(buffer, left);
2738		if (IS_ERR(kbuf))
2739			return PTR_ERR(kbuf);
2740	}
2741
2742	for (; left && vleft--; i++, first = 0) {
2743		unsigned long val;
2744
2745		if (write) {
2746			bool neg;
2747
2748			left -= proc_skip_spaces(&p);
2749
2750			err = proc_get_long(&p, &left, &val, &neg,
2751					     proc_wspace_sep,
2752					     sizeof(proc_wspace_sep), NULL);
2753			if (err)
2754				break;
2755			if (neg)
2756				continue;
2757			val = convmul * val / convdiv;
2758			if ((min && val < *min) || (max && val > *max))
2759				continue;
2760			*i = val;
2761		} else {
2762			val = convdiv * (*i) / convmul;
2763			if (!first) {
2764				err = proc_put_char(&buffer, &left, '\t');
2765				if (err)
2766					break;
2767			}
2768			err = proc_put_long(&buffer, &left, val, false);
2769			if (err)
2770				break;
2771		}
2772	}
2773
2774	if (!write && !first && left && !err)
2775		err = proc_put_char(&buffer, &left, '\n');
2776	if (write && !err)
2777		left -= proc_skip_spaces(&p);
2778	if (write) {
2779		kfree(kbuf);
2780		if (first)
2781			return err ? : -EINVAL;
2782	}
2783	*lenp -= left;
2784out:
2785	*ppos += *lenp;
2786	return err;
2787}
2788
2789static int do_proc_doulongvec_minmax(struct ctl_table *table, int write,
2790				     void __user *buffer,
2791				     size_t *lenp, loff_t *ppos,
2792				     unsigned long convmul,
2793				     unsigned long convdiv)
2794{
2795	return __do_proc_doulongvec_minmax(table->data, table, write,
2796			buffer, lenp, ppos, convmul, convdiv);
2797}
2798
2799/**
2800 * proc_doulongvec_minmax - read a vector of long integers with min/max values
2801 * @table: the sysctl table
2802 * @write: %TRUE if this is a write to the sysctl file
2803 * @buffer: the user buffer
2804 * @lenp: the size of the user buffer
2805 * @ppos: file position
2806 *
2807 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long
2808 * values from/to the user buffer, treated as an ASCII string.
2809 *
2810 * This routine will ensure the values are within the range specified by
2811 * table->extra1 (min) and table->extra2 (max).
2812 *
2813 * Returns 0 on success.
2814 */
2815int proc_doulongvec_minmax(struct ctl_table *table, int write,
2816			   void __user *buffer, size_t *lenp, loff_t *ppos)
2817{
2818    return do_proc_doulongvec_minmax(table, write, buffer, lenp, ppos, 1l, 1l);
2819}
2820
2821/**
2822 * proc_doulongvec_ms_jiffies_minmax - read a vector of millisecond values with min/max values
2823 * @table: the sysctl table
2824 * @write: %TRUE if this is a write to the sysctl file
2825 * @buffer: the user buffer
2826 * @lenp: the size of the user buffer
2827 * @ppos: file position
2828 *
2829 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long
2830 * values from/to the user buffer, treated as an ASCII string. The values
2831 * are treated as milliseconds, and converted to jiffies when they are stored.
2832 *
2833 * This routine will ensure the values are within the range specified by
2834 * table->extra1 (min) and table->extra2 (max).
2835 *
2836 * Returns 0 on success.
2837 */
2838int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write,
2839				      void __user *buffer,
2840				      size_t *lenp, loff_t *ppos)
2841{
2842    return do_proc_doulongvec_minmax(table, write, buffer,
2843				     lenp, ppos, HZ, 1000l);
2844}
2845
2846
2847static int do_proc_dointvec_jiffies_conv(bool *negp, unsigned long *lvalp,
2848					 int *valp,
2849					 int write, void *data)
2850{
2851	if (write) {
2852		if (*lvalp > INT_MAX / HZ)
2853			return 1;
2854		*valp = *negp ? -(*lvalp*HZ) : (*lvalp*HZ);
2855	} else {
2856		int val = *valp;
2857		unsigned long lval;
2858		if (val < 0) {
2859			*negp = true;
2860			lval = -(unsigned long)val;
2861		} else {
2862			*negp = false;
2863			lval = (unsigned long)val;
2864		}
2865		*lvalp = lval / HZ;
2866	}
2867	return 0;
2868}
2869
2870static int do_proc_dointvec_userhz_jiffies_conv(bool *negp, unsigned long *lvalp,
2871						int *valp,
2872						int write, void *data)
2873{
2874	if (write) {
2875		if (USER_HZ < HZ && *lvalp > (LONG_MAX / HZ) * USER_HZ)
2876			return 1;
2877		*valp = clock_t_to_jiffies(*negp ? -*lvalp : *lvalp);
2878	} else {
2879		int val = *valp;
2880		unsigned long lval;
2881		if (val < 0) {
2882			*negp = true;
2883			lval = -(unsigned long)val;
2884		} else {
2885			*negp = false;
2886			lval = (unsigned long)val;
2887		}
2888		*lvalp = jiffies_to_clock_t(lval);
2889	}
2890	return 0;
2891}
2892
2893static int do_proc_dointvec_ms_jiffies_conv(bool *negp, unsigned long *lvalp,
2894					    int *valp,
2895					    int write, void *data)
2896{
2897	if (write) {
2898		unsigned long jif = msecs_to_jiffies(*negp ? -*lvalp : *lvalp);
2899
2900		if (jif > INT_MAX)
2901			return 1;
2902		*valp = (int)jif;
2903	} else {
2904		int val = *valp;
2905		unsigned long lval;
2906		if (val < 0) {
2907			*negp = true;
2908			lval = -(unsigned long)val;
2909		} else {
2910			*negp = false;
2911			lval = (unsigned long)val;
2912		}
2913		*lvalp = jiffies_to_msecs(lval);
2914	}
2915	return 0;
2916}
2917
2918/**
2919 * proc_dointvec_jiffies - read a vector of integers as seconds
2920 * @table: the sysctl table
2921 * @write: %TRUE if this is a write to the sysctl file
2922 * @buffer: the user buffer
2923 * @lenp: the size of the user buffer
2924 * @ppos: file position
2925 *
2926 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2927 * values from/to the user buffer, treated as an ASCII string. 
2928 * The values read are assumed to be in seconds, and are converted into
2929 * jiffies.
2930 *
2931 * Returns 0 on success.
2932 */
2933int proc_dointvec_jiffies(struct ctl_table *table, int write,
2934			  void __user *buffer, size_t *lenp, loff_t *ppos)
2935{
2936    return do_proc_dointvec(table,write,buffer,lenp,ppos,
2937		    	    do_proc_dointvec_jiffies_conv,NULL);
2938}
2939
2940/**
2941 * proc_dointvec_userhz_jiffies - read a vector of integers as 1/USER_HZ seconds
2942 * @table: the sysctl table
2943 * @write: %TRUE if this is a write to the sysctl file
2944 * @buffer: the user buffer
2945 * @lenp: the size of the user buffer
2946 * @ppos: pointer to the file position
2947 *
2948 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2949 * values from/to the user buffer, treated as an ASCII string. 
2950 * The values read are assumed to be in 1/USER_HZ seconds, and 
2951 * are converted into jiffies.
2952 *
2953 * Returns 0 on success.
2954 */
2955int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write,
2956				 void __user *buffer, size_t *lenp, loff_t *ppos)
2957{
2958    return do_proc_dointvec(table,write,buffer,lenp,ppos,
2959		    	    do_proc_dointvec_userhz_jiffies_conv,NULL);
2960}
2961
2962/**
2963 * proc_dointvec_ms_jiffies - read a vector of integers as 1 milliseconds
2964 * @table: the sysctl table
2965 * @write: %TRUE if this is a write to the sysctl file
2966 * @buffer: the user buffer
2967 * @lenp: the size of the user buffer
2968 * @ppos: file position
2969 * @ppos: the current position in the file
2970 *
2971 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer
2972 * values from/to the user buffer, treated as an ASCII string. 
2973 * The values read are assumed to be in 1/1000 seconds, and 
2974 * are converted into jiffies.
2975 *
2976 * Returns 0 on success.
2977 */
2978int proc_dointvec_ms_jiffies(struct ctl_table *table, int write,
2979			     void __user *buffer, size_t *lenp, loff_t *ppos)
2980{
2981	return do_proc_dointvec(table, write, buffer, lenp, ppos,
2982				do_proc_dointvec_ms_jiffies_conv, NULL);
2983}
2984
2985static int proc_do_cad_pid(struct ctl_table *table, int write,
2986			   void __user *buffer, size_t *lenp, loff_t *ppos)
2987{
2988	struct pid *new_pid;
2989	pid_t tmp;
2990	int r;
2991
2992	tmp = pid_vnr(cad_pid);
2993
2994	r = __do_proc_dointvec(&tmp, table, write, buffer,
2995			       lenp, ppos, NULL, NULL);
2996	if (r || !write)
2997		return r;
2998
2999	new_pid = find_get_pid(tmp);
3000	if (!new_pid)
3001		return -ESRCH;
3002
3003	put_pid(xchg(&cad_pid, new_pid));
3004	return 0;
3005}
3006
3007/**
3008 * proc_do_large_bitmap - read/write from/to a large bitmap
3009 * @table: the sysctl table
3010 * @write: %TRUE if this is a write to the sysctl file
3011 * @buffer: the user buffer
3012 * @lenp: the size of the user buffer
3013 * @ppos: file position
3014 *
3015 * The bitmap is stored at table->data and the bitmap length (in bits)
3016 * in table->maxlen.
3017 *
3018 * We use a range comma separated format (e.g. 1,3-4,10-10) so that
3019 * large bitmaps may be represented in a compact manner. Writing into
3020 * the file will clear the bitmap then update it with the given input.
3021 *
3022 * Returns 0 on success.
3023 */
3024int proc_do_large_bitmap(struct ctl_table *table, int write,
3025			 void __user *buffer, size_t *lenp, loff_t *ppos)
3026{
3027	int err = 0;
3028	bool first = 1;
3029	size_t left = *lenp;
3030	unsigned long bitmap_len = table->maxlen;
3031	unsigned long *bitmap = *(unsigned long **) table->data;
3032	unsigned long *tmp_bitmap = NULL;
3033	char tr_a[] = { '-', ',', '\n' }, tr_b[] = { ',', '\n', 0 }, c;
3034
3035	if (!bitmap || !bitmap_len || !left || (*ppos && !write)) {
3036		*lenp = 0;
3037		return 0;
3038	}
3039
3040	if (write) {
3041		char *kbuf, *p;
3042
3043		if (left > PAGE_SIZE - 1)
3044			left = PAGE_SIZE - 1;
3045
3046		p = kbuf = memdup_user_nul(buffer, left);
3047		if (IS_ERR(kbuf))
3048			return PTR_ERR(kbuf);
3049
3050		tmp_bitmap = kzalloc(BITS_TO_LONGS(bitmap_len) * sizeof(unsigned long),
3051				     GFP_KERNEL);
3052		if (!tmp_bitmap) {
3053			kfree(kbuf);
3054			return -ENOMEM;
3055		}
3056		proc_skip_char(&p, &left, '\n');
3057		while (!err && left) {
3058			unsigned long val_a, val_b;
3059			bool neg;
3060
3061			err = proc_get_long(&p, &left, &val_a, &neg, tr_a,
3062					     sizeof(tr_a), &c);
3063			if (err)
3064				break;
3065			if (val_a >= bitmap_len || neg) {
3066				err = -EINVAL;
3067				break;
3068			}
3069
3070			val_b = val_a;
3071			if (left) {
3072				p++;
3073				left--;
3074			}
3075
3076			if (c == '-') {
3077				err = proc_get_long(&p, &left, &val_b,
3078						     &neg, tr_b, sizeof(tr_b),
3079						     &c);
3080				if (err)
3081					break;
3082				if (val_b >= bitmap_len || neg ||
3083				    val_a > val_b) {
3084					err = -EINVAL;
3085					break;
3086				}
3087				if (left) {
3088					p++;
3089					left--;
3090				}
3091			}
3092
3093			bitmap_set(tmp_bitmap, val_a, val_b - val_a + 1);
3094			first = 0;
3095			proc_skip_char(&p, &left, '\n');
3096		}
3097		kfree(kbuf);
3098	} else {
3099		unsigned long bit_a, bit_b = 0;
3100
3101		while (left) {
3102			bit_a = find_next_bit(bitmap, bitmap_len, bit_b);
3103			if (bit_a >= bitmap_len)
3104				break;
3105			bit_b = find_next_zero_bit(bitmap, bitmap_len,
3106						   bit_a + 1) - 1;
3107
3108			if (!first) {
3109				err = proc_put_char(&buffer, &left, ',');
3110				if (err)
3111					break;
3112			}
3113			err = proc_put_long(&buffer, &left, bit_a, false);
3114			if (err)
3115				break;
3116			if (bit_a != bit_b) {
3117				err = proc_put_char(&buffer, &left, '-');
3118				if (err)
3119					break;
3120				err = proc_put_long(&buffer, &left, bit_b, false);
3121				if (err)
3122					break;
3123			}
3124
3125			first = 0; bit_b++;
3126		}
3127		if (!err)
3128			err = proc_put_char(&buffer, &left, '\n');
3129	}
3130
3131	if (!err) {
3132		if (write) {
3133			if (*ppos)
3134				bitmap_or(bitmap, bitmap, tmp_bitmap, bitmap_len);
3135			else
3136				bitmap_copy(bitmap, tmp_bitmap, bitmap_len);
3137		}
 
3138		*lenp -= left;
3139		*ppos += *lenp;
 
 
 
 
3140	}
3141
3142	kfree(tmp_bitmap);
3143	return err;
3144}
3145
3146#else /* CONFIG_PROC_SYSCTL */
3147
3148int proc_dostring(struct ctl_table *table, int write,
3149		  void __user *buffer, size_t *lenp, loff_t *ppos)
3150{
3151	return -ENOSYS;
3152}
3153
3154int proc_dointvec(struct ctl_table *table, int write,
3155		  void __user *buffer, size_t *lenp, loff_t *ppos)
3156{
3157	return -ENOSYS;
3158}
3159
3160int proc_douintvec(struct ctl_table *table, int write,
3161		  void __user *buffer, size_t *lenp, loff_t *ppos)
3162{
3163	return -ENOSYS;
3164}
3165
3166int proc_dointvec_minmax(struct ctl_table *table, int write,
3167		    void __user *buffer, size_t *lenp, loff_t *ppos)
3168{
3169	return -ENOSYS;
3170}
3171
3172int proc_douintvec_minmax(struct ctl_table *table, int write,
3173			  void __user *buffer, size_t *lenp, loff_t *ppos)
3174{
3175	return -ENOSYS;
3176}
3177
3178int proc_dointvec_jiffies(struct ctl_table *table, int write,
3179		    void __user *buffer, size_t *lenp, loff_t *ppos)
3180{
3181	return -ENOSYS;
3182}
3183
3184int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write,
3185		    void __user *buffer, size_t *lenp, loff_t *ppos)
3186{
3187	return -ENOSYS;
3188}
3189
3190int proc_dointvec_ms_jiffies(struct ctl_table *table, int write,
3191			     void __user *buffer, size_t *lenp, loff_t *ppos)
3192{
3193	return -ENOSYS;
3194}
3195
3196int proc_doulongvec_minmax(struct ctl_table *table, int write,
3197		    void __user *buffer, size_t *lenp, loff_t *ppos)
3198{
3199	return -ENOSYS;
3200}
3201
3202int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write,
3203				      void __user *buffer,
3204				      size_t *lenp, loff_t *ppos)
3205{
3206    return -ENOSYS;
3207}
3208
3209
3210#endif /* CONFIG_PROC_SYSCTL */
3211
3212/*
3213 * No sense putting this after each symbol definition, twice,
3214 * exception granted :-)
3215 */
3216EXPORT_SYMBOL(proc_dointvec);
3217EXPORT_SYMBOL(proc_douintvec);
3218EXPORT_SYMBOL(proc_dointvec_jiffies);
3219EXPORT_SYMBOL(proc_dointvec_minmax);
3220EXPORT_SYMBOL_GPL(proc_douintvec_minmax);
3221EXPORT_SYMBOL(proc_dointvec_userhz_jiffies);
3222EXPORT_SYMBOL(proc_dointvec_ms_jiffies);
3223EXPORT_SYMBOL(proc_dostring);
3224EXPORT_SYMBOL(proc_doulongvec_minmax);
3225EXPORT_SYMBOL(proc_doulongvec_ms_jiffies_minmax);