1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * sysctl.c: General linux system control interface 4 * 5 * Begun 24 March 1995, Stephen Tweedie 6 * Added /proc support, Dec 1995 7 * Added bdflush entry and intvec min/max checking, 2/23/96, Tom Dyas. 8 * Added hooks for /proc/sys/net (minor, minor patch), 96/4/1, Mike Shaver. 9 * Added kernel/java-{interpreter,appletviewer}, 96/5/10, Mike Shaver. 10 * Dynamic registration fixes, Stephen Tweedie. 11 * Added kswapd-interval, ctrl-alt-del, printk stuff, 1/8/97, Chris Horn. 12 * Made sysctl support optional via CONFIG_SYSCTL, 1/10/97, Chris 13 * Horn. 14 * Added proc_doulongvec_ms_jiffies_minmax, 09/08/99, Carlos H. Bauer. 15 * Added proc_doulongvec_minmax, 09/08/99, Carlos H. Bauer. 16 * Changed linked lists to use list.h instead of lists.h, 02/24/00, Bill 17 * Wendling. 18 * The list_for_each() macro wasn't appropriate for the sysctl loop. 19 * Removed it and replaced it with older style, 03/23/00, Bill Wendling 20 */ 21 22 #include <linux/module.h> 23 #include <linux/mm.h> 24 #include <linux/swap.h> 25 #include <linux/slab.h> 26 #include <linux/sysctl.h> 27 #include <linux/bitmap.h> 28 #include <linux/signal.h> 29 #include <linux/panic.h> 30 #include <linux/printk.h> 31 #include <linux/proc_fs.h> 32 #include <linux/security.h> 33 #include <linux/ctype.h> 34 #include <linux/kmemleak.h> 35 #include <linux/filter.h> 36 #include <linux/fs.h> 37 #include <linux/init.h> 38 #include <linux/kernel.h> 39 #include <linux/kobject.h> 40 #include <linux/net.h> 41 #include <linux/sysrq.h> 42 #include <linux/highuid.h> 43 #include <linux/writeback.h> 44 #include <linux/ratelimit.h> 45 #include <linux/compaction.h> 46 #include <linux/hugetlb.h> 47 #include <linux/initrd.h> 48 #include <linux/key.h> 49 #include <linux/times.h> 50 #include <linux/limits.h> 51 #include <linux/dcache.h> 52 #include <linux/syscalls.h> 53 #include <linux/vmstat.h> 54 #include <linux/nfs_fs.h> 55 #include <linux/acpi.h> 56 #include <linux/reboot.h> 57 #include <linux/ftrace.h> 58 #include <linux/perf_event.h> 59 #include <linux/oom.h> 60 #include <linux/kmod.h> 61 #include <linux/capability.h> 62 #include <linux/binfmts.h> 63 #include <linux/sched/sysctl.h> 64 #include <linux/kexec.h> 65 #include <linux/mount.h> 66 #include <linux/userfaultfd_k.h> 67 #include <linux/latencytop.h> 68 #include <linux/pid.h> 69 #include <linux/delayacct.h> 70 71 #include "../lib/kstrtox.h" 72 73 #include <linux/uaccess.h> 74 #include <asm/processor.h> 75 76 #ifdef CONFIG_X86 77 #include <asm/nmi.h> 78 #include <asm/stacktrace.h> 79 #include <asm/io.h> 80 #endif 81 #ifdef CONFIG_SPARC 82 #include <asm/setup.h> 83 #endif 84 #ifdef CONFIG_BSD_PROCESS_ACCT 85 #include <linux/acct.h> 86 #endif 87 #ifdef CONFIG_RT_MUTEXES 88 #include <linux/rtmutex.h> 89 #endif 90 #if defined(CONFIG_PROVE_LOCKING) || defined(CONFIG_LOCK_STAT) 91 #include <linux/lockdep.h> 92 #endif 93 94 #if defined(CONFIG_SYSCTL) 95 96 /* Constants used for minimum and maximum */ 97 98 #ifdef CONFIG_PERF_EVENTS 99 static const int six_hundred_forty_kb = 640 * 1024; 100 #endif 101 102 /* this is needed for the proc_doulongvec_minmax of vm_dirty_bytes */ 103 static const unsigned long dirty_bytes_min = 2 * PAGE_SIZE; 104 105 static const int ngroups_max = NGROUPS_MAX; 106 static const int cap_last_cap = CAP_LAST_CAP; 107 108 #ifdef CONFIG_PROC_SYSCTL 109 110 /** 111 * enum sysctl_writes_mode - supported sysctl write modes 112 * 113 * @SYSCTL_WRITES_LEGACY: each write syscall must fully contain the sysctl value 114 * to be written, and multiple writes on the same sysctl file descriptor 115 * will rewrite the sysctl value, regardless of file position. No warning 116 * is issued when the initial position is not 0. 117 * @SYSCTL_WRITES_WARN: same as above but warn when the initial file position is 118 * not 0. 119 * @SYSCTL_WRITES_STRICT: writes to numeric sysctl entries must always be at 120 * file position 0 and the value must be fully contained in the buffer 121 * sent to the write syscall. If dealing with strings respect the file 122 * position, but restrict this to the max length of the buffer, anything 123 * passed the max length will be ignored. Multiple writes will append 124 * to the buffer. 125 * 126 * These write modes control how current file position affects the behavior of 127 * updating sysctl values through the proc interface on each write. 128 */ 129 enum sysctl_writes_mode { 130 SYSCTL_WRITES_LEGACY = -1, 131 SYSCTL_WRITES_WARN = 0, 132 SYSCTL_WRITES_STRICT = 1, 133 }; 134 135 static enum sysctl_writes_mode sysctl_writes_strict = SYSCTL_WRITES_STRICT; 136 #endif /* CONFIG_PROC_SYSCTL */ 137 138 #if defined(HAVE_ARCH_PICK_MMAP_LAYOUT) || \ 139 defined(CONFIG_ARCH_WANT_DEFAULT_TOPDOWN_MMAP_LAYOUT) 140 int sysctl_legacy_va_layout; 141 #endif 142 143 #ifdef CONFIG_COMPACTION 144 /* min_extfrag_threshold is SYSCTL_ZERO */; 145 static const int max_extfrag_threshold = 1000; 146 #endif 147 148 #endif /* CONFIG_SYSCTL */ 149 150 /* 151 * /proc/sys support 152 */ 153 154 #ifdef CONFIG_PROC_SYSCTL 155 156 static int _proc_do_string(char *data, int maxlen, int write, 157 char *buffer, size_t *lenp, loff_t *ppos) 158 { 159 size_t len; 160 char c, *p; 161 162 if (!data || !maxlen || !*lenp) { 163 *lenp = 0; 164 return 0; 165 } 166 167 if (write) { 168 if (sysctl_writes_strict == SYSCTL_WRITES_STRICT) { 169 /* Only continue writes not past the end of buffer. */ 170 len = strlen(data); 171 if (len > maxlen - 1) 172 len = maxlen - 1; 173 174 if (*ppos > len) 175 return 0; 176 len = *ppos; 177 } else { 178 /* Start writing from beginning of buffer. */ 179 len = 0; 180 } 181 182 *ppos += *lenp; 183 p = buffer; 184 while ((p - buffer) < *lenp && len < maxlen - 1) { 185 c = *(p++); 186 if (c == 0 || c == '\n') 187 break; 188 data[len++] = c; 189 } 190 data[len] = 0; 191 } else { 192 len = strlen(data); 193 if (len > maxlen) 194 len = maxlen; 195 196 if (*ppos > len) { 197 *lenp = 0; 198 return 0; 199 } 200 201 data += *ppos; 202 len -= *ppos; 203 204 if (len > *lenp) 205 len = *lenp; 206 if (len) 207 memcpy(buffer, data, len); 208 if (len < *lenp) { 209 buffer[len] = '\n'; 210 len++; 211 } 212 *lenp = len; 213 *ppos += len; 214 } 215 return 0; 216 } 217 218 static void warn_sysctl_write(struct ctl_table *table) 219 { 220 pr_warn_once("%s wrote to %s when file position was not 0!\n" 221 "This will not be supported in the future. To silence this\n" 222 "warning, set kernel.sysctl_writes_strict = -1\n", 223 current->comm, table->procname); 224 } 225 226 /** 227 * proc_first_pos_non_zero_ignore - check if first position is allowed 228 * @ppos: file position 229 * @table: the sysctl table 230 * 231 * Returns true if the first position is non-zero and the sysctl_writes_strict 232 * mode indicates this is not allowed for numeric input types. String proc 233 * handlers can ignore the return value. 234 */ 235 static bool proc_first_pos_non_zero_ignore(loff_t *ppos, 236 struct ctl_table *table) 237 { 238 if (!*ppos) 239 return false; 240 241 switch (sysctl_writes_strict) { 242 case SYSCTL_WRITES_STRICT: 243 return true; 244 case SYSCTL_WRITES_WARN: 245 warn_sysctl_write(table); 246 return false; 247 default: 248 return false; 249 } 250 } 251 252 /** 253 * proc_dostring - read a string sysctl 254 * @table: the sysctl table 255 * @write: %TRUE if this is a write to the sysctl file 256 * @buffer: the user buffer 257 * @lenp: the size of the user buffer 258 * @ppos: file position 259 * 260 * Reads/writes a string from/to the user buffer. If the kernel 261 * buffer provided is not large enough to hold the string, the 262 * string is truncated. The copied string is %NULL-terminated. 263 * If the string is being read by the user process, it is copied 264 * and a newline '\n' is added. It is truncated if the buffer is 265 * not large enough. 266 * 267 * Returns 0 on success. 268 */ 269 int proc_dostring(struct ctl_table *table, int write, 270 void *buffer, size_t *lenp, loff_t *ppos) 271 { 272 if (write) 273 proc_first_pos_non_zero_ignore(ppos, table); 274 275 return _proc_do_string(table->data, table->maxlen, write, buffer, lenp, 276 ppos); 277 } 278 279 static size_t proc_skip_spaces(char **buf) 280 { 281 size_t ret; 282 char *tmp = skip_spaces(*buf); 283 ret = tmp - *buf; 284 *buf = tmp; 285 return ret; 286 } 287 288 static void proc_skip_char(char **buf, size_t *size, const char v) 289 { 290 while (*size) { 291 if (**buf != v) 292 break; 293 (*size)--; 294 (*buf)++; 295 } 296 } 297 298 /** 299 * strtoul_lenient - parse an ASCII formatted integer from a buffer and only 300 * fail on overflow 301 * 302 * @cp: kernel buffer containing the string to parse 303 * @endp: pointer to store the trailing characters 304 * @base: the base to use 305 * @res: where the parsed integer will be stored 306 * 307 * In case of success 0 is returned and @res will contain the parsed integer, 308 * @endp will hold any trailing characters. 309 * This function will fail the parse on overflow. If there wasn't an overflow 310 * the function will defer the decision what characters count as invalid to the 311 * caller. 312 */ 313 static int strtoul_lenient(const char *cp, char **endp, unsigned int base, 314 unsigned long *res) 315 { 316 unsigned long long result; 317 unsigned int rv; 318 319 cp = _parse_integer_fixup_radix(cp, &base); 320 rv = _parse_integer(cp, base, &result); 321 if ((rv & KSTRTOX_OVERFLOW) || (result != (unsigned long)result)) 322 return -ERANGE; 323 324 cp += rv; 325 326 if (endp) 327 *endp = (char *)cp; 328 329 *res = (unsigned long)result; 330 return 0; 331 } 332 333 #define TMPBUFLEN 22 334 /** 335 * proc_get_long - reads an ASCII formatted integer from a user buffer 336 * 337 * @buf: a kernel buffer 338 * @size: size of the kernel buffer 339 * @val: this is where the number will be stored 340 * @neg: set to %TRUE if number is negative 341 * @perm_tr: a vector which contains the allowed trailers 342 * @perm_tr_len: size of the perm_tr vector 343 * @tr: pointer to store the trailer character 344 * 345 * In case of success %0 is returned and @buf and @size are updated with 346 * the amount of bytes read. If @tr is non-NULL and a trailing 347 * character exists (size is non-zero after returning from this 348 * function), @tr is updated with the trailing character. 349 */ 350 static int proc_get_long(char **buf, size_t *size, 351 unsigned long *val, bool *neg, 352 const char *perm_tr, unsigned perm_tr_len, char *tr) 353 { 354 int len; 355 char *p, tmp[TMPBUFLEN]; 356 357 if (!*size) 358 return -EINVAL; 359 360 len = *size; 361 if (len > TMPBUFLEN - 1) 362 len = TMPBUFLEN - 1; 363 364 memcpy(tmp, *buf, len); 365 366 tmp[len] = 0; 367 p = tmp; 368 if (*p == '-' && *size > 1) { 369 *neg = true; 370 p++; 371 } else 372 *neg = false; 373 if (!isdigit(*p)) 374 return -EINVAL; 375 376 if (strtoul_lenient(p, &p, 0, val)) 377 return -EINVAL; 378 379 len = p - tmp; 380 381 /* We don't know if the next char is whitespace thus we may accept 382 * invalid integers (e.g. 1234...a) or two integers instead of one 383 * (e.g. 123...1). So lets not allow such large numbers. */ 384 if (len == TMPBUFLEN - 1) 385 return -EINVAL; 386 387 if (len < *size && perm_tr_len && !memchr(perm_tr, *p, perm_tr_len)) 388 return -EINVAL; 389 390 if (tr && (len < *size)) 391 *tr = *p; 392 393 *buf += len; 394 *size -= len; 395 396 return 0; 397 } 398 399 /** 400 * proc_put_long - converts an integer to a decimal ASCII formatted string 401 * 402 * @buf: the user buffer 403 * @size: the size of the user buffer 404 * @val: the integer to be converted 405 * @neg: sign of the number, %TRUE for negative 406 * 407 * In case of success @buf and @size are updated with the amount of bytes 408 * written. 409 */ 410 static void proc_put_long(void **buf, size_t *size, unsigned long val, bool neg) 411 { 412 int len; 413 char tmp[TMPBUFLEN], *p = tmp; 414 415 sprintf(p, "%s%lu", neg ? "-" : "", val); 416 len = strlen(tmp); 417 if (len > *size) 418 len = *size; 419 memcpy(*buf, tmp, len); 420 *size -= len; 421 *buf += len; 422 } 423 #undef TMPBUFLEN 424 425 static void proc_put_char(void **buf, size_t *size, char c) 426 { 427 if (*size) { 428 char **buffer = (char **)buf; 429 **buffer = c; 430 431 (*size)--; 432 (*buffer)++; 433 *buf = *buffer; 434 } 435 } 436 437 static int do_proc_dobool_conv(bool *negp, unsigned long *lvalp, 438 int *valp, 439 int write, void *data) 440 { 441 if (write) { 442 *(bool *)valp = *lvalp; 443 } else { 444 int val = *(bool *)valp; 445 446 *lvalp = (unsigned long)val; 447 *negp = false; 448 } 449 return 0; 450 } 451 452 static int do_proc_dointvec_conv(bool *negp, unsigned long *lvalp, 453 int *valp, 454 int write, void *data) 455 { 456 if (write) { 457 if (*negp) { 458 if (*lvalp > (unsigned long) INT_MAX + 1) 459 return -EINVAL; 460 *valp = -*lvalp; 461 } else { 462 if (*lvalp > (unsigned long) INT_MAX) 463 return -EINVAL; 464 *valp = *lvalp; 465 } 466 } else { 467 int val = *valp; 468 if (val < 0) { 469 *negp = true; 470 *lvalp = -(unsigned long)val; 471 } else { 472 *negp = false; 473 *lvalp = (unsigned long)val; 474 } 475 } 476 return 0; 477 } 478 479 static int do_proc_douintvec_conv(unsigned long *lvalp, 480 unsigned int *valp, 481 int write, void *data) 482 { 483 if (write) { 484 if (*lvalp > UINT_MAX) 485 return -EINVAL; 486 *valp = *lvalp; 487 } else { 488 unsigned int val = *valp; 489 *lvalp = (unsigned long)val; 490 } 491 return 0; 492 } 493 494 static const char proc_wspace_sep[] = { ' ', '\t', '\n' }; 495 496 static int __do_proc_dointvec(void *tbl_data, struct ctl_table *table, 497 int write, void *buffer, 498 size_t *lenp, loff_t *ppos, 499 int (*conv)(bool *negp, unsigned long *lvalp, int *valp, 500 int write, void *data), 501 void *data) 502 { 503 int *i, vleft, first = 1, err = 0; 504 size_t left; 505 char *p; 506 507 if (!tbl_data || !table->maxlen || !*lenp || (*ppos && !write)) { 508 *lenp = 0; 509 return 0; 510 } 511 512 i = (int *) tbl_data; 513 vleft = table->maxlen / sizeof(*i); 514 left = *lenp; 515 516 if (!conv) 517 conv = do_proc_dointvec_conv; 518 519 if (write) { 520 if (proc_first_pos_non_zero_ignore(ppos, table)) 521 goto out; 522 523 if (left > PAGE_SIZE - 1) 524 left = PAGE_SIZE - 1; 525 p = buffer; 526 } 527 528 for (; left && vleft--; i++, first=0) { 529 unsigned long lval; 530 bool neg; 531 532 if (write) { 533 left -= proc_skip_spaces(&p); 534 535 if (!left) 536 break; 537 err = proc_get_long(&p, &left, &lval, &neg, 538 proc_wspace_sep, 539 sizeof(proc_wspace_sep), NULL); 540 if (err) 541 break; 542 if (conv(&neg, &lval, i, 1, data)) { 543 err = -EINVAL; 544 break; 545 } 546 } else { 547 if (conv(&neg, &lval, i, 0, data)) { 548 err = -EINVAL; 549 break; 550 } 551 if (!first) 552 proc_put_char(&buffer, &left, '\t'); 553 proc_put_long(&buffer, &left, lval, neg); 554 } 555 } 556 557 if (!write && !first && left && !err) 558 proc_put_char(&buffer, &left, '\n'); 559 if (write && !err && left) 560 left -= proc_skip_spaces(&p); 561 if (write && first) 562 return err ? : -EINVAL; 563 *lenp -= left; 564 out: 565 *ppos += *lenp; 566 return err; 567 } 568 569 static int do_proc_dointvec(struct ctl_table *table, int write, 570 void *buffer, size_t *lenp, loff_t *ppos, 571 int (*conv)(bool *negp, unsigned long *lvalp, int *valp, 572 int write, void *data), 573 void *data) 574 { 575 return __do_proc_dointvec(table->data, table, write, 576 buffer, lenp, ppos, conv, data); 577 } 578 579 static int do_proc_douintvec_w(unsigned int *tbl_data, 580 struct ctl_table *table, 581 void *buffer, 582 size_t *lenp, loff_t *ppos, 583 int (*conv)(unsigned long *lvalp, 584 unsigned int *valp, 585 int write, void *data), 586 void *data) 587 { 588 unsigned long lval; 589 int err = 0; 590 size_t left; 591 bool neg; 592 char *p = buffer; 593 594 left = *lenp; 595 596 if (proc_first_pos_non_zero_ignore(ppos, table)) 597 goto bail_early; 598 599 if (left > PAGE_SIZE - 1) 600 left = PAGE_SIZE - 1; 601 602 left -= proc_skip_spaces(&p); 603 if (!left) { 604 err = -EINVAL; 605 goto out_free; 606 } 607 608 err = proc_get_long(&p, &left, &lval, &neg, 609 proc_wspace_sep, 610 sizeof(proc_wspace_sep), NULL); 611 if (err || neg) { 612 err = -EINVAL; 613 goto out_free; 614 } 615 616 if (conv(&lval, tbl_data, 1, data)) { 617 err = -EINVAL; 618 goto out_free; 619 } 620 621 if (!err && left) 622 left -= proc_skip_spaces(&p); 623 624 out_free: 625 if (err) 626 return -EINVAL; 627 628 return 0; 629 630 /* This is in keeping with old __do_proc_dointvec() */ 631 bail_early: 632 *ppos += *lenp; 633 return err; 634 } 635 636 static int do_proc_douintvec_r(unsigned int *tbl_data, void *buffer, 637 size_t *lenp, loff_t *ppos, 638 int (*conv)(unsigned long *lvalp, 639 unsigned int *valp, 640 int write, void *data), 641 void *data) 642 { 643 unsigned long lval; 644 int err = 0; 645 size_t left; 646 647 left = *lenp; 648 649 if (conv(&lval, tbl_data, 0, data)) { 650 err = -EINVAL; 651 goto out; 652 } 653 654 proc_put_long(&buffer, &left, lval, false); 655 if (!left) 656 goto out; 657 658 proc_put_char(&buffer, &left, '\n'); 659 660 out: 661 *lenp -= left; 662 *ppos += *lenp; 663 664 return err; 665 } 666 667 static int __do_proc_douintvec(void *tbl_data, struct ctl_table *table, 668 int write, void *buffer, 669 size_t *lenp, loff_t *ppos, 670 int (*conv)(unsigned long *lvalp, 671 unsigned int *valp, 672 int write, void *data), 673 void *data) 674 { 675 unsigned int *i, vleft; 676 677 if (!tbl_data || !table->maxlen || !*lenp || (*ppos && !write)) { 678 *lenp = 0; 679 return 0; 680 } 681 682 i = (unsigned int *) tbl_data; 683 vleft = table->maxlen / sizeof(*i); 684 685 /* 686 * Arrays are not supported, keep this simple. *Do not* add 687 * support for them. 688 */ 689 if (vleft != 1) { 690 *lenp = 0; 691 return -EINVAL; 692 } 693 694 if (!conv) 695 conv = do_proc_douintvec_conv; 696 697 if (write) 698 return do_proc_douintvec_w(i, table, buffer, lenp, ppos, 699 conv, data); 700 return do_proc_douintvec_r(i, buffer, lenp, ppos, conv, data); 701 } 702 703 int do_proc_douintvec(struct ctl_table *table, int write, 704 void *buffer, size_t *lenp, loff_t *ppos, 705 int (*conv)(unsigned long *lvalp, 706 unsigned int *valp, 707 int write, void *data), 708 void *data) 709 { 710 return __do_proc_douintvec(table->data, table, write, 711 buffer, lenp, ppos, conv, data); 712 } 713 714 /** 715 * proc_dobool - read/write a bool 716 * @table: the sysctl table 717 * @write: %TRUE if this is a write to the sysctl file 718 * @buffer: the user buffer 719 * @lenp: the size of the user buffer 720 * @ppos: file position 721 * 722 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 723 * values from/to the user buffer, treated as an ASCII string. 724 * 725 * Returns 0 on success. 726 */ 727 int proc_dobool(struct ctl_table *table, int write, void *buffer, 728 size_t *lenp, loff_t *ppos) 729 { 730 return do_proc_dointvec(table, write, buffer, lenp, ppos, 731 do_proc_dobool_conv, NULL); 732 } 733 734 /** 735 * proc_dointvec - read a vector of integers 736 * @table: the sysctl table 737 * @write: %TRUE if this is a write to the sysctl file 738 * @buffer: the user buffer 739 * @lenp: the size of the user buffer 740 * @ppos: file position 741 * 742 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 743 * values from/to the user buffer, treated as an ASCII string. 744 * 745 * Returns 0 on success. 746 */ 747 int proc_dointvec(struct ctl_table *table, int write, void *buffer, 748 size_t *lenp, loff_t *ppos) 749 { 750 return do_proc_dointvec(table, write, buffer, lenp, ppos, NULL, NULL); 751 } 752 753 #ifdef CONFIG_COMPACTION 754 static int proc_dointvec_minmax_warn_RT_change(struct ctl_table *table, 755 int write, void *buffer, size_t *lenp, loff_t *ppos) 756 { 757 int ret, old; 758 759 if (!IS_ENABLED(CONFIG_PREEMPT_RT) || !write) 760 return proc_dointvec_minmax(table, write, buffer, lenp, ppos); 761 762 old = *(int *)table->data; 763 ret = proc_dointvec_minmax(table, write, buffer, lenp, ppos); 764 if (ret) 765 return ret; 766 if (old != *(int *)table->data) 767 pr_warn_once("sysctl attribute %s changed by %s[%d]\n", 768 table->procname, current->comm, 769 task_pid_nr(current)); 770 return ret; 771 } 772 #endif 773 774 /** 775 * proc_douintvec - read a vector of unsigned integers 776 * @table: the sysctl table 777 * @write: %TRUE if this is a write to the sysctl file 778 * @buffer: the user buffer 779 * @lenp: the size of the user buffer 780 * @ppos: file position 781 * 782 * Reads/writes up to table->maxlen/sizeof(unsigned int) unsigned integer 783 * values from/to the user buffer, treated as an ASCII string. 784 * 785 * Returns 0 on success. 786 */ 787 int proc_douintvec(struct ctl_table *table, int write, void *buffer, 788 size_t *lenp, loff_t *ppos) 789 { 790 return do_proc_douintvec(table, write, buffer, lenp, ppos, 791 do_proc_douintvec_conv, NULL); 792 } 793 794 /* 795 * Taint values can only be increased 796 * This means we can safely use a temporary. 797 */ 798 static int proc_taint(struct ctl_table *table, int write, 799 void *buffer, size_t *lenp, loff_t *ppos) 800 { 801 struct ctl_table t; 802 unsigned long tmptaint = get_taint(); 803 int err; 804 805 if (write && !capable(CAP_SYS_ADMIN)) 806 return -EPERM; 807 808 t = *table; 809 t.data = &tmptaint; 810 err = proc_doulongvec_minmax(&t, write, buffer, lenp, ppos); 811 if (err < 0) 812 return err; 813 814 if (write) { 815 int i; 816 817 /* 818 * If we are relying on panic_on_taint not producing 819 * false positives due to userspace input, bail out 820 * before setting the requested taint flags. 821 */ 822 if (panic_on_taint_nousertaint && (tmptaint & panic_on_taint)) 823 return -EINVAL; 824 825 /* 826 * Poor man's atomic or. Not worth adding a primitive 827 * to everyone's atomic.h for this 828 */ 829 for (i = 0; i < TAINT_FLAGS_COUNT; i++) 830 if ((1UL << i) & tmptaint) 831 add_taint(i, LOCKDEP_STILL_OK); 832 } 833 834 return err; 835 } 836 837 /** 838 * struct do_proc_dointvec_minmax_conv_param - proc_dointvec_minmax() range checking structure 839 * @min: pointer to minimum allowable value 840 * @max: pointer to maximum allowable value 841 * 842 * The do_proc_dointvec_minmax_conv_param structure provides the 843 * minimum and maximum values for doing range checking for those sysctl 844 * parameters that use the proc_dointvec_minmax() handler. 845 */ 846 struct do_proc_dointvec_minmax_conv_param { 847 int *min; 848 int *max; 849 }; 850 851 static int do_proc_dointvec_minmax_conv(bool *negp, unsigned long *lvalp, 852 int *valp, 853 int write, void *data) 854 { 855 int tmp, ret; 856 struct do_proc_dointvec_minmax_conv_param *param = data; 857 /* 858 * If writing, first do so via a temporary local int so we can 859 * bounds-check it before touching *valp. 860 */ 861 int *ip = write ? &tmp : valp; 862 863 ret = do_proc_dointvec_conv(negp, lvalp, ip, write, data); 864 if (ret) 865 return ret; 866 867 if (write) { 868 if ((param->min && *param->min > tmp) || 869 (param->max && *param->max < tmp)) 870 return -EINVAL; 871 *valp = tmp; 872 } 873 874 return 0; 875 } 876 877 /** 878 * proc_dointvec_minmax - read a vector of integers with min/max values 879 * @table: the sysctl table 880 * @write: %TRUE if this is a write to the sysctl file 881 * @buffer: the user buffer 882 * @lenp: the size of the user buffer 883 * @ppos: file position 884 * 885 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 886 * values from/to the user buffer, treated as an ASCII string. 887 * 888 * This routine will ensure the values are within the range specified by 889 * table->extra1 (min) and table->extra2 (max). 890 * 891 * Returns 0 on success or -EINVAL on write when the range check fails. 892 */ 893 int proc_dointvec_minmax(struct ctl_table *table, int write, 894 void *buffer, size_t *lenp, loff_t *ppos) 895 { 896 struct do_proc_dointvec_minmax_conv_param param = { 897 .min = (int *) table->extra1, 898 .max = (int *) table->extra2, 899 }; 900 return do_proc_dointvec(table, write, buffer, lenp, ppos, 901 do_proc_dointvec_minmax_conv, ¶m); 902 } 903 904 /** 905 * struct do_proc_douintvec_minmax_conv_param - proc_douintvec_minmax() range checking structure 906 * @min: pointer to minimum allowable value 907 * @max: pointer to maximum allowable value 908 * 909 * The do_proc_douintvec_minmax_conv_param structure provides the 910 * minimum and maximum values for doing range checking for those sysctl 911 * parameters that use the proc_douintvec_minmax() handler. 912 */ 913 struct do_proc_douintvec_minmax_conv_param { 914 unsigned int *min; 915 unsigned int *max; 916 }; 917 918 static int do_proc_douintvec_minmax_conv(unsigned long *lvalp, 919 unsigned int *valp, 920 int write, void *data) 921 { 922 int ret; 923 unsigned int tmp; 924 struct do_proc_douintvec_minmax_conv_param *param = data; 925 /* write via temporary local uint for bounds-checking */ 926 unsigned int *up = write ? &tmp : valp; 927 928 ret = do_proc_douintvec_conv(lvalp, up, write, data); 929 if (ret) 930 return ret; 931 932 if (write) { 933 if ((param->min && *param->min > tmp) || 934 (param->max && *param->max < tmp)) 935 return -ERANGE; 936 937 *valp = tmp; 938 } 939 940 return 0; 941 } 942 943 /** 944 * proc_douintvec_minmax - read a vector of unsigned ints with min/max values 945 * @table: the sysctl table 946 * @write: %TRUE if this is a write to the sysctl file 947 * @buffer: the user buffer 948 * @lenp: the size of the user buffer 949 * @ppos: file position 950 * 951 * Reads/writes up to table->maxlen/sizeof(unsigned int) unsigned integer 952 * values from/to the user buffer, treated as an ASCII string. Negative 953 * strings are not allowed. 954 * 955 * This routine will ensure the values are within the range specified by 956 * table->extra1 (min) and table->extra2 (max). There is a final sanity 957 * check for UINT_MAX to avoid having to support wrap around uses from 958 * userspace. 959 * 960 * Returns 0 on success or -ERANGE on write when the range check fails. 961 */ 962 int proc_douintvec_minmax(struct ctl_table *table, int write, 963 void *buffer, size_t *lenp, loff_t *ppos) 964 { 965 struct do_proc_douintvec_minmax_conv_param param = { 966 .min = (unsigned int *) table->extra1, 967 .max = (unsigned int *) table->extra2, 968 }; 969 return do_proc_douintvec(table, write, buffer, lenp, ppos, 970 do_proc_douintvec_minmax_conv, ¶m); 971 } 972 973 /** 974 * proc_dou8vec_minmax - read a vector of unsigned chars with min/max values 975 * @table: the sysctl table 976 * @write: %TRUE if this is a write to the sysctl file 977 * @buffer: the user buffer 978 * @lenp: the size of the user buffer 979 * @ppos: file position 980 * 981 * Reads/writes up to table->maxlen/sizeof(u8) unsigned chars 982 * values from/to the user buffer, treated as an ASCII string. Negative 983 * strings are not allowed. 984 * 985 * This routine will ensure the values are within the range specified by 986 * table->extra1 (min) and table->extra2 (max). 987 * 988 * Returns 0 on success or an error on write when the range check fails. 989 */ 990 int proc_dou8vec_minmax(struct ctl_table *table, int write, 991 void *buffer, size_t *lenp, loff_t *ppos) 992 { 993 struct ctl_table tmp; 994 unsigned int min = 0, max = 255U, val; 995 u8 *data = table->data; 996 struct do_proc_douintvec_minmax_conv_param param = { 997 .min = &min, 998 .max = &max, 999 }; 1000 int res; 1001 1002 /* Do not support arrays yet. */ 1003 if (table->maxlen != sizeof(u8)) 1004 return -EINVAL; 1005 1006 if (table->extra1) { 1007 min = *(unsigned int *) table->extra1; 1008 if (min > 255U) 1009 return -EINVAL; 1010 } 1011 if (table->extra2) { 1012 max = *(unsigned int *) table->extra2; 1013 if (max > 255U) 1014 return -EINVAL; 1015 } 1016 1017 tmp = *table; 1018 1019 tmp.maxlen = sizeof(val); 1020 tmp.data = &val; 1021 val = *data; 1022 res = do_proc_douintvec(&tmp, write, buffer, lenp, ppos, 1023 do_proc_douintvec_minmax_conv, ¶m); 1024 if (res) 1025 return res; 1026 if (write) 1027 *data = val; 1028 return 0; 1029 } 1030 EXPORT_SYMBOL_GPL(proc_dou8vec_minmax); 1031 1032 #ifdef CONFIG_MAGIC_SYSRQ 1033 static int sysrq_sysctl_handler(struct ctl_table *table, int write, 1034 void *buffer, size_t *lenp, loff_t *ppos) 1035 { 1036 int tmp, ret; 1037 1038 tmp = sysrq_mask(); 1039 1040 ret = __do_proc_dointvec(&tmp, table, write, buffer, 1041 lenp, ppos, NULL, NULL); 1042 if (ret || !write) 1043 return ret; 1044 1045 if (write) 1046 sysrq_toggle_support(tmp); 1047 1048 return 0; 1049 } 1050 #endif 1051 1052 static int __do_proc_doulongvec_minmax(void *data, struct ctl_table *table, 1053 int write, void *buffer, size_t *lenp, loff_t *ppos, 1054 unsigned long convmul, unsigned long convdiv) 1055 { 1056 unsigned long *i, *min, *max; 1057 int vleft, first = 1, err = 0; 1058 size_t left; 1059 char *p; 1060 1061 if (!data || !table->maxlen || !*lenp || (*ppos && !write)) { 1062 *lenp = 0; 1063 return 0; 1064 } 1065 1066 i = (unsigned long *) data; 1067 min = (unsigned long *) table->extra1; 1068 max = (unsigned long *) table->extra2; 1069 vleft = table->maxlen / sizeof(unsigned long); 1070 left = *lenp; 1071 1072 if (write) { 1073 if (proc_first_pos_non_zero_ignore(ppos, table)) 1074 goto out; 1075 1076 if (left > PAGE_SIZE - 1) 1077 left = PAGE_SIZE - 1; 1078 p = buffer; 1079 } 1080 1081 for (; left && vleft--; i++, first = 0) { 1082 unsigned long val; 1083 1084 if (write) { 1085 bool neg; 1086 1087 left -= proc_skip_spaces(&p); 1088 if (!left) 1089 break; 1090 1091 err = proc_get_long(&p, &left, &val, &neg, 1092 proc_wspace_sep, 1093 sizeof(proc_wspace_sep), NULL); 1094 if (err || neg) { 1095 err = -EINVAL; 1096 break; 1097 } 1098 1099 val = convmul * val / convdiv; 1100 if ((min && val < *min) || (max && val > *max)) { 1101 err = -EINVAL; 1102 break; 1103 } 1104 *i = val; 1105 } else { 1106 val = convdiv * (*i) / convmul; 1107 if (!first) 1108 proc_put_char(&buffer, &left, '\t'); 1109 proc_put_long(&buffer, &left, val, false); 1110 } 1111 } 1112 1113 if (!write && !first && left && !err) 1114 proc_put_char(&buffer, &left, '\n'); 1115 if (write && !err) 1116 left -= proc_skip_spaces(&p); 1117 if (write && first) 1118 return err ? : -EINVAL; 1119 *lenp -= left; 1120 out: 1121 *ppos += *lenp; 1122 return err; 1123 } 1124 1125 static int do_proc_doulongvec_minmax(struct ctl_table *table, int write, 1126 void *buffer, size_t *lenp, loff_t *ppos, unsigned long convmul, 1127 unsigned long convdiv) 1128 { 1129 return __do_proc_doulongvec_minmax(table->data, table, write, 1130 buffer, lenp, ppos, convmul, convdiv); 1131 } 1132 1133 /** 1134 * proc_doulongvec_minmax - read a vector of long integers with min/max values 1135 * @table: the sysctl table 1136 * @write: %TRUE if this is a write to the sysctl file 1137 * @buffer: the user buffer 1138 * @lenp: the size of the user buffer 1139 * @ppos: file position 1140 * 1141 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long 1142 * values from/to the user buffer, treated as an ASCII string. 1143 * 1144 * This routine will ensure the values are within the range specified by 1145 * table->extra1 (min) and table->extra2 (max). 1146 * 1147 * Returns 0 on success. 1148 */ 1149 int proc_doulongvec_minmax(struct ctl_table *table, int write, 1150 void *buffer, size_t *lenp, loff_t *ppos) 1151 { 1152 return do_proc_doulongvec_minmax(table, write, buffer, lenp, ppos, 1l, 1l); 1153 } 1154 1155 /** 1156 * proc_doulongvec_ms_jiffies_minmax - read a vector of millisecond values with min/max values 1157 * @table: the sysctl table 1158 * @write: %TRUE if this is a write to the sysctl file 1159 * @buffer: the user buffer 1160 * @lenp: the size of the user buffer 1161 * @ppos: file position 1162 * 1163 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long 1164 * values from/to the user buffer, treated as an ASCII string. The values 1165 * are treated as milliseconds, and converted to jiffies when they are stored. 1166 * 1167 * This routine will ensure the values are within the range specified by 1168 * table->extra1 (min) and table->extra2 (max). 1169 * 1170 * Returns 0 on success. 1171 */ 1172 int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write, 1173 void *buffer, size_t *lenp, loff_t *ppos) 1174 { 1175 return do_proc_doulongvec_minmax(table, write, buffer, 1176 lenp, ppos, HZ, 1000l); 1177 } 1178 1179 1180 static int do_proc_dointvec_jiffies_conv(bool *negp, unsigned long *lvalp, 1181 int *valp, 1182 int write, void *data) 1183 { 1184 if (write) { 1185 if (*lvalp > INT_MAX / HZ) 1186 return 1; 1187 *valp = *negp ? -(*lvalp*HZ) : (*lvalp*HZ); 1188 } else { 1189 int val = *valp; 1190 unsigned long lval; 1191 if (val < 0) { 1192 *negp = true; 1193 lval = -(unsigned long)val; 1194 } else { 1195 *negp = false; 1196 lval = (unsigned long)val; 1197 } 1198 *lvalp = lval / HZ; 1199 } 1200 return 0; 1201 } 1202 1203 static int do_proc_dointvec_userhz_jiffies_conv(bool *negp, unsigned long *lvalp, 1204 int *valp, 1205 int write, void *data) 1206 { 1207 if (write) { 1208 if (USER_HZ < HZ && *lvalp > (LONG_MAX / HZ) * USER_HZ) 1209 return 1; 1210 *valp = clock_t_to_jiffies(*negp ? -*lvalp : *lvalp); 1211 } else { 1212 int val = *valp; 1213 unsigned long lval; 1214 if (val < 0) { 1215 *negp = true; 1216 lval = -(unsigned long)val; 1217 } else { 1218 *negp = false; 1219 lval = (unsigned long)val; 1220 } 1221 *lvalp = jiffies_to_clock_t(lval); 1222 } 1223 return 0; 1224 } 1225 1226 static int do_proc_dointvec_ms_jiffies_conv(bool *negp, unsigned long *lvalp, 1227 int *valp, 1228 int write, void *data) 1229 { 1230 if (write) { 1231 unsigned long jif = msecs_to_jiffies(*negp ? -*lvalp : *lvalp); 1232 1233 if (jif > INT_MAX) 1234 return 1; 1235 *valp = (int)jif; 1236 } else { 1237 int val = *valp; 1238 unsigned long lval; 1239 if (val < 0) { 1240 *negp = true; 1241 lval = -(unsigned long)val; 1242 } else { 1243 *negp = false; 1244 lval = (unsigned long)val; 1245 } 1246 *lvalp = jiffies_to_msecs(lval); 1247 } 1248 return 0; 1249 } 1250 1251 /** 1252 * proc_dointvec_jiffies - read a vector of integers as seconds 1253 * @table: the sysctl table 1254 * @write: %TRUE if this is a write to the sysctl file 1255 * @buffer: the user buffer 1256 * @lenp: the size of the user buffer 1257 * @ppos: file position 1258 * 1259 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 1260 * values from/to the user buffer, treated as an ASCII string. 1261 * The values read are assumed to be in seconds, and are converted into 1262 * jiffies. 1263 * 1264 * Returns 0 on success. 1265 */ 1266 int proc_dointvec_jiffies(struct ctl_table *table, int write, 1267 void *buffer, size_t *lenp, loff_t *ppos) 1268 { 1269 return do_proc_dointvec(table,write,buffer,lenp,ppos, 1270 do_proc_dointvec_jiffies_conv,NULL); 1271 } 1272 1273 /** 1274 * proc_dointvec_userhz_jiffies - read a vector of integers as 1/USER_HZ seconds 1275 * @table: the sysctl table 1276 * @write: %TRUE if this is a write to the sysctl file 1277 * @buffer: the user buffer 1278 * @lenp: the size of the user buffer 1279 * @ppos: pointer to the file position 1280 * 1281 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 1282 * values from/to the user buffer, treated as an ASCII string. 1283 * The values read are assumed to be in 1/USER_HZ seconds, and 1284 * are converted into jiffies. 1285 * 1286 * Returns 0 on success. 1287 */ 1288 int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write, 1289 void *buffer, size_t *lenp, loff_t *ppos) 1290 { 1291 return do_proc_dointvec(table,write,buffer,lenp,ppos, 1292 do_proc_dointvec_userhz_jiffies_conv,NULL); 1293 } 1294 1295 /** 1296 * proc_dointvec_ms_jiffies - read a vector of integers as 1 milliseconds 1297 * @table: the sysctl table 1298 * @write: %TRUE if this is a write to the sysctl file 1299 * @buffer: the user buffer 1300 * @lenp: the size of the user buffer 1301 * @ppos: file position 1302 * @ppos: the current position in the file 1303 * 1304 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 1305 * values from/to the user buffer, treated as an ASCII string. 1306 * The values read are assumed to be in 1/1000 seconds, and 1307 * are converted into jiffies. 1308 * 1309 * Returns 0 on success. 1310 */ 1311 int proc_dointvec_ms_jiffies(struct ctl_table *table, int write, void *buffer, 1312 size_t *lenp, loff_t *ppos) 1313 { 1314 return do_proc_dointvec(table, write, buffer, lenp, ppos, 1315 do_proc_dointvec_ms_jiffies_conv, NULL); 1316 } 1317 1318 static int proc_do_cad_pid(struct ctl_table *table, int write, void *buffer, 1319 size_t *lenp, loff_t *ppos) 1320 { 1321 struct pid *new_pid; 1322 pid_t tmp; 1323 int r; 1324 1325 tmp = pid_vnr(cad_pid); 1326 1327 r = __do_proc_dointvec(&tmp, table, write, buffer, 1328 lenp, ppos, NULL, NULL); 1329 if (r || !write) 1330 return r; 1331 1332 new_pid = find_get_pid(tmp); 1333 if (!new_pid) 1334 return -ESRCH; 1335 1336 put_pid(xchg(&cad_pid, new_pid)); 1337 return 0; 1338 } 1339 1340 /** 1341 * proc_do_large_bitmap - read/write from/to a large bitmap 1342 * @table: the sysctl table 1343 * @write: %TRUE if this is a write to the sysctl file 1344 * @buffer: the user buffer 1345 * @lenp: the size of the user buffer 1346 * @ppos: file position 1347 * 1348 * The bitmap is stored at table->data and the bitmap length (in bits) 1349 * in table->maxlen. 1350 * 1351 * We use a range comma separated format (e.g. 1,3-4,10-10) so that 1352 * large bitmaps may be represented in a compact manner. Writing into 1353 * the file will clear the bitmap then update it with the given input. 1354 * 1355 * Returns 0 on success. 1356 */ 1357 int proc_do_large_bitmap(struct ctl_table *table, int write, 1358 void *buffer, size_t *lenp, loff_t *ppos) 1359 { 1360 int err = 0; 1361 size_t left = *lenp; 1362 unsigned long bitmap_len = table->maxlen; 1363 unsigned long *bitmap = *(unsigned long **) table->data; 1364 unsigned long *tmp_bitmap = NULL; 1365 char tr_a[] = { '-', ',', '\n' }, tr_b[] = { ',', '\n', 0 }, c; 1366 1367 if (!bitmap || !bitmap_len || !left || (*ppos && !write)) { 1368 *lenp = 0; 1369 return 0; 1370 } 1371 1372 if (write) { 1373 char *p = buffer; 1374 size_t skipped = 0; 1375 1376 if (left > PAGE_SIZE - 1) { 1377 left = PAGE_SIZE - 1; 1378 /* How much of the buffer we'll skip this pass */ 1379 skipped = *lenp - left; 1380 } 1381 1382 tmp_bitmap = bitmap_zalloc(bitmap_len, GFP_KERNEL); 1383 if (!tmp_bitmap) 1384 return -ENOMEM; 1385 proc_skip_char(&p, &left, '\n'); 1386 while (!err && left) { 1387 unsigned long val_a, val_b; 1388 bool neg; 1389 size_t saved_left; 1390 1391 /* In case we stop parsing mid-number, we can reset */ 1392 saved_left = left; 1393 err = proc_get_long(&p, &left, &val_a, &neg, tr_a, 1394 sizeof(tr_a), &c); 1395 /* 1396 * If we consumed the entirety of a truncated buffer or 1397 * only one char is left (may be a "-"), then stop here, 1398 * reset, & come back for more. 1399 */ 1400 if ((left <= 1) && skipped) { 1401 left = saved_left; 1402 break; 1403 } 1404 1405 if (err) 1406 break; 1407 if (val_a >= bitmap_len || neg) { 1408 err = -EINVAL; 1409 break; 1410 } 1411 1412 val_b = val_a; 1413 if (left) { 1414 p++; 1415 left--; 1416 } 1417 1418 if (c == '-') { 1419 err = proc_get_long(&p, &left, &val_b, 1420 &neg, tr_b, sizeof(tr_b), 1421 &c); 1422 /* 1423 * If we consumed all of a truncated buffer or 1424 * then stop here, reset, & come back for more. 1425 */ 1426 if (!left && skipped) { 1427 left = saved_left; 1428 break; 1429 } 1430 1431 if (err) 1432 break; 1433 if (val_b >= bitmap_len || neg || 1434 val_a > val_b) { 1435 err = -EINVAL; 1436 break; 1437 } 1438 if (left) { 1439 p++; 1440 left--; 1441 } 1442 } 1443 1444 bitmap_set(tmp_bitmap, val_a, val_b - val_a + 1); 1445 proc_skip_char(&p, &left, '\n'); 1446 } 1447 left += skipped; 1448 } else { 1449 unsigned long bit_a, bit_b = 0; 1450 bool first = 1; 1451 1452 while (left) { 1453 bit_a = find_next_bit(bitmap, bitmap_len, bit_b); 1454 if (bit_a >= bitmap_len) 1455 break; 1456 bit_b = find_next_zero_bit(bitmap, bitmap_len, 1457 bit_a + 1) - 1; 1458 1459 if (!first) 1460 proc_put_char(&buffer, &left, ','); 1461 proc_put_long(&buffer, &left, bit_a, false); 1462 if (bit_a != bit_b) { 1463 proc_put_char(&buffer, &left, '-'); 1464 proc_put_long(&buffer, &left, bit_b, false); 1465 } 1466 1467 first = 0; bit_b++; 1468 } 1469 proc_put_char(&buffer, &left, '\n'); 1470 } 1471 1472 if (!err) { 1473 if (write) { 1474 if (*ppos) 1475 bitmap_or(bitmap, bitmap, tmp_bitmap, bitmap_len); 1476 else 1477 bitmap_copy(bitmap, tmp_bitmap, bitmap_len); 1478 } 1479 *lenp -= left; 1480 *ppos += *lenp; 1481 } 1482 1483 bitmap_free(tmp_bitmap); 1484 return err; 1485 } 1486 1487 #else /* CONFIG_PROC_SYSCTL */ 1488 1489 int proc_dostring(struct ctl_table *table, int write, 1490 void *buffer, size_t *lenp, loff_t *ppos) 1491 { 1492 return -ENOSYS; 1493 } 1494 1495 int proc_dobool(struct ctl_table *table, int write, 1496 void *buffer, size_t *lenp, loff_t *ppos) 1497 { 1498 return -ENOSYS; 1499 } 1500 1501 int proc_dointvec(struct ctl_table *table, int write, 1502 void *buffer, size_t *lenp, loff_t *ppos) 1503 { 1504 return -ENOSYS; 1505 } 1506 1507 int proc_douintvec(struct ctl_table *table, int write, 1508 void *buffer, size_t *lenp, loff_t *ppos) 1509 { 1510 return -ENOSYS; 1511 } 1512 1513 int proc_dointvec_minmax(struct ctl_table *table, int write, 1514 void *buffer, size_t *lenp, loff_t *ppos) 1515 { 1516 return -ENOSYS; 1517 } 1518 1519 int proc_douintvec_minmax(struct ctl_table *table, int write, 1520 void *buffer, size_t *lenp, loff_t *ppos) 1521 { 1522 return -ENOSYS; 1523 } 1524 1525 int proc_dou8vec_minmax(struct ctl_table *table, int write, 1526 void *buffer, size_t *lenp, loff_t *ppos) 1527 { 1528 return -ENOSYS; 1529 } 1530 1531 int proc_dointvec_jiffies(struct ctl_table *table, int write, 1532 void *buffer, size_t *lenp, loff_t *ppos) 1533 { 1534 return -ENOSYS; 1535 } 1536 1537 int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write, 1538 void *buffer, size_t *lenp, loff_t *ppos) 1539 { 1540 return -ENOSYS; 1541 } 1542 1543 int proc_dointvec_ms_jiffies(struct ctl_table *table, int write, 1544 void *buffer, size_t *lenp, loff_t *ppos) 1545 { 1546 return -ENOSYS; 1547 } 1548 1549 int proc_doulongvec_minmax(struct ctl_table *table, int write, 1550 void *buffer, size_t *lenp, loff_t *ppos) 1551 { 1552 return -ENOSYS; 1553 } 1554 1555 int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write, 1556 void *buffer, size_t *lenp, loff_t *ppos) 1557 { 1558 return -ENOSYS; 1559 } 1560 1561 int proc_do_large_bitmap(struct ctl_table *table, int write, 1562 void *buffer, size_t *lenp, loff_t *ppos) 1563 { 1564 return -ENOSYS; 1565 } 1566 1567 #endif /* CONFIG_PROC_SYSCTL */ 1568 1569 #if defined(CONFIG_SYSCTL) 1570 int proc_do_static_key(struct ctl_table *table, int write, 1571 void *buffer, size_t *lenp, loff_t *ppos) 1572 { 1573 struct static_key *key = (struct static_key *)table->data; 1574 static DEFINE_MUTEX(static_key_mutex); 1575 int val, ret; 1576 struct ctl_table tmp = { 1577 .data = &val, 1578 .maxlen = sizeof(val), 1579 .mode = table->mode, 1580 .extra1 = SYSCTL_ZERO, 1581 .extra2 = SYSCTL_ONE, 1582 }; 1583 1584 if (write && !capable(CAP_SYS_ADMIN)) 1585 return -EPERM; 1586 1587 mutex_lock(&static_key_mutex); 1588 val = static_key_enabled(key); 1589 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos); 1590 if (write && !ret) { 1591 if (val) 1592 static_key_enable(key); 1593 else 1594 static_key_disable(key); 1595 } 1596 mutex_unlock(&static_key_mutex); 1597 return ret; 1598 } 1599 1600 static struct ctl_table kern_table[] = { 1601 { 1602 .procname = "sched_child_runs_first", 1603 .data = &sysctl_sched_child_runs_first, 1604 .maxlen = sizeof(unsigned int), 1605 .mode = 0644, 1606 .proc_handler = proc_dointvec, 1607 }, 1608 #ifdef CONFIG_SCHEDSTATS 1609 { 1610 .procname = "sched_schedstats", 1611 .data = NULL, 1612 .maxlen = sizeof(unsigned int), 1613 .mode = 0644, 1614 .proc_handler = sysctl_schedstats, 1615 .extra1 = SYSCTL_ZERO, 1616 .extra2 = SYSCTL_ONE, 1617 }, 1618 #endif /* CONFIG_SCHEDSTATS */ 1619 #ifdef CONFIG_TASK_DELAY_ACCT 1620 { 1621 .procname = "task_delayacct", 1622 .data = NULL, 1623 .maxlen = sizeof(unsigned int), 1624 .mode = 0644, 1625 .proc_handler = sysctl_delayacct, 1626 .extra1 = SYSCTL_ZERO, 1627 .extra2 = SYSCTL_ONE, 1628 }, 1629 #endif /* CONFIG_TASK_DELAY_ACCT */ 1630 #ifdef CONFIG_NUMA_BALANCING 1631 { 1632 .procname = "numa_balancing", 1633 .data = NULL, /* filled in by handler */ 1634 .maxlen = sizeof(unsigned int), 1635 .mode = 0644, 1636 .proc_handler = sysctl_numa_balancing, 1637 .extra1 = SYSCTL_ZERO, 1638 .extra2 = SYSCTL_FOUR, 1639 }, 1640 #endif /* CONFIG_NUMA_BALANCING */ 1641 { 1642 .procname = "sched_rt_period_us", 1643 .data = &sysctl_sched_rt_period, 1644 .maxlen = sizeof(unsigned int), 1645 .mode = 0644, 1646 .proc_handler = sched_rt_handler, 1647 }, 1648 { 1649 .procname = "sched_rt_runtime_us", 1650 .data = &sysctl_sched_rt_runtime, 1651 .maxlen = sizeof(int), 1652 .mode = 0644, 1653 .proc_handler = sched_rt_handler, 1654 }, 1655 { 1656 .procname = "sched_deadline_period_max_us", 1657 .data = &sysctl_sched_dl_period_max, 1658 .maxlen = sizeof(unsigned int), 1659 .mode = 0644, 1660 .proc_handler = proc_dointvec, 1661 }, 1662 { 1663 .procname = "sched_deadline_period_min_us", 1664 .data = &sysctl_sched_dl_period_min, 1665 .maxlen = sizeof(unsigned int), 1666 .mode = 0644, 1667 .proc_handler = proc_dointvec, 1668 }, 1669 { 1670 .procname = "sched_rr_timeslice_ms", 1671 .data = &sysctl_sched_rr_timeslice, 1672 .maxlen = sizeof(int), 1673 .mode = 0644, 1674 .proc_handler = sched_rr_handler, 1675 }, 1676 #ifdef CONFIG_UCLAMP_TASK 1677 { 1678 .procname = "sched_util_clamp_min", 1679 .data = &sysctl_sched_uclamp_util_min, 1680 .maxlen = sizeof(unsigned int), 1681 .mode = 0644, 1682 .proc_handler = sysctl_sched_uclamp_handler, 1683 }, 1684 { 1685 .procname = "sched_util_clamp_max", 1686 .data = &sysctl_sched_uclamp_util_max, 1687 .maxlen = sizeof(unsigned int), 1688 .mode = 0644, 1689 .proc_handler = sysctl_sched_uclamp_handler, 1690 }, 1691 { 1692 .procname = "sched_util_clamp_min_rt_default", 1693 .data = &sysctl_sched_uclamp_util_min_rt_default, 1694 .maxlen = sizeof(unsigned int), 1695 .mode = 0644, 1696 .proc_handler = sysctl_sched_uclamp_handler, 1697 }, 1698 #endif 1699 #ifdef CONFIG_CFS_BANDWIDTH 1700 { 1701 .procname = "sched_cfs_bandwidth_slice_us", 1702 .data = &sysctl_sched_cfs_bandwidth_slice, 1703 .maxlen = sizeof(unsigned int), 1704 .mode = 0644, 1705 .proc_handler = proc_dointvec_minmax, 1706 .extra1 = SYSCTL_ONE, 1707 }, 1708 #endif 1709 #if defined(CONFIG_ENERGY_MODEL) && defined(CONFIG_CPU_FREQ_GOV_SCHEDUTIL) 1710 { 1711 .procname = "sched_energy_aware", 1712 .data = &sysctl_sched_energy_aware, 1713 .maxlen = sizeof(unsigned int), 1714 .mode = 0644, 1715 .proc_handler = sched_energy_aware_handler, 1716 .extra1 = SYSCTL_ZERO, 1717 .extra2 = SYSCTL_ONE, 1718 }, 1719 #endif 1720 #ifdef CONFIG_PROVE_LOCKING 1721 { 1722 .procname = "prove_locking", 1723 .data = &prove_locking, 1724 .maxlen = sizeof(int), 1725 .mode = 0644, 1726 .proc_handler = proc_dointvec, 1727 }, 1728 #endif 1729 #ifdef CONFIG_LOCK_STAT 1730 { 1731 .procname = "lock_stat", 1732 .data = &lock_stat, 1733 .maxlen = sizeof(int), 1734 .mode = 0644, 1735 .proc_handler = proc_dointvec, 1736 }, 1737 #endif 1738 { 1739 .procname = "panic", 1740 .data = &panic_timeout, 1741 .maxlen = sizeof(int), 1742 .mode = 0644, 1743 .proc_handler = proc_dointvec, 1744 }, 1745 #ifdef CONFIG_PROC_SYSCTL 1746 { 1747 .procname = "tainted", 1748 .maxlen = sizeof(long), 1749 .mode = 0644, 1750 .proc_handler = proc_taint, 1751 }, 1752 { 1753 .procname = "sysctl_writes_strict", 1754 .data = &sysctl_writes_strict, 1755 .maxlen = sizeof(int), 1756 .mode = 0644, 1757 .proc_handler = proc_dointvec_minmax, 1758 .extra1 = SYSCTL_NEG_ONE, 1759 .extra2 = SYSCTL_ONE, 1760 }, 1761 #endif 1762 #ifdef CONFIG_LATENCYTOP 1763 { 1764 .procname = "latencytop", 1765 .data = &latencytop_enabled, 1766 .maxlen = sizeof(int), 1767 .mode = 0644, 1768 .proc_handler = sysctl_latencytop, 1769 }, 1770 #endif 1771 #ifdef CONFIG_BLK_DEV_INITRD 1772 { 1773 .procname = "real-root-dev", 1774 .data = &real_root_dev, 1775 .maxlen = sizeof(int), 1776 .mode = 0644, 1777 .proc_handler = proc_dointvec, 1778 }, 1779 #endif 1780 { 1781 .procname = "print-fatal-signals", 1782 .data = &print_fatal_signals, 1783 .maxlen = sizeof(int), 1784 .mode = 0644, 1785 .proc_handler = proc_dointvec, 1786 }, 1787 #ifdef CONFIG_SPARC 1788 { 1789 .procname = "reboot-cmd", 1790 .data = reboot_command, 1791 .maxlen = 256, 1792 .mode = 0644, 1793 .proc_handler = proc_dostring, 1794 }, 1795 { 1796 .procname = "stop-a", 1797 .data = &stop_a_enabled, 1798 .maxlen = sizeof (int), 1799 .mode = 0644, 1800 .proc_handler = proc_dointvec, 1801 }, 1802 { 1803 .procname = "scons-poweroff", 1804 .data = &scons_pwroff, 1805 .maxlen = sizeof (int), 1806 .mode = 0644, 1807 .proc_handler = proc_dointvec, 1808 }, 1809 #endif 1810 #ifdef CONFIG_SPARC64 1811 { 1812 .procname = "tsb-ratio", 1813 .data = &sysctl_tsb_ratio, 1814 .maxlen = sizeof (int), 1815 .mode = 0644, 1816 .proc_handler = proc_dointvec, 1817 }, 1818 #endif 1819 #ifdef CONFIG_PARISC 1820 { 1821 .procname = "soft-power", 1822 .data = &pwrsw_enabled, 1823 .maxlen = sizeof (int), 1824 .mode = 0644, 1825 .proc_handler = proc_dointvec, 1826 }, 1827 #endif 1828 #ifdef CONFIG_SYSCTL_ARCH_UNALIGN_ALLOW 1829 { 1830 .procname = "unaligned-trap", 1831 .data = &unaligned_enabled, 1832 .maxlen = sizeof (int), 1833 .mode = 0644, 1834 .proc_handler = proc_dointvec, 1835 }, 1836 #endif 1837 { 1838 .procname = "ctrl-alt-del", 1839 .data = &C_A_D, 1840 .maxlen = sizeof(int), 1841 .mode = 0644, 1842 .proc_handler = proc_dointvec, 1843 }, 1844 #ifdef CONFIG_FUNCTION_TRACER 1845 { 1846 .procname = "ftrace_enabled", 1847 .data = &ftrace_enabled, 1848 .maxlen = sizeof(int), 1849 .mode = 0644, 1850 .proc_handler = ftrace_enable_sysctl, 1851 }, 1852 #endif 1853 #ifdef CONFIG_STACK_TRACER 1854 { 1855 .procname = "stack_tracer_enabled", 1856 .data = &stack_tracer_enabled, 1857 .maxlen = sizeof(int), 1858 .mode = 0644, 1859 .proc_handler = stack_trace_sysctl, 1860 }, 1861 #endif 1862 #ifdef CONFIG_TRACING 1863 { 1864 .procname = "ftrace_dump_on_oops", 1865 .data = &ftrace_dump_on_oops, 1866 .maxlen = sizeof(int), 1867 .mode = 0644, 1868 .proc_handler = proc_dointvec, 1869 }, 1870 { 1871 .procname = "traceoff_on_warning", 1872 .data = &__disable_trace_on_warning, 1873 .maxlen = sizeof(__disable_trace_on_warning), 1874 .mode = 0644, 1875 .proc_handler = proc_dointvec, 1876 }, 1877 { 1878 .procname = "tracepoint_printk", 1879 .data = &tracepoint_printk, 1880 .maxlen = sizeof(tracepoint_printk), 1881 .mode = 0644, 1882 .proc_handler = tracepoint_printk_sysctl, 1883 }, 1884 #endif 1885 #ifdef CONFIG_KEXEC_CORE 1886 { 1887 .procname = "kexec_load_disabled", 1888 .data = &kexec_load_disabled, 1889 .maxlen = sizeof(int), 1890 .mode = 0644, 1891 /* only handle a transition from default "0" to "1" */ 1892 .proc_handler = proc_dointvec_minmax, 1893 .extra1 = SYSCTL_ONE, 1894 .extra2 = SYSCTL_ONE, 1895 }, 1896 #endif 1897 #ifdef CONFIG_MODULES 1898 { 1899 .procname = "modprobe", 1900 .data = &modprobe_path, 1901 .maxlen = KMOD_PATH_LEN, 1902 .mode = 0644, 1903 .proc_handler = proc_dostring, 1904 }, 1905 { 1906 .procname = "modules_disabled", 1907 .data = &modules_disabled, 1908 .maxlen = sizeof(int), 1909 .mode = 0644, 1910 /* only handle a transition from default "0" to "1" */ 1911 .proc_handler = proc_dointvec_minmax, 1912 .extra1 = SYSCTL_ONE, 1913 .extra2 = SYSCTL_ONE, 1914 }, 1915 #endif 1916 #ifdef CONFIG_UEVENT_HELPER 1917 { 1918 .procname = "hotplug", 1919 .data = &uevent_helper, 1920 .maxlen = UEVENT_HELPER_PATH_LEN, 1921 .mode = 0644, 1922 .proc_handler = proc_dostring, 1923 }, 1924 #endif 1925 #ifdef CONFIG_BSD_PROCESS_ACCT 1926 { 1927 .procname = "acct", 1928 .data = &acct_parm, 1929 .maxlen = 3*sizeof(int), 1930 .mode = 0644, 1931 .proc_handler = proc_dointvec, 1932 }, 1933 #endif 1934 #ifdef CONFIG_MAGIC_SYSRQ 1935 { 1936 .procname = "sysrq", 1937 .data = NULL, 1938 .maxlen = sizeof (int), 1939 .mode = 0644, 1940 .proc_handler = sysrq_sysctl_handler, 1941 }, 1942 #endif 1943 #ifdef CONFIG_PROC_SYSCTL 1944 { 1945 .procname = "cad_pid", 1946 .data = NULL, 1947 .maxlen = sizeof (int), 1948 .mode = 0600, 1949 .proc_handler = proc_do_cad_pid, 1950 }, 1951 #endif 1952 { 1953 .procname = "threads-max", 1954 .data = NULL, 1955 .maxlen = sizeof(int), 1956 .mode = 0644, 1957 .proc_handler = sysctl_max_threads, 1958 }, 1959 { 1960 .procname = "usermodehelper", 1961 .mode = 0555, 1962 .child = usermodehelper_table, 1963 }, 1964 { 1965 .procname = "overflowuid", 1966 .data = &overflowuid, 1967 .maxlen = sizeof(int), 1968 .mode = 0644, 1969 .proc_handler = proc_dointvec_minmax, 1970 .extra1 = SYSCTL_ZERO, 1971 .extra2 = SYSCTL_MAXOLDUID, 1972 }, 1973 { 1974 .procname = "overflowgid", 1975 .data = &overflowgid, 1976 .maxlen = sizeof(int), 1977 .mode = 0644, 1978 .proc_handler = proc_dointvec_minmax, 1979 .extra1 = SYSCTL_ZERO, 1980 .extra2 = SYSCTL_MAXOLDUID, 1981 }, 1982 #ifdef CONFIG_S390 1983 { 1984 .procname = "userprocess_debug", 1985 .data = &show_unhandled_signals, 1986 .maxlen = sizeof(int), 1987 .mode = 0644, 1988 .proc_handler = proc_dointvec, 1989 }, 1990 #endif 1991 #ifdef CONFIG_SMP 1992 { 1993 .procname = "oops_all_cpu_backtrace", 1994 .data = &sysctl_oops_all_cpu_backtrace, 1995 .maxlen = sizeof(int), 1996 .mode = 0644, 1997 .proc_handler = proc_dointvec_minmax, 1998 .extra1 = SYSCTL_ZERO, 1999 .extra2 = SYSCTL_ONE, 2000 }, 2001 #endif /* CONFIG_SMP */ 2002 { 2003 .procname = "pid_max", 2004 .data = &pid_max, 2005 .maxlen = sizeof (int), 2006 .mode = 0644, 2007 .proc_handler = proc_dointvec_minmax, 2008 .extra1 = &pid_max_min, 2009 .extra2 = &pid_max_max, 2010 }, 2011 { 2012 .procname = "panic_on_oops", 2013 .data = &panic_on_oops, 2014 .maxlen = sizeof(int), 2015 .mode = 0644, 2016 .proc_handler = proc_dointvec, 2017 }, 2018 { 2019 .procname = "panic_print", 2020 .data = &panic_print, 2021 .maxlen = sizeof(unsigned long), 2022 .mode = 0644, 2023 .proc_handler = proc_doulongvec_minmax, 2024 }, 2025 { 2026 .procname = "ngroups_max", 2027 .data = (void *)&ngroups_max, 2028 .maxlen = sizeof (int), 2029 .mode = 0444, 2030 .proc_handler = proc_dointvec, 2031 }, 2032 { 2033 .procname = "cap_last_cap", 2034 .data = (void *)&cap_last_cap, 2035 .maxlen = sizeof(int), 2036 .mode = 0444, 2037 .proc_handler = proc_dointvec, 2038 }, 2039 #if defined(CONFIG_X86_LOCAL_APIC) && defined(CONFIG_X86) 2040 { 2041 .procname = "unknown_nmi_panic", 2042 .data = &unknown_nmi_panic, 2043 .maxlen = sizeof (int), 2044 .mode = 0644, 2045 .proc_handler = proc_dointvec, 2046 }, 2047 #endif 2048 2049 #if (defined(CONFIG_X86_32) || defined(CONFIG_PARISC)) && \ 2050 defined(CONFIG_DEBUG_STACKOVERFLOW) 2051 { 2052 .procname = "panic_on_stackoverflow", 2053 .data = &sysctl_panic_on_stackoverflow, 2054 .maxlen = sizeof(int), 2055 .mode = 0644, 2056 .proc_handler = proc_dointvec, 2057 }, 2058 #endif 2059 #if defined(CONFIG_X86) 2060 { 2061 .procname = "panic_on_unrecovered_nmi", 2062 .data = &panic_on_unrecovered_nmi, 2063 .maxlen = sizeof(int), 2064 .mode = 0644, 2065 .proc_handler = proc_dointvec, 2066 }, 2067 { 2068 .procname = "panic_on_io_nmi", 2069 .data = &panic_on_io_nmi, 2070 .maxlen = sizeof(int), 2071 .mode = 0644, 2072 .proc_handler = proc_dointvec, 2073 }, 2074 { 2075 .procname = "bootloader_type", 2076 .data = &bootloader_type, 2077 .maxlen = sizeof (int), 2078 .mode = 0444, 2079 .proc_handler = proc_dointvec, 2080 }, 2081 { 2082 .procname = "bootloader_version", 2083 .data = &bootloader_version, 2084 .maxlen = sizeof (int), 2085 .mode = 0444, 2086 .proc_handler = proc_dointvec, 2087 }, 2088 { 2089 .procname = "io_delay_type", 2090 .data = &io_delay_type, 2091 .maxlen = sizeof(int), 2092 .mode = 0644, 2093 .proc_handler = proc_dointvec, 2094 }, 2095 #endif 2096 #if defined(CONFIG_MMU) 2097 { 2098 .procname = "randomize_va_space", 2099 .data = &randomize_va_space, 2100 .maxlen = sizeof(int), 2101 .mode = 0644, 2102 .proc_handler = proc_dointvec, 2103 }, 2104 #endif 2105 #if defined(CONFIG_S390) && defined(CONFIG_SMP) 2106 { 2107 .procname = "spin_retry", 2108 .data = &spin_retry, 2109 .maxlen = sizeof (int), 2110 .mode = 0644, 2111 .proc_handler = proc_dointvec, 2112 }, 2113 #endif 2114 #if defined(CONFIG_ACPI_SLEEP) && defined(CONFIG_X86) 2115 { 2116 .procname = "acpi_video_flags", 2117 .data = &acpi_realmode_flags, 2118 .maxlen = sizeof (unsigned long), 2119 .mode = 0644, 2120 .proc_handler = proc_doulongvec_minmax, 2121 }, 2122 #endif 2123 #ifdef CONFIG_SYSCTL_ARCH_UNALIGN_NO_WARN 2124 { 2125 .procname = "ignore-unaligned-usertrap", 2126 .data = &no_unaligned_warning, 2127 .maxlen = sizeof (int), 2128 .mode = 0644, 2129 .proc_handler = proc_dointvec, 2130 }, 2131 #endif 2132 #ifdef CONFIG_IA64 2133 { 2134 .procname = "unaligned-dump-stack", 2135 .data = &unaligned_dump_stack, 2136 .maxlen = sizeof (int), 2137 .mode = 0644, 2138 .proc_handler = proc_dointvec, 2139 }, 2140 #endif 2141 #ifdef CONFIG_RT_MUTEXES 2142 { 2143 .procname = "max_lock_depth", 2144 .data = &max_lock_depth, 2145 .maxlen = sizeof(int), 2146 .mode = 0644, 2147 .proc_handler = proc_dointvec, 2148 }, 2149 #endif 2150 { 2151 .procname = "poweroff_cmd", 2152 .data = &poweroff_cmd, 2153 .maxlen = POWEROFF_CMD_PATH_LEN, 2154 .mode = 0644, 2155 .proc_handler = proc_dostring, 2156 }, 2157 #ifdef CONFIG_KEYS 2158 { 2159 .procname = "keys", 2160 .mode = 0555, 2161 .child = key_sysctls, 2162 }, 2163 #endif 2164 #ifdef CONFIG_PERF_EVENTS 2165 /* 2166 * User-space scripts rely on the existence of this file 2167 * as a feature check for perf_events being enabled. 2168 * 2169 * So it's an ABI, do not remove! 2170 */ 2171 { 2172 .procname = "perf_event_paranoid", 2173 .data = &sysctl_perf_event_paranoid, 2174 .maxlen = sizeof(sysctl_perf_event_paranoid), 2175 .mode = 0644, 2176 .proc_handler = proc_dointvec, 2177 }, 2178 { 2179 .procname = "perf_event_mlock_kb", 2180 .data = &sysctl_perf_event_mlock, 2181 .maxlen = sizeof(sysctl_perf_event_mlock), 2182 .mode = 0644, 2183 .proc_handler = proc_dointvec, 2184 }, 2185 { 2186 .procname = "perf_event_max_sample_rate", 2187 .data = &sysctl_perf_event_sample_rate, 2188 .maxlen = sizeof(sysctl_perf_event_sample_rate), 2189 .mode = 0644, 2190 .proc_handler = perf_proc_update_handler, 2191 .extra1 = SYSCTL_ONE, 2192 }, 2193 { 2194 .procname = "perf_cpu_time_max_percent", 2195 .data = &sysctl_perf_cpu_time_max_percent, 2196 .maxlen = sizeof(sysctl_perf_cpu_time_max_percent), 2197 .mode = 0644, 2198 .proc_handler = perf_cpu_time_max_percent_handler, 2199 .extra1 = SYSCTL_ZERO, 2200 .extra2 = SYSCTL_ONE_HUNDRED, 2201 }, 2202 { 2203 .procname = "perf_event_max_stack", 2204 .data = &sysctl_perf_event_max_stack, 2205 .maxlen = sizeof(sysctl_perf_event_max_stack), 2206 .mode = 0644, 2207 .proc_handler = perf_event_max_stack_handler, 2208 .extra1 = SYSCTL_ZERO, 2209 .extra2 = (void *)&six_hundred_forty_kb, 2210 }, 2211 { 2212 .procname = "perf_event_max_contexts_per_stack", 2213 .data = &sysctl_perf_event_max_contexts_per_stack, 2214 .maxlen = sizeof(sysctl_perf_event_max_contexts_per_stack), 2215 .mode = 0644, 2216 .proc_handler = perf_event_max_stack_handler, 2217 .extra1 = SYSCTL_ZERO, 2218 .extra2 = SYSCTL_ONE_THOUSAND, 2219 }, 2220 #endif 2221 { 2222 .procname = "panic_on_warn", 2223 .data = &panic_on_warn, 2224 .maxlen = sizeof(int), 2225 .mode = 0644, 2226 .proc_handler = proc_dointvec_minmax, 2227 .extra1 = SYSCTL_ZERO, 2228 .extra2 = SYSCTL_ONE, 2229 }, 2230 #if defined(CONFIG_TREE_RCU) 2231 { 2232 .procname = "panic_on_rcu_stall", 2233 .data = &sysctl_panic_on_rcu_stall, 2234 .maxlen = sizeof(sysctl_panic_on_rcu_stall), 2235 .mode = 0644, 2236 .proc_handler = proc_dointvec_minmax, 2237 .extra1 = SYSCTL_ZERO, 2238 .extra2 = SYSCTL_ONE, 2239 }, 2240 #endif 2241 #if defined(CONFIG_TREE_RCU) 2242 { 2243 .procname = "max_rcu_stall_to_panic", 2244 .data = &sysctl_max_rcu_stall_to_panic, 2245 .maxlen = sizeof(sysctl_max_rcu_stall_to_panic), 2246 .mode = 0644, 2247 .proc_handler = proc_dointvec_minmax, 2248 .extra1 = SYSCTL_ONE, 2249 .extra2 = SYSCTL_INT_MAX, 2250 }, 2251 #endif 2252 { } 2253 }; 2254 2255 static struct ctl_table vm_table[] = { 2256 { 2257 .procname = "overcommit_memory", 2258 .data = &sysctl_overcommit_memory, 2259 .maxlen = sizeof(sysctl_overcommit_memory), 2260 .mode = 0644, 2261 .proc_handler = overcommit_policy_handler, 2262 .extra1 = SYSCTL_ZERO, 2263 .extra2 = SYSCTL_TWO, 2264 }, 2265 { 2266 .procname = "panic_on_oom", 2267 .data = &sysctl_panic_on_oom, 2268 .maxlen = sizeof(sysctl_panic_on_oom), 2269 .mode = 0644, 2270 .proc_handler = proc_dointvec_minmax, 2271 .extra1 = SYSCTL_ZERO, 2272 .extra2 = SYSCTL_TWO, 2273 }, 2274 { 2275 .procname = "oom_kill_allocating_task", 2276 .data = &sysctl_oom_kill_allocating_task, 2277 .maxlen = sizeof(sysctl_oom_kill_allocating_task), 2278 .mode = 0644, 2279 .proc_handler = proc_dointvec, 2280 }, 2281 { 2282 .procname = "oom_dump_tasks", 2283 .data = &sysctl_oom_dump_tasks, 2284 .maxlen = sizeof(sysctl_oom_dump_tasks), 2285 .mode = 0644, 2286 .proc_handler = proc_dointvec, 2287 }, 2288 { 2289 .procname = "overcommit_ratio", 2290 .data = &sysctl_overcommit_ratio, 2291 .maxlen = sizeof(sysctl_overcommit_ratio), 2292 .mode = 0644, 2293 .proc_handler = overcommit_ratio_handler, 2294 }, 2295 { 2296 .procname = "overcommit_kbytes", 2297 .data = &sysctl_overcommit_kbytes, 2298 .maxlen = sizeof(sysctl_overcommit_kbytes), 2299 .mode = 0644, 2300 .proc_handler = overcommit_kbytes_handler, 2301 }, 2302 { 2303 .procname = "page-cluster", 2304 .data = &page_cluster, 2305 .maxlen = sizeof(int), 2306 .mode = 0644, 2307 .proc_handler = proc_dointvec_minmax, 2308 .extra1 = SYSCTL_ZERO, 2309 }, 2310 { 2311 .procname = "dirty_background_ratio", 2312 .data = &dirty_background_ratio, 2313 .maxlen = sizeof(dirty_background_ratio), 2314 .mode = 0644, 2315 .proc_handler = dirty_background_ratio_handler, 2316 .extra1 = SYSCTL_ZERO, 2317 .extra2 = SYSCTL_ONE_HUNDRED, 2318 }, 2319 { 2320 .procname = "dirty_background_bytes", 2321 .data = &dirty_background_bytes, 2322 .maxlen = sizeof(dirty_background_bytes), 2323 .mode = 0644, 2324 .proc_handler = dirty_background_bytes_handler, 2325 .extra1 = SYSCTL_LONG_ONE, 2326 }, 2327 { 2328 .procname = "dirty_ratio", 2329 .data = &vm_dirty_ratio, 2330 .maxlen = sizeof(vm_dirty_ratio), 2331 .mode = 0644, 2332 .proc_handler = dirty_ratio_handler, 2333 .extra1 = SYSCTL_ZERO, 2334 .extra2 = SYSCTL_ONE_HUNDRED, 2335 }, 2336 { 2337 .procname = "dirty_bytes", 2338 .data = &vm_dirty_bytes, 2339 .maxlen = sizeof(vm_dirty_bytes), 2340 .mode = 0644, 2341 .proc_handler = dirty_bytes_handler, 2342 .extra1 = (void *)&dirty_bytes_min, 2343 }, 2344 { 2345 .procname = "dirty_writeback_centisecs", 2346 .data = &dirty_writeback_interval, 2347 .maxlen = sizeof(dirty_writeback_interval), 2348 .mode = 0644, 2349 .proc_handler = dirty_writeback_centisecs_handler, 2350 }, 2351 { 2352 .procname = "dirty_expire_centisecs", 2353 .data = &dirty_expire_interval, 2354 .maxlen = sizeof(dirty_expire_interval), 2355 .mode = 0644, 2356 .proc_handler = proc_dointvec_minmax, 2357 .extra1 = SYSCTL_ZERO, 2358 }, 2359 { 2360 .procname = "dirtytime_expire_seconds", 2361 .data = &dirtytime_expire_interval, 2362 .maxlen = sizeof(dirtytime_expire_interval), 2363 .mode = 0644, 2364 .proc_handler = dirtytime_interval_handler, 2365 .extra1 = SYSCTL_ZERO, 2366 }, 2367 { 2368 .procname = "swappiness", 2369 .data = &vm_swappiness, 2370 .maxlen = sizeof(vm_swappiness), 2371 .mode = 0644, 2372 .proc_handler = proc_dointvec_minmax, 2373 .extra1 = SYSCTL_ZERO, 2374 .extra2 = SYSCTL_TWO_HUNDRED, 2375 }, 2376 #ifdef CONFIG_HUGETLB_PAGE 2377 { 2378 .procname = "nr_hugepages", 2379 .data = NULL, 2380 .maxlen = sizeof(unsigned long), 2381 .mode = 0644, 2382 .proc_handler = hugetlb_sysctl_handler, 2383 }, 2384 #ifdef CONFIG_NUMA 2385 { 2386 .procname = "nr_hugepages_mempolicy", 2387 .data = NULL, 2388 .maxlen = sizeof(unsigned long), 2389 .mode = 0644, 2390 .proc_handler = &hugetlb_mempolicy_sysctl_handler, 2391 }, 2392 { 2393 .procname = "numa_stat", 2394 .data = &sysctl_vm_numa_stat, 2395 .maxlen = sizeof(int), 2396 .mode = 0644, 2397 .proc_handler = sysctl_vm_numa_stat_handler, 2398 .extra1 = SYSCTL_ZERO, 2399 .extra2 = SYSCTL_ONE, 2400 }, 2401 #endif 2402 { 2403 .procname = "hugetlb_shm_group", 2404 .data = &sysctl_hugetlb_shm_group, 2405 .maxlen = sizeof(gid_t), 2406 .mode = 0644, 2407 .proc_handler = proc_dointvec, 2408 }, 2409 { 2410 .procname = "nr_overcommit_hugepages", 2411 .data = NULL, 2412 .maxlen = sizeof(unsigned long), 2413 .mode = 0644, 2414 .proc_handler = hugetlb_overcommit_handler, 2415 }, 2416 #endif 2417 { 2418 .procname = "lowmem_reserve_ratio", 2419 .data = &sysctl_lowmem_reserve_ratio, 2420 .maxlen = sizeof(sysctl_lowmem_reserve_ratio), 2421 .mode = 0644, 2422 .proc_handler = lowmem_reserve_ratio_sysctl_handler, 2423 }, 2424 { 2425 .procname = "drop_caches", 2426 .data = &sysctl_drop_caches, 2427 .maxlen = sizeof(int), 2428 .mode = 0200, 2429 .proc_handler = drop_caches_sysctl_handler, 2430 .extra1 = SYSCTL_ONE, 2431 .extra2 = SYSCTL_FOUR, 2432 }, 2433 #ifdef CONFIG_COMPACTION 2434 { 2435 .procname = "compact_memory", 2436 .data = NULL, 2437 .maxlen = sizeof(int), 2438 .mode = 0200, 2439 .proc_handler = sysctl_compaction_handler, 2440 }, 2441 { 2442 .procname = "compaction_proactiveness", 2443 .data = &sysctl_compaction_proactiveness, 2444 .maxlen = sizeof(sysctl_compaction_proactiveness), 2445 .mode = 0644, 2446 .proc_handler = compaction_proactiveness_sysctl_handler, 2447 .extra1 = SYSCTL_ZERO, 2448 .extra2 = SYSCTL_ONE_HUNDRED, 2449 }, 2450 { 2451 .procname = "extfrag_threshold", 2452 .data = &sysctl_extfrag_threshold, 2453 .maxlen = sizeof(int), 2454 .mode = 0644, 2455 .proc_handler = proc_dointvec_minmax, 2456 .extra1 = SYSCTL_ZERO, 2457 .extra2 = (void *)&max_extfrag_threshold, 2458 }, 2459 { 2460 .procname = "compact_unevictable_allowed", 2461 .data = &sysctl_compact_unevictable_allowed, 2462 .maxlen = sizeof(int), 2463 .mode = 0644, 2464 .proc_handler = proc_dointvec_minmax_warn_RT_change, 2465 .extra1 = SYSCTL_ZERO, 2466 .extra2 = SYSCTL_ONE, 2467 }, 2468 2469 #endif /* CONFIG_COMPACTION */ 2470 { 2471 .procname = "min_free_kbytes", 2472 .data = &min_free_kbytes, 2473 .maxlen = sizeof(min_free_kbytes), 2474 .mode = 0644, 2475 .proc_handler = min_free_kbytes_sysctl_handler, 2476 .extra1 = SYSCTL_ZERO, 2477 }, 2478 { 2479 .procname = "watermark_boost_factor", 2480 .data = &watermark_boost_factor, 2481 .maxlen = sizeof(watermark_boost_factor), 2482 .mode = 0644, 2483 .proc_handler = proc_dointvec_minmax, 2484 .extra1 = SYSCTL_ZERO, 2485 }, 2486 { 2487 .procname = "watermark_scale_factor", 2488 .data = &watermark_scale_factor, 2489 .maxlen = sizeof(watermark_scale_factor), 2490 .mode = 0644, 2491 .proc_handler = watermark_scale_factor_sysctl_handler, 2492 .extra1 = SYSCTL_ONE, 2493 .extra2 = SYSCTL_THREE_THOUSAND, 2494 }, 2495 { 2496 .procname = "percpu_pagelist_high_fraction", 2497 .data = &percpu_pagelist_high_fraction, 2498 .maxlen = sizeof(percpu_pagelist_high_fraction), 2499 .mode = 0644, 2500 .proc_handler = percpu_pagelist_high_fraction_sysctl_handler, 2501 .extra1 = SYSCTL_ZERO, 2502 }, 2503 { 2504 .procname = "page_lock_unfairness", 2505 .data = &sysctl_page_lock_unfairness, 2506 .maxlen = sizeof(sysctl_page_lock_unfairness), 2507 .mode = 0644, 2508 .proc_handler = proc_dointvec_minmax, 2509 .extra1 = SYSCTL_ZERO, 2510 }, 2511 #ifdef CONFIG_MMU 2512 { 2513 .procname = "max_map_count", 2514 .data = &sysctl_max_map_count, 2515 .maxlen = sizeof(sysctl_max_map_count), 2516 .mode = 0644, 2517 .proc_handler = proc_dointvec_minmax, 2518 .extra1 = SYSCTL_ZERO, 2519 }, 2520 #else 2521 { 2522 .procname = "nr_trim_pages", 2523 .data = &sysctl_nr_trim_pages, 2524 .maxlen = sizeof(sysctl_nr_trim_pages), 2525 .mode = 0644, 2526 .proc_handler = proc_dointvec_minmax, 2527 .extra1 = SYSCTL_ZERO, 2528 }, 2529 #endif 2530 { 2531 .procname = "laptop_mode", 2532 .data = &laptop_mode, 2533 .maxlen = sizeof(laptop_mode), 2534 .mode = 0644, 2535 .proc_handler = proc_dointvec_jiffies, 2536 }, 2537 { 2538 .procname = "vfs_cache_pressure", 2539 .data = &sysctl_vfs_cache_pressure, 2540 .maxlen = sizeof(sysctl_vfs_cache_pressure), 2541 .mode = 0644, 2542 .proc_handler = proc_dointvec_minmax, 2543 .extra1 = SYSCTL_ZERO, 2544 }, 2545 #if defined(HAVE_ARCH_PICK_MMAP_LAYOUT) || \ 2546 defined(CONFIG_ARCH_WANT_DEFAULT_TOPDOWN_MMAP_LAYOUT) 2547 { 2548 .procname = "legacy_va_layout", 2549 .data = &sysctl_legacy_va_layout, 2550 .maxlen = sizeof(sysctl_legacy_va_layout), 2551 .mode = 0644, 2552 .proc_handler = proc_dointvec_minmax, 2553 .extra1 = SYSCTL_ZERO, 2554 }, 2555 #endif 2556 #ifdef CONFIG_NUMA 2557 { 2558 .procname = "zone_reclaim_mode", 2559 .data = &node_reclaim_mode, 2560 .maxlen = sizeof(node_reclaim_mode), 2561 .mode = 0644, 2562 .proc_handler = proc_dointvec_minmax, 2563 .extra1 = SYSCTL_ZERO, 2564 }, 2565 { 2566 .procname = "min_unmapped_ratio", 2567 .data = &sysctl_min_unmapped_ratio, 2568 .maxlen = sizeof(sysctl_min_unmapped_ratio), 2569 .mode = 0644, 2570 .proc_handler = sysctl_min_unmapped_ratio_sysctl_handler, 2571 .extra1 = SYSCTL_ZERO, 2572 .extra2 = SYSCTL_ONE_HUNDRED, 2573 }, 2574 { 2575 .procname = "min_slab_ratio", 2576 .data = &sysctl_min_slab_ratio, 2577 .maxlen = sizeof(sysctl_min_slab_ratio), 2578 .mode = 0644, 2579 .proc_handler = sysctl_min_slab_ratio_sysctl_handler, 2580 .extra1 = SYSCTL_ZERO, 2581 .extra2 = SYSCTL_ONE_HUNDRED, 2582 }, 2583 #endif 2584 #ifdef CONFIG_SMP 2585 { 2586 .procname = "stat_interval", 2587 .data = &sysctl_stat_interval, 2588 .maxlen = sizeof(sysctl_stat_interval), 2589 .mode = 0644, 2590 .proc_handler = proc_dointvec_jiffies, 2591 }, 2592 { 2593 .procname = "stat_refresh", 2594 .data = NULL, 2595 .maxlen = 0, 2596 .mode = 0600, 2597 .proc_handler = vmstat_refresh, 2598 }, 2599 #endif 2600 #ifdef CONFIG_MMU 2601 { 2602 .procname = "mmap_min_addr", 2603 .data = &dac_mmap_min_addr, 2604 .maxlen = sizeof(unsigned long), 2605 .mode = 0644, 2606 .proc_handler = mmap_min_addr_handler, 2607 }, 2608 #endif 2609 #ifdef CONFIG_NUMA 2610 { 2611 .procname = "numa_zonelist_order", 2612 .data = &numa_zonelist_order, 2613 .maxlen = NUMA_ZONELIST_ORDER_LEN, 2614 .mode = 0644, 2615 .proc_handler = numa_zonelist_order_handler, 2616 }, 2617 #endif 2618 #if (defined(CONFIG_X86_32) && !defined(CONFIG_UML))|| \ 2619 (defined(CONFIG_SUPERH) && defined(CONFIG_VSYSCALL)) 2620 { 2621 .procname = "vdso_enabled", 2622 #ifdef CONFIG_X86_32 2623 .data = &vdso32_enabled, 2624 .maxlen = sizeof(vdso32_enabled), 2625 #else 2626 .data = &vdso_enabled, 2627 .maxlen = sizeof(vdso_enabled), 2628 #endif 2629 .mode = 0644, 2630 .proc_handler = proc_dointvec, 2631 .extra1 = SYSCTL_ZERO, 2632 }, 2633 #endif 2634 #ifdef CONFIG_HIGHMEM 2635 { 2636 .procname = "highmem_is_dirtyable", 2637 .data = &vm_highmem_is_dirtyable, 2638 .maxlen = sizeof(vm_highmem_is_dirtyable), 2639 .mode = 0644, 2640 .proc_handler = proc_dointvec_minmax, 2641 .extra1 = SYSCTL_ZERO, 2642 .extra2 = SYSCTL_ONE, 2643 }, 2644 #endif 2645 #ifdef CONFIG_MEMORY_FAILURE 2646 { 2647 .procname = "memory_failure_early_kill", 2648 .data = &sysctl_memory_failure_early_kill, 2649 .maxlen = sizeof(sysctl_memory_failure_early_kill), 2650 .mode = 0644, 2651 .proc_handler = proc_dointvec_minmax, 2652 .extra1 = SYSCTL_ZERO, 2653 .extra2 = SYSCTL_ONE, 2654 }, 2655 { 2656 .procname = "memory_failure_recovery", 2657 .data = &sysctl_memory_failure_recovery, 2658 .maxlen = sizeof(sysctl_memory_failure_recovery), 2659 .mode = 0644, 2660 .proc_handler = proc_dointvec_minmax, 2661 .extra1 = SYSCTL_ZERO, 2662 .extra2 = SYSCTL_ONE, 2663 }, 2664 #endif 2665 { 2666 .procname = "user_reserve_kbytes", 2667 .data = &sysctl_user_reserve_kbytes, 2668 .maxlen = sizeof(sysctl_user_reserve_kbytes), 2669 .mode = 0644, 2670 .proc_handler = proc_doulongvec_minmax, 2671 }, 2672 { 2673 .procname = "admin_reserve_kbytes", 2674 .data = &sysctl_admin_reserve_kbytes, 2675 .maxlen = sizeof(sysctl_admin_reserve_kbytes), 2676 .mode = 0644, 2677 .proc_handler = proc_doulongvec_minmax, 2678 }, 2679 #ifdef CONFIG_HAVE_ARCH_MMAP_RND_BITS 2680 { 2681 .procname = "mmap_rnd_bits", 2682 .data = &mmap_rnd_bits, 2683 .maxlen = sizeof(mmap_rnd_bits), 2684 .mode = 0600, 2685 .proc_handler = proc_dointvec_minmax, 2686 .extra1 = (void *)&mmap_rnd_bits_min, 2687 .extra2 = (void *)&mmap_rnd_bits_max, 2688 }, 2689 #endif 2690 #ifdef CONFIG_HAVE_ARCH_MMAP_RND_COMPAT_BITS 2691 { 2692 .procname = "mmap_rnd_compat_bits", 2693 .data = &mmap_rnd_compat_bits, 2694 .maxlen = sizeof(mmap_rnd_compat_bits), 2695 .mode = 0600, 2696 .proc_handler = proc_dointvec_minmax, 2697 .extra1 = (void *)&mmap_rnd_compat_bits_min, 2698 .extra2 = (void *)&mmap_rnd_compat_bits_max, 2699 }, 2700 #endif 2701 #ifdef CONFIG_USERFAULTFD 2702 { 2703 .procname = "unprivileged_userfaultfd", 2704 .data = &sysctl_unprivileged_userfaultfd, 2705 .maxlen = sizeof(sysctl_unprivileged_userfaultfd), 2706 .mode = 0644, 2707 .proc_handler = proc_dointvec_minmax, 2708 .extra1 = SYSCTL_ZERO, 2709 .extra2 = SYSCTL_ONE, 2710 }, 2711 #endif 2712 { } 2713 }; 2714 2715 static struct ctl_table debug_table[] = { 2716 #ifdef CONFIG_SYSCTL_EXCEPTION_TRACE 2717 { 2718 .procname = "exception-trace", 2719 .data = &show_unhandled_signals, 2720 .maxlen = sizeof(int), 2721 .mode = 0644, 2722 .proc_handler = proc_dointvec 2723 }, 2724 #endif 2725 { } 2726 }; 2727 2728 static struct ctl_table dev_table[] = { 2729 { } 2730 }; 2731 2732 DECLARE_SYSCTL_BASE(kernel, kern_table); 2733 DECLARE_SYSCTL_BASE(vm, vm_table); 2734 DECLARE_SYSCTL_BASE(debug, debug_table); 2735 DECLARE_SYSCTL_BASE(dev, dev_table); 2736 2737 int __init sysctl_init_bases(void) 2738 { 2739 register_sysctl_base(kernel); 2740 register_sysctl_base(vm); 2741 register_sysctl_base(debug); 2742 register_sysctl_base(dev); 2743 2744 return 0; 2745 } 2746 #endif /* CONFIG_SYSCTL */ 2747 /* 2748 * No sense putting this after each symbol definition, twice, 2749 * exception granted :-) 2750 */ 2751 EXPORT_SYMBOL(proc_dobool); 2752 EXPORT_SYMBOL(proc_dointvec); 2753 EXPORT_SYMBOL(proc_douintvec); 2754 EXPORT_SYMBOL(proc_dointvec_jiffies); 2755 EXPORT_SYMBOL(proc_dointvec_minmax); 2756 EXPORT_SYMBOL_GPL(proc_douintvec_minmax); 2757 EXPORT_SYMBOL(proc_dointvec_userhz_jiffies); 2758 EXPORT_SYMBOL(proc_dointvec_ms_jiffies); 2759 EXPORT_SYMBOL(proc_dostring); 2760 EXPORT_SYMBOL(proc_doulongvec_minmax); 2761 EXPORT_SYMBOL(proc_doulongvec_ms_jiffies_minmax); 2762 EXPORT_SYMBOL(proc_do_large_bitmap); 2763