1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * sysctl.c: General linux system control interface 4 * 5 * Begun 24 March 1995, Stephen Tweedie 6 * Added /proc support, Dec 1995 7 * Added bdflush entry and intvec min/max checking, 2/23/96, Tom Dyas. 8 * Added hooks for /proc/sys/net (minor, minor patch), 96/4/1, Mike Shaver. 9 * Added kernel/java-{interpreter,appletviewer}, 96/5/10, Mike Shaver. 10 * Dynamic registration fixes, Stephen Tweedie. 11 * Added kswapd-interval, ctrl-alt-del, printk stuff, 1/8/97, Chris Horn. 12 * Made sysctl support optional via CONFIG_SYSCTL, 1/10/97, Chris 13 * Horn. 14 * Added proc_doulongvec_ms_jiffies_minmax, 09/08/99, Carlos H. Bauer. 15 * Added proc_doulongvec_minmax, 09/08/99, Carlos H. Bauer. 16 * Changed linked lists to use list.h instead of lists.h, 02/24/00, Bill 17 * Wendling. 18 * The list_for_each() macro wasn't appropriate for the sysctl loop. 19 * Removed it and replaced it with older style, 03/23/00, Bill Wendling 20 */ 21 22 #include <linux/module.h> 23 #include <linux/aio.h> 24 #include <linux/mm.h> 25 #include <linux/swap.h> 26 #include <linux/slab.h> 27 #include <linux/sysctl.h> 28 #include <linux/bitmap.h> 29 #include <linux/signal.h> 30 #include <linux/panic.h> 31 #include <linux/printk.h> 32 #include <linux/proc_fs.h> 33 #include <linux/security.h> 34 #include <linux/ctype.h> 35 #include <linux/kmemleak.h> 36 #include <linux/fs.h> 37 #include <linux/init.h> 38 #include <linux/kernel.h> 39 #include <linux/kobject.h> 40 #include <linux/net.h> 41 #include <linux/sysrq.h> 42 #include <linux/highuid.h> 43 #include <linux/writeback.h> 44 #include <linux/ratelimit.h> 45 #include <linux/compaction.h> 46 #include <linux/hugetlb.h> 47 #include <linux/initrd.h> 48 #include <linux/key.h> 49 #include <linux/times.h> 50 #include <linux/limits.h> 51 #include <linux/dcache.h> 52 #include <linux/dnotify.h> 53 #include <linux/syscalls.h> 54 #include <linux/vmstat.h> 55 #include <linux/nfs_fs.h> 56 #include <linux/acpi.h> 57 #include <linux/reboot.h> 58 #include <linux/ftrace.h> 59 #include <linux/perf_event.h> 60 #include <linux/kprobes.h> 61 #include <linux/pipe_fs_i.h> 62 #include <linux/oom.h> 63 #include <linux/kmod.h> 64 #include <linux/capability.h> 65 #include <linux/binfmts.h> 66 #include <linux/sched/sysctl.h> 67 #include <linux/sched/coredump.h> 68 #include <linux/kexec.h> 69 #include <linux/bpf.h> 70 #include <linux/mount.h> 71 #include <linux/userfaultfd_k.h> 72 #include <linux/coredump.h> 73 #include <linux/latencytop.h> 74 #include <linux/pid.h> 75 76 #include "../lib/kstrtox.h" 77 78 #include <linux/uaccess.h> 79 #include <asm/processor.h> 80 81 #ifdef CONFIG_X86 82 #include <asm/nmi.h> 83 #include <asm/stacktrace.h> 84 #include <asm/io.h> 85 #endif 86 #ifdef CONFIG_SPARC 87 #include <asm/setup.h> 88 #endif 89 #ifdef CONFIG_BSD_PROCESS_ACCT 90 #include <linux/acct.h> 91 #endif 92 #ifdef CONFIG_RT_MUTEXES 93 #include <linux/rtmutex.h> 94 #endif 95 #if defined(CONFIG_PROVE_LOCKING) || defined(CONFIG_LOCK_STAT) 96 #include <linux/lockdep.h> 97 #endif 98 #ifdef CONFIG_CHR_DEV_SG 99 #include <scsi/sg.h> 100 #endif 101 #ifdef CONFIG_STACKLEAK_RUNTIME_DISABLE 102 #include <linux/stackleak.h> 103 #endif 104 #ifdef CONFIG_LOCKUP_DETECTOR 105 #include <linux/nmi.h> 106 #endif 107 108 #if defined(CONFIG_SYSCTL) 109 110 /* Constants used for minimum and maximum */ 111 #ifdef CONFIG_LOCKUP_DETECTOR 112 static int sixty = 60; 113 #endif 114 115 static int __maybe_unused neg_one = -1; 116 static int __maybe_unused two = 2; 117 static int __maybe_unused four = 4; 118 static unsigned long zero_ul; 119 static unsigned long one_ul = 1; 120 static unsigned long long_max = LONG_MAX; 121 static int one_hundred = 100; 122 static int two_hundred = 200; 123 static int one_thousand = 1000; 124 #ifdef CONFIG_PRINTK 125 static int ten_thousand = 10000; 126 #endif 127 #ifdef CONFIG_PERF_EVENTS 128 static int six_hundred_forty_kb = 640 * 1024; 129 #endif 130 131 /* this is needed for the proc_doulongvec_minmax of vm_dirty_bytes */ 132 static unsigned long dirty_bytes_min = 2 * PAGE_SIZE; 133 134 /* this is needed for the proc_dointvec_minmax for [fs_]overflow UID and GID */ 135 static int maxolduid = 65535; 136 static int minolduid; 137 138 static int ngroups_max = NGROUPS_MAX; 139 static const int cap_last_cap = CAP_LAST_CAP; 140 141 /* 142 * This is needed for proc_doulongvec_minmax of sysctl_hung_task_timeout_secs 143 * and hung_task_check_interval_secs 144 */ 145 #ifdef CONFIG_DETECT_HUNG_TASK 146 static unsigned long hung_task_timeout_max = (LONG_MAX/HZ); 147 #endif 148 149 #ifdef CONFIG_INOTIFY_USER 150 #include <linux/inotify.h> 151 #endif 152 #ifdef CONFIG_FANOTIFY 153 #include <linux/fanotify.h> 154 #endif 155 156 #ifdef CONFIG_PROC_SYSCTL 157 158 /** 159 * enum sysctl_writes_mode - supported sysctl write modes 160 * 161 * @SYSCTL_WRITES_LEGACY: each write syscall must fully contain the sysctl value 162 * to be written, and multiple writes on the same sysctl file descriptor 163 * will rewrite the sysctl value, regardless of file position. No warning 164 * is issued when the initial position is not 0. 165 * @SYSCTL_WRITES_WARN: same as above but warn when the initial file position is 166 * not 0. 167 * @SYSCTL_WRITES_STRICT: writes to numeric sysctl entries must always be at 168 * file position 0 and the value must be fully contained in the buffer 169 * sent to the write syscall. If dealing with strings respect the file 170 * position, but restrict this to the max length of the buffer, anything 171 * passed the max length will be ignored. Multiple writes will append 172 * to the buffer. 173 * 174 * These write modes control how current file position affects the behavior of 175 * updating sysctl values through the proc interface on each write. 176 */ 177 enum sysctl_writes_mode { 178 SYSCTL_WRITES_LEGACY = -1, 179 SYSCTL_WRITES_WARN = 0, 180 SYSCTL_WRITES_STRICT = 1, 181 }; 182 183 static enum sysctl_writes_mode sysctl_writes_strict = SYSCTL_WRITES_STRICT; 184 #endif /* CONFIG_PROC_SYSCTL */ 185 186 #if defined(HAVE_ARCH_PICK_MMAP_LAYOUT) || \ 187 defined(CONFIG_ARCH_WANT_DEFAULT_TOPDOWN_MMAP_LAYOUT) 188 int sysctl_legacy_va_layout; 189 #endif 190 191 #ifdef CONFIG_COMPACTION 192 static int min_extfrag_threshold; 193 static int max_extfrag_threshold = 1000; 194 #endif 195 196 #endif /* CONFIG_SYSCTL */ 197 198 #if defined(CONFIG_BPF_SYSCALL) && defined(CONFIG_SYSCTL) 199 static int bpf_stats_handler(struct ctl_table *table, int write, 200 void *buffer, size_t *lenp, loff_t *ppos) 201 { 202 struct static_key *key = (struct static_key *)table->data; 203 static int saved_val; 204 int val, ret; 205 struct ctl_table tmp = { 206 .data = &val, 207 .maxlen = sizeof(val), 208 .mode = table->mode, 209 .extra1 = SYSCTL_ZERO, 210 .extra2 = SYSCTL_ONE, 211 }; 212 213 if (write && !capable(CAP_SYS_ADMIN)) 214 return -EPERM; 215 216 mutex_lock(&bpf_stats_enabled_mutex); 217 val = saved_val; 218 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos); 219 if (write && !ret && val != saved_val) { 220 if (val) 221 static_key_slow_inc(key); 222 else 223 static_key_slow_dec(key); 224 saved_val = val; 225 } 226 mutex_unlock(&bpf_stats_enabled_mutex); 227 return ret; 228 } 229 230 static int bpf_unpriv_handler(struct ctl_table *table, int write, 231 void *buffer, size_t *lenp, loff_t *ppos) 232 { 233 int ret, unpriv_enable = *(int *)table->data; 234 bool locked_state = unpriv_enable == 1; 235 struct ctl_table tmp = *table; 236 237 if (write && !capable(CAP_SYS_ADMIN)) 238 return -EPERM; 239 240 tmp.data = &unpriv_enable; 241 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos); 242 if (write && !ret) { 243 if (locked_state && unpriv_enable != 1) 244 return -EPERM; 245 *(int *)table->data = unpriv_enable; 246 } 247 return ret; 248 } 249 #endif /* CONFIG_BPF_SYSCALL && CONFIG_SYSCTL */ 250 251 /* 252 * /proc/sys support 253 */ 254 255 #ifdef CONFIG_PROC_SYSCTL 256 257 static int _proc_do_string(char *data, int maxlen, int write, 258 char *buffer, size_t *lenp, loff_t *ppos) 259 { 260 size_t len; 261 char c, *p; 262 263 if (!data || !maxlen || !*lenp) { 264 *lenp = 0; 265 return 0; 266 } 267 268 if (write) { 269 if (sysctl_writes_strict == SYSCTL_WRITES_STRICT) { 270 /* Only continue writes not past the end of buffer. */ 271 len = strlen(data); 272 if (len > maxlen - 1) 273 len = maxlen - 1; 274 275 if (*ppos > len) 276 return 0; 277 len = *ppos; 278 } else { 279 /* Start writing from beginning of buffer. */ 280 len = 0; 281 } 282 283 *ppos += *lenp; 284 p = buffer; 285 while ((p - buffer) < *lenp && len < maxlen - 1) { 286 c = *(p++); 287 if (c == 0 || c == '\n') 288 break; 289 data[len++] = c; 290 } 291 data[len] = 0; 292 } else { 293 len = strlen(data); 294 if (len > maxlen) 295 len = maxlen; 296 297 if (*ppos > len) { 298 *lenp = 0; 299 return 0; 300 } 301 302 data += *ppos; 303 len -= *ppos; 304 305 if (len > *lenp) 306 len = *lenp; 307 if (len) 308 memcpy(buffer, data, len); 309 if (len < *lenp) { 310 buffer[len] = '\n'; 311 len++; 312 } 313 *lenp = len; 314 *ppos += len; 315 } 316 return 0; 317 } 318 319 static void warn_sysctl_write(struct ctl_table *table) 320 { 321 pr_warn_once("%s wrote to %s when file position was not 0!\n" 322 "This will not be supported in the future. To silence this\n" 323 "warning, set kernel.sysctl_writes_strict = -1\n", 324 current->comm, table->procname); 325 } 326 327 /** 328 * proc_first_pos_non_zero_ignore - check if first position is allowed 329 * @ppos: file position 330 * @table: the sysctl table 331 * 332 * Returns true if the first position is non-zero and the sysctl_writes_strict 333 * mode indicates this is not allowed for numeric input types. String proc 334 * handlers can ignore the return value. 335 */ 336 static bool proc_first_pos_non_zero_ignore(loff_t *ppos, 337 struct ctl_table *table) 338 { 339 if (!*ppos) 340 return false; 341 342 switch (sysctl_writes_strict) { 343 case SYSCTL_WRITES_STRICT: 344 return true; 345 case SYSCTL_WRITES_WARN: 346 warn_sysctl_write(table); 347 return false; 348 default: 349 return false; 350 } 351 } 352 353 /** 354 * proc_dostring - read a string sysctl 355 * @table: the sysctl table 356 * @write: %TRUE if this is a write to the sysctl file 357 * @buffer: the user buffer 358 * @lenp: the size of the user buffer 359 * @ppos: file position 360 * 361 * Reads/writes a string from/to the user buffer. If the kernel 362 * buffer provided is not large enough to hold the string, the 363 * string is truncated. The copied string is %NULL-terminated. 364 * If the string is being read by the user process, it is copied 365 * and a newline '\n' is added. It is truncated if the buffer is 366 * not large enough. 367 * 368 * Returns 0 on success. 369 */ 370 int proc_dostring(struct ctl_table *table, int write, 371 void *buffer, size_t *lenp, loff_t *ppos) 372 { 373 if (write) 374 proc_first_pos_non_zero_ignore(ppos, table); 375 376 return _proc_do_string(table->data, table->maxlen, write, buffer, lenp, 377 ppos); 378 } 379 380 static size_t proc_skip_spaces(char **buf) 381 { 382 size_t ret; 383 char *tmp = skip_spaces(*buf); 384 ret = tmp - *buf; 385 *buf = tmp; 386 return ret; 387 } 388 389 static void proc_skip_char(char **buf, size_t *size, const char v) 390 { 391 while (*size) { 392 if (**buf != v) 393 break; 394 (*size)--; 395 (*buf)++; 396 } 397 } 398 399 /** 400 * strtoul_lenient - parse an ASCII formatted integer from a buffer and only 401 * fail on overflow 402 * 403 * @cp: kernel buffer containing the string to parse 404 * @endp: pointer to store the trailing characters 405 * @base: the base to use 406 * @res: where the parsed integer will be stored 407 * 408 * In case of success 0 is returned and @res will contain the parsed integer, 409 * @endp will hold any trailing characters. 410 * This function will fail the parse on overflow. If there wasn't an overflow 411 * the function will defer the decision what characters count as invalid to the 412 * caller. 413 */ 414 static int strtoul_lenient(const char *cp, char **endp, unsigned int base, 415 unsigned long *res) 416 { 417 unsigned long long result; 418 unsigned int rv; 419 420 cp = _parse_integer_fixup_radix(cp, &base); 421 rv = _parse_integer(cp, base, &result); 422 if ((rv & KSTRTOX_OVERFLOW) || (result != (unsigned long)result)) 423 return -ERANGE; 424 425 cp += rv; 426 427 if (endp) 428 *endp = (char *)cp; 429 430 *res = (unsigned long)result; 431 return 0; 432 } 433 434 #define TMPBUFLEN 22 435 /** 436 * proc_get_long - reads an ASCII formatted integer from a user buffer 437 * 438 * @buf: a kernel buffer 439 * @size: size of the kernel buffer 440 * @val: this is where the number will be stored 441 * @neg: set to %TRUE if number is negative 442 * @perm_tr: a vector which contains the allowed trailers 443 * @perm_tr_len: size of the perm_tr vector 444 * @tr: pointer to store the trailer character 445 * 446 * In case of success %0 is returned and @buf and @size are updated with 447 * the amount of bytes read. If @tr is non-NULL and a trailing 448 * character exists (size is non-zero after returning from this 449 * function), @tr is updated with the trailing character. 450 */ 451 static int proc_get_long(char **buf, size_t *size, 452 unsigned long *val, bool *neg, 453 const char *perm_tr, unsigned perm_tr_len, char *tr) 454 { 455 int len; 456 char *p, tmp[TMPBUFLEN]; 457 458 if (!*size) 459 return -EINVAL; 460 461 len = *size; 462 if (len > TMPBUFLEN - 1) 463 len = TMPBUFLEN - 1; 464 465 memcpy(tmp, *buf, len); 466 467 tmp[len] = 0; 468 p = tmp; 469 if (*p == '-' && *size > 1) { 470 *neg = true; 471 p++; 472 } else 473 *neg = false; 474 if (!isdigit(*p)) 475 return -EINVAL; 476 477 if (strtoul_lenient(p, &p, 0, val)) 478 return -EINVAL; 479 480 len = p - tmp; 481 482 /* We don't know if the next char is whitespace thus we may accept 483 * invalid integers (e.g. 1234...a) or two integers instead of one 484 * (e.g. 123...1). So lets not allow such large numbers. */ 485 if (len == TMPBUFLEN - 1) 486 return -EINVAL; 487 488 if (len < *size && perm_tr_len && !memchr(perm_tr, *p, perm_tr_len)) 489 return -EINVAL; 490 491 if (tr && (len < *size)) 492 *tr = *p; 493 494 *buf += len; 495 *size -= len; 496 497 return 0; 498 } 499 500 /** 501 * proc_put_long - converts an integer to a decimal ASCII formatted string 502 * 503 * @buf: the user buffer 504 * @size: the size of the user buffer 505 * @val: the integer to be converted 506 * @neg: sign of the number, %TRUE for negative 507 * 508 * In case of success @buf and @size are updated with the amount of bytes 509 * written. 510 */ 511 static void proc_put_long(void **buf, size_t *size, unsigned long val, bool neg) 512 { 513 int len; 514 char tmp[TMPBUFLEN], *p = tmp; 515 516 sprintf(p, "%s%lu", neg ? "-" : "", val); 517 len = strlen(tmp); 518 if (len > *size) 519 len = *size; 520 memcpy(*buf, tmp, len); 521 *size -= len; 522 *buf += len; 523 } 524 #undef TMPBUFLEN 525 526 static void proc_put_char(void **buf, size_t *size, char c) 527 { 528 if (*size) { 529 char **buffer = (char **)buf; 530 **buffer = c; 531 532 (*size)--; 533 (*buffer)++; 534 *buf = *buffer; 535 } 536 } 537 538 static int do_proc_dointvec_conv(bool *negp, unsigned long *lvalp, 539 int *valp, 540 int write, void *data) 541 { 542 if (write) { 543 if (*negp) { 544 if (*lvalp > (unsigned long) INT_MAX + 1) 545 return -EINVAL; 546 *valp = -*lvalp; 547 } else { 548 if (*lvalp > (unsigned long) INT_MAX) 549 return -EINVAL; 550 *valp = *lvalp; 551 } 552 } else { 553 int val = *valp; 554 if (val < 0) { 555 *negp = true; 556 *lvalp = -(unsigned long)val; 557 } else { 558 *negp = false; 559 *lvalp = (unsigned long)val; 560 } 561 } 562 return 0; 563 } 564 565 static int do_proc_douintvec_conv(unsigned long *lvalp, 566 unsigned int *valp, 567 int write, void *data) 568 { 569 if (write) { 570 if (*lvalp > UINT_MAX) 571 return -EINVAL; 572 *valp = *lvalp; 573 } else { 574 unsigned int val = *valp; 575 *lvalp = (unsigned long)val; 576 } 577 return 0; 578 } 579 580 static const char proc_wspace_sep[] = { ' ', '\t', '\n' }; 581 582 static int __do_proc_dointvec(void *tbl_data, struct ctl_table *table, 583 int write, void *buffer, 584 size_t *lenp, loff_t *ppos, 585 int (*conv)(bool *negp, unsigned long *lvalp, int *valp, 586 int write, void *data), 587 void *data) 588 { 589 int *i, vleft, first = 1, err = 0; 590 size_t left; 591 char *p; 592 593 if (!tbl_data || !table->maxlen || !*lenp || (*ppos && !write)) { 594 *lenp = 0; 595 return 0; 596 } 597 598 i = (int *) tbl_data; 599 vleft = table->maxlen / sizeof(*i); 600 left = *lenp; 601 602 if (!conv) 603 conv = do_proc_dointvec_conv; 604 605 if (write) { 606 if (proc_first_pos_non_zero_ignore(ppos, table)) 607 goto out; 608 609 if (left > PAGE_SIZE - 1) 610 left = PAGE_SIZE - 1; 611 p = buffer; 612 } 613 614 for (; left && vleft--; i++, first=0) { 615 unsigned long lval; 616 bool neg; 617 618 if (write) { 619 left -= proc_skip_spaces(&p); 620 621 if (!left) 622 break; 623 err = proc_get_long(&p, &left, &lval, &neg, 624 proc_wspace_sep, 625 sizeof(proc_wspace_sep), NULL); 626 if (err) 627 break; 628 if (conv(&neg, &lval, i, 1, data)) { 629 err = -EINVAL; 630 break; 631 } 632 } else { 633 if (conv(&neg, &lval, i, 0, data)) { 634 err = -EINVAL; 635 break; 636 } 637 if (!first) 638 proc_put_char(&buffer, &left, '\t'); 639 proc_put_long(&buffer, &left, lval, neg); 640 } 641 } 642 643 if (!write && !first && left && !err) 644 proc_put_char(&buffer, &left, '\n'); 645 if (write && !err && left) 646 left -= proc_skip_spaces(&p); 647 if (write && first) 648 return err ? : -EINVAL; 649 *lenp -= left; 650 out: 651 *ppos += *lenp; 652 return err; 653 } 654 655 static int do_proc_dointvec(struct ctl_table *table, int write, 656 void *buffer, size_t *lenp, loff_t *ppos, 657 int (*conv)(bool *negp, unsigned long *lvalp, int *valp, 658 int write, void *data), 659 void *data) 660 { 661 return __do_proc_dointvec(table->data, table, write, 662 buffer, lenp, ppos, conv, data); 663 } 664 665 static int do_proc_douintvec_w(unsigned int *tbl_data, 666 struct ctl_table *table, 667 void *buffer, 668 size_t *lenp, loff_t *ppos, 669 int (*conv)(unsigned long *lvalp, 670 unsigned int *valp, 671 int write, void *data), 672 void *data) 673 { 674 unsigned long lval; 675 int err = 0; 676 size_t left; 677 bool neg; 678 char *p = buffer; 679 680 left = *lenp; 681 682 if (proc_first_pos_non_zero_ignore(ppos, table)) 683 goto bail_early; 684 685 if (left > PAGE_SIZE - 1) 686 left = PAGE_SIZE - 1; 687 688 left -= proc_skip_spaces(&p); 689 if (!left) { 690 err = -EINVAL; 691 goto out_free; 692 } 693 694 err = proc_get_long(&p, &left, &lval, &neg, 695 proc_wspace_sep, 696 sizeof(proc_wspace_sep), NULL); 697 if (err || neg) { 698 err = -EINVAL; 699 goto out_free; 700 } 701 702 if (conv(&lval, tbl_data, 1, data)) { 703 err = -EINVAL; 704 goto out_free; 705 } 706 707 if (!err && left) 708 left -= proc_skip_spaces(&p); 709 710 out_free: 711 if (err) 712 return -EINVAL; 713 714 return 0; 715 716 /* This is in keeping with old __do_proc_dointvec() */ 717 bail_early: 718 *ppos += *lenp; 719 return err; 720 } 721 722 static int do_proc_douintvec_r(unsigned int *tbl_data, void *buffer, 723 size_t *lenp, loff_t *ppos, 724 int (*conv)(unsigned long *lvalp, 725 unsigned int *valp, 726 int write, void *data), 727 void *data) 728 { 729 unsigned long lval; 730 int err = 0; 731 size_t left; 732 733 left = *lenp; 734 735 if (conv(&lval, tbl_data, 0, data)) { 736 err = -EINVAL; 737 goto out; 738 } 739 740 proc_put_long(&buffer, &left, lval, false); 741 if (!left) 742 goto out; 743 744 proc_put_char(&buffer, &left, '\n'); 745 746 out: 747 *lenp -= left; 748 *ppos += *lenp; 749 750 return err; 751 } 752 753 static int __do_proc_douintvec(void *tbl_data, struct ctl_table *table, 754 int write, void *buffer, 755 size_t *lenp, loff_t *ppos, 756 int (*conv)(unsigned long *lvalp, 757 unsigned int *valp, 758 int write, void *data), 759 void *data) 760 { 761 unsigned int *i, vleft; 762 763 if (!tbl_data || !table->maxlen || !*lenp || (*ppos && !write)) { 764 *lenp = 0; 765 return 0; 766 } 767 768 i = (unsigned int *) tbl_data; 769 vleft = table->maxlen / sizeof(*i); 770 771 /* 772 * Arrays are not supported, keep this simple. *Do not* add 773 * support for them. 774 */ 775 if (vleft != 1) { 776 *lenp = 0; 777 return -EINVAL; 778 } 779 780 if (!conv) 781 conv = do_proc_douintvec_conv; 782 783 if (write) 784 return do_proc_douintvec_w(i, table, buffer, lenp, ppos, 785 conv, data); 786 return do_proc_douintvec_r(i, buffer, lenp, ppos, conv, data); 787 } 788 789 static int do_proc_douintvec(struct ctl_table *table, int write, 790 void *buffer, size_t *lenp, loff_t *ppos, 791 int (*conv)(unsigned long *lvalp, 792 unsigned int *valp, 793 int write, void *data), 794 void *data) 795 { 796 return __do_proc_douintvec(table->data, table, write, 797 buffer, lenp, ppos, conv, data); 798 } 799 800 /** 801 * proc_dointvec - read a vector of integers 802 * @table: the sysctl table 803 * @write: %TRUE if this is a write to the sysctl file 804 * @buffer: the user buffer 805 * @lenp: the size of the user buffer 806 * @ppos: file position 807 * 808 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 809 * values from/to the user buffer, treated as an ASCII string. 810 * 811 * Returns 0 on success. 812 */ 813 int proc_dointvec(struct ctl_table *table, int write, void *buffer, 814 size_t *lenp, loff_t *ppos) 815 { 816 return do_proc_dointvec(table, write, buffer, lenp, ppos, NULL, NULL); 817 } 818 819 #ifdef CONFIG_COMPACTION 820 static int proc_dointvec_minmax_warn_RT_change(struct ctl_table *table, 821 int write, void *buffer, size_t *lenp, loff_t *ppos) 822 { 823 int ret, old; 824 825 if (!IS_ENABLED(CONFIG_PREEMPT_RT) || !write) 826 return proc_dointvec_minmax(table, write, buffer, lenp, ppos); 827 828 old = *(int *)table->data; 829 ret = proc_dointvec_minmax(table, write, buffer, lenp, ppos); 830 if (ret) 831 return ret; 832 if (old != *(int *)table->data) 833 pr_warn_once("sysctl attribute %s changed by %s[%d]\n", 834 table->procname, current->comm, 835 task_pid_nr(current)); 836 return ret; 837 } 838 #endif 839 840 /** 841 * proc_douintvec - read a vector of unsigned integers 842 * @table: the sysctl table 843 * @write: %TRUE if this is a write to the sysctl file 844 * @buffer: the user buffer 845 * @lenp: the size of the user buffer 846 * @ppos: file position 847 * 848 * Reads/writes up to table->maxlen/sizeof(unsigned int) unsigned integer 849 * values from/to the user buffer, treated as an ASCII string. 850 * 851 * Returns 0 on success. 852 */ 853 int proc_douintvec(struct ctl_table *table, int write, void *buffer, 854 size_t *lenp, loff_t *ppos) 855 { 856 return do_proc_douintvec(table, write, buffer, lenp, ppos, 857 do_proc_douintvec_conv, NULL); 858 } 859 860 /* 861 * Taint values can only be increased 862 * This means we can safely use a temporary. 863 */ 864 static int proc_taint(struct ctl_table *table, int write, 865 void *buffer, size_t *lenp, loff_t *ppos) 866 { 867 struct ctl_table t; 868 unsigned long tmptaint = get_taint(); 869 int err; 870 871 if (write && !capable(CAP_SYS_ADMIN)) 872 return -EPERM; 873 874 t = *table; 875 t.data = &tmptaint; 876 err = proc_doulongvec_minmax(&t, write, buffer, lenp, ppos); 877 if (err < 0) 878 return err; 879 880 if (write) { 881 int i; 882 883 /* 884 * If we are relying on panic_on_taint not producing 885 * false positives due to userspace input, bail out 886 * before setting the requested taint flags. 887 */ 888 if (panic_on_taint_nousertaint && (tmptaint & panic_on_taint)) 889 return -EINVAL; 890 891 /* 892 * Poor man's atomic or. Not worth adding a primitive 893 * to everyone's atomic.h for this 894 */ 895 for (i = 0; i < TAINT_FLAGS_COUNT; i++) 896 if ((1UL << i) & tmptaint) 897 add_taint(i, LOCKDEP_STILL_OK); 898 } 899 900 return err; 901 } 902 903 #ifdef CONFIG_PRINTK 904 static int proc_dointvec_minmax_sysadmin(struct ctl_table *table, int write, 905 void *buffer, size_t *lenp, loff_t *ppos) 906 { 907 if (write && !capable(CAP_SYS_ADMIN)) 908 return -EPERM; 909 910 return proc_dointvec_minmax(table, write, buffer, lenp, ppos); 911 } 912 #endif 913 914 /** 915 * struct do_proc_dointvec_minmax_conv_param - proc_dointvec_minmax() range checking structure 916 * @min: pointer to minimum allowable value 917 * @max: pointer to maximum allowable value 918 * 919 * The do_proc_dointvec_minmax_conv_param structure provides the 920 * minimum and maximum values for doing range checking for those sysctl 921 * parameters that use the proc_dointvec_minmax() handler. 922 */ 923 struct do_proc_dointvec_minmax_conv_param { 924 int *min; 925 int *max; 926 }; 927 928 static int do_proc_dointvec_minmax_conv(bool *negp, unsigned long *lvalp, 929 int *valp, 930 int write, void *data) 931 { 932 int tmp, ret; 933 struct do_proc_dointvec_minmax_conv_param *param = data; 934 /* 935 * If writing, first do so via a temporary local int so we can 936 * bounds-check it before touching *valp. 937 */ 938 int *ip = write ? &tmp : valp; 939 940 ret = do_proc_dointvec_conv(negp, lvalp, ip, write, data); 941 if (ret) 942 return ret; 943 944 if (write) { 945 if ((param->min && *param->min > tmp) || 946 (param->max && *param->max < tmp)) 947 return -EINVAL; 948 *valp = tmp; 949 } 950 951 return 0; 952 } 953 954 /** 955 * proc_dointvec_minmax - read a vector of integers with min/max values 956 * @table: the sysctl table 957 * @write: %TRUE if this is a write to the sysctl file 958 * @buffer: the user buffer 959 * @lenp: the size of the user buffer 960 * @ppos: file position 961 * 962 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 963 * values from/to the user buffer, treated as an ASCII string. 964 * 965 * This routine will ensure the values are within the range specified by 966 * table->extra1 (min) and table->extra2 (max). 967 * 968 * Returns 0 on success or -EINVAL on write when the range check fails. 969 */ 970 int proc_dointvec_minmax(struct ctl_table *table, int write, 971 void *buffer, size_t *lenp, loff_t *ppos) 972 { 973 struct do_proc_dointvec_minmax_conv_param param = { 974 .min = (int *) table->extra1, 975 .max = (int *) table->extra2, 976 }; 977 return do_proc_dointvec(table, write, buffer, lenp, ppos, 978 do_proc_dointvec_minmax_conv, ¶m); 979 } 980 981 /** 982 * struct do_proc_douintvec_minmax_conv_param - proc_douintvec_minmax() range checking structure 983 * @min: pointer to minimum allowable value 984 * @max: pointer to maximum allowable value 985 * 986 * The do_proc_douintvec_minmax_conv_param structure provides the 987 * minimum and maximum values for doing range checking for those sysctl 988 * parameters that use the proc_douintvec_minmax() handler. 989 */ 990 struct do_proc_douintvec_minmax_conv_param { 991 unsigned int *min; 992 unsigned int *max; 993 }; 994 995 static int do_proc_douintvec_minmax_conv(unsigned long *lvalp, 996 unsigned int *valp, 997 int write, void *data) 998 { 999 int ret; 1000 unsigned int tmp; 1001 struct do_proc_douintvec_minmax_conv_param *param = data; 1002 /* write via temporary local uint for bounds-checking */ 1003 unsigned int *up = write ? &tmp : valp; 1004 1005 ret = do_proc_douintvec_conv(lvalp, up, write, data); 1006 if (ret) 1007 return ret; 1008 1009 if (write) { 1010 if ((param->min && *param->min > tmp) || 1011 (param->max && *param->max < tmp)) 1012 return -ERANGE; 1013 1014 *valp = tmp; 1015 } 1016 1017 return 0; 1018 } 1019 1020 /** 1021 * proc_douintvec_minmax - read a vector of unsigned ints with min/max values 1022 * @table: the sysctl table 1023 * @write: %TRUE if this is a write to the sysctl file 1024 * @buffer: the user buffer 1025 * @lenp: the size of the user buffer 1026 * @ppos: file position 1027 * 1028 * Reads/writes up to table->maxlen/sizeof(unsigned int) unsigned integer 1029 * values from/to the user buffer, treated as an ASCII string. Negative 1030 * strings are not allowed. 1031 * 1032 * This routine will ensure the values are within the range specified by 1033 * table->extra1 (min) and table->extra2 (max). There is a final sanity 1034 * check for UINT_MAX to avoid having to support wrap around uses from 1035 * userspace. 1036 * 1037 * Returns 0 on success or -ERANGE on write when the range check fails. 1038 */ 1039 int proc_douintvec_minmax(struct ctl_table *table, int write, 1040 void *buffer, size_t *lenp, loff_t *ppos) 1041 { 1042 struct do_proc_douintvec_minmax_conv_param param = { 1043 .min = (unsigned int *) table->extra1, 1044 .max = (unsigned int *) table->extra2, 1045 }; 1046 return do_proc_douintvec(table, write, buffer, lenp, ppos, 1047 do_proc_douintvec_minmax_conv, ¶m); 1048 } 1049 1050 /** 1051 * proc_dou8vec_minmax - read a vector of unsigned chars with min/max values 1052 * @table: the sysctl table 1053 * @write: %TRUE if this is a write to the sysctl file 1054 * @buffer: the user buffer 1055 * @lenp: the size of the user buffer 1056 * @ppos: file position 1057 * 1058 * Reads/writes up to table->maxlen/sizeof(u8) unsigned chars 1059 * values from/to the user buffer, treated as an ASCII string. Negative 1060 * strings are not allowed. 1061 * 1062 * This routine will ensure the values are within the range specified by 1063 * table->extra1 (min) and table->extra2 (max). 1064 * 1065 * Returns 0 on success or an error on write when the range check fails. 1066 */ 1067 int proc_dou8vec_minmax(struct ctl_table *table, int write, 1068 void *buffer, size_t *lenp, loff_t *ppos) 1069 { 1070 struct ctl_table tmp; 1071 unsigned int min = 0, max = 255U, val; 1072 u8 *data = table->data; 1073 struct do_proc_douintvec_minmax_conv_param param = { 1074 .min = &min, 1075 .max = &max, 1076 }; 1077 int res; 1078 1079 /* Do not support arrays yet. */ 1080 if (table->maxlen != sizeof(u8)) 1081 return -EINVAL; 1082 1083 if (table->extra1) { 1084 min = *(unsigned int *) table->extra1; 1085 if (min > 255U) 1086 return -EINVAL; 1087 } 1088 if (table->extra2) { 1089 max = *(unsigned int *) table->extra2; 1090 if (max > 255U) 1091 return -EINVAL; 1092 } 1093 1094 tmp = *table; 1095 1096 tmp.maxlen = sizeof(val); 1097 tmp.data = &val; 1098 val = *data; 1099 res = do_proc_douintvec(&tmp, write, buffer, lenp, ppos, 1100 do_proc_douintvec_minmax_conv, ¶m); 1101 if (res) 1102 return res; 1103 if (write) 1104 *data = val; 1105 return 0; 1106 } 1107 EXPORT_SYMBOL_GPL(proc_dou8vec_minmax); 1108 1109 static int do_proc_dopipe_max_size_conv(unsigned long *lvalp, 1110 unsigned int *valp, 1111 int write, void *data) 1112 { 1113 if (write) { 1114 unsigned int val; 1115 1116 val = round_pipe_size(*lvalp); 1117 if (val == 0) 1118 return -EINVAL; 1119 1120 *valp = val; 1121 } else { 1122 unsigned int val = *valp; 1123 *lvalp = (unsigned long) val; 1124 } 1125 1126 return 0; 1127 } 1128 1129 static int proc_dopipe_max_size(struct ctl_table *table, int write, 1130 void *buffer, size_t *lenp, loff_t *ppos) 1131 { 1132 return do_proc_douintvec(table, write, buffer, lenp, ppos, 1133 do_proc_dopipe_max_size_conv, NULL); 1134 } 1135 1136 static void validate_coredump_safety(void) 1137 { 1138 #ifdef CONFIG_COREDUMP 1139 if (suid_dumpable == SUID_DUMP_ROOT && 1140 core_pattern[0] != '/' && core_pattern[0] != '|') { 1141 printk(KERN_WARNING 1142 "Unsafe core_pattern used with fs.suid_dumpable=2.\n" 1143 "Pipe handler or fully qualified core dump path required.\n" 1144 "Set kernel.core_pattern before fs.suid_dumpable.\n" 1145 ); 1146 } 1147 #endif 1148 } 1149 1150 static int proc_dointvec_minmax_coredump(struct ctl_table *table, int write, 1151 void *buffer, size_t *lenp, loff_t *ppos) 1152 { 1153 int error = proc_dointvec_minmax(table, write, buffer, lenp, ppos); 1154 if (!error) 1155 validate_coredump_safety(); 1156 return error; 1157 } 1158 1159 #ifdef CONFIG_COREDUMP 1160 static int proc_dostring_coredump(struct ctl_table *table, int write, 1161 void *buffer, size_t *lenp, loff_t *ppos) 1162 { 1163 int error = proc_dostring(table, write, buffer, lenp, ppos); 1164 if (!error) 1165 validate_coredump_safety(); 1166 return error; 1167 } 1168 #endif 1169 1170 #ifdef CONFIG_MAGIC_SYSRQ 1171 static int sysrq_sysctl_handler(struct ctl_table *table, int write, 1172 void *buffer, size_t *lenp, loff_t *ppos) 1173 { 1174 int tmp, ret; 1175 1176 tmp = sysrq_mask(); 1177 1178 ret = __do_proc_dointvec(&tmp, table, write, buffer, 1179 lenp, ppos, NULL, NULL); 1180 if (ret || !write) 1181 return ret; 1182 1183 if (write) 1184 sysrq_toggle_support(tmp); 1185 1186 return 0; 1187 } 1188 #endif 1189 1190 static int __do_proc_doulongvec_minmax(void *data, struct ctl_table *table, 1191 int write, void *buffer, size_t *lenp, loff_t *ppos, 1192 unsigned long convmul, unsigned long convdiv) 1193 { 1194 unsigned long *i, *min, *max; 1195 int vleft, first = 1, err = 0; 1196 size_t left; 1197 char *p; 1198 1199 if (!data || !table->maxlen || !*lenp || (*ppos && !write)) { 1200 *lenp = 0; 1201 return 0; 1202 } 1203 1204 i = (unsigned long *) data; 1205 min = (unsigned long *) table->extra1; 1206 max = (unsigned long *) table->extra2; 1207 vleft = table->maxlen / sizeof(unsigned long); 1208 left = *lenp; 1209 1210 if (write) { 1211 if (proc_first_pos_non_zero_ignore(ppos, table)) 1212 goto out; 1213 1214 if (left > PAGE_SIZE - 1) 1215 left = PAGE_SIZE - 1; 1216 p = buffer; 1217 } 1218 1219 for (; left && vleft--; i++, first = 0) { 1220 unsigned long val; 1221 1222 if (write) { 1223 bool neg; 1224 1225 left -= proc_skip_spaces(&p); 1226 if (!left) 1227 break; 1228 1229 err = proc_get_long(&p, &left, &val, &neg, 1230 proc_wspace_sep, 1231 sizeof(proc_wspace_sep), NULL); 1232 if (err) 1233 break; 1234 if (neg) 1235 continue; 1236 val = convmul * val / convdiv; 1237 if ((min && val < *min) || (max && val > *max)) { 1238 err = -EINVAL; 1239 break; 1240 } 1241 *i = val; 1242 } else { 1243 val = convdiv * (*i) / convmul; 1244 if (!first) 1245 proc_put_char(&buffer, &left, '\t'); 1246 proc_put_long(&buffer, &left, val, false); 1247 } 1248 } 1249 1250 if (!write && !first && left && !err) 1251 proc_put_char(&buffer, &left, '\n'); 1252 if (write && !err) 1253 left -= proc_skip_spaces(&p); 1254 if (write && first) 1255 return err ? : -EINVAL; 1256 *lenp -= left; 1257 out: 1258 *ppos += *lenp; 1259 return err; 1260 } 1261 1262 static int do_proc_doulongvec_minmax(struct ctl_table *table, int write, 1263 void *buffer, size_t *lenp, loff_t *ppos, unsigned long convmul, 1264 unsigned long convdiv) 1265 { 1266 return __do_proc_doulongvec_minmax(table->data, table, write, 1267 buffer, lenp, ppos, convmul, convdiv); 1268 } 1269 1270 /** 1271 * proc_doulongvec_minmax - read a vector of long integers with min/max values 1272 * @table: the sysctl table 1273 * @write: %TRUE if this is a write to the sysctl file 1274 * @buffer: the user buffer 1275 * @lenp: the size of the user buffer 1276 * @ppos: file position 1277 * 1278 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long 1279 * values from/to the user buffer, treated as an ASCII string. 1280 * 1281 * This routine will ensure the values are within the range specified by 1282 * table->extra1 (min) and table->extra2 (max). 1283 * 1284 * Returns 0 on success. 1285 */ 1286 int proc_doulongvec_minmax(struct ctl_table *table, int write, 1287 void *buffer, size_t *lenp, loff_t *ppos) 1288 { 1289 return do_proc_doulongvec_minmax(table, write, buffer, lenp, ppos, 1l, 1l); 1290 } 1291 1292 /** 1293 * proc_doulongvec_ms_jiffies_minmax - read a vector of millisecond values with min/max values 1294 * @table: the sysctl table 1295 * @write: %TRUE if this is a write to the sysctl file 1296 * @buffer: the user buffer 1297 * @lenp: the size of the user buffer 1298 * @ppos: file position 1299 * 1300 * Reads/writes up to table->maxlen/sizeof(unsigned long) unsigned long 1301 * values from/to the user buffer, treated as an ASCII string. The values 1302 * are treated as milliseconds, and converted to jiffies when they are stored. 1303 * 1304 * This routine will ensure the values are within the range specified by 1305 * table->extra1 (min) and table->extra2 (max). 1306 * 1307 * Returns 0 on success. 1308 */ 1309 int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write, 1310 void *buffer, size_t *lenp, loff_t *ppos) 1311 { 1312 return do_proc_doulongvec_minmax(table, write, buffer, 1313 lenp, ppos, HZ, 1000l); 1314 } 1315 1316 1317 static int do_proc_dointvec_jiffies_conv(bool *negp, unsigned long *lvalp, 1318 int *valp, 1319 int write, void *data) 1320 { 1321 if (write) { 1322 if (*lvalp > INT_MAX / HZ) 1323 return 1; 1324 *valp = *negp ? -(*lvalp*HZ) : (*lvalp*HZ); 1325 } else { 1326 int val = *valp; 1327 unsigned long lval; 1328 if (val < 0) { 1329 *negp = true; 1330 lval = -(unsigned long)val; 1331 } else { 1332 *negp = false; 1333 lval = (unsigned long)val; 1334 } 1335 *lvalp = lval / HZ; 1336 } 1337 return 0; 1338 } 1339 1340 static int do_proc_dointvec_userhz_jiffies_conv(bool *negp, unsigned long *lvalp, 1341 int *valp, 1342 int write, void *data) 1343 { 1344 if (write) { 1345 if (USER_HZ < HZ && *lvalp > (LONG_MAX / HZ) * USER_HZ) 1346 return 1; 1347 *valp = clock_t_to_jiffies(*negp ? -*lvalp : *lvalp); 1348 } else { 1349 int val = *valp; 1350 unsigned long lval; 1351 if (val < 0) { 1352 *negp = true; 1353 lval = -(unsigned long)val; 1354 } else { 1355 *negp = false; 1356 lval = (unsigned long)val; 1357 } 1358 *lvalp = jiffies_to_clock_t(lval); 1359 } 1360 return 0; 1361 } 1362 1363 static int do_proc_dointvec_ms_jiffies_conv(bool *negp, unsigned long *lvalp, 1364 int *valp, 1365 int write, void *data) 1366 { 1367 if (write) { 1368 unsigned long jif = msecs_to_jiffies(*negp ? -*lvalp : *lvalp); 1369 1370 if (jif > INT_MAX) 1371 return 1; 1372 *valp = (int)jif; 1373 } else { 1374 int val = *valp; 1375 unsigned long lval; 1376 if (val < 0) { 1377 *negp = true; 1378 lval = -(unsigned long)val; 1379 } else { 1380 *negp = false; 1381 lval = (unsigned long)val; 1382 } 1383 *lvalp = jiffies_to_msecs(lval); 1384 } 1385 return 0; 1386 } 1387 1388 /** 1389 * proc_dointvec_jiffies - read a vector of integers as seconds 1390 * @table: the sysctl table 1391 * @write: %TRUE if this is a write to the sysctl file 1392 * @buffer: the user buffer 1393 * @lenp: the size of the user buffer 1394 * @ppos: file position 1395 * 1396 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 1397 * values from/to the user buffer, treated as an ASCII string. 1398 * The values read are assumed to be in seconds, and are converted into 1399 * jiffies. 1400 * 1401 * Returns 0 on success. 1402 */ 1403 int proc_dointvec_jiffies(struct ctl_table *table, int write, 1404 void *buffer, size_t *lenp, loff_t *ppos) 1405 { 1406 return do_proc_dointvec(table,write,buffer,lenp,ppos, 1407 do_proc_dointvec_jiffies_conv,NULL); 1408 } 1409 1410 /** 1411 * proc_dointvec_userhz_jiffies - read a vector of integers as 1/USER_HZ seconds 1412 * @table: the sysctl table 1413 * @write: %TRUE if this is a write to the sysctl file 1414 * @buffer: the user buffer 1415 * @lenp: the size of the user buffer 1416 * @ppos: pointer to the file position 1417 * 1418 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 1419 * values from/to the user buffer, treated as an ASCII string. 1420 * The values read are assumed to be in 1/USER_HZ seconds, and 1421 * are converted into jiffies. 1422 * 1423 * Returns 0 on success. 1424 */ 1425 int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write, 1426 void *buffer, size_t *lenp, loff_t *ppos) 1427 { 1428 return do_proc_dointvec(table,write,buffer,lenp,ppos, 1429 do_proc_dointvec_userhz_jiffies_conv,NULL); 1430 } 1431 1432 /** 1433 * proc_dointvec_ms_jiffies - read a vector of integers as 1 milliseconds 1434 * @table: the sysctl table 1435 * @write: %TRUE if this is a write to the sysctl file 1436 * @buffer: the user buffer 1437 * @lenp: the size of the user buffer 1438 * @ppos: file position 1439 * @ppos: the current position in the file 1440 * 1441 * Reads/writes up to table->maxlen/sizeof(unsigned int) integer 1442 * values from/to the user buffer, treated as an ASCII string. 1443 * The values read are assumed to be in 1/1000 seconds, and 1444 * are converted into jiffies. 1445 * 1446 * Returns 0 on success. 1447 */ 1448 int proc_dointvec_ms_jiffies(struct ctl_table *table, int write, void *buffer, 1449 size_t *lenp, loff_t *ppos) 1450 { 1451 return do_proc_dointvec(table, write, buffer, lenp, ppos, 1452 do_proc_dointvec_ms_jiffies_conv, NULL); 1453 } 1454 1455 static int proc_do_cad_pid(struct ctl_table *table, int write, void *buffer, 1456 size_t *lenp, loff_t *ppos) 1457 { 1458 struct pid *new_pid; 1459 pid_t tmp; 1460 int r; 1461 1462 tmp = pid_vnr(cad_pid); 1463 1464 r = __do_proc_dointvec(&tmp, table, write, buffer, 1465 lenp, ppos, NULL, NULL); 1466 if (r || !write) 1467 return r; 1468 1469 new_pid = find_get_pid(tmp); 1470 if (!new_pid) 1471 return -ESRCH; 1472 1473 put_pid(xchg(&cad_pid, new_pid)); 1474 return 0; 1475 } 1476 1477 /** 1478 * proc_do_large_bitmap - read/write from/to a large bitmap 1479 * @table: the sysctl table 1480 * @write: %TRUE if this is a write to the sysctl file 1481 * @buffer: the user buffer 1482 * @lenp: the size of the user buffer 1483 * @ppos: file position 1484 * 1485 * The bitmap is stored at table->data and the bitmap length (in bits) 1486 * in table->maxlen. 1487 * 1488 * We use a range comma separated format (e.g. 1,3-4,10-10) so that 1489 * large bitmaps may be represented in a compact manner. Writing into 1490 * the file will clear the bitmap then update it with the given input. 1491 * 1492 * Returns 0 on success. 1493 */ 1494 int proc_do_large_bitmap(struct ctl_table *table, int write, 1495 void *buffer, size_t *lenp, loff_t *ppos) 1496 { 1497 int err = 0; 1498 size_t left = *lenp; 1499 unsigned long bitmap_len = table->maxlen; 1500 unsigned long *bitmap = *(unsigned long **) table->data; 1501 unsigned long *tmp_bitmap = NULL; 1502 char tr_a[] = { '-', ',', '\n' }, tr_b[] = { ',', '\n', 0 }, c; 1503 1504 if (!bitmap || !bitmap_len || !left || (*ppos && !write)) { 1505 *lenp = 0; 1506 return 0; 1507 } 1508 1509 if (write) { 1510 char *p = buffer; 1511 size_t skipped = 0; 1512 1513 if (left > PAGE_SIZE - 1) { 1514 left = PAGE_SIZE - 1; 1515 /* How much of the buffer we'll skip this pass */ 1516 skipped = *lenp - left; 1517 } 1518 1519 tmp_bitmap = bitmap_zalloc(bitmap_len, GFP_KERNEL); 1520 if (!tmp_bitmap) 1521 return -ENOMEM; 1522 proc_skip_char(&p, &left, '\n'); 1523 while (!err && left) { 1524 unsigned long val_a, val_b; 1525 bool neg; 1526 size_t saved_left; 1527 1528 /* In case we stop parsing mid-number, we can reset */ 1529 saved_left = left; 1530 err = proc_get_long(&p, &left, &val_a, &neg, tr_a, 1531 sizeof(tr_a), &c); 1532 /* 1533 * If we consumed the entirety of a truncated buffer or 1534 * only one char is left (may be a "-"), then stop here, 1535 * reset, & come back for more. 1536 */ 1537 if ((left <= 1) && skipped) { 1538 left = saved_left; 1539 break; 1540 } 1541 1542 if (err) 1543 break; 1544 if (val_a >= bitmap_len || neg) { 1545 err = -EINVAL; 1546 break; 1547 } 1548 1549 val_b = val_a; 1550 if (left) { 1551 p++; 1552 left--; 1553 } 1554 1555 if (c == '-') { 1556 err = proc_get_long(&p, &left, &val_b, 1557 &neg, tr_b, sizeof(tr_b), 1558 &c); 1559 /* 1560 * If we consumed all of a truncated buffer or 1561 * then stop here, reset, & come back for more. 1562 */ 1563 if (!left && skipped) { 1564 left = saved_left; 1565 break; 1566 } 1567 1568 if (err) 1569 break; 1570 if (val_b >= bitmap_len || neg || 1571 val_a > val_b) { 1572 err = -EINVAL; 1573 break; 1574 } 1575 if (left) { 1576 p++; 1577 left--; 1578 } 1579 } 1580 1581 bitmap_set(tmp_bitmap, val_a, val_b - val_a + 1); 1582 proc_skip_char(&p, &left, '\n'); 1583 } 1584 left += skipped; 1585 } else { 1586 unsigned long bit_a, bit_b = 0; 1587 bool first = 1; 1588 1589 while (left) { 1590 bit_a = find_next_bit(bitmap, bitmap_len, bit_b); 1591 if (bit_a >= bitmap_len) 1592 break; 1593 bit_b = find_next_zero_bit(bitmap, bitmap_len, 1594 bit_a + 1) - 1; 1595 1596 if (!first) 1597 proc_put_char(&buffer, &left, ','); 1598 proc_put_long(&buffer, &left, bit_a, false); 1599 if (bit_a != bit_b) { 1600 proc_put_char(&buffer, &left, '-'); 1601 proc_put_long(&buffer, &left, bit_b, false); 1602 } 1603 1604 first = 0; bit_b++; 1605 } 1606 proc_put_char(&buffer, &left, '\n'); 1607 } 1608 1609 if (!err) { 1610 if (write) { 1611 if (*ppos) 1612 bitmap_or(bitmap, bitmap, tmp_bitmap, bitmap_len); 1613 else 1614 bitmap_copy(bitmap, tmp_bitmap, bitmap_len); 1615 } 1616 *lenp -= left; 1617 *ppos += *lenp; 1618 } 1619 1620 bitmap_free(tmp_bitmap); 1621 return err; 1622 } 1623 1624 #else /* CONFIG_PROC_SYSCTL */ 1625 1626 int proc_dostring(struct ctl_table *table, int write, 1627 void *buffer, size_t *lenp, loff_t *ppos) 1628 { 1629 return -ENOSYS; 1630 } 1631 1632 int proc_dointvec(struct ctl_table *table, int write, 1633 void *buffer, size_t *lenp, loff_t *ppos) 1634 { 1635 return -ENOSYS; 1636 } 1637 1638 int proc_douintvec(struct ctl_table *table, int write, 1639 void *buffer, size_t *lenp, loff_t *ppos) 1640 { 1641 return -ENOSYS; 1642 } 1643 1644 int proc_dointvec_minmax(struct ctl_table *table, int write, 1645 void *buffer, size_t *lenp, loff_t *ppos) 1646 { 1647 return -ENOSYS; 1648 } 1649 1650 int proc_douintvec_minmax(struct ctl_table *table, int write, 1651 void *buffer, size_t *lenp, loff_t *ppos) 1652 { 1653 return -ENOSYS; 1654 } 1655 1656 int proc_dou8vec_minmax(struct ctl_table *table, int write, 1657 void *buffer, size_t *lenp, loff_t *ppos) 1658 { 1659 return -ENOSYS; 1660 } 1661 1662 int proc_dointvec_jiffies(struct ctl_table *table, int write, 1663 void *buffer, size_t *lenp, loff_t *ppos) 1664 { 1665 return -ENOSYS; 1666 } 1667 1668 int proc_dointvec_userhz_jiffies(struct ctl_table *table, int write, 1669 void *buffer, size_t *lenp, loff_t *ppos) 1670 { 1671 return -ENOSYS; 1672 } 1673 1674 int proc_dointvec_ms_jiffies(struct ctl_table *table, int write, 1675 void *buffer, size_t *lenp, loff_t *ppos) 1676 { 1677 return -ENOSYS; 1678 } 1679 1680 int proc_doulongvec_minmax(struct ctl_table *table, int write, 1681 void *buffer, size_t *lenp, loff_t *ppos) 1682 { 1683 return -ENOSYS; 1684 } 1685 1686 int proc_doulongvec_ms_jiffies_minmax(struct ctl_table *table, int write, 1687 void *buffer, size_t *lenp, loff_t *ppos) 1688 { 1689 return -ENOSYS; 1690 } 1691 1692 int proc_do_large_bitmap(struct ctl_table *table, int write, 1693 void *buffer, size_t *lenp, loff_t *ppos) 1694 { 1695 return -ENOSYS; 1696 } 1697 1698 #endif /* CONFIG_PROC_SYSCTL */ 1699 1700 #if defined(CONFIG_SYSCTL) 1701 int proc_do_static_key(struct ctl_table *table, int write, 1702 void *buffer, size_t *lenp, loff_t *ppos) 1703 { 1704 struct static_key *key = (struct static_key *)table->data; 1705 static DEFINE_MUTEX(static_key_mutex); 1706 int val, ret; 1707 struct ctl_table tmp = { 1708 .data = &val, 1709 .maxlen = sizeof(val), 1710 .mode = table->mode, 1711 .extra1 = SYSCTL_ZERO, 1712 .extra2 = SYSCTL_ONE, 1713 }; 1714 1715 if (write && !capable(CAP_SYS_ADMIN)) 1716 return -EPERM; 1717 1718 mutex_lock(&static_key_mutex); 1719 val = static_key_enabled(key); 1720 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos); 1721 if (write && !ret) { 1722 if (val) 1723 static_key_enable(key); 1724 else 1725 static_key_disable(key); 1726 } 1727 mutex_unlock(&static_key_mutex); 1728 return ret; 1729 } 1730 1731 static struct ctl_table kern_table[] = { 1732 { 1733 .procname = "sched_child_runs_first", 1734 .data = &sysctl_sched_child_runs_first, 1735 .maxlen = sizeof(unsigned int), 1736 .mode = 0644, 1737 .proc_handler = proc_dointvec, 1738 }, 1739 #ifdef CONFIG_SCHEDSTATS 1740 { 1741 .procname = "sched_schedstats", 1742 .data = NULL, 1743 .maxlen = sizeof(unsigned int), 1744 .mode = 0644, 1745 .proc_handler = sysctl_schedstats, 1746 .extra1 = SYSCTL_ZERO, 1747 .extra2 = SYSCTL_ONE, 1748 }, 1749 #endif /* CONFIG_SCHEDSTATS */ 1750 #ifdef CONFIG_NUMA_BALANCING 1751 { 1752 .procname = "numa_balancing", 1753 .data = NULL, /* filled in by handler */ 1754 .maxlen = sizeof(unsigned int), 1755 .mode = 0644, 1756 .proc_handler = sysctl_numa_balancing, 1757 .extra1 = SYSCTL_ZERO, 1758 .extra2 = SYSCTL_ONE, 1759 }, 1760 #endif /* CONFIG_NUMA_BALANCING */ 1761 { 1762 .procname = "sched_rt_period_us", 1763 .data = &sysctl_sched_rt_period, 1764 .maxlen = sizeof(unsigned int), 1765 .mode = 0644, 1766 .proc_handler = sched_rt_handler, 1767 }, 1768 { 1769 .procname = "sched_rt_runtime_us", 1770 .data = &sysctl_sched_rt_runtime, 1771 .maxlen = sizeof(int), 1772 .mode = 0644, 1773 .proc_handler = sched_rt_handler, 1774 }, 1775 { 1776 .procname = "sched_deadline_period_max_us", 1777 .data = &sysctl_sched_dl_period_max, 1778 .maxlen = sizeof(unsigned int), 1779 .mode = 0644, 1780 .proc_handler = proc_dointvec, 1781 }, 1782 { 1783 .procname = "sched_deadline_period_min_us", 1784 .data = &sysctl_sched_dl_period_min, 1785 .maxlen = sizeof(unsigned int), 1786 .mode = 0644, 1787 .proc_handler = proc_dointvec, 1788 }, 1789 { 1790 .procname = "sched_rr_timeslice_ms", 1791 .data = &sysctl_sched_rr_timeslice, 1792 .maxlen = sizeof(int), 1793 .mode = 0644, 1794 .proc_handler = sched_rr_handler, 1795 }, 1796 #ifdef CONFIG_UCLAMP_TASK 1797 { 1798 .procname = "sched_util_clamp_min", 1799 .data = &sysctl_sched_uclamp_util_min, 1800 .maxlen = sizeof(unsigned int), 1801 .mode = 0644, 1802 .proc_handler = sysctl_sched_uclamp_handler, 1803 }, 1804 { 1805 .procname = "sched_util_clamp_max", 1806 .data = &sysctl_sched_uclamp_util_max, 1807 .maxlen = sizeof(unsigned int), 1808 .mode = 0644, 1809 .proc_handler = sysctl_sched_uclamp_handler, 1810 }, 1811 { 1812 .procname = "sched_util_clamp_min_rt_default", 1813 .data = &sysctl_sched_uclamp_util_min_rt_default, 1814 .maxlen = sizeof(unsigned int), 1815 .mode = 0644, 1816 .proc_handler = sysctl_sched_uclamp_handler, 1817 }, 1818 #endif 1819 #ifdef CONFIG_SCHED_AUTOGROUP 1820 { 1821 .procname = "sched_autogroup_enabled", 1822 .data = &sysctl_sched_autogroup_enabled, 1823 .maxlen = sizeof(unsigned int), 1824 .mode = 0644, 1825 .proc_handler = proc_dointvec_minmax, 1826 .extra1 = SYSCTL_ZERO, 1827 .extra2 = SYSCTL_ONE, 1828 }, 1829 #endif 1830 #ifdef CONFIG_CFS_BANDWIDTH 1831 { 1832 .procname = "sched_cfs_bandwidth_slice_us", 1833 .data = &sysctl_sched_cfs_bandwidth_slice, 1834 .maxlen = sizeof(unsigned int), 1835 .mode = 0644, 1836 .proc_handler = proc_dointvec_minmax, 1837 .extra1 = SYSCTL_ONE, 1838 }, 1839 #endif 1840 #if defined(CONFIG_ENERGY_MODEL) && defined(CONFIG_CPU_FREQ_GOV_SCHEDUTIL) 1841 { 1842 .procname = "sched_energy_aware", 1843 .data = &sysctl_sched_energy_aware, 1844 .maxlen = sizeof(unsigned int), 1845 .mode = 0644, 1846 .proc_handler = sched_energy_aware_handler, 1847 .extra1 = SYSCTL_ZERO, 1848 .extra2 = SYSCTL_ONE, 1849 }, 1850 #endif 1851 #ifdef CONFIG_PROVE_LOCKING 1852 { 1853 .procname = "prove_locking", 1854 .data = &prove_locking, 1855 .maxlen = sizeof(int), 1856 .mode = 0644, 1857 .proc_handler = proc_dointvec, 1858 }, 1859 #endif 1860 #ifdef CONFIG_LOCK_STAT 1861 { 1862 .procname = "lock_stat", 1863 .data = &lock_stat, 1864 .maxlen = sizeof(int), 1865 .mode = 0644, 1866 .proc_handler = proc_dointvec, 1867 }, 1868 #endif 1869 { 1870 .procname = "panic", 1871 .data = &panic_timeout, 1872 .maxlen = sizeof(int), 1873 .mode = 0644, 1874 .proc_handler = proc_dointvec, 1875 }, 1876 #ifdef CONFIG_COREDUMP 1877 { 1878 .procname = "core_uses_pid", 1879 .data = &core_uses_pid, 1880 .maxlen = sizeof(int), 1881 .mode = 0644, 1882 .proc_handler = proc_dointvec, 1883 }, 1884 { 1885 .procname = "core_pattern", 1886 .data = core_pattern, 1887 .maxlen = CORENAME_MAX_SIZE, 1888 .mode = 0644, 1889 .proc_handler = proc_dostring_coredump, 1890 }, 1891 { 1892 .procname = "core_pipe_limit", 1893 .data = &core_pipe_limit, 1894 .maxlen = sizeof(unsigned int), 1895 .mode = 0644, 1896 .proc_handler = proc_dointvec, 1897 }, 1898 #endif 1899 #ifdef CONFIG_PROC_SYSCTL 1900 { 1901 .procname = "tainted", 1902 .maxlen = sizeof(long), 1903 .mode = 0644, 1904 .proc_handler = proc_taint, 1905 }, 1906 { 1907 .procname = "sysctl_writes_strict", 1908 .data = &sysctl_writes_strict, 1909 .maxlen = sizeof(int), 1910 .mode = 0644, 1911 .proc_handler = proc_dointvec_minmax, 1912 .extra1 = &neg_one, 1913 .extra2 = SYSCTL_ONE, 1914 }, 1915 #endif 1916 #ifdef CONFIG_LATENCYTOP 1917 { 1918 .procname = "latencytop", 1919 .data = &latencytop_enabled, 1920 .maxlen = sizeof(int), 1921 .mode = 0644, 1922 .proc_handler = sysctl_latencytop, 1923 }, 1924 #endif 1925 #ifdef CONFIG_BLK_DEV_INITRD 1926 { 1927 .procname = "real-root-dev", 1928 .data = &real_root_dev, 1929 .maxlen = sizeof(int), 1930 .mode = 0644, 1931 .proc_handler = proc_dointvec, 1932 }, 1933 #endif 1934 { 1935 .procname = "print-fatal-signals", 1936 .data = &print_fatal_signals, 1937 .maxlen = sizeof(int), 1938 .mode = 0644, 1939 .proc_handler = proc_dointvec, 1940 }, 1941 #ifdef CONFIG_SPARC 1942 { 1943 .procname = "reboot-cmd", 1944 .data = reboot_command, 1945 .maxlen = 256, 1946 .mode = 0644, 1947 .proc_handler = proc_dostring, 1948 }, 1949 { 1950 .procname = "stop-a", 1951 .data = &stop_a_enabled, 1952 .maxlen = sizeof (int), 1953 .mode = 0644, 1954 .proc_handler = proc_dointvec, 1955 }, 1956 { 1957 .procname = "scons-poweroff", 1958 .data = &scons_pwroff, 1959 .maxlen = sizeof (int), 1960 .mode = 0644, 1961 .proc_handler = proc_dointvec, 1962 }, 1963 #endif 1964 #ifdef CONFIG_SPARC64 1965 { 1966 .procname = "tsb-ratio", 1967 .data = &sysctl_tsb_ratio, 1968 .maxlen = sizeof (int), 1969 .mode = 0644, 1970 .proc_handler = proc_dointvec, 1971 }, 1972 #endif 1973 #ifdef CONFIG_PARISC 1974 { 1975 .procname = "soft-power", 1976 .data = &pwrsw_enabled, 1977 .maxlen = sizeof (int), 1978 .mode = 0644, 1979 .proc_handler = proc_dointvec, 1980 }, 1981 #endif 1982 #ifdef CONFIG_SYSCTL_ARCH_UNALIGN_ALLOW 1983 { 1984 .procname = "unaligned-trap", 1985 .data = &unaligned_enabled, 1986 .maxlen = sizeof (int), 1987 .mode = 0644, 1988 .proc_handler = proc_dointvec, 1989 }, 1990 #endif 1991 { 1992 .procname = "ctrl-alt-del", 1993 .data = &C_A_D, 1994 .maxlen = sizeof(int), 1995 .mode = 0644, 1996 .proc_handler = proc_dointvec, 1997 }, 1998 #ifdef CONFIG_FUNCTION_TRACER 1999 { 2000 .procname = "ftrace_enabled", 2001 .data = &ftrace_enabled, 2002 .maxlen = sizeof(int), 2003 .mode = 0644, 2004 .proc_handler = ftrace_enable_sysctl, 2005 }, 2006 #endif 2007 #ifdef CONFIG_STACK_TRACER 2008 { 2009 .procname = "stack_tracer_enabled", 2010 .data = &stack_tracer_enabled, 2011 .maxlen = sizeof(int), 2012 .mode = 0644, 2013 .proc_handler = stack_trace_sysctl, 2014 }, 2015 #endif 2016 #ifdef CONFIG_TRACING 2017 { 2018 .procname = "ftrace_dump_on_oops", 2019 .data = &ftrace_dump_on_oops, 2020 .maxlen = sizeof(int), 2021 .mode = 0644, 2022 .proc_handler = proc_dointvec, 2023 }, 2024 { 2025 .procname = "traceoff_on_warning", 2026 .data = &__disable_trace_on_warning, 2027 .maxlen = sizeof(__disable_trace_on_warning), 2028 .mode = 0644, 2029 .proc_handler = proc_dointvec, 2030 }, 2031 { 2032 .procname = "tracepoint_printk", 2033 .data = &tracepoint_printk, 2034 .maxlen = sizeof(tracepoint_printk), 2035 .mode = 0644, 2036 .proc_handler = tracepoint_printk_sysctl, 2037 }, 2038 #endif 2039 #ifdef CONFIG_KEXEC_CORE 2040 { 2041 .procname = "kexec_load_disabled", 2042 .data = &kexec_load_disabled, 2043 .maxlen = sizeof(int), 2044 .mode = 0644, 2045 /* only handle a transition from default "0" to "1" */ 2046 .proc_handler = proc_dointvec_minmax, 2047 .extra1 = SYSCTL_ONE, 2048 .extra2 = SYSCTL_ONE, 2049 }, 2050 #endif 2051 #ifdef CONFIG_MODULES 2052 { 2053 .procname = "modprobe", 2054 .data = &modprobe_path, 2055 .maxlen = KMOD_PATH_LEN, 2056 .mode = 0644, 2057 .proc_handler = proc_dostring, 2058 }, 2059 { 2060 .procname = "modules_disabled", 2061 .data = &modules_disabled, 2062 .maxlen = sizeof(int), 2063 .mode = 0644, 2064 /* only handle a transition from default "0" to "1" */ 2065 .proc_handler = proc_dointvec_minmax, 2066 .extra1 = SYSCTL_ONE, 2067 .extra2 = SYSCTL_ONE, 2068 }, 2069 #endif 2070 #ifdef CONFIG_UEVENT_HELPER 2071 { 2072 .procname = "hotplug", 2073 .data = &uevent_helper, 2074 .maxlen = UEVENT_HELPER_PATH_LEN, 2075 .mode = 0644, 2076 .proc_handler = proc_dostring, 2077 }, 2078 #endif 2079 #ifdef CONFIG_CHR_DEV_SG 2080 { 2081 .procname = "sg-big-buff", 2082 .data = &sg_big_buff, 2083 .maxlen = sizeof (int), 2084 .mode = 0444, 2085 .proc_handler = proc_dointvec, 2086 }, 2087 #endif 2088 #ifdef CONFIG_BSD_PROCESS_ACCT 2089 { 2090 .procname = "acct", 2091 .data = &acct_parm, 2092 .maxlen = 3*sizeof(int), 2093 .mode = 0644, 2094 .proc_handler = proc_dointvec, 2095 }, 2096 #endif 2097 #ifdef CONFIG_MAGIC_SYSRQ 2098 { 2099 .procname = "sysrq", 2100 .data = NULL, 2101 .maxlen = sizeof (int), 2102 .mode = 0644, 2103 .proc_handler = sysrq_sysctl_handler, 2104 }, 2105 #endif 2106 #ifdef CONFIG_PROC_SYSCTL 2107 { 2108 .procname = "cad_pid", 2109 .data = NULL, 2110 .maxlen = sizeof (int), 2111 .mode = 0600, 2112 .proc_handler = proc_do_cad_pid, 2113 }, 2114 #endif 2115 { 2116 .procname = "threads-max", 2117 .data = NULL, 2118 .maxlen = sizeof(int), 2119 .mode = 0644, 2120 .proc_handler = sysctl_max_threads, 2121 }, 2122 { 2123 .procname = "random", 2124 .mode = 0555, 2125 .child = random_table, 2126 }, 2127 { 2128 .procname = "usermodehelper", 2129 .mode = 0555, 2130 .child = usermodehelper_table, 2131 }, 2132 #ifdef CONFIG_FW_LOADER_USER_HELPER 2133 { 2134 .procname = "firmware_config", 2135 .mode = 0555, 2136 .child = firmware_config_table, 2137 }, 2138 #endif 2139 { 2140 .procname = "overflowuid", 2141 .data = &overflowuid, 2142 .maxlen = sizeof(int), 2143 .mode = 0644, 2144 .proc_handler = proc_dointvec_minmax, 2145 .extra1 = &minolduid, 2146 .extra2 = &maxolduid, 2147 }, 2148 { 2149 .procname = "overflowgid", 2150 .data = &overflowgid, 2151 .maxlen = sizeof(int), 2152 .mode = 0644, 2153 .proc_handler = proc_dointvec_minmax, 2154 .extra1 = &minolduid, 2155 .extra2 = &maxolduid, 2156 }, 2157 #ifdef CONFIG_S390 2158 { 2159 .procname = "userprocess_debug", 2160 .data = &show_unhandled_signals, 2161 .maxlen = sizeof(int), 2162 .mode = 0644, 2163 .proc_handler = proc_dointvec, 2164 }, 2165 #endif 2166 #ifdef CONFIG_SMP 2167 { 2168 .procname = "oops_all_cpu_backtrace", 2169 .data = &sysctl_oops_all_cpu_backtrace, 2170 .maxlen = sizeof(int), 2171 .mode = 0644, 2172 .proc_handler = proc_dointvec_minmax, 2173 .extra1 = SYSCTL_ZERO, 2174 .extra2 = SYSCTL_ONE, 2175 }, 2176 #endif /* CONFIG_SMP */ 2177 { 2178 .procname = "pid_max", 2179 .data = &pid_max, 2180 .maxlen = sizeof (int), 2181 .mode = 0644, 2182 .proc_handler = proc_dointvec_minmax, 2183 .extra1 = &pid_max_min, 2184 .extra2 = &pid_max_max, 2185 }, 2186 { 2187 .procname = "panic_on_oops", 2188 .data = &panic_on_oops, 2189 .maxlen = sizeof(int), 2190 .mode = 0644, 2191 .proc_handler = proc_dointvec, 2192 }, 2193 { 2194 .procname = "panic_print", 2195 .data = &panic_print, 2196 .maxlen = sizeof(unsigned long), 2197 .mode = 0644, 2198 .proc_handler = proc_doulongvec_minmax, 2199 }, 2200 #if defined CONFIG_PRINTK 2201 { 2202 .procname = "printk", 2203 .data = &console_loglevel, 2204 .maxlen = 4*sizeof(int), 2205 .mode = 0644, 2206 .proc_handler = proc_dointvec, 2207 }, 2208 { 2209 .procname = "printk_ratelimit", 2210 .data = &printk_ratelimit_state.interval, 2211 .maxlen = sizeof(int), 2212 .mode = 0644, 2213 .proc_handler = proc_dointvec_jiffies, 2214 }, 2215 { 2216 .procname = "printk_ratelimit_burst", 2217 .data = &printk_ratelimit_state.burst, 2218 .maxlen = sizeof(int), 2219 .mode = 0644, 2220 .proc_handler = proc_dointvec, 2221 }, 2222 { 2223 .procname = "printk_delay", 2224 .data = &printk_delay_msec, 2225 .maxlen = sizeof(int), 2226 .mode = 0644, 2227 .proc_handler = proc_dointvec_minmax, 2228 .extra1 = SYSCTL_ZERO, 2229 .extra2 = &ten_thousand, 2230 }, 2231 { 2232 .procname = "printk_devkmsg", 2233 .data = devkmsg_log_str, 2234 .maxlen = DEVKMSG_STR_MAX_SIZE, 2235 .mode = 0644, 2236 .proc_handler = devkmsg_sysctl_set_loglvl, 2237 }, 2238 { 2239 .procname = "dmesg_restrict", 2240 .data = &dmesg_restrict, 2241 .maxlen = sizeof(int), 2242 .mode = 0644, 2243 .proc_handler = proc_dointvec_minmax_sysadmin, 2244 .extra1 = SYSCTL_ZERO, 2245 .extra2 = SYSCTL_ONE, 2246 }, 2247 { 2248 .procname = "kptr_restrict", 2249 .data = &kptr_restrict, 2250 .maxlen = sizeof(int), 2251 .mode = 0644, 2252 .proc_handler = proc_dointvec_minmax_sysadmin, 2253 .extra1 = SYSCTL_ZERO, 2254 .extra2 = &two, 2255 }, 2256 #endif 2257 { 2258 .procname = "ngroups_max", 2259 .data = &ngroups_max, 2260 .maxlen = sizeof (int), 2261 .mode = 0444, 2262 .proc_handler = proc_dointvec, 2263 }, 2264 { 2265 .procname = "cap_last_cap", 2266 .data = (void *)&cap_last_cap, 2267 .maxlen = sizeof(int), 2268 .mode = 0444, 2269 .proc_handler = proc_dointvec, 2270 }, 2271 #if defined(CONFIG_LOCKUP_DETECTOR) 2272 { 2273 .procname = "watchdog", 2274 .data = &watchdog_user_enabled, 2275 .maxlen = sizeof(int), 2276 .mode = 0644, 2277 .proc_handler = proc_watchdog, 2278 .extra1 = SYSCTL_ZERO, 2279 .extra2 = SYSCTL_ONE, 2280 }, 2281 { 2282 .procname = "watchdog_thresh", 2283 .data = &watchdog_thresh, 2284 .maxlen = sizeof(int), 2285 .mode = 0644, 2286 .proc_handler = proc_watchdog_thresh, 2287 .extra1 = SYSCTL_ZERO, 2288 .extra2 = &sixty, 2289 }, 2290 { 2291 .procname = "nmi_watchdog", 2292 .data = &nmi_watchdog_user_enabled, 2293 .maxlen = sizeof(int), 2294 .mode = NMI_WATCHDOG_SYSCTL_PERM, 2295 .proc_handler = proc_nmi_watchdog, 2296 .extra1 = SYSCTL_ZERO, 2297 .extra2 = SYSCTL_ONE, 2298 }, 2299 { 2300 .procname = "watchdog_cpumask", 2301 .data = &watchdog_cpumask_bits, 2302 .maxlen = NR_CPUS, 2303 .mode = 0644, 2304 .proc_handler = proc_watchdog_cpumask, 2305 }, 2306 #ifdef CONFIG_SOFTLOCKUP_DETECTOR 2307 { 2308 .procname = "soft_watchdog", 2309 .data = &soft_watchdog_user_enabled, 2310 .maxlen = sizeof(int), 2311 .mode = 0644, 2312 .proc_handler = proc_soft_watchdog, 2313 .extra1 = SYSCTL_ZERO, 2314 .extra2 = SYSCTL_ONE, 2315 }, 2316 { 2317 .procname = "softlockup_panic", 2318 .data = &softlockup_panic, 2319 .maxlen = sizeof(int), 2320 .mode = 0644, 2321 .proc_handler = proc_dointvec_minmax, 2322 .extra1 = SYSCTL_ZERO, 2323 .extra2 = SYSCTL_ONE, 2324 }, 2325 #ifdef CONFIG_SMP 2326 { 2327 .procname = "softlockup_all_cpu_backtrace", 2328 .data = &sysctl_softlockup_all_cpu_backtrace, 2329 .maxlen = sizeof(int), 2330 .mode = 0644, 2331 .proc_handler = proc_dointvec_minmax, 2332 .extra1 = SYSCTL_ZERO, 2333 .extra2 = SYSCTL_ONE, 2334 }, 2335 #endif /* CONFIG_SMP */ 2336 #endif 2337 #ifdef CONFIG_HARDLOCKUP_DETECTOR 2338 { 2339 .procname = "hardlockup_panic", 2340 .data = &hardlockup_panic, 2341 .maxlen = sizeof(int), 2342 .mode = 0644, 2343 .proc_handler = proc_dointvec_minmax, 2344 .extra1 = SYSCTL_ZERO, 2345 .extra2 = SYSCTL_ONE, 2346 }, 2347 #ifdef CONFIG_SMP 2348 { 2349 .procname = "hardlockup_all_cpu_backtrace", 2350 .data = &sysctl_hardlockup_all_cpu_backtrace, 2351 .maxlen = sizeof(int), 2352 .mode = 0644, 2353 .proc_handler = proc_dointvec_minmax, 2354 .extra1 = SYSCTL_ZERO, 2355 .extra2 = SYSCTL_ONE, 2356 }, 2357 #endif /* CONFIG_SMP */ 2358 #endif 2359 #endif 2360 2361 #if defined(CONFIG_X86_LOCAL_APIC) && defined(CONFIG_X86) 2362 { 2363 .procname = "unknown_nmi_panic", 2364 .data = &unknown_nmi_panic, 2365 .maxlen = sizeof (int), 2366 .mode = 0644, 2367 .proc_handler = proc_dointvec, 2368 }, 2369 #endif 2370 2371 #if (defined(CONFIG_X86_32) || defined(CONFIG_PARISC)) && \ 2372 defined(CONFIG_DEBUG_STACKOVERFLOW) 2373 { 2374 .procname = "panic_on_stackoverflow", 2375 .data = &sysctl_panic_on_stackoverflow, 2376 .maxlen = sizeof(int), 2377 .mode = 0644, 2378 .proc_handler = proc_dointvec, 2379 }, 2380 #endif 2381 #if defined(CONFIG_X86) 2382 { 2383 .procname = "panic_on_unrecovered_nmi", 2384 .data = &panic_on_unrecovered_nmi, 2385 .maxlen = sizeof(int), 2386 .mode = 0644, 2387 .proc_handler = proc_dointvec, 2388 }, 2389 { 2390 .procname = "panic_on_io_nmi", 2391 .data = &panic_on_io_nmi, 2392 .maxlen = sizeof(int), 2393 .mode = 0644, 2394 .proc_handler = proc_dointvec, 2395 }, 2396 { 2397 .procname = "bootloader_type", 2398 .data = &bootloader_type, 2399 .maxlen = sizeof (int), 2400 .mode = 0444, 2401 .proc_handler = proc_dointvec, 2402 }, 2403 { 2404 .procname = "bootloader_version", 2405 .data = &bootloader_version, 2406 .maxlen = sizeof (int), 2407 .mode = 0444, 2408 .proc_handler = proc_dointvec, 2409 }, 2410 { 2411 .procname = "io_delay_type", 2412 .data = &io_delay_type, 2413 .maxlen = sizeof(int), 2414 .mode = 0644, 2415 .proc_handler = proc_dointvec, 2416 }, 2417 #endif 2418 #if defined(CONFIG_MMU) 2419 { 2420 .procname = "randomize_va_space", 2421 .data = &randomize_va_space, 2422 .maxlen = sizeof(int), 2423 .mode = 0644, 2424 .proc_handler = proc_dointvec, 2425 }, 2426 #endif 2427 #if defined(CONFIG_S390) && defined(CONFIG_SMP) 2428 { 2429 .procname = "spin_retry", 2430 .data = &spin_retry, 2431 .maxlen = sizeof (int), 2432 .mode = 0644, 2433 .proc_handler = proc_dointvec, 2434 }, 2435 #endif 2436 #if defined(CONFIG_ACPI_SLEEP) && defined(CONFIG_X86) 2437 { 2438 .procname = "acpi_video_flags", 2439 .data = &acpi_realmode_flags, 2440 .maxlen = sizeof (unsigned long), 2441 .mode = 0644, 2442 .proc_handler = proc_doulongvec_minmax, 2443 }, 2444 #endif 2445 #ifdef CONFIG_SYSCTL_ARCH_UNALIGN_NO_WARN 2446 { 2447 .procname = "ignore-unaligned-usertrap", 2448 .data = &no_unaligned_warning, 2449 .maxlen = sizeof (int), 2450 .mode = 0644, 2451 .proc_handler = proc_dointvec, 2452 }, 2453 #endif 2454 #ifdef CONFIG_IA64 2455 { 2456 .procname = "unaligned-dump-stack", 2457 .data = &unaligned_dump_stack, 2458 .maxlen = sizeof (int), 2459 .mode = 0644, 2460 .proc_handler = proc_dointvec, 2461 }, 2462 #endif 2463 #ifdef CONFIG_DETECT_HUNG_TASK 2464 #ifdef CONFIG_SMP 2465 { 2466 .procname = "hung_task_all_cpu_backtrace", 2467 .data = &sysctl_hung_task_all_cpu_backtrace, 2468 .maxlen = sizeof(int), 2469 .mode = 0644, 2470 .proc_handler = proc_dointvec_minmax, 2471 .extra1 = SYSCTL_ZERO, 2472 .extra2 = SYSCTL_ONE, 2473 }, 2474 #endif /* CONFIG_SMP */ 2475 { 2476 .procname = "hung_task_panic", 2477 .data = &sysctl_hung_task_panic, 2478 .maxlen = sizeof(int), 2479 .mode = 0644, 2480 .proc_handler = proc_dointvec_minmax, 2481 .extra1 = SYSCTL_ZERO, 2482 .extra2 = SYSCTL_ONE, 2483 }, 2484 { 2485 .procname = "hung_task_check_count", 2486 .data = &sysctl_hung_task_check_count, 2487 .maxlen = sizeof(int), 2488 .mode = 0644, 2489 .proc_handler = proc_dointvec_minmax, 2490 .extra1 = SYSCTL_ZERO, 2491 }, 2492 { 2493 .procname = "hung_task_timeout_secs", 2494 .data = &sysctl_hung_task_timeout_secs, 2495 .maxlen = sizeof(unsigned long), 2496 .mode = 0644, 2497 .proc_handler = proc_dohung_task_timeout_secs, 2498 .extra2 = &hung_task_timeout_max, 2499 }, 2500 { 2501 .procname = "hung_task_check_interval_secs", 2502 .data = &sysctl_hung_task_check_interval_secs, 2503 .maxlen = sizeof(unsigned long), 2504 .mode = 0644, 2505 .proc_handler = proc_dohung_task_timeout_secs, 2506 .extra2 = &hung_task_timeout_max, 2507 }, 2508 { 2509 .procname = "hung_task_warnings", 2510 .data = &sysctl_hung_task_warnings, 2511 .maxlen = sizeof(int), 2512 .mode = 0644, 2513 .proc_handler = proc_dointvec_minmax, 2514 .extra1 = &neg_one, 2515 }, 2516 #endif 2517 #ifdef CONFIG_RT_MUTEXES 2518 { 2519 .procname = "max_lock_depth", 2520 .data = &max_lock_depth, 2521 .maxlen = sizeof(int), 2522 .mode = 0644, 2523 .proc_handler = proc_dointvec, 2524 }, 2525 #endif 2526 { 2527 .procname = "poweroff_cmd", 2528 .data = &poweroff_cmd, 2529 .maxlen = POWEROFF_CMD_PATH_LEN, 2530 .mode = 0644, 2531 .proc_handler = proc_dostring, 2532 }, 2533 #ifdef CONFIG_KEYS 2534 { 2535 .procname = "keys", 2536 .mode = 0555, 2537 .child = key_sysctls, 2538 }, 2539 #endif 2540 #ifdef CONFIG_PERF_EVENTS 2541 /* 2542 * User-space scripts rely on the existence of this file 2543 * as a feature check for perf_events being enabled. 2544 * 2545 * So it's an ABI, do not remove! 2546 */ 2547 { 2548 .procname = "perf_event_paranoid", 2549 .data = &sysctl_perf_event_paranoid, 2550 .maxlen = sizeof(sysctl_perf_event_paranoid), 2551 .mode = 0644, 2552 .proc_handler = proc_dointvec, 2553 }, 2554 { 2555 .procname = "perf_event_mlock_kb", 2556 .data = &sysctl_perf_event_mlock, 2557 .maxlen = sizeof(sysctl_perf_event_mlock), 2558 .mode = 0644, 2559 .proc_handler = proc_dointvec, 2560 }, 2561 { 2562 .procname = "perf_event_max_sample_rate", 2563 .data = &sysctl_perf_event_sample_rate, 2564 .maxlen = sizeof(sysctl_perf_event_sample_rate), 2565 .mode = 0644, 2566 .proc_handler = perf_proc_update_handler, 2567 .extra1 = SYSCTL_ONE, 2568 }, 2569 { 2570 .procname = "perf_cpu_time_max_percent", 2571 .data = &sysctl_perf_cpu_time_max_percent, 2572 .maxlen = sizeof(sysctl_perf_cpu_time_max_percent), 2573 .mode = 0644, 2574 .proc_handler = perf_cpu_time_max_percent_handler, 2575 .extra1 = SYSCTL_ZERO, 2576 .extra2 = &one_hundred, 2577 }, 2578 { 2579 .procname = "perf_event_max_stack", 2580 .data = &sysctl_perf_event_max_stack, 2581 .maxlen = sizeof(sysctl_perf_event_max_stack), 2582 .mode = 0644, 2583 .proc_handler = perf_event_max_stack_handler, 2584 .extra1 = SYSCTL_ZERO, 2585 .extra2 = &six_hundred_forty_kb, 2586 }, 2587 { 2588 .procname = "perf_event_max_contexts_per_stack", 2589 .data = &sysctl_perf_event_max_contexts_per_stack, 2590 .maxlen = sizeof(sysctl_perf_event_max_contexts_per_stack), 2591 .mode = 0644, 2592 .proc_handler = perf_event_max_stack_handler, 2593 .extra1 = SYSCTL_ZERO, 2594 .extra2 = &one_thousand, 2595 }, 2596 #endif 2597 { 2598 .procname = "panic_on_warn", 2599 .data = &panic_on_warn, 2600 .maxlen = sizeof(int), 2601 .mode = 0644, 2602 .proc_handler = proc_dointvec_minmax, 2603 .extra1 = SYSCTL_ZERO, 2604 .extra2 = SYSCTL_ONE, 2605 }, 2606 #if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ_COMMON) 2607 { 2608 .procname = "timer_migration", 2609 .data = &sysctl_timer_migration, 2610 .maxlen = sizeof(unsigned int), 2611 .mode = 0644, 2612 .proc_handler = timer_migration_handler, 2613 .extra1 = SYSCTL_ZERO, 2614 .extra2 = SYSCTL_ONE, 2615 }, 2616 #endif 2617 #ifdef CONFIG_BPF_SYSCALL 2618 { 2619 .procname = "unprivileged_bpf_disabled", 2620 .data = &sysctl_unprivileged_bpf_disabled, 2621 .maxlen = sizeof(sysctl_unprivileged_bpf_disabled), 2622 .mode = 0644, 2623 .proc_handler = bpf_unpriv_handler, 2624 .extra1 = SYSCTL_ZERO, 2625 .extra2 = &two, 2626 }, 2627 { 2628 .procname = "bpf_stats_enabled", 2629 .data = &bpf_stats_enabled_key.key, 2630 .maxlen = sizeof(bpf_stats_enabled_key), 2631 .mode = 0644, 2632 .proc_handler = bpf_stats_handler, 2633 }, 2634 #endif 2635 #if defined(CONFIG_TREE_RCU) 2636 { 2637 .procname = "panic_on_rcu_stall", 2638 .data = &sysctl_panic_on_rcu_stall, 2639 .maxlen = sizeof(sysctl_panic_on_rcu_stall), 2640 .mode = 0644, 2641 .proc_handler = proc_dointvec_minmax, 2642 .extra1 = SYSCTL_ZERO, 2643 .extra2 = SYSCTL_ONE, 2644 }, 2645 #endif 2646 #if defined(CONFIG_TREE_RCU) 2647 { 2648 .procname = "max_rcu_stall_to_panic", 2649 .data = &sysctl_max_rcu_stall_to_panic, 2650 .maxlen = sizeof(sysctl_max_rcu_stall_to_panic), 2651 .mode = 0644, 2652 .proc_handler = proc_dointvec_minmax, 2653 .extra1 = SYSCTL_ONE, 2654 .extra2 = SYSCTL_INT_MAX, 2655 }, 2656 #endif 2657 #ifdef CONFIG_STACKLEAK_RUNTIME_DISABLE 2658 { 2659 .procname = "stack_erasing", 2660 .data = NULL, 2661 .maxlen = sizeof(int), 2662 .mode = 0600, 2663 .proc_handler = stack_erasing_sysctl, 2664 .extra1 = SYSCTL_ZERO, 2665 .extra2 = SYSCTL_ONE, 2666 }, 2667 #endif 2668 { } 2669 }; 2670 2671 static struct ctl_table vm_table[] = { 2672 { 2673 .procname = "overcommit_memory", 2674 .data = &sysctl_overcommit_memory, 2675 .maxlen = sizeof(sysctl_overcommit_memory), 2676 .mode = 0644, 2677 .proc_handler = overcommit_policy_handler, 2678 .extra1 = SYSCTL_ZERO, 2679 .extra2 = &two, 2680 }, 2681 { 2682 .procname = "panic_on_oom", 2683 .data = &sysctl_panic_on_oom, 2684 .maxlen = sizeof(sysctl_panic_on_oom), 2685 .mode = 0644, 2686 .proc_handler = proc_dointvec_minmax, 2687 .extra1 = SYSCTL_ZERO, 2688 .extra2 = &two, 2689 }, 2690 { 2691 .procname = "oom_kill_allocating_task", 2692 .data = &sysctl_oom_kill_allocating_task, 2693 .maxlen = sizeof(sysctl_oom_kill_allocating_task), 2694 .mode = 0644, 2695 .proc_handler = proc_dointvec, 2696 }, 2697 { 2698 .procname = "oom_dump_tasks", 2699 .data = &sysctl_oom_dump_tasks, 2700 .maxlen = sizeof(sysctl_oom_dump_tasks), 2701 .mode = 0644, 2702 .proc_handler = proc_dointvec, 2703 }, 2704 { 2705 .procname = "overcommit_ratio", 2706 .data = &sysctl_overcommit_ratio, 2707 .maxlen = sizeof(sysctl_overcommit_ratio), 2708 .mode = 0644, 2709 .proc_handler = overcommit_ratio_handler, 2710 }, 2711 { 2712 .procname = "overcommit_kbytes", 2713 .data = &sysctl_overcommit_kbytes, 2714 .maxlen = sizeof(sysctl_overcommit_kbytes), 2715 .mode = 0644, 2716 .proc_handler = overcommit_kbytes_handler, 2717 }, 2718 { 2719 .procname = "page-cluster", 2720 .data = &page_cluster, 2721 .maxlen = sizeof(int), 2722 .mode = 0644, 2723 .proc_handler = proc_dointvec_minmax, 2724 .extra1 = SYSCTL_ZERO, 2725 }, 2726 { 2727 .procname = "dirty_background_ratio", 2728 .data = &dirty_background_ratio, 2729 .maxlen = sizeof(dirty_background_ratio), 2730 .mode = 0644, 2731 .proc_handler = dirty_background_ratio_handler, 2732 .extra1 = SYSCTL_ZERO, 2733 .extra2 = &one_hundred, 2734 }, 2735 { 2736 .procname = "dirty_background_bytes", 2737 .data = &dirty_background_bytes, 2738 .maxlen = sizeof(dirty_background_bytes), 2739 .mode = 0644, 2740 .proc_handler = dirty_background_bytes_handler, 2741 .extra1 = &one_ul, 2742 }, 2743 { 2744 .procname = "dirty_ratio", 2745 .data = &vm_dirty_ratio, 2746 .maxlen = sizeof(vm_dirty_ratio), 2747 .mode = 0644, 2748 .proc_handler = dirty_ratio_handler, 2749 .extra1 = SYSCTL_ZERO, 2750 .extra2 = &one_hundred, 2751 }, 2752 { 2753 .procname = "dirty_bytes", 2754 .data = &vm_dirty_bytes, 2755 .maxlen = sizeof(vm_dirty_bytes), 2756 .mode = 0644, 2757 .proc_handler = dirty_bytes_handler, 2758 .extra1 = &dirty_bytes_min, 2759 }, 2760 { 2761 .procname = "dirty_writeback_centisecs", 2762 .data = &dirty_writeback_interval, 2763 .maxlen = sizeof(dirty_writeback_interval), 2764 .mode = 0644, 2765 .proc_handler = dirty_writeback_centisecs_handler, 2766 }, 2767 { 2768 .procname = "dirty_expire_centisecs", 2769 .data = &dirty_expire_interval, 2770 .maxlen = sizeof(dirty_expire_interval), 2771 .mode = 0644, 2772 .proc_handler = proc_dointvec_minmax, 2773 .extra1 = SYSCTL_ZERO, 2774 }, 2775 { 2776 .procname = "dirtytime_expire_seconds", 2777 .data = &dirtytime_expire_interval, 2778 .maxlen = sizeof(dirtytime_expire_interval), 2779 .mode = 0644, 2780 .proc_handler = dirtytime_interval_handler, 2781 .extra1 = SYSCTL_ZERO, 2782 }, 2783 { 2784 .procname = "swappiness", 2785 .data = &vm_swappiness, 2786 .maxlen = sizeof(vm_swappiness), 2787 .mode = 0644, 2788 .proc_handler = proc_dointvec_minmax, 2789 .extra1 = SYSCTL_ZERO, 2790 .extra2 = &two_hundred, 2791 }, 2792 #ifdef CONFIG_HUGETLB_PAGE 2793 { 2794 .procname = "nr_hugepages", 2795 .data = NULL, 2796 .maxlen = sizeof(unsigned long), 2797 .mode = 0644, 2798 .proc_handler = hugetlb_sysctl_handler, 2799 }, 2800 #ifdef CONFIG_NUMA 2801 { 2802 .procname = "nr_hugepages_mempolicy", 2803 .data = NULL, 2804 .maxlen = sizeof(unsigned long), 2805 .mode = 0644, 2806 .proc_handler = &hugetlb_mempolicy_sysctl_handler, 2807 }, 2808 { 2809 .procname = "numa_stat", 2810 .data = &sysctl_vm_numa_stat, 2811 .maxlen = sizeof(int), 2812 .mode = 0644, 2813 .proc_handler = sysctl_vm_numa_stat_handler, 2814 .extra1 = SYSCTL_ZERO, 2815 .extra2 = SYSCTL_ONE, 2816 }, 2817 #endif 2818 { 2819 .procname = "hugetlb_shm_group", 2820 .data = &sysctl_hugetlb_shm_group, 2821 .maxlen = sizeof(gid_t), 2822 .mode = 0644, 2823 .proc_handler = proc_dointvec, 2824 }, 2825 { 2826 .procname = "nr_overcommit_hugepages", 2827 .data = NULL, 2828 .maxlen = sizeof(unsigned long), 2829 .mode = 0644, 2830 .proc_handler = hugetlb_overcommit_handler, 2831 }, 2832 #endif 2833 { 2834 .procname = "lowmem_reserve_ratio", 2835 .data = &sysctl_lowmem_reserve_ratio, 2836 .maxlen = sizeof(sysctl_lowmem_reserve_ratio), 2837 .mode = 0644, 2838 .proc_handler = lowmem_reserve_ratio_sysctl_handler, 2839 }, 2840 { 2841 .procname = "drop_caches", 2842 .data = &sysctl_drop_caches, 2843 .maxlen = sizeof(int), 2844 .mode = 0200, 2845 .proc_handler = drop_caches_sysctl_handler, 2846 .extra1 = SYSCTL_ONE, 2847 .extra2 = &four, 2848 }, 2849 #ifdef CONFIG_COMPACTION 2850 { 2851 .procname = "compact_memory", 2852 .data = NULL, 2853 .maxlen = sizeof(int), 2854 .mode = 0200, 2855 .proc_handler = sysctl_compaction_handler, 2856 }, 2857 { 2858 .procname = "compaction_proactiveness", 2859 .data = &sysctl_compaction_proactiveness, 2860 .maxlen = sizeof(sysctl_compaction_proactiveness), 2861 .mode = 0644, 2862 .proc_handler = proc_dointvec_minmax, 2863 .extra1 = SYSCTL_ZERO, 2864 .extra2 = &one_hundred, 2865 }, 2866 { 2867 .procname = "extfrag_threshold", 2868 .data = &sysctl_extfrag_threshold, 2869 .maxlen = sizeof(int), 2870 .mode = 0644, 2871 .proc_handler = proc_dointvec_minmax, 2872 .extra1 = &min_extfrag_threshold, 2873 .extra2 = &max_extfrag_threshold, 2874 }, 2875 { 2876 .procname = "compact_unevictable_allowed", 2877 .data = &sysctl_compact_unevictable_allowed, 2878 .maxlen = sizeof(int), 2879 .mode = 0644, 2880 .proc_handler = proc_dointvec_minmax_warn_RT_change, 2881 .extra1 = SYSCTL_ZERO, 2882 .extra2 = SYSCTL_ONE, 2883 }, 2884 2885 #endif /* CONFIG_COMPACTION */ 2886 { 2887 .procname = "min_free_kbytes", 2888 .data = &min_free_kbytes, 2889 .maxlen = sizeof(min_free_kbytes), 2890 .mode = 0644, 2891 .proc_handler = min_free_kbytes_sysctl_handler, 2892 .extra1 = SYSCTL_ZERO, 2893 }, 2894 { 2895 .procname = "watermark_boost_factor", 2896 .data = &watermark_boost_factor, 2897 .maxlen = sizeof(watermark_boost_factor), 2898 .mode = 0644, 2899 .proc_handler = proc_dointvec_minmax, 2900 .extra1 = SYSCTL_ZERO, 2901 }, 2902 { 2903 .procname = "watermark_scale_factor", 2904 .data = &watermark_scale_factor, 2905 .maxlen = sizeof(watermark_scale_factor), 2906 .mode = 0644, 2907 .proc_handler = watermark_scale_factor_sysctl_handler, 2908 .extra1 = SYSCTL_ONE, 2909 .extra2 = &one_thousand, 2910 }, 2911 { 2912 .procname = "percpu_pagelist_high_fraction", 2913 .data = &percpu_pagelist_high_fraction, 2914 .maxlen = sizeof(percpu_pagelist_high_fraction), 2915 .mode = 0644, 2916 .proc_handler = percpu_pagelist_high_fraction_sysctl_handler, 2917 .extra1 = SYSCTL_ZERO, 2918 }, 2919 { 2920 .procname = "page_lock_unfairness", 2921 .data = &sysctl_page_lock_unfairness, 2922 .maxlen = sizeof(sysctl_page_lock_unfairness), 2923 .mode = 0644, 2924 .proc_handler = proc_dointvec_minmax, 2925 .extra1 = SYSCTL_ZERO, 2926 }, 2927 #ifdef CONFIG_MMU 2928 { 2929 .procname = "max_map_count", 2930 .data = &sysctl_max_map_count, 2931 .maxlen = sizeof(sysctl_max_map_count), 2932 .mode = 0644, 2933 .proc_handler = proc_dointvec_minmax, 2934 .extra1 = SYSCTL_ZERO, 2935 }, 2936 #else 2937 { 2938 .procname = "nr_trim_pages", 2939 .data = &sysctl_nr_trim_pages, 2940 .maxlen = sizeof(sysctl_nr_trim_pages), 2941 .mode = 0644, 2942 .proc_handler = proc_dointvec_minmax, 2943 .extra1 = SYSCTL_ZERO, 2944 }, 2945 #endif 2946 { 2947 .procname = "laptop_mode", 2948 .data = &laptop_mode, 2949 .maxlen = sizeof(laptop_mode), 2950 .mode = 0644, 2951 .proc_handler = proc_dointvec_jiffies, 2952 }, 2953 { 2954 .procname = "block_dump", 2955 .data = &block_dump, 2956 .maxlen = sizeof(block_dump), 2957 .mode = 0644, 2958 .proc_handler = proc_dointvec_minmax, 2959 .extra1 = SYSCTL_ZERO, 2960 }, 2961 { 2962 .procname = "vfs_cache_pressure", 2963 .data = &sysctl_vfs_cache_pressure, 2964 .maxlen = sizeof(sysctl_vfs_cache_pressure), 2965 .mode = 0644, 2966 .proc_handler = proc_dointvec_minmax, 2967 .extra1 = SYSCTL_ZERO, 2968 }, 2969 #if defined(HAVE_ARCH_PICK_MMAP_LAYOUT) || \ 2970 defined(CONFIG_ARCH_WANT_DEFAULT_TOPDOWN_MMAP_LAYOUT) 2971 { 2972 .procname = "legacy_va_layout", 2973 .data = &sysctl_legacy_va_layout, 2974 .maxlen = sizeof(sysctl_legacy_va_layout), 2975 .mode = 0644, 2976 .proc_handler = proc_dointvec_minmax, 2977 .extra1 = SYSCTL_ZERO, 2978 }, 2979 #endif 2980 #ifdef CONFIG_NUMA 2981 { 2982 .procname = "zone_reclaim_mode", 2983 .data = &node_reclaim_mode, 2984 .maxlen = sizeof(node_reclaim_mode), 2985 .mode = 0644, 2986 .proc_handler = proc_dointvec_minmax, 2987 .extra1 = SYSCTL_ZERO, 2988 }, 2989 { 2990 .procname = "min_unmapped_ratio", 2991 .data = &sysctl_min_unmapped_ratio, 2992 .maxlen = sizeof(sysctl_min_unmapped_ratio), 2993 .mode = 0644, 2994 .proc_handler = sysctl_min_unmapped_ratio_sysctl_handler, 2995 .extra1 = SYSCTL_ZERO, 2996 .extra2 = &one_hundred, 2997 }, 2998 { 2999 .procname = "min_slab_ratio", 3000 .data = &sysctl_min_slab_ratio, 3001 .maxlen = sizeof(sysctl_min_slab_ratio), 3002 .mode = 0644, 3003 .proc_handler = sysctl_min_slab_ratio_sysctl_handler, 3004 .extra1 = SYSCTL_ZERO, 3005 .extra2 = &one_hundred, 3006 }, 3007 #endif 3008 #ifdef CONFIG_SMP 3009 { 3010 .procname = "stat_interval", 3011 .data = &sysctl_stat_interval, 3012 .maxlen = sizeof(sysctl_stat_interval), 3013 .mode = 0644, 3014 .proc_handler = proc_dointvec_jiffies, 3015 }, 3016 { 3017 .procname = "stat_refresh", 3018 .data = NULL, 3019 .maxlen = 0, 3020 .mode = 0600, 3021 .proc_handler = vmstat_refresh, 3022 }, 3023 #endif 3024 #ifdef CONFIG_MMU 3025 { 3026 .procname = "mmap_min_addr", 3027 .data = &dac_mmap_min_addr, 3028 .maxlen = sizeof(unsigned long), 3029 .mode = 0644, 3030 .proc_handler = mmap_min_addr_handler, 3031 }, 3032 #endif 3033 #ifdef CONFIG_NUMA 3034 { 3035 .procname = "numa_zonelist_order", 3036 .data = &numa_zonelist_order, 3037 .maxlen = NUMA_ZONELIST_ORDER_LEN, 3038 .mode = 0644, 3039 .proc_handler = numa_zonelist_order_handler, 3040 }, 3041 #endif 3042 #if (defined(CONFIG_X86_32) && !defined(CONFIG_UML))|| \ 3043 (defined(CONFIG_SUPERH) && defined(CONFIG_VSYSCALL)) 3044 { 3045 .procname = "vdso_enabled", 3046 #ifdef CONFIG_X86_32 3047 .data = &vdso32_enabled, 3048 .maxlen = sizeof(vdso32_enabled), 3049 #else 3050 .data = &vdso_enabled, 3051 .maxlen = sizeof(vdso_enabled), 3052 #endif 3053 .mode = 0644, 3054 .proc_handler = proc_dointvec, 3055 .extra1 = SYSCTL_ZERO, 3056 }, 3057 #endif 3058 #ifdef CONFIG_HIGHMEM 3059 { 3060 .procname = "highmem_is_dirtyable", 3061 .data = &vm_highmem_is_dirtyable, 3062 .maxlen = sizeof(vm_highmem_is_dirtyable), 3063 .mode = 0644, 3064 .proc_handler = proc_dointvec_minmax, 3065 .extra1 = SYSCTL_ZERO, 3066 .extra2 = SYSCTL_ONE, 3067 }, 3068 #endif 3069 #ifdef CONFIG_MEMORY_FAILURE 3070 { 3071 .procname = "memory_failure_early_kill", 3072 .data = &sysctl_memory_failure_early_kill, 3073 .maxlen = sizeof(sysctl_memory_failure_early_kill), 3074 .mode = 0644, 3075 .proc_handler = proc_dointvec_minmax, 3076 .extra1 = SYSCTL_ZERO, 3077 .extra2 = SYSCTL_ONE, 3078 }, 3079 { 3080 .procname = "memory_failure_recovery", 3081 .data = &sysctl_memory_failure_recovery, 3082 .maxlen = sizeof(sysctl_memory_failure_recovery), 3083 .mode = 0644, 3084 .proc_handler = proc_dointvec_minmax, 3085 .extra1 = SYSCTL_ZERO, 3086 .extra2 = SYSCTL_ONE, 3087 }, 3088 #endif 3089 { 3090 .procname = "user_reserve_kbytes", 3091 .data = &sysctl_user_reserve_kbytes, 3092 .maxlen = sizeof(sysctl_user_reserve_kbytes), 3093 .mode = 0644, 3094 .proc_handler = proc_doulongvec_minmax, 3095 }, 3096 { 3097 .procname = "admin_reserve_kbytes", 3098 .data = &sysctl_admin_reserve_kbytes, 3099 .maxlen = sizeof(sysctl_admin_reserve_kbytes), 3100 .mode = 0644, 3101 .proc_handler = proc_doulongvec_minmax, 3102 }, 3103 #ifdef CONFIG_HAVE_ARCH_MMAP_RND_BITS 3104 { 3105 .procname = "mmap_rnd_bits", 3106 .data = &mmap_rnd_bits, 3107 .maxlen = sizeof(mmap_rnd_bits), 3108 .mode = 0600, 3109 .proc_handler = proc_dointvec_minmax, 3110 .extra1 = (void *)&mmap_rnd_bits_min, 3111 .extra2 = (void *)&mmap_rnd_bits_max, 3112 }, 3113 #endif 3114 #ifdef CONFIG_HAVE_ARCH_MMAP_RND_COMPAT_BITS 3115 { 3116 .procname = "mmap_rnd_compat_bits", 3117 .data = &mmap_rnd_compat_bits, 3118 .maxlen = sizeof(mmap_rnd_compat_bits), 3119 .mode = 0600, 3120 .proc_handler = proc_dointvec_minmax, 3121 .extra1 = (void *)&mmap_rnd_compat_bits_min, 3122 .extra2 = (void *)&mmap_rnd_compat_bits_max, 3123 }, 3124 #endif 3125 #ifdef CONFIG_USERFAULTFD 3126 { 3127 .procname = "unprivileged_userfaultfd", 3128 .data = &sysctl_unprivileged_userfaultfd, 3129 .maxlen = sizeof(sysctl_unprivileged_userfaultfd), 3130 .mode = 0644, 3131 .proc_handler = proc_dointvec_minmax, 3132 .extra1 = SYSCTL_ZERO, 3133 .extra2 = SYSCTL_ONE, 3134 }, 3135 #endif 3136 { } 3137 }; 3138 3139 static struct ctl_table fs_table[] = { 3140 { 3141 .procname = "inode-nr", 3142 .data = &inodes_stat, 3143 .maxlen = 2*sizeof(long), 3144 .mode = 0444, 3145 .proc_handler = proc_nr_inodes, 3146 }, 3147 { 3148 .procname = "inode-state", 3149 .data = &inodes_stat, 3150 .maxlen = 7*sizeof(long), 3151 .mode = 0444, 3152 .proc_handler = proc_nr_inodes, 3153 }, 3154 { 3155 .procname = "file-nr", 3156 .data = &files_stat, 3157 .maxlen = sizeof(files_stat), 3158 .mode = 0444, 3159 .proc_handler = proc_nr_files, 3160 }, 3161 { 3162 .procname = "file-max", 3163 .data = &files_stat.max_files, 3164 .maxlen = sizeof(files_stat.max_files), 3165 .mode = 0644, 3166 .proc_handler = proc_doulongvec_minmax, 3167 .extra1 = &zero_ul, 3168 .extra2 = &long_max, 3169 }, 3170 { 3171 .procname = "nr_open", 3172 .data = &sysctl_nr_open, 3173 .maxlen = sizeof(unsigned int), 3174 .mode = 0644, 3175 .proc_handler = proc_dointvec_minmax, 3176 .extra1 = &sysctl_nr_open_min, 3177 .extra2 = &sysctl_nr_open_max, 3178 }, 3179 { 3180 .procname = "dentry-state", 3181 .data = &dentry_stat, 3182 .maxlen = 6*sizeof(long), 3183 .mode = 0444, 3184 .proc_handler = proc_nr_dentry, 3185 }, 3186 { 3187 .procname = "overflowuid", 3188 .data = &fs_overflowuid, 3189 .maxlen = sizeof(int), 3190 .mode = 0644, 3191 .proc_handler = proc_dointvec_minmax, 3192 .extra1 = &minolduid, 3193 .extra2 = &maxolduid, 3194 }, 3195 { 3196 .procname = "overflowgid", 3197 .data = &fs_overflowgid, 3198 .maxlen = sizeof(int), 3199 .mode = 0644, 3200 .proc_handler = proc_dointvec_minmax, 3201 .extra1 = &minolduid, 3202 .extra2 = &maxolduid, 3203 }, 3204 #ifdef CONFIG_FILE_LOCKING 3205 { 3206 .procname = "leases-enable", 3207 .data = &leases_enable, 3208 .maxlen = sizeof(int), 3209 .mode = 0644, 3210 .proc_handler = proc_dointvec, 3211 }, 3212 #endif 3213 #ifdef CONFIG_DNOTIFY 3214 { 3215 .procname = "dir-notify-enable", 3216 .data = &dir_notify_enable, 3217 .maxlen = sizeof(int), 3218 .mode = 0644, 3219 .proc_handler = proc_dointvec, 3220 }, 3221 #endif 3222 #ifdef CONFIG_MMU 3223 #ifdef CONFIG_FILE_LOCKING 3224 { 3225 .procname = "lease-break-time", 3226 .data = &lease_break_time, 3227 .maxlen = sizeof(int), 3228 .mode = 0644, 3229 .proc_handler = proc_dointvec, 3230 }, 3231 #endif 3232 #ifdef CONFIG_AIO 3233 { 3234 .procname = "aio-nr", 3235 .data = &aio_nr, 3236 .maxlen = sizeof(aio_nr), 3237 .mode = 0444, 3238 .proc_handler = proc_doulongvec_minmax, 3239 }, 3240 { 3241 .procname = "aio-max-nr", 3242 .data = &aio_max_nr, 3243 .maxlen = sizeof(aio_max_nr), 3244 .mode = 0644, 3245 .proc_handler = proc_doulongvec_minmax, 3246 }, 3247 #endif /* CONFIG_AIO */ 3248 #ifdef CONFIG_INOTIFY_USER 3249 { 3250 .procname = "inotify", 3251 .mode = 0555, 3252 .child = inotify_table, 3253 }, 3254 #endif 3255 #ifdef CONFIG_FANOTIFY 3256 { 3257 .procname = "fanotify", 3258 .mode = 0555, 3259 .child = fanotify_table, 3260 }, 3261 #endif 3262 #ifdef CONFIG_EPOLL 3263 { 3264 .procname = "epoll", 3265 .mode = 0555, 3266 .child = epoll_table, 3267 }, 3268 #endif 3269 #endif 3270 { 3271 .procname = "protected_symlinks", 3272 .data = &sysctl_protected_symlinks, 3273 .maxlen = sizeof(int), 3274 .mode = 0600, 3275 .proc_handler = proc_dointvec_minmax, 3276 .extra1 = SYSCTL_ZERO, 3277 .extra2 = SYSCTL_ONE, 3278 }, 3279 { 3280 .procname = "protected_hardlinks", 3281 .data = &sysctl_protected_hardlinks, 3282 .maxlen = sizeof(int), 3283 .mode = 0600, 3284 .proc_handler = proc_dointvec_minmax, 3285 .extra1 = SYSCTL_ZERO, 3286 .extra2 = SYSCTL_ONE, 3287 }, 3288 { 3289 .procname = "protected_fifos", 3290 .data = &sysctl_protected_fifos, 3291 .maxlen = sizeof(int), 3292 .mode = 0600, 3293 .proc_handler = proc_dointvec_minmax, 3294 .extra1 = SYSCTL_ZERO, 3295 .extra2 = &two, 3296 }, 3297 { 3298 .procname = "protected_regular", 3299 .data = &sysctl_protected_regular, 3300 .maxlen = sizeof(int), 3301 .mode = 0600, 3302 .proc_handler = proc_dointvec_minmax, 3303 .extra1 = SYSCTL_ZERO, 3304 .extra2 = &two, 3305 }, 3306 { 3307 .procname = "suid_dumpable", 3308 .data = &suid_dumpable, 3309 .maxlen = sizeof(int), 3310 .mode = 0644, 3311 .proc_handler = proc_dointvec_minmax_coredump, 3312 .extra1 = SYSCTL_ZERO, 3313 .extra2 = &two, 3314 }, 3315 #if defined(CONFIG_BINFMT_MISC) || defined(CONFIG_BINFMT_MISC_MODULE) 3316 { 3317 .procname = "binfmt_misc", 3318 .mode = 0555, 3319 .child = sysctl_mount_point, 3320 }, 3321 #endif 3322 { 3323 .procname = "pipe-max-size", 3324 .data = &pipe_max_size, 3325 .maxlen = sizeof(pipe_max_size), 3326 .mode = 0644, 3327 .proc_handler = proc_dopipe_max_size, 3328 }, 3329 { 3330 .procname = "pipe-user-pages-hard", 3331 .data = &pipe_user_pages_hard, 3332 .maxlen = sizeof(pipe_user_pages_hard), 3333 .mode = 0644, 3334 .proc_handler = proc_doulongvec_minmax, 3335 }, 3336 { 3337 .procname = "pipe-user-pages-soft", 3338 .data = &pipe_user_pages_soft, 3339 .maxlen = sizeof(pipe_user_pages_soft), 3340 .mode = 0644, 3341 .proc_handler = proc_doulongvec_minmax, 3342 }, 3343 { 3344 .procname = "mount-max", 3345 .data = &sysctl_mount_max, 3346 .maxlen = sizeof(unsigned int), 3347 .mode = 0644, 3348 .proc_handler = proc_dointvec_minmax, 3349 .extra1 = SYSCTL_ONE, 3350 }, 3351 { } 3352 }; 3353 3354 static struct ctl_table debug_table[] = { 3355 #ifdef CONFIG_SYSCTL_EXCEPTION_TRACE 3356 { 3357 .procname = "exception-trace", 3358 .data = &show_unhandled_signals, 3359 .maxlen = sizeof(int), 3360 .mode = 0644, 3361 .proc_handler = proc_dointvec 3362 }, 3363 #endif 3364 #if defined(CONFIG_OPTPROBES) 3365 { 3366 .procname = "kprobes-optimization", 3367 .data = &sysctl_kprobes_optimization, 3368 .maxlen = sizeof(int), 3369 .mode = 0644, 3370 .proc_handler = proc_kprobes_optimization_handler, 3371 .extra1 = SYSCTL_ZERO, 3372 .extra2 = SYSCTL_ONE, 3373 }, 3374 #endif 3375 { } 3376 }; 3377 3378 static struct ctl_table dev_table[] = { 3379 { } 3380 }; 3381 3382 static struct ctl_table sysctl_base_table[] = { 3383 { 3384 .procname = "kernel", 3385 .mode = 0555, 3386 .child = kern_table, 3387 }, 3388 { 3389 .procname = "vm", 3390 .mode = 0555, 3391 .child = vm_table, 3392 }, 3393 { 3394 .procname = "fs", 3395 .mode = 0555, 3396 .child = fs_table, 3397 }, 3398 { 3399 .procname = "debug", 3400 .mode = 0555, 3401 .child = debug_table, 3402 }, 3403 { 3404 .procname = "dev", 3405 .mode = 0555, 3406 .child = dev_table, 3407 }, 3408 { } 3409 }; 3410 3411 int __init sysctl_init(void) 3412 { 3413 struct ctl_table_header *hdr; 3414 3415 hdr = register_sysctl_table(sysctl_base_table); 3416 kmemleak_not_leak(hdr); 3417 return 0; 3418 } 3419 #endif /* CONFIG_SYSCTL */ 3420 /* 3421 * No sense putting this after each symbol definition, twice, 3422 * exception granted :-) 3423 */ 3424 EXPORT_SYMBOL(proc_dointvec); 3425 EXPORT_SYMBOL(proc_douintvec); 3426 EXPORT_SYMBOL(proc_dointvec_jiffies); 3427 EXPORT_SYMBOL(proc_dointvec_minmax); 3428 EXPORT_SYMBOL_GPL(proc_douintvec_minmax); 3429 EXPORT_SYMBOL(proc_dointvec_userhz_jiffies); 3430 EXPORT_SYMBOL(proc_dointvec_ms_jiffies); 3431 EXPORT_SYMBOL(proc_dostring); 3432 EXPORT_SYMBOL(proc_doulongvec_minmax); 3433 EXPORT_SYMBOL(proc_doulongvec_ms_jiffies_minmax); 3434 EXPORT_SYMBOL(proc_do_large_bitmap); 3435