1 /* 2 * kernel/power/main.c - PM subsystem core functionality. 3 * 4 * Copyright (c) 2003 Patrick Mochel 5 * Copyright (c) 2003 Open Source Development Lab 6 * 7 * This file is released under the GPLv2 8 * 9 */ 10 11 #include <linux/module.h> 12 #include <linux/suspend.h> 13 #include <linux/kobject.h> 14 #include <linux/string.h> 15 #include <linux/delay.h> 16 #include <linux/errno.h> 17 #include <linux/kmod.h> 18 #include <linux/init.h> 19 #include <linux/console.h> 20 #include <linux/cpu.h> 21 #include <linux/resume-trace.h> 22 #include <linux/freezer.h> 23 #include <linux/vmstat.h> 24 #include <linux/syscalls.h> 25 26 #include "power.h" 27 28 DEFINE_MUTEX(pm_mutex); 29 30 unsigned int pm_flags; 31 EXPORT_SYMBOL(pm_flags); 32 33 #ifdef CONFIG_PM_SLEEP 34 35 /* Routines for PM-transition notifications */ 36 37 static BLOCKING_NOTIFIER_HEAD(pm_chain_head); 38 39 int register_pm_notifier(struct notifier_block *nb) 40 { 41 return blocking_notifier_chain_register(&pm_chain_head, nb); 42 } 43 EXPORT_SYMBOL_GPL(register_pm_notifier); 44 45 int unregister_pm_notifier(struct notifier_block *nb) 46 { 47 return blocking_notifier_chain_unregister(&pm_chain_head, nb); 48 } 49 EXPORT_SYMBOL_GPL(unregister_pm_notifier); 50 51 int pm_notifier_call_chain(unsigned long val) 52 { 53 return (blocking_notifier_call_chain(&pm_chain_head, val, NULL) 54 == NOTIFY_BAD) ? -EINVAL : 0; 55 } 56 57 #ifdef CONFIG_PM_DEBUG 58 int pm_test_level = TEST_NONE; 59 60 static const char * const pm_tests[__TEST_AFTER_LAST] = { 61 [TEST_NONE] = "none", 62 [TEST_CORE] = "core", 63 [TEST_CPUS] = "processors", 64 [TEST_PLATFORM] = "platform", 65 [TEST_DEVICES] = "devices", 66 [TEST_FREEZER] = "freezer", 67 }; 68 69 static ssize_t pm_test_show(struct kobject *kobj, struct kobj_attribute *attr, 70 char *buf) 71 { 72 char *s = buf; 73 int level; 74 75 for (level = TEST_FIRST; level <= TEST_MAX; level++) 76 if (pm_tests[level]) { 77 if (level == pm_test_level) 78 s += sprintf(s, "[%s] ", pm_tests[level]); 79 else 80 s += sprintf(s, "%s ", pm_tests[level]); 81 } 82 83 if (s != buf) 84 /* convert the last space to a newline */ 85 *(s-1) = '\n'; 86 87 return (s - buf); 88 } 89 90 static ssize_t pm_test_store(struct kobject *kobj, struct kobj_attribute *attr, 91 const char *buf, size_t n) 92 { 93 const char * const *s; 94 int level; 95 char *p; 96 int len; 97 int error = -EINVAL; 98 99 p = memchr(buf, '\n', n); 100 len = p ? p - buf : n; 101 102 mutex_lock(&pm_mutex); 103 104 level = TEST_FIRST; 105 for (s = &pm_tests[level]; level <= TEST_MAX; s++, level++) 106 if (*s && len == strlen(*s) && !strncmp(buf, *s, len)) { 107 pm_test_level = level; 108 error = 0; 109 break; 110 } 111 112 mutex_unlock(&pm_mutex); 113 114 return error ? error : n; 115 } 116 117 power_attr(pm_test); 118 #endif /* CONFIG_PM_DEBUG */ 119 120 #endif /* CONFIG_PM_SLEEP */ 121 122 #ifdef CONFIG_SUSPEND 123 124 static int suspend_test(int level) 125 { 126 #ifdef CONFIG_PM_DEBUG 127 if (pm_test_level == level) { 128 printk(KERN_INFO "suspend debug: Waiting for 5 seconds.\n"); 129 mdelay(5000); 130 return 1; 131 } 132 #endif /* !CONFIG_PM_DEBUG */ 133 return 0; 134 } 135 136 #ifdef CONFIG_PM_TEST_SUSPEND 137 138 /* 139 * We test the system suspend code by setting an RTC wakealarm a short 140 * time in the future, then suspending. Suspending the devices won't 141 * normally take long ... some systems only need a few milliseconds. 142 * 143 * The time it takes is system-specific though, so when we test this 144 * during system bootup we allow a LOT of time. 145 */ 146 #define TEST_SUSPEND_SECONDS 5 147 148 static unsigned long suspend_test_start_time; 149 150 static void suspend_test_start(void) 151 { 152 /* FIXME Use better timebase than "jiffies", ideally a clocksource. 153 * What we want is a hardware counter that will work correctly even 154 * during the irqs-are-off stages of the suspend/resume cycle... 155 */ 156 suspend_test_start_time = jiffies; 157 } 158 159 static void suspend_test_finish(const char *label) 160 { 161 long nj = jiffies - suspend_test_start_time; 162 unsigned msec; 163 164 msec = jiffies_to_msecs(abs(nj)); 165 pr_info("PM: %s took %d.%03d seconds\n", label, 166 msec / 1000, msec % 1000); 167 168 /* Warning on suspend means the RTC alarm period needs to be 169 * larger -- the system was sooo slooowwww to suspend that the 170 * alarm (should have) fired before the system went to sleep! 171 * 172 * Warning on either suspend or resume also means the system 173 * has some performance issues. The stack dump of a WARN_ON 174 * is more likely to get the right attention than a printk... 175 */ 176 WARN(msec > (TEST_SUSPEND_SECONDS * 1000), "Component: %s\n", label); 177 } 178 179 #else 180 181 static void suspend_test_start(void) 182 { 183 } 184 185 static void suspend_test_finish(const char *label) 186 { 187 } 188 189 #endif 190 191 /* This is just an arbitrary number */ 192 #define FREE_PAGE_NUMBER (100) 193 194 static struct platform_suspend_ops *suspend_ops; 195 196 /** 197 * suspend_set_ops - Set the global suspend method table. 198 * @ops: Pointer to ops structure. 199 */ 200 201 void suspend_set_ops(struct platform_suspend_ops *ops) 202 { 203 mutex_lock(&pm_mutex); 204 suspend_ops = ops; 205 mutex_unlock(&pm_mutex); 206 } 207 208 /** 209 * suspend_valid_only_mem - generic memory-only valid callback 210 * 211 * Platform drivers that implement mem suspend only and only need 212 * to check for that in their .valid callback can use this instead 213 * of rolling their own .valid callback. 214 */ 215 int suspend_valid_only_mem(suspend_state_t state) 216 { 217 return state == PM_SUSPEND_MEM; 218 } 219 220 /** 221 * suspend_prepare - Do prep work before entering low-power state. 222 * 223 * This is common code that is called for each state that we're entering. 224 * Run suspend notifiers, allocate a console and stop all processes. 225 */ 226 static int suspend_prepare(void) 227 { 228 int error; 229 unsigned int free_pages; 230 231 if (!suspend_ops || !suspend_ops->enter) 232 return -EPERM; 233 234 pm_prepare_console(); 235 236 error = pm_notifier_call_chain(PM_SUSPEND_PREPARE); 237 if (error) 238 goto Finish; 239 240 error = usermodehelper_disable(); 241 if (error) 242 goto Finish; 243 244 if (suspend_freeze_processes()) { 245 error = -EAGAIN; 246 goto Thaw; 247 } 248 249 free_pages = global_page_state(NR_FREE_PAGES); 250 if (free_pages < FREE_PAGE_NUMBER) { 251 pr_debug("PM: free some memory\n"); 252 shrink_all_memory(FREE_PAGE_NUMBER - free_pages); 253 if (nr_free_pages() < FREE_PAGE_NUMBER) { 254 error = -ENOMEM; 255 printk(KERN_ERR "PM: No enough memory\n"); 256 } 257 } 258 if (!error) 259 return 0; 260 261 Thaw: 262 suspend_thaw_processes(); 263 usermodehelper_enable(); 264 Finish: 265 pm_notifier_call_chain(PM_POST_SUSPEND); 266 pm_restore_console(); 267 return error; 268 } 269 270 /* default implementation */ 271 void __attribute__ ((weak)) arch_suspend_disable_irqs(void) 272 { 273 local_irq_disable(); 274 } 275 276 /* default implementation */ 277 void __attribute__ ((weak)) arch_suspend_enable_irqs(void) 278 { 279 local_irq_enable(); 280 } 281 282 /** 283 * suspend_enter - enter the desired system sleep state. 284 * @state: state to enter 285 * 286 * This function should be called after devices have been suspended. 287 */ 288 static int suspend_enter(suspend_state_t state) 289 { 290 int error; 291 292 device_pm_lock(); 293 294 if (suspend_ops->prepare) { 295 error = suspend_ops->prepare(); 296 if (error) 297 goto Done; 298 } 299 300 error = device_power_down(PMSG_SUSPEND); 301 if (error) { 302 printk(KERN_ERR "PM: Some devices failed to power down\n"); 303 goto Platfrom_finish; 304 } 305 306 if (suspend_ops->prepare_late) { 307 error = suspend_ops->prepare_late(); 308 if (error) 309 goto Power_up_devices; 310 } 311 312 if (suspend_test(TEST_PLATFORM)) 313 goto Platform_wake; 314 315 error = disable_nonboot_cpus(); 316 if (error || suspend_test(TEST_CPUS)) 317 goto Enable_cpus; 318 319 arch_suspend_disable_irqs(); 320 BUG_ON(!irqs_disabled()); 321 322 error = sysdev_suspend(PMSG_SUSPEND); 323 if (!error) { 324 if (!suspend_test(TEST_CORE)) 325 error = suspend_ops->enter(state); 326 sysdev_resume(); 327 } 328 329 arch_suspend_enable_irqs(); 330 BUG_ON(irqs_disabled()); 331 332 Enable_cpus: 333 enable_nonboot_cpus(); 334 335 Platform_wake: 336 if (suspend_ops->wake) 337 suspend_ops->wake(); 338 339 Power_up_devices: 340 device_power_up(PMSG_RESUME); 341 342 Platfrom_finish: 343 if (suspend_ops->finish) 344 suspend_ops->finish(); 345 346 Done: 347 device_pm_unlock(); 348 349 return error; 350 } 351 352 /** 353 * suspend_devices_and_enter - suspend devices and enter the desired system 354 * sleep state. 355 * @state: state to enter 356 */ 357 int suspend_devices_and_enter(suspend_state_t state) 358 { 359 int error; 360 361 if (!suspend_ops) 362 return -ENOSYS; 363 364 if (suspend_ops->begin) { 365 error = suspend_ops->begin(state); 366 if (error) 367 goto Close; 368 } 369 suspend_console(); 370 suspend_test_start(); 371 error = device_suspend(PMSG_SUSPEND); 372 if (error) { 373 printk(KERN_ERR "PM: Some devices failed to suspend\n"); 374 goto Recover_platform; 375 } 376 suspend_test_finish("suspend devices"); 377 if (suspend_test(TEST_DEVICES)) 378 goto Recover_platform; 379 380 suspend_enter(state); 381 382 Resume_devices: 383 suspend_test_start(); 384 device_resume(PMSG_RESUME); 385 suspend_test_finish("resume devices"); 386 resume_console(); 387 Close: 388 if (suspend_ops->end) 389 suspend_ops->end(); 390 return error; 391 392 Recover_platform: 393 if (suspend_ops->recover) 394 suspend_ops->recover(); 395 goto Resume_devices; 396 } 397 398 /** 399 * suspend_finish - Do final work before exiting suspend sequence. 400 * 401 * Call platform code to clean up, restart processes, and free the 402 * console that we've allocated. This is not called for suspend-to-disk. 403 */ 404 static void suspend_finish(void) 405 { 406 suspend_thaw_processes(); 407 usermodehelper_enable(); 408 pm_notifier_call_chain(PM_POST_SUSPEND); 409 pm_restore_console(); 410 } 411 412 413 414 415 static const char * const pm_states[PM_SUSPEND_MAX] = { 416 [PM_SUSPEND_STANDBY] = "standby", 417 [PM_SUSPEND_MEM] = "mem", 418 }; 419 420 static inline int valid_state(suspend_state_t state) 421 { 422 /* All states need lowlevel support and need to be valid 423 * to the lowlevel implementation, no valid callback 424 * implies that none are valid. */ 425 if (!suspend_ops || !suspend_ops->valid || !suspend_ops->valid(state)) 426 return 0; 427 return 1; 428 } 429 430 431 /** 432 * enter_state - Do common work of entering low-power state. 433 * @state: pm_state structure for state we're entering. 434 * 435 * Make sure we're the only ones trying to enter a sleep state. Fail 436 * if someone has beat us to it, since we don't want anything weird to 437 * happen when we wake up. 438 * Then, do the setup for suspend, enter the state, and cleaup (after 439 * we've woken up). 440 */ 441 static int enter_state(suspend_state_t state) 442 { 443 int error; 444 445 if (!valid_state(state)) 446 return -ENODEV; 447 448 if (!mutex_trylock(&pm_mutex)) 449 return -EBUSY; 450 451 printk(KERN_INFO "PM: Syncing filesystems ... "); 452 sys_sync(); 453 printk("done.\n"); 454 455 pr_debug("PM: Preparing system for %s sleep\n", pm_states[state]); 456 error = suspend_prepare(); 457 if (error) 458 goto Unlock; 459 460 if (suspend_test(TEST_FREEZER)) 461 goto Finish; 462 463 pr_debug("PM: Entering %s sleep\n", pm_states[state]); 464 error = suspend_devices_and_enter(state); 465 466 Finish: 467 pr_debug("PM: Finishing wakeup.\n"); 468 suspend_finish(); 469 Unlock: 470 mutex_unlock(&pm_mutex); 471 return error; 472 } 473 474 475 /** 476 * pm_suspend - Externally visible function for suspending system. 477 * @state: Enumerated value of state to enter. 478 * 479 * Determine whether or not value is within range, get state 480 * structure, and enter (above). 481 */ 482 483 int pm_suspend(suspend_state_t state) 484 { 485 if (state > PM_SUSPEND_ON && state <= PM_SUSPEND_MAX) 486 return enter_state(state); 487 return -EINVAL; 488 } 489 490 EXPORT_SYMBOL(pm_suspend); 491 492 #endif /* CONFIG_SUSPEND */ 493 494 struct kobject *power_kobj; 495 496 /** 497 * state - control system power state. 498 * 499 * show() returns what states are supported, which is hard-coded to 500 * 'standby' (Power-On Suspend), 'mem' (Suspend-to-RAM), and 501 * 'disk' (Suspend-to-Disk). 502 * 503 * store() accepts one of those strings, translates it into the 504 * proper enumerated value, and initiates a suspend transition. 505 */ 506 507 static ssize_t state_show(struct kobject *kobj, struct kobj_attribute *attr, 508 char *buf) 509 { 510 char *s = buf; 511 #ifdef CONFIG_SUSPEND 512 int i; 513 514 for (i = 0; i < PM_SUSPEND_MAX; i++) { 515 if (pm_states[i] && valid_state(i)) 516 s += sprintf(s,"%s ", pm_states[i]); 517 } 518 #endif 519 #ifdef CONFIG_HIBERNATION 520 s += sprintf(s, "%s\n", "disk"); 521 #else 522 if (s != buf) 523 /* convert the last space to a newline */ 524 *(s-1) = '\n'; 525 #endif 526 return (s - buf); 527 } 528 529 static ssize_t state_store(struct kobject *kobj, struct kobj_attribute *attr, 530 const char *buf, size_t n) 531 { 532 #ifdef CONFIG_SUSPEND 533 suspend_state_t state = PM_SUSPEND_STANDBY; 534 const char * const *s; 535 #endif 536 char *p; 537 int len; 538 int error = -EINVAL; 539 540 p = memchr(buf, '\n', n); 541 len = p ? p - buf : n; 542 543 /* First, check if we are requested to hibernate */ 544 if (len == 4 && !strncmp(buf, "disk", len)) { 545 error = hibernate(); 546 goto Exit; 547 } 548 549 #ifdef CONFIG_SUSPEND 550 for (s = &pm_states[state]; state < PM_SUSPEND_MAX; s++, state++) { 551 if (*s && len == strlen(*s) && !strncmp(buf, *s, len)) 552 break; 553 } 554 if (state < PM_SUSPEND_MAX && *s) 555 error = enter_state(state); 556 #endif 557 558 Exit: 559 return error ? error : n; 560 } 561 562 power_attr(state); 563 564 #ifdef CONFIG_PM_TRACE 565 int pm_trace_enabled; 566 567 static ssize_t pm_trace_show(struct kobject *kobj, struct kobj_attribute *attr, 568 char *buf) 569 { 570 return sprintf(buf, "%d\n", pm_trace_enabled); 571 } 572 573 static ssize_t 574 pm_trace_store(struct kobject *kobj, struct kobj_attribute *attr, 575 const char *buf, size_t n) 576 { 577 int val; 578 579 if (sscanf(buf, "%d", &val) == 1) { 580 pm_trace_enabled = !!val; 581 return n; 582 } 583 return -EINVAL; 584 } 585 586 power_attr(pm_trace); 587 #endif /* CONFIG_PM_TRACE */ 588 589 static struct attribute * g[] = { 590 &state_attr.attr, 591 #ifdef CONFIG_PM_TRACE 592 &pm_trace_attr.attr, 593 #endif 594 #if defined(CONFIG_PM_SLEEP) && defined(CONFIG_PM_DEBUG) 595 &pm_test_attr.attr, 596 #endif 597 NULL, 598 }; 599 600 static struct attribute_group attr_group = { 601 .attrs = g, 602 }; 603 604 605 static int __init pm_init(void) 606 { 607 power_kobj = kobject_create_and_add("power", NULL); 608 if (!power_kobj) 609 return -ENOMEM; 610 return sysfs_create_group(power_kobj, &attr_group); 611 } 612 613 core_initcall(pm_init); 614 615 616 #ifdef CONFIG_PM_TEST_SUSPEND 617 618 #include <linux/rtc.h> 619 620 /* 621 * To test system suspend, we need a hands-off mechanism to resume the 622 * system. RTCs wake alarms are a common self-contained mechanism. 623 */ 624 625 static void __init test_wakealarm(struct rtc_device *rtc, suspend_state_t state) 626 { 627 static char err_readtime[] __initdata = 628 KERN_ERR "PM: can't read %s time, err %d\n"; 629 static char err_wakealarm [] __initdata = 630 KERN_ERR "PM: can't set %s wakealarm, err %d\n"; 631 static char err_suspend[] __initdata = 632 KERN_ERR "PM: suspend test failed, error %d\n"; 633 static char info_test[] __initdata = 634 KERN_INFO "PM: test RTC wakeup from '%s' suspend\n"; 635 636 unsigned long now; 637 struct rtc_wkalrm alm; 638 int status; 639 640 /* this may fail if the RTC hasn't been initialized */ 641 status = rtc_read_time(rtc, &alm.time); 642 if (status < 0) { 643 printk(err_readtime, dev_name(&rtc->dev), status); 644 return; 645 } 646 rtc_tm_to_time(&alm.time, &now); 647 648 memset(&alm, 0, sizeof alm); 649 rtc_time_to_tm(now + TEST_SUSPEND_SECONDS, &alm.time); 650 alm.enabled = true; 651 652 status = rtc_set_alarm(rtc, &alm); 653 if (status < 0) { 654 printk(err_wakealarm, dev_name(&rtc->dev), status); 655 return; 656 } 657 658 if (state == PM_SUSPEND_MEM) { 659 printk(info_test, pm_states[state]); 660 status = pm_suspend(state); 661 if (status == -ENODEV) 662 state = PM_SUSPEND_STANDBY; 663 } 664 if (state == PM_SUSPEND_STANDBY) { 665 printk(info_test, pm_states[state]); 666 status = pm_suspend(state); 667 } 668 if (status < 0) 669 printk(err_suspend, status); 670 671 /* Some platforms can't detect that the alarm triggered the 672 * wakeup, or (accordingly) disable it after it afterwards. 673 * It's supposed to give oneshot behavior; cope. 674 */ 675 alm.enabled = false; 676 rtc_set_alarm(rtc, &alm); 677 } 678 679 static int __init has_wakealarm(struct device *dev, void *name_ptr) 680 { 681 struct rtc_device *candidate = to_rtc_device(dev); 682 683 if (!candidate->ops->set_alarm) 684 return 0; 685 if (!device_may_wakeup(candidate->dev.parent)) 686 return 0; 687 688 *(const char **)name_ptr = dev_name(dev); 689 return 1; 690 } 691 692 /* 693 * Kernel options like "test_suspend=mem" force suspend/resume sanity tests 694 * at startup time. They're normally disabled, for faster boot and because 695 * we can't know which states really work on this particular system. 696 */ 697 static suspend_state_t test_state __initdata = PM_SUSPEND_ON; 698 699 static char warn_bad_state[] __initdata = 700 KERN_WARNING "PM: can't test '%s' suspend state\n"; 701 702 static int __init setup_test_suspend(char *value) 703 { 704 unsigned i; 705 706 /* "=mem" ==> "mem" */ 707 value++; 708 for (i = 0; i < PM_SUSPEND_MAX; i++) { 709 if (!pm_states[i]) 710 continue; 711 if (strcmp(pm_states[i], value) != 0) 712 continue; 713 test_state = (__force suspend_state_t) i; 714 return 0; 715 } 716 printk(warn_bad_state, value); 717 return 0; 718 } 719 __setup("test_suspend", setup_test_suspend); 720 721 static int __init test_suspend(void) 722 { 723 static char warn_no_rtc[] __initdata = 724 KERN_WARNING "PM: no wakealarm-capable RTC driver is ready\n"; 725 726 char *pony = NULL; 727 struct rtc_device *rtc = NULL; 728 729 /* PM is initialized by now; is that state testable? */ 730 if (test_state == PM_SUSPEND_ON) 731 goto done; 732 if (!valid_state(test_state)) { 733 printk(warn_bad_state, pm_states[test_state]); 734 goto done; 735 } 736 737 /* RTCs have initialized by now too ... can we use one? */ 738 class_find_device(rtc_class, NULL, &pony, has_wakealarm); 739 if (pony) 740 rtc = rtc_class_open(pony); 741 if (!rtc) { 742 printk(warn_no_rtc); 743 goto done; 744 } 745 746 /* go for it */ 747 test_wakealarm(rtc, test_state); 748 rtc_class_close(rtc); 749 done: 750 return 0; 751 } 752 late_initcall(test_suspend); 753 754 #endif /* CONFIG_PM_TEST_SUSPEND */ 755