xref: /openbmc/linux/arch/x86/power/cpu.c (revision a71c8bc5dfefbbf80ef90739791554ef7ea4401b)
108687aecSSergio Luis /*
208687aecSSergio Luis  * Suspend support specific for i386/x86-64.
308687aecSSergio Luis  *
408687aecSSergio Luis  * Distribute under GPLv2
508687aecSSergio Luis  *
608687aecSSergio Luis  * Copyright (c) 2007 Rafael J. Wysocki <rjw@sisk.pl>
7a2531293SPavel Machek  * Copyright (c) 2002 Pavel Machek <pavel@ucw.cz>
808687aecSSergio Luis  * Copyright (c) 2001 Patrick Mochel <mochel@osdl.org>
908687aecSSergio Luis  */
1008687aecSSergio Luis 
1108687aecSSergio Luis #include <linux/suspend.h>
1269c60c88SPaul Gortmaker #include <linux/export.h>
1308687aecSSergio Luis #include <linux/smp.h>
1408687aecSSergio Luis 
1508687aecSSergio Luis #include <asm/pgtable.h>
1608687aecSSergio Luis #include <asm/proto.h>
1708687aecSSergio Luis #include <asm/mtrr.h>
1808687aecSSergio Luis #include <asm/page.h>
1908687aecSSergio Luis #include <asm/mce.h>
2008687aecSSergio Luis #include <asm/xcr.h>
2108687aecSSergio Luis #include <asm/suspend.h>
22eadb8a09SIngo Molnar #include <asm/debugreg.h>
231361b83aSLinus Torvalds #include <asm/fpu-internal.h> /* pcntxt_mask */
24*a71c8bc5SFenghua Yu #include <asm/cpu.h>
2508687aecSSergio Luis 
2608687aecSSergio Luis #ifdef CONFIG_X86_32
2708687aecSSergio Luis static struct saved_context saved_context;
2808687aecSSergio Luis 
2908687aecSSergio Luis unsigned long saved_context_ebx;
3008687aecSSergio Luis unsigned long saved_context_esp, saved_context_ebp;
3108687aecSSergio Luis unsigned long saved_context_esi, saved_context_edi;
3208687aecSSergio Luis unsigned long saved_context_eflags;
3308687aecSSergio Luis #else
3408687aecSSergio Luis /* CONFIG_X86_64 */
3508687aecSSergio Luis struct saved_context saved_context;
3608687aecSSergio Luis #endif
3708687aecSSergio Luis 
3808687aecSSergio Luis /**
3908687aecSSergio Luis  *	__save_processor_state - save CPU registers before creating a
4008687aecSSergio Luis  *		hibernation image and before restoring the memory state from it
4108687aecSSergio Luis  *	@ctxt - structure to store the registers contents in
4208687aecSSergio Luis  *
4308687aecSSergio Luis  *	NOTE: If there is a CPU register the modification of which by the
4408687aecSSergio Luis  *	boot kernel (ie. the kernel used for loading the hibernation image)
4508687aecSSergio Luis  *	might affect the operations of the restored target kernel (ie. the one
4608687aecSSergio Luis  *	saved in the hibernation image), then its contents must be saved by this
4708687aecSSergio Luis  *	function.  In other words, if kernel A is hibernated and different
4808687aecSSergio Luis  *	kernel B is used for loading the hibernation image into memory, the
4908687aecSSergio Luis  *	kernel A's __save_processor_state() function must save all registers
5008687aecSSergio Luis  *	needed by kernel A, so that it can operate correctly after the resume
5108687aecSSergio Luis  *	regardless of what kernel B does in the meantime.
5208687aecSSergio Luis  */
5308687aecSSergio Luis static void __save_processor_state(struct saved_context *ctxt)
5408687aecSSergio Luis {
5508687aecSSergio Luis #ifdef CONFIG_X86_32
5608687aecSSergio Luis 	mtrr_save_fixed_ranges(NULL);
5708687aecSSergio Luis #endif
5808687aecSSergio Luis 	kernel_fpu_begin();
5908687aecSSergio Luis 
6008687aecSSergio Luis 	/*
6108687aecSSergio Luis 	 * descriptor tables
6208687aecSSergio Luis 	 */
6308687aecSSergio Luis #ifdef CONFIG_X86_32
6408687aecSSergio Luis 	store_gdt(&ctxt->gdt);
6508687aecSSergio Luis 	store_idt(&ctxt->idt);
6608687aecSSergio Luis #else
6708687aecSSergio Luis /* CONFIG_X86_64 */
6808687aecSSergio Luis 	store_gdt((struct desc_ptr *)&ctxt->gdt_limit);
6908687aecSSergio Luis 	store_idt((struct desc_ptr *)&ctxt->idt_limit);
7008687aecSSergio Luis #endif
7108687aecSSergio Luis 	store_tr(ctxt->tr);
7208687aecSSergio Luis 
7308687aecSSergio Luis 	/* XMM0..XMM15 should be handled by kernel_fpu_begin(). */
7408687aecSSergio Luis 	/*
7508687aecSSergio Luis 	 * segment registers
7608687aecSSergio Luis 	 */
7708687aecSSergio Luis #ifdef CONFIG_X86_32
7808687aecSSergio Luis 	savesegment(es, ctxt->es);
7908687aecSSergio Luis 	savesegment(fs, ctxt->fs);
8008687aecSSergio Luis 	savesegment(gs, ctxt->gs);
8108687aecSSergio Luis 	savesegment(ss, ctxt->ss);
8208687aecSSergio Luis #else
8308687aecSSergio Luis /* CONFIG_X86_64 */
8408687aecSSergio Luis 	asm volatile ("movw %%ds, %0" : "=m" (ctxt->ds));
8508687aecSSergio Luis 	asm volatile ("movw %%es, %0" : "=m" (ctxt->es));
8608687aecSSergio Luis 	asm volatile ("movw %%fs, %0" : "=m" (ctxt->fs));
8708687aecSSergio Luis 	asm volatile ("movw %%gs, %0" : "=m" (ctxt->gs));
8808687aecSSergio Luis 	asm volatile ("movw %%ss, %0" : "=m" (ctxt->ss));
8908687aecSSergio Luis 
9008687aecSSergio Luis 	rdmsrl(MSR_FS_BASE, ctxt->fs_base);
9108687aecSSergio Luis 	rdmsrl(MSR_GS_BASE, ctxt->gs_base);
9208687aecSSergio Luis 	rdmsrl(MSR_KERNEL_GS_BASE, ctxt->gs_kernel_base);
9308687aecSSergio Luis 	mtrr_save_fixed_ranges(NULL);
9408687aecSSergio Luis 
9508687aecSSergio Luis 	rdmsrl(MSR_EFER, ctxt->efer);
9608687aecSSergio Luis #endif
9708687aecSSergio Luis 
9808687aecSSergio Luis 	/*
9908687aecSSergio Luis 	 * control registers
10008687aecSSergio Luis 	 */
10108687aecSSergio Luis 	ctxt->cr0 = read_cr0();
10208687aecSSergio Luis 	ctxt->cr2 = read_cr2();
10308687aecSSergio Luis 	ctxt->cr3 = read_cr3();
10408687aecSSergio Luis #ifdef CONFIG_X86_32
10508687aecSSergio Luis 	ctxt->cr4 = read_cr4_safe();
10608687aecSSergio Luis #else
10708687aecSSergio Luis /* CONFIG_X86_64 */
10808687aecSSergio Luis 	ctxt->cr4 = read_cr4();
10908687aecSSergio Luis 	ctxt->cr8 = read_cr8();
11008687aecSSergio Luis #endif
11185a0e753SOndrej Zary 	ctxt->misc_enable_saved = !rdmsrl_safe(MSR_IA32_MISC_ENABLE,
11285a0e753SOndrej Zary 					       &ctxt->misc_enable);
11308687aecSSergio Luis }
11408687aecSSergio Luis 
11508687aecSSergio Luis /* Needed by apm.c */
11608687aecSSergio Luis void save_processor_state(void)
11708687aecSSergio Luis {
11808687aecSSergio Luis 	__save_processor_state(&saved_context);
119b74f05d6SMarcelo Tosatti 	x86_platform.save_sched_clock_state();
12008687aecSSergio Luis }
12108687aecSSergio Luis #ifdef CONFIG_X86_32
12208687aecSSergio Luis EXPORT_SYMBOL(save_processor_state);
12308687aecSSergio Luis #endif
12408687aecSSergio Luis 
12508687aecSSergio Luis static void do_fpu_end(void)
12608687aecSSergio Luis {
12708687aecSSergio Luis 	/*
12808687aecSSergio Luis 	 * Restore FPU regs if necessary.
12908687aecSSergio Luis 	 */
13008687aecSSergio Luis 	kernel_fpu_end();
13108687aecSSergio Luis }
13208687aecSSergio Luis 
13308687aecSSergio Luis static void fix_processor_context(void)
13408687aecSSergio Luis {
13508687aecSSergio Luis 	int cpu = smp_processor_id();
13608687aecSSergio Luis 	struct tss_struct *t = &per_cpu(init_tss, cpu);
13708687aecSSergio Luis 
13808687aecSSergio Luis 	set_tss_desc(cpu, t);	/*
13908687aecSSergio Luis 				 * This just modifies memory; should not be
14008687aecSSergio Luis 				 * necessary. But... This is necessary, because
14108687aecSSergio Luis 				 * 386 hardware has concept of busy TSS or some
14208687aecSSergio Luis 				 * similar stupidity.
14308687aecSSergio Luis 				 */
14408687aecSSergio Luis 
14508687aecSSergio Luis #ifdef CONFIG_X86_64
14608687aecSSergio Luis 	get_cpu_gdt_table(cpu)[GDT_ENTRY_TSS].type = 9;
14708687aecSSergio Luis 
14808687aecSSergio Luis 	syscall_init();				/* This sets MSR_*STAR and related */
14908687aecSSergio Luis #endif
15008687aecSSergio Luis 	load_TR_desc();				/* This does ltr */
15108687aecSSergio Luis 	load_LDT(&current->active_mm->context);	/* This does lldt */
15208687aecSSergio Luis }
15308687aecSSergio Luis 
15408687aecSSergio Luis /**
15508687aecSSergio Luis  *	__restore_processor_state - restore the contents of CPU registers saved
15608687aecSSergio Luis  *		by __save_processor_state()
15708687aecSSergio Luis  *	@ctxt - structure to load the registers contents from
15808687aecSSergio Luis  */
15908687aecSSergio Luis static void __restore_processor_state(struct saved_context *ctxt)
16008687aecSSergio Luis {
16185a0e753SOndrej Zary 	if (ctxt->misc_enable_saved)
16285a0e753SOndrej Zary 		wrmsrl(MSR_IA32_MISC_ENABLE, ctxt->misc_enable);
16308687aecSSergio Luis 	/*
16408687aecSSergio Luis 	 * control registers
16508687aecSSergio Luis 	 */
16608687aecSSergio Luis 	/* cr4 was introduced in the Pentium CPU */
16708687aecSSergio Luis #ifdef CONFIG_X86_32
16808687aecSSergio Luis 	if (ctxt->cr4)
16908687aecSSergio Luis 		write_cr4(ctxt->cr4);
17008687aecSSergio Luis #else
17108687aecSSergio Luis /* CONFIG X86_64 */
17208687aecSSergio Luis 	wrmsrl(MSR_EFER, ctxt->efer);
17308687aecSSergio Luis 	write_cr8(ctxt->cr8);
17408687aecSSergio Luis 	write_cr4(ctxt->cr4);
17508687aecSSergio Luis #endif
17608687aecSSergio Luis 	write_cr3(ctxt->cr3);
17708687aecSSergio Luis 	write_cr2(ctxt->cr2);
17808687aecSSergio Luis 	write_cr0(ctxt->cr0);
17908687aecSSergio Luis 
18008687aecSSergio Luis 	/*
18108687aecSSergio Luis 	 * now restore the descriptor tables to their proper values
18208687aecSSergio Luis 	 * ltr is done i fix_processor_context().
18308687aecSSergio Luis 	 */
18408687aecSSergio Luis #ifdef CONFIG_X86_32
18508687aecSSergio Luis 	load_gdt(&ctxt->gdt);
18608687aecSSergio Luis 	load_idt(&ctxt->idt);
18708687aecSSergio Luis #else
18808687aecSSergio Luis /* CONFIG_X86_64 */
18908687aecSSergio Luis 	load_gdt((const struct desc_ptr *)&ctxt->gdt_limit);
19008687aecSSergio Luis 	load_idt((const struct desc_ptr *)&ctxt->idt_limit);
19108687aecSSergio Luis #endif
19208687aecSSergio Luis 
19308687aecSSergio Luis 	/*
19408687aecSSergio Luis 	 * segment registers
19508687aecSSergio Luis 	 */
19608687aecSSergio Luis #ifdef CONFIG_X86_32
19708687aecSSergio Luis 	loadsegment(es, ctxt->es);
19808687aecSSergio Luis 	loadsegment(fs, ctxt->fs);
19908687aecSSergio Luis 	loadsegment(gs, ctxt->gs);
20008687aecSSergio Luis 	loadsegment(ss, ctxt->ss);
20108687aecSSergio Luis 
20208687aecSSergio Luis 	/*
20308687aecSSergio Luis 	 * sysenter MSRs
20408687aecSSergio Luis 	 */
20508687aecSSergio Luis 	if (boot_cpu_has(X86_FEATURE_SEP))
20608687aecSSergio Luis 		enable_sep_cpu();
20708687aecSSergio Luis #else
20808687aecSSergio Luis /* CONFIG_X86_64 */
20908687aecSSergio Luis 	asm volatile ("movw %0, %%ds" :: "r" (ctxt->ds));
21008687aecSSergio Luis 	asm volatile ("movw %0, %%es" :: "r" (ctxt->es));
21108687aecSSergio Luis 	asm volatile ("movw %0, %%fs" :: "r" (ctxt->fs));
21208687aecSSergio Luis 	load_gs_index(ctxt->gs);
21308687aecSSergio Luis 	asm volatile ("movw %0, %%ss" :: "r" (ctxt->ss));
21408687aecSSergio Luis 
21508687aecSSergio Luis 	wrmsrl(MSR_FS_BASE, ctxt->fs_base);
21608687aecSSergio Luis 	wrmsrl(MSR_GS_BASE, ctxt->gs_base);
21708687aecSSergio Luis 	wrmsrl(MSR_KERNEL_GS_BASE, ctxt->gs_kernel_base);
21808687aecSSergio Luis #endif
21908687aecSSergio Luis 
22008687aecSSergio Luis 	/*
22108687aecSSergio Luis 	 * restore XCR0 for xsave capable cpu's.
22208687aecSSergio Luis 	 */
22308687aecSSergio Luis 	if (cpu_has_xsave)
22408687aecSSergio Luis 		xsetbv(XCR_XFEATURE_ENABLED_MASK, pcntxt_mask);
22508687aecSSergio Luis 
22608687aecSSergio Luis 	fix_processor_context();
22708687aecSSergio Luis 
22808687aecSSergio Luis 	do_fpu_end();
229dba69d10SMarcelo Tosatti 	x86_platform.restore_sched_clock_state();
230d0af9eedSSuresh Siddha 	mtrr_bp_restore();
23108687aecSSergio Luis }
23208687aecSSergio Luis 
23308687aecSSergio Luis /* Needed by apm.c */
23408687aecSSergio Luis void restore_processor_state(void)
23508687aecSSergio Luis {
23608687aecSSergio Luis 	__restore_processor_state(&saved_context);
23708687aecSSergio Luis }
23808687aecSSergio Luis #ifdef CONFIG_X86_32
23908687aecSSergio Luis EXPORT_SYMBOL(restore_processor_state);
24008687aecSSergio Luis #endif
241209efae1SFenghua Yu 
242209efae1SFenghua Yu /*
243209efae1SFenghua Yu  * When bsp_check() is called in hibernate and suspend, cpu hotplug
244209efae1SFenghua Yu  * is disabled already. So it's unnessary to handle race condition between
245209efae1SFenghua Yu  * cpumask query and cpu hotplug.
246209efae1SFenghua Yu  */
247209efae1SFenghua Yu static int bsp_check(void)
248209efae1SFenghua Yu {
249209efae1SFenghua Yu 	if (cpumask_first(cpu_online_mask) != 0) {
250209efae1SFenghua Yu 		pr_warn("CPU0 is offline.\n");
251209efae1SFenghua Yu 		return -ENODEV;
252209efae1SFenghua Yu 	}
253209efae1SFenghua Yu 
254209efae1SFenghua Yu 	return 0;
255209efae1SFenghua Yu }
256209efae1SFenghua Yu 
257209efae1SFenghua Yu static int bsp_pm_callback(struct notifier_block *nb, unsigned long action,
258209efae1SFenghua Yu 			   void *ptr)
259209efae1SFenghua Yu {
260209efae1SFenghua Yu 	int ret = 0;
261209efae1SFenghua Yu 
262209efae1SFenghua Yu 	switch (action) {
263209efae1SFenghua Yu 	case PM_SUSPEND_PREPARE:
264209efae1SFenghua Yu 	case PM_HIBERNATION_PREPARE:
265209efae1SFenghua Yu 		ret = bsp_check();
266209efae1SFenghua Yu 		break;
267*a71c8bc5SFenghua Yu #ifdef CONFIG_DEBUG_HOTPLUG_CPU0
268*a71c8bc5SFenghua Yu 	case PM_RESTORE_PREPARE:
269*a71c8bc5SFenghua Yu 		/*
270*a71c8bc5SFenghua Yu 		 * When system resumes from hibernation, online CPU0 because
271*a71c8bc5SFenghua Yu 		 * 1. it's required for resume and
272*a71c8bc5SFenghua Yu 		 * 2. the CPU was online before hibernation
273*a71c8bc5SFenghua Yu 		 */
274*a71c8bc5SFenghua Yu 		if (!cpu_online(0))
275*a71c8bc5SFenghua Yu 			_debug_hotplug_cpu(0, 1);
276*a71c8bc5SFenghua Yu 		break;
277*a71c8bc5SFenghua Yu 	case PM_POST_RESTORE:
278*a71c8bc5SFenghua Yu 		/*
279*a71c8bc5SFenghua Yu 		 * When a resume really happens, this code won't be called.
280*a71c8bc5SFenghua Yu 		 *
281*a71c8bc5SFenghua Yu 		 * This code is called only when user space hibernation software
282*a71c8bc5SFenghua Yu 		 * prepares for snapshot device during boot time. So we just
283*a71c8bc5SFenghua Yu 		 * call _debug_hotplug_cpu() to restore to CPU0's state prior to
284*a71c8bc5SFenghua Yu 		 * preparing the snapshot device.
285*a71c8bc5SFenghua Yu 		 *
286*a71c8bc5SFenghua Yu 		 * This works for normal boot case in our CPU0 hotplug debug
287*a71c8bc5SFenghua Yu 		 * mode, i.e. CPU0 is offline and user mode hibernation
288*a71c8bc5SFenghua Yu 		 * software initializes during boot time.
289*a71c8bc5SFenghua Yu 		 *
290*a71c8bc5SFenghua Yu 		 * If CPU0 is online and user application accesses snapshot
291*a71c8bc5SFenghua Yu 		 * device after boot time, this will offline CPU0 and user may
292*a71c8bc5SFenghua Yu 		 * see different CPU0 state before and after accessing
293*a71c8bc5SFenghua Yu 		 * the snapshot device. But hopefully this is not a case when
294*a71c8bc5SFenghua Yu 		 * user debugging CPU0 hotplug. Even if users hit this case,
295*a71c8bc5SFenghua Yu 		 * they can easily online CPU0 back.
296*a71c8bc5SFenghua Yu 		 *
297*a71c8bc5SFenghua Yu 		 * To simplify this debug code, we only consider normal boot
298*a71c8bc5SFenghua Yu 		 * case. Otherwise we need to remember CPU0's state and restore
299*a71c8bc5SFenghua Yu 		 * to that state and resolve racy conditions etc.
300*a71c8bc5SFenghua Yu 		 */
301*a71c8bc5SFenghua Yu 		_debug_hotplug_cpu(0, 0);
302*a71c8bc5SFenghua Yu 		break;
303*a71c8bc5SFenghua Yu #endif
304209efae1SFenghua Yu 	default:
305209efae1SFenghua Yu 		break;
306209efae1SFenghua Yu 	}
307209efae1SFenghua Yu 	return notifier_from_errno(ret);
308209efae1SFenghua Yu }
309209efae1SFenghua Yu 
310209efae1SFenghua Yu static int __init bsp_pm_check_init(void)
311209efae1SFenghua Yu {
312209efae1SFenghua Yu 	/*
313209efae1SFenghua Yu 	 * Set this bsp_pm_callback as lower priority than
314209efae1SFenghua Yu 	 * cpu_hotplug_pm_callback. So cpu_hotplug_pm_callback will be called
315209efae1SFenghua Yu 	 * earlier to disable cpu hotplug before bsp online check.
316209efae1SFenghua Yu 	 */
317209efae1SFenghua Yu 	pm_notifier(bsp_pm_callback, -INT_MAX);
318209efae1SFenghua Yu 	return 0;
319209efae1SFenghua Yu }
320209efae1SFenghua Yu 
321209efae1SFenghua Yu core_initcall(bsp_pm_check_init);
322