xref: /openbmc/linux/arch/x86/kernel/idt.c (revision d15cb3da)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * Interrupt descriptor table related code
4  */
5 #include <linux/interrupt.h>
6 
7 #include <asm/cpu_entry_area.h>
8 #include <asm/set_memory.h>
9 #include <asm/traps.h>
10 #include <asm/proto.h>
11 #include <asm/desc.h>
12 #include <asm/hw_irq.h>
13 #include <asm/idtentry.h>
14 
15 #define DPL0		0x0
16 #define DPL3		0x3
17 
18 #define DEFAULT_STACK	0
19 
20 #define G(_vector, _addr, _ist, _type, _dpl, _segment)	\
21 	{						\
22 		.vector		= _vector,		\
23 		.bits.ist	= _ist,			\
24 		.bits.type	= _type,		\
25 		.bits.dpl	= _dpl,			\
26 		.bits.p		= 1,			\
27 		.addr		= _addr,		\
28 		.segment	= _segment,		\
29 	}
30 
31 /* Interrupt gate */
32 #define INTG(_vector, _addr)				\
33 	G(_vector, _addr, DEFAULT_STACK, GATE_INTERRUPT, DPL0, __KERNEL_CS)
34 
35 /* System interrupt gate */
36 #define SYSG(_vector, _addr)				\
37 	G(_vector, _addr, DEFAULT_STACK, GATE_INTERRUPT, DPL3, __KERNEL_CS)
38 
39 #ifdef CONFIG_X86_64
40 /*
41  * Interrupt gate with interrupt stack. The _ist index is the index in
42  * the tss.ist[] array, but for the descriptor it needs to start at 1.
43  */
44 #define ISTG(_vector, _addr, _ist)			\
45 	G(_vector, _addr, _ist + 1, GATE_INTERRUPT, DPL0, __KERNEL_CS)
46 #else
47 #define ISTG(_vector, _addr, _ist)	INTG(_vector, _addr)
48 #endif
49 
50 /* Task gate */
51 #define TSKG(_vector, _gdt)				\
52 	G(_vector, NULL, DEFAULT_STACK, GATE_TASK, DPL0, _gdt << 3)
53 
54 #define IDT_TABLE_SIZE		(IDT_ENTRIES * sizeof(gate_desc))
55 
56 static bool idt_setup_done __initdata;
57 
58 /*
59  * Early traps running on the DEFAULT_STACK because the other interrupt
60  * stacks work only after cpu_init().
61  */
62 static const __initconst struct idt_data early_idts[] = {
63 	INTG(X86_TRAP_DB,		asm_exc_debug),
64 	SYSG(X86_TRAP_BP,		asm_exc_int3),
65 
66 #ifdef CONFIG_X86_32
67 	/*
68 	 * Not possible on 64-bit. See idt_setup_early_pf() for details.
69 	 */
70 	INTG(X86_TRAP_PF,		asm_exc_page_fault),
71 #endif
72 };
73 
74 /*
75  * The default IDT entries which are set up in trap_init() before
76  * cpu_init() is invoked. Interrupt stacks cannot be used at that point and
77  * the traps which use them are reinitialized with IST after cpu_init() has
78  * set up TSS.
79  */
80 static const __initconst struct idt_data def_idts[] = {
81 	INTG(X86_TRAP_DE,		asm_exc_divide_error),
82 	ISTG(X86_TRAP_NMI,		asm_exc_nmi, IST_INDEX_NMI),
83 	INTG(X86_TRAP_BR,		asm_exc_bounds),
84 	INTG(X86_TRAP_UD,		asm_exc_invalid_op),
85 	INTG(X86_TRAP_NM,		asm_exc_device_not_available),
86 	INTG(X86_TRAP_OLD_MF,		asm_exc_coproc_segment_overrun),
87 	INTG(X86_TRAP_TS,		asm_exc_invalid_tss),
88 	INTG(X86_TRAP_NP,		asm_exc_segment_not_present),
89 	INTG(X86_TRAP_SS,		asm_exc_stack_segment),
90 	INTG(X86_TRAP_GP,		asm_exc_general_protection),
91 	INTG(X86_TRAP_SPURIOUS,		asm_exc_spurious_interrupt_bug),
92 	INTG(X86_TRAP_MF,		asm_exc_coprocessor_error),
93 	INTG(X86_TRAP_AC,		asm_exc_alignment_check),
94 	INTG(X86_TRAP_XF,		asm_exc_simd_coprocessor_error),
95 
96 #ifdef CONFIG_X86_32
97 	TSKG(X86_TRAP_DF,		GDT_ENTRY_DOUBLEFAULT_TSS),
98 #else
99 	ISTG(X86_TRAP_DF,		asm_exc_double_fault, IST_INDEX_DF),
100 #endif
101 	ISTG(X86_TRAP_DB,		asm_exc_debug, IST_INDEX_DB),
102 
103 #ifdef CONFIG_X86_MCE
104 	ISTG(X86_TRAP_MC,		asm_exc_machine_check, IST_INDEX_MCE),
105 #endif
106 
107 #ifdef CONFIG_AMD_MEM_ENCRYPT
108 	ISTG(X86_TRAP_VC,		asm_exc_vmm_communication, IST_INDEX_VC),
109 #endif
110 
111 	SYSG(X86_TRAP_OF,		asm_exc_overflow),
112 #if defined(CONFIG_IA32_EMULATION)
113 	SYSG(IA32_SYSCALL_VECTOR,	entry_INT80_compat),
114 #elif defined(CONFIG_X86_32)
115 	SYSG(IA32_SYSCALL_VECTOR,	entry_INT80_32),
116 #endif
117 };
118 
119 /*
120  * The APIC and SMP idt entries
121  */
122 static const __initconst struct idt_data apic_idts[] = {
123 #ifdef CONFIG_SMP
124 	INTG(RESCHEDULE_VECTOR,			asm_sysvec_reschedule_ipi),
125 	INTG(CALL_FUNCTION_VECTOR,		asm_sysvec_call_function),
126 	INTG(CALL_FUNCTION_SINGLE_VECTOR,	asm_sysvec_call_function_single),
127 	INTG(IRQ_MOVE_CLEANUP_VECTOR,		asm_sysvec_irq_move_cleanup),
128 	INTG(REBOOT_VECTOR,			asm_sysvec_reboot),
129 #endif
130 
131 #ifdef CONFIG_X86_THERMAL_VECTOR
132 	INTG(THERMAL_APIC_VECTOR,		asm_sysvec_thermal),
133 #endif
134 
135 #ifdef CONFIG_X86_MCE_THRESHOLD
136 	INTG(THRESHOLD_APIC_VECTOR,		asm_sysvec_threshold),
137 #endif
138 
139 #ifdef CONFIG_X86_MCE_AMD
140 	INTG(DEFERRED_ERROR_VECTOR,		asm_sysvec_deferred_error),
141 #endif
142 
143 #ifdef CONFIG_X86_LOCAL_APIC
144 	INTG(LOCAL_TIMER_VECTOR,		asm_sysvec_apic_timer_interrupt),
145 	INTG(X86_PLATFORM_IPI_VECTOR,		asm_sysvec_x86_platform_ipi),
146 # ifdef CONFIG_HAVE_KVM
147 	INTG(POSTED_INTR_VECTOR,		asm_sysvec_kvm_posted_intr_ipi),
148 	INTG(POSTED_INTR_WAKEUP_VECTOR,		asm_sysvec_kvm_posted_intr_wakeup_ipi),
149 	INTG(POSTED_INTR_NESTED_VECTOR,		asm_sysvec_kvm_posted_intr_nested_ipi),
150 # endif
151 # ifdef CONFIG_IRQ_WORK
152 	INTG(IRQ_WORK_VECTOR,			asm_sysvec_irq_work),
153 # endif
154 	INTG(SPURIOUS_APIC_VECTOR,		asm_sysvec_spurious_apic_interrupt),
155 	INTG(ERROR_APIC_VECTOR,			asm_sysvec_error_interrupt),
156 #endif
157 };
158 
159 /* Must be page-aligned because the real IDT is used in the cpu entry area */
160 static gate_desc idt_table[IDT_ENTRIES] __page_aligned_bss;
161 
162 static struct desc_ptr idt_descr __ro_after_init = {
163 	.size		= IDT_TABLE_SIZE - 1,
164 	.address	= (unsigned long) idt_table,
165 };
166 
167 void load_current_idt(void)
168 {
169 	lockdep_assert_irqs_disabled();
170 	load_idt(&idt_descr);
171 }
172 
173 #ifdef CONFIG_X86_F00F_BUG
174 bool idt_is_f00f_address(unsigned long address)
175 {
176 	return ((address - idt_descr.address) >> 3) == 6;
177 }
178 #endif
179 
180 static __init void
181 idt_setup_from_table(gate_desc *idt, const struct idt_data *t, int size, bool sys)
182 {
183 	gate_desc desc;
184 
185 	for (; size > 0; t++, size--) {
186 		idt_init_desc(&desc, t);
187 		write_idt_entry(idt, t->vector, &desc);
188 		if (sys)
189 			set_bit(t->vector, system_vectors);
190 	}
191 }
192 
193 static __init void set_intr_gate(unsigned int n, const void *addr)
194 {
195 	struct idt_data data;
196 
197 	init_idt_data(&data, n, addr);
198 
199 	idt_setup_from_table(idt_table, &data, 1, false);
200 }
201 
202 /**
203  * idt_setup_early_traps - Initialize the idt table with early traps
204  *
205  * On X8664 these traps do not use interrupt stacks as they can't work
206  * before cpu_init() is invoked and sets up TSS. The IST variants are
207  * installed after that.
208  */
209 void __init idt_setup_early_traps(void)
210 {
211 	idt_setup_from_table(idt_table, early_idts, ARRAY_SIZE(early_idts),
212 			     true);
213 	load_idt(&idt_descr);
214 }
215 
216 /**
217  * idt_setup_traps - Initialize the idt table with default traps
218  */
219 void __init idt_setup_traps(void)
220 {
221 	idt_setup_from_table(idt_table, def_idts, ARRAY_SIZE(def_idts), true);
222 }
223 
224 #ifdef CONFIG_X86_64
225 /*
226  * Early traps running on the DEFAULT_STACK because the other interrupt
227  * stacks work only after cpu_init().
228  */
229 static const __initconst struct idt_data early_pf_idts[] = {
230 	INTG(X86_TRAP_PF,		asm_exc_page_fault),
231 };
232 
233 /**
234  * idt_setup_early_pf - Initialize the idt table with early pagefault handler
235  *
236  * On X8664 this does not use interrupt stacks as they can't work before
237  * cpu_init() is invoked and sets up TSS. The IST variant is installed
238  * after that.
239  *
240  * Note, that X86_64 cannot install the real #PF handler in
241  * idt_setup_early_traps() because the memory initialization needs the #PF
242  * handler from the early_idt_handler_array to initialize the early page
243  * tables.
244  */
245 void __init idt_setup_early_pf(void)
246 {
247 	idt_setup_from_table(idt_table, early_pf_idts,
248 			     ARRAY_SIZE(early_pf_idts), true);
249 }
250 #endif
251 
252 static void __init idt_map_in_cea(void)
253 {
254 	/*
255 	 * Set the IDT descriptor to a fixed read-only location in the cpu
256 	 * entry area, so that the "sidt" instruction will not leak the
257 	 * location of the kernel, and to defend the IDT against arbitrary
258 	 * memory write vulnerabilities.
259 	 */
260 	cea_set_pte(CPU_ENTRY_AREA_RO_IDT_VADDR, __pa_symbol(idt_table),
261 		    PAGE_KERNEL_RO);
262 	idt_descr.address = CPU_ENTRY_AREA_RO_IDT;
263 }
264 
265 /**
266  * idt_setup_apic_and_irq_gates - Setup APIC/SMP and normal interrupt gates
267  */
268 void __init idt_setup_apic_and_irq_gates(void)
269 {
270 	int i = FIRST_EXTERNAL_VECTOR;
271 	void *entry;
272 
273 	idt_setup_from_table(idt_table, apic_idts, ARRAY_SIZE(apic_idts), true);
274 
275 	for_each_clear_bit_from(i, system_vectors, FIRST_SYSTEM_VECTOR) {
276 		entry = irq_entries_start + IDT_ALIGN * (i - FIRST_EXTERNAL_VECTOR);
277 		set_intr_gate(i, entry);
278 	}
279 
280 #ifdef CONFIG_X86_LOCAL_APIC
281 	for_each_clear_bit_from(i, system_vectors, NR_VECTORS) {
282 		/*
283 		 * Don't set the non assigned system vectors in the
284 		 * system_vectors bitmap. Otherwise they show up in
285 		 * /proc/interrupts.
286 		 */
287 		entry = spurious_entries_start + IDT_ALIGN * (i - FIRST_SYSTEM_VECTOR);
288 		set_intr_gate(i, entry);
289 	}
290 #endif
291 	/* Map IDT into CPU entry area and reload it. */
292 	idt_map_in_cea();
293 	load_idt(&idt_descr);
294 
295 	/* Make the IDT table read only */
296 	set_memory_ro((unsigned long)&idt_table, 1);
297 
298 	idt_setup_done = true;
299 }
300 
301 /**
302  * idt_setup_early_handler - Initializes the idt table with early handlers
303  */
304 void __init idt_setup_early_handler(void)
305 {
306 	int i;
307 
308 	for (i = 0; i < NUM_EXCEPTION_VECTORS; i++)
309 		set_intr_gate(i, early_idt_handler_array[i]);
310 #ifdef CONFIG_X86_32
311 	for ( ; i < NR_VECTORS; i++)
312 		set_intr_gate(i, early_ignore_irq);
313 #endif
314 	load_idt(&idt_descr);
315 }
316 
317 /**
318  * idt_invalidate - Invalidate interrupt descriptor table
319  */
320 void idt_invalidate(void)
321 {
322 	static const struct desc_ptr idt = { .address = 0, .size = 0 };
323 
324 	load_idt(&idt);
325 }
326 
327 void __init alloc_intr_gate(unsigned int n, const void *addr)
328 {
329 	if (WARN_ON(n < FIRST_SYSTEM_VECTOR))
330 		return;
331 
332 	if (WARN_ON(idt_setup_done))
333 		return;
334 
335 	if (!WARN_ON(test_and_set_bit(n, system_vectors)))
336 		set_intr_gate(n, addr);
337 }
338