xref: /openbmc/linux/arch/mips/math-emu/dsemul.c (revision 4f2c0a4acffbec01079c28f839422e64ddeff004)
1b2441318SGreg Kroah-Hartman // SPDX-License-Identifier: GPL-2.0
2432c6bacSPaul Burton #include <linux/err.h>
3432c6bacSPaul Burton #include <linux/slab.h>
4589ee628SIngo Molnar #include <linux/mm_types.h>
5f719ff9bSIngo Molnar #include <linux/sched/task.h>
6432c6bacSPaul Burton 
71da177e4SLinus Torvalds #include <asm/branch.h>
81da177e4SLinus Torvalds #include <asm/cacheflush.h>
91da177e4SLinus Torvalds #include <asm/fpu_emulator.h>
10cd8ee345SRalf Baechle #include <asm/inst.h>
11cd8ee345SRalf Baechle #include <asm/mipsregs.h>
127c0f6ba6SLinus Torvalds #include <linux/uaccess.h>
131da177e4SLinus Torvalds 
14432c6bacSPaul Burton /**
15432c6bacSPaul Burton  * struct emuframe - The 'emulation' frame structure
16432c6bacSPaul Burton  * @emul:	The instruction to 'emulate'.
17432c6bacSPaul Burton  * @badinst:	A break instruction to cause a return to the kernel.
181da177e4SLinus Torvalds  *
19432c6bacSPaul Burton  * This structure defines the frames placed within the delay slot emulation
20432c6bacSPaul Burton  * page in response to a call to mips_dsemul(). Each thread may be allocated
21432c6bacSPaul Burton  * only one frame at any given time. The kernel stores within it the
22432c6bacSPaul Burton  * instruction to be 'emulated' followed by a break instruction, then
23432c6bacSPaul Burton  * executes the frame in user mode. The break causes a trap to the kernel
24432c6bacSPaul Burton  * which leads to do_dsemulret() being called unless the instruction in
25432c6bacSPaul Burton  * @emul causes a trap itself, is a branch, or a signal is delivered to
26432c6bacSPaul Burton  * the thread. In these cases the allocated frame will either be reused by
27432c6bacSPaul Burton  * a subsequent delay slot 'emulation', or be freed during signal delivery or
28432c6bacSPaul Burton  * upon thread exit.
29432c6bacSPaul Burton  *
30432c6bacSPaul Burton  * This approach is used because:
31432c6bacSPaul Burton  *
32432c6bacSPaul Burton  * - Actually emulating all instructions isn't feasible. We would need to
33432c6bacSPaul Burton  *   be able to handle instructions from all revisions of the MIPS ISA,
34432c6bacSPaul Burton  *   all ASEs & all vendor instruction set extensions. This would be a
35432c6bacSPaul Burton  *   whole lot of work & continual maintenance burden as new instructions
36432c6bacSPaul Burton  *   are introduced, and in the case of some vendor extensions may not
37432c6bacSPaul Burton  *   even be possible. Thus we need to take the approach of actually
38432c6bacSPaul Burton  *   executing the instruction.
39432c6bacSPaul Burton  *
40432c6bacSPaul Burton  * - We must execute the instruction within user context. If we were to
41432c6bacSPaul Burton  *   execute the instruction in kernel mode then it would have access to
42432c6bacSPaul Burton  *   kernel resources without very careful checks, leaving us with a
43432c6bacSPaul Burton  *   high potential for security or stability issues to arise.
44432c6bacSPaul Burton  *
45432c6bacSPaul Burton  * - We used to place the frame on the users stack, but this requires
46432c6bacSPaul Burton  *   that the stack be executable. This is bad for security so the
47432c6bacSPaul Burton  *   per-process page is now used instead.
48432c6bacSPaul Burton  *
49432c6bacSPaul Burton  * - The instruction in @emul may be something entirely invalid for a
50432c6bacSPaul Burton  *   delay slot. The user may (intentionally or otherwise) place a branch
51432c6bacSPaul Burton  *   in a delay slot, or a kernel mode instruction, or something else
52432c6bacSPaul Burton  *   which generates an exception. Thus we can't rely upon the break in
53432c6bacSPaul Burton  *   @badinst always being hit. For this reason we track the index of the
54432c6bacSPaul Burton  *   frame allocated to each thread, allowing us to clean it up at later
55432c6bacSPaul Burton  *   points such as signal delivery or thread exit.
56432c6bacSPaul Burton  *
57432c6bacSPaul Burton  * - The user may generate a fake struct emuframe if they wish, invoking
58432c6bacSPaul Burton  *   the BRK_MEMU break instruction themselves. We must therefore not
59432c6bacSPaul Burton  *   trust that BRK_MEMU means there's actually a valid frame allocated
60432c6bacSPaul Burton  *   to the thread, and must not allow the user to do anything they
61432c6bacSPaul Burton  *   couldn't already.
621da177e4SLinus Torvalds  */
631da177e4SLinus Torvalds struct emuframe {
641da177e4SLinus Torvalds 	mips_instruction	emul;
651da177e4SLinus Torvalds 	mips_instruction	badinst;
661da177e4SLinus Torvalds };
671da177e4SLinus Torvalds 
68432c6bacSPaul Burton static const int emupage_frame_count = PAGE_SIZE / sizeof(struct emuframe);
69432c6bacSPaul Burton 
dsemul_page(void)70432c6bacSPaul Burton static inline __user struct emuframe *dsemul_page(void)
71432c6bacSPaul Burton {
72432c6bacSPaul Burton 	return (__user struct emuframe *)STACK_TOP;
73432c6bacSPaul Burton }
74432c6bacSPaul Burton 
alloc_emuframe(void)75432c6bacSPaul Burton static int alloc_emuframe(void)
76432c6bacSPaul Burton {
77432c6bacSPaul Burton 	mm_context_t *mm_ctx = &current->mm->context;
78432c6bacSPaul Burton 	int idx;
79432c6bacSPaul Burton 
80432c6bacSPaul Burton retry:
81432c6bacSPaul Burton 	spin_lock(&mm_ctx->bd_emupage_lock);
82432c6bacSPaul Burton 
83432c6bacSPaul Burton 	/* Ensure we have an allocation bitmap */
84432c6bacSPaul Burton 	if (!mm_ctx->bd_emupage_allocmap) {
85*8512670dSChristophe JAILLET 		mm_ctx->bd_emupage_allocmap = bitmap_zalloc(emupage_frame_count,
86432c6bacSPaul Burton 							    GFP_ATOMIC);
87432c6bacSPaul Burton 		if (!mm_ctx->bd_emupage_allocmap) {
88432c6bacSPaul Burton 			idx = BD_EMUFRAME_NONE;
89432c6bacSPaul Burton 			goto out_unlock;
90432c6bacSPaul Burton 		}
91432c6bacSPaul Burton 	}
92432c6bacSPaul Burton 
93432c6bacSPaul Burton 	/* Attempt to allocate a single bit/frame */
94432c6bacSPaul Burton 	idx = bitmap_find_free_region(mm_ctx->bd_emupage_allocmap,
95432c6bacSPaul Burton 				      emupage_frame_count, 0);
96432c6bacSPaul Burton 	if (idx < 0) {
97e4553573SMaciej W. Rozycki 		/*
98432c6bacSPaul Burton 		 * Failed to allocate a frame. We'll wait until one becomes
99432c6bacSPaul Burton 		 * available. We unlock the page so that other threads actually
100432c6bacSPaul Burton 		 * get the opportunity to free their frames, which means
101432c6bacSPaul Burton 		 * technically the result of bitmap_full may be incorrect.
102432c6bacSPaul Burton 		 * However the worst case is that we repeat all this and end up
103432c6bacSPaul Burton 		 * back here again.
104e4553573SMaciej W. Rozycki 		 */
105432c6bacSPaul Burton 		spin_unlock(&mm_ctx->bd_emupage_lock);
106432c6bacSPaul Burton 		if (!wait_event_killable(mm_ctx->bd_emupage_queue,
107432c6bacSPaul Burton 			!bitmap_full(mm_ctx->bd_emupage_allocmap,
108432c6bacSPaul Burton 				     emupage_frame_count)))
109432c6bacSPaul Burton 			goto retry;
110432c6bacSPaul Burton 
111432c6bacSPaul Burton 		/* Received a fatal signal - just give in */
112432c6bacSPaul Burton 		return BD_EMUFRAME_NONE;
113432c6bacSPaul Burton 	}
114432c6bacSPaul Burton 
115432c6bacSPaul Burton 	/* Success! */
116432c6bacSPaul Burton 	pr_debug("allocate emuframe %d to %d\n", idx, current->pid);
117432c6bacSPaul Burton out_unlock:
118432c6bacSPaul Burton 	spin_unlock(&mm_ctx->bd_emupage_lock);
119432c6bacSPaul Burton 	return idx;
120432c6bacSPaul Burton }
121432c6bacSPaul Burton 
free_emuframe(int idx,struct mm_struct * mm)122432c6bacSPaul Burton static void free_emuframe(int idx, struct mm_struct *mm)
123432c6bacSPaul Burton {
124432c6bacSPaul Burton 	mm_context_t *mm_ctx = &mm->context;
125432c6bacSPaul Burton 
126432c6bacSPaul Burton 	spin_lock(&mm_ctx->bd_emupage_lock);
127432c6bacSPaul Burton 
128432c6bacSPaul Burton 	pr_debug("free emuframe %d from %d\n", idx, current->pid);
129432c6bacSPaul Burton 	bitmap_clear(mm_ctx->bd_emupage_allocmap, idx, 1);
130432c6bacSPaul Burton 
131432c6bacSPaul Burton 	/* If some thread is waiting for a frame, now's its chance */
132432c6bacSPaul Burton 	wake_up(&mm_ctx->bd_emupage_queue);
133432c6bacSPaul Burton 
134432c6bacSPaul Burton 	spin_unlock(&mm_ctx->bd_emupage_lock);
135432c6bacSPaul Burton }
136432c6bacSPaul Burton 
within_emuframe(struct pt_regs * regs)137432c6bacSPaul Burton static bool within_emuframe(struct pt_regs *regs)
138432c6bacSPaul Burton {
139432c6bacSPaul Burton 	unsigned long base = (unsigned long)dsemul_page();
140432c6bacSPaul Burton 
141432c6bacSPaul Burton 	if (regs->cp0_epc < base)
142432c6bacSPaul Burton 		return false;
143432c6bacSPaul Burton 	if (regs->cp0_epc >= (base + PAGE_SIZE))
144432c6bacSPaul Burton 		return false;
145432c6bacSPaul Burton 
146432c6bacSPaul Burton 	return true;
147432c6bacSPaul Burton }
148432c6bacSPaul Burton 
dsemul_thread_cleanup(struct task_struct * tsk)149432c6bacSPaul Burton bool dsemul_thread_cleanup(struct task_struct *tsk)
150432c6bacSPaul Burton {
151432c6bacSPaul Burton 	int fr_idx;
152432c6bacSPaul Burton 
153432c6bacSPaul Burton 	/* Clear any allocated frame, retrieving its index */
154432c6bacSPaul Burton 	fr_idx = atomic_xchg(&tsk->thread.bd_emu_frame, BD_EMUFRAME_NONE);
155432c6bacSPaul Burton 
156432c6bacSPaul Burton 	/* If no frame was allocated, we're done */
157432c6bacSPaul Burton 	if (fr_idx == BD_EMUFRAME_NONE)
158432c6bacSPaul Burton 		return false;
159432c6bacSPaul Burton 
160432c6bacSPaul Burton 	task_lock(tsk);
161432c6bacSPaul Burton 
162432c6bacSPaul Burton 	/* Free the frame that this thread had allocated */
163432c6bacSPaul Burton 	if (tsk->mm)
164432c6bacSPaul Burton 		free_emuframe(fr_idx, tsk->mm);
165432c6bacSPaul Burton 
166432c6bacSPaul Burton 	task_unlock(tsk);
167432c6bacSPaul Burton 	return true;
168432c6bacSPaul Burton }
169432c6bacSPaul Burton 
dsemul_thread_rollback(struct pt_regs * regs)170432c6bacSPaul Burton bool dsemul_thread_rollback(struct pt_regs *regs)
171432c6bacSPaul Burton {
172432c6bacSPaul Burton 	struct emuframe __user *fr;
173432c6bacSPaul Burton 	int fr_idx;
174432c6bacSPaul Burton 
175432c6bacSPaul Burton 	/* Do nothing if we're not executing from a frame */
176432c6bacSPaul Burton 	if (!within_emuframe(regs))
177432c6bacSPaul Burton 		return false;
178432c6bacSPaul Burton 
179432c6bacSPaul Burton 	/* Find the frame being executed */
180432c6bacSPaul Burton 	fr_idx = atomic_read(&current->thread.bd_emu_frame);
181432c6bacSPaul Burton 	if (fr_idx == BD_EMUFRAME_NONE)
182432c6bacSPaul Burton 		return false;
183432c6bacSPaul Burton 	fr = &dsemul_page()[fr_idx];
184432c6bacSPaul Burton 
185432c6bacSPaul Burton 	/*
186432c6bacSPaul Burton 	 * If the PC is at the emul instruction, roll back to the branch. If
187432c6bacSPaul Burton 	 * PC is at the badinst (break) instruction, we've already emulated the
188432c6bacSPaul Burton 	 * instruction so progress to the continue PC. If it's anything else
189432c6bacSPaul Burton 	 * then something is amiss & the user has branched into some other area
190432c6bacSPaul Burton 	 * of the emupage - we'll free the allocated frame anyway.
191432c6bacSPaul Burton 	 */
192432c6bacSPaul Burton 	if (msk_isa16_mode(regs->cp0_epc) == (unsigned long)&fr->emul)
193432c6bacSPaul Burton 		regs->cp0_epc = current->thread.bd_emu_branch_pc;
194432c6bacSPaul Burton 	else if (msk_isa16_mode(regs->cp0_epc) == (unsigned long)&fr->badinst)
195432c6bacSPaul Burton 		regs->cp0_epc = current->thread.bd_emu_cont_pc;
196432c6bacSPaul Burton 
197432c6bacSPaul Burton 	atomic_set(&current->thread.bd_emu_frame, BD_EMUFRAME_NONE);
198432c6bacSPaul Burton 	free_emuframe(fr_idx, current->mm);
199432c6bacSPaul Burton 	return true;
200432c6bacSPaul Burton }
201432c6bacSPaul Burton 
dsemul_mm_cleanup(struct mm_struct * mm)202432c6bacSPaul Burton void dsemul_mm_cleanup(struct mm_struct *mm)
203432c6bacSPaul Burton {
204432c6bacSPaul Burton 	mm_context_t *mm_ctx = &mm->context;
205432c6bacSPaul Burton 
206*8512670dSChristophe JAILLET 	bitmap_free(mm_ctx->bd_emupage_allocmap);
207432c6bacSPaul Burton }
208432c6bacSPaul Burton 
mips_dsemul(struct pt_regs * regs,mips_instruction ir,unsigned long branch_pc,unsigned long cont_pc)209432c6bacSPaul Burton int mips_dsemul(struct pt_regs *regs, mips_instruction ir,
210432c6bacSPaul Burton 		unsigned long branch_pc, unsigned long cont_pc)
2111da177e4SLinus Torvalds {
2126d7b1415SMaciej W. Rozycki 	int isa16 = get_isa16_mode(regs->cp0_epc);
213733b8bc1SMaciej W. Rozycki 	mips_instruction break_math;
214adcc81f1SPaul Burton 	unsigned long fr_uaddr;
215adcc81f1SPaul Burton 	struct emuframe fr;
216adcc81f1SPaul Burton 	int fr_idx, ret;
2171da177e4SLinus Torvalds 
218102cedc3SLeonid Yegoshin 	/* NOP is easy */
21969a1e6cbSMaciej W. Rozycki 	if (ir == 0)
220e4553573SMaciej W. Rozycki 		return -1;
2211da177e4SLinus Torvalds 
22269a1e6cbSMaciej W. Rozycki 	/* microMIPS instructions */
2236d7b1415SMaciej W. Rozycki 	if (isa16) {
22469a1e6cbSMaciej W. Rozycki 		union mips_instruction insn = { .word = ir };
22569a1e6cbSMaciej W. Rozycki 
22669a1e6cbSMaciej W. Rozycki 		/* NOP16 aka MOVE16 $0, $0 */
22769a1e6cbSMaciej W. Rozycki 		if ((ir >> 16) == MM_NOP16)
22869a1e6cbSMaciej W. Rozycki 			return -1;
22969a1e6cbSMaciej W. Rozycki 
23069a1e6cbSMaciej W. Rozycki 		/* ADDIUPC */
23169a1e6cbSMaciej W. Rozycki 		if (insn.mm_a_format.opcode == mm_addiupc_op) {
23269a1e6cbSMaciej W. Rozycki 			unsigned int rs;
23369a1e6cbSMaciej W. Rozycki 			s32 v;
23469a1e6cbSMaciej W. Rozycki 
235036aff91SMaciej W. Rozycki 			rs = (((insn.mm_a_format.rs + 0xe) & 0xf) + 2);
23669a1e6cbSMaciej W. Rozycki 			v = regs->cp0_epc & ~3;
23769a1e6cbSMaciej W. Rozycki 			v += insn.mm_a_format.simmediate << 2;
23869a1e6cbSMaciej W. Rozycki 			regs->regs[rs] = (long)v;
23969a1e6cbSMaciej W. Rozycki 			return -1;
24069a1e6cbSMaciej W. Rozycki 		}
24169a1e6cbSMaciej W. Rozycki 	}
24269a1e6cbSMaciej W. Rozycki 
243432c6bacSPaul Burton 	pr_debug("dsemul 0x%08lx cont at 0x%08lx\n", regs->cp0_epc, cont_pc);
2441da177e4SLinus Torvalds 
245432c6bacSPaul Burton 	/* Allocate a frame if we don't already have one */
246432c6bacSPaul Burton 	fr_idx = atomic_read(&current->thread.bd_emu_frame);
247432c6bacSPaul Burton 	if (fr_idx == BD_EMUFRAME_NONE)
248432c6bacSPaul Burton 		fr_idx = alloc_emuframe();
249432c6bacSPaul Burton 	if (fr_idx == BD_EMUFRAME_NONE)
250432c6bacSPaul Burton 		return SIGBUS;
251432c6bacSPaul Burton 
252432c6bacSPaul Burton 	/* Retrieve the appropriately encoded break instruction */
2536d7b1415SMaciej W. Rozycki 	break_math = BREAK_MATH(isa16);
2541da177e4SLinus Torvalds 
255432c6bacSPaul Burton 	/* Write the instructions to the frame */
2566d7b1415SMaciej W. Rozycki 	if (isa16) {
257adcc81f1SPaul Burton 		union mips_instruction _emul = {
258adcc81f1SPaul Burton 			.halfword = { ir >> 16, ir }
259adcc81f1SPaul Burton 		};
260adcc81f1SPaul Burton 		union mips_instruction _badinst = {
261adcc81f1SPaul Burton 			.halfword = { break_math >> 16, break_math }
262adcc81f1SPaul Burton 		};
263adcc81f1SPaul Burton 
264adcc81f1SPaul Burton 		fr.emul = _emul.word;
265adcc81f1SPaul Burton 		fr.badinst = _badinst.word;
266102cedc3SLeonid Yegoshin 	} else {
267adcc81f1SPaul Burton 		fr.emul = ir;
268adcc81f1SPaul Burton 		fr.badinst = break_math;
269102cedc3SLeonid Yegoshin 	}
270102cedc3SLeonid Yegoshin 
271adcc81f1SPaul Burton 	/* Write the frame to user memory */
272adcc81f1SPaul Burton 	fr_uaddr = (unsigned long)&dsemul_page()[fr_idx];
273adcc81f1SPaul Burton 	ret = access_process_vm(current, fr_uaddr, &fr, sizeof(fr),
274adcc81f1SPaul Burton 				FOLL_FORCE | FOLL_WRITE);
275adcc81f1SPaul Burton 	if (unlikely(ret != sizeof(fr))) {
276b6ee75edSDavid Daney 		MIPS_FPU_EMU_INC_STATS(errors);
277432c6bacSPaul Burton 		free_emuframe(fr_idx, current->mm);
2781da177e4SLinus Torvalds 		return SIGBUS;
2791da177e4SLinus Torvalds 	}
2801da177e4SLinus Torvalds 
281432c6bacSPaul Burton 	/* Record the PC of the branch, PC to continue from & frame index */
282432c6bacSPaul Burton 	current->thread.bd_emu_branch_pc = branch_pc;
283432c6bacSPaul Burton 	current->thread.bd_emu_cont_pc = cont_pc;
284432c6bacSPaul Burton 	atomic_set(&current->thread.bd_emu_frame, fr_idx);
285432c6bacSPaul Burton 
286432c6bacSPaul Burton 	/* Change user register context to execute the frame */
287adcc81f1SPaul Burton 	regs->cp0_epc = fr_uaddr | isa16;
2881da177e4SLinus Torvalds 
2899ab4471cSMaciej W. Rozycki 	return 0;
2901da177e4SLinus Torvalds }
2911da177e4SLinus Torvalds 
do_dsemulret(struct pt_regs * xcp)292432c6bacSPaul Burton bool do_dsemulret(struct pt_regs *xcp)
2931da177e4SLinus Torvalds {
294432c6bacSPaul Burton 	/* Cleanup the allocated frame, returning if there wasn't one */
295432c6bacSPaul Burton 	if (!dsemul_thread_cleanup(current)) {
296b6ee75edSDavid Daney 		MIPS_FPU_EMU_INC_STATS(errors);
297432c6bacSPaul Burton 		return false;
2981da177e4SLinus Torvalds 	}
2991da177e4SLinus Torvalds 
3001da177e4SLinus Torvalds 	/* Set EPC to return to post-branch instruction */
301432c6bacSPaul Burton 	xcp->cp0_epc = current->thread.bd_emu_cont_pc;
302432c6bacSPaul Burton 	pr_debug("dsemulret to 0x%08lx\n", xcp->cp0_epc);
303116e7111SPaul Burton 	MIPS_FPU_EMU_INC_STATS(ds_emul);
304432c6bacSPaul Burton 	return true;
3051da177e4SLinus Torvalds }
306