184778508Sblueswir1 /*
284778508Sblueswir1 * mmap support for qemu
384778508Sblueswir1 *
484778508Sblueswir1 * Copyright (c) 2003 - 2008 Fabrice Bellard
584778508Sblueswir1 *
684778508Sblueswir1 * This program is free software; you can redistribute it and/or modify
784778508Sblueswir1 * it under the terms of the GNU General Public License as published by
884778508Sblueswir1 * the Free Software Foundation; either version 2 of the License, or
984778508Sblueswir1 * (at your option) any later version.
1084778508Sblueswir1 *
1184778508Sblueswir1 * This program is distributed in the hope that it will be useful,
1284778508Sblueswir1 * but WITHOUT ANY WARRANTY; without even the implied warranty of
1384778508Sblueswir1 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
1484778508Sblueswir1 * GNU General Public License for more details.
1584778508Sblueswir1 *
1684778508Sblueswir1 * You should have received a copy of the GNU General Public License
178167ee88SBlue Swirl * along with this program; if not, see <http://www.gnu.org/licenses/>.
1884778508Sblueswir1 */
192231197cSPeter Maydell #include "qemu/osdep.h"
2074781c08SPhilippe Mathieu-Daudé #include "exec/page-protection.h"
2184778508Sblueswir1
2284778508Sblueswir1 #include "qemu.h"
2384778508Sblueswir1
2495992b67SAlex Bennée static pthread_mutex_t mmap_mutex = PTHREAD_MUTEX_INITIALIZER;
2506943a62SPeter Maydell static __thread int mmap_lock_count;
2684778508Sblueswir1
mmap_lock(void)2784778508Sblueswir1 void mmap_lock(void)
2884778508Sblueswir1 {
2984778508Sblueswir1 if (mmap_lock_count++ == 0) {
3084778508Sblueswir1 pthread_mutex_lock(&mmap_mutex);
3184778508Sblueswir1 }
3284778508Sblueswir1 }
3384778508Sblueswir1
mmap_unlock(void)3484778508Sblueswir1 void mmap_unlock(void)
3584778508Sblueswir1 {
36990ef918SRichard Henderson assert(mmap_lock_count > 0);
3784778508Sblueswir1 if (--mmap_lock_count == 0) {
3884778508Sblueswir1 pthread_mutex_unlock(&mmap_mutex);
3984778508Sblueswir1 }
4084778508Sblueswir1 }
4184778508Sblueswir1
have_mmap_lock(void)42301e40edSAlex Bennée bool have_mmap_lock(void)
43301e40edSAlex Bennée {
44301e40edSAlex Bennée return mmap_lock_count > 0 ? true : false;
45301e40edSAlex Bennée }
46301e40edSAlex Bennée
4784778508Sblueswir1 /* Grab lock to make sure things are in a consistent state after fork(). */
mmap_fork_start(void)4884778508Sblueswir1 void mmap_fork_start(void)
4984778508Sblueswir1 {
5084778508Sblueswir1 if (mmap_lock_count)
5184778508Sblueswir1 abort();
5284778508Sblueswir1 pthread_mutex_lock(&mmap_mutex);
5384778508Sblueswir1 }
5484778508Sblueswir1
mmap_fork_end(int child)5584778508Sblueswir1 void mmap_fork_end(int child)
5684778508Sblueswir1 {
5784778508Sblueswir1 if (child)
5884778508Sblueswir1 pthread_mutex_init(&mmap_mutex, NULL);
5984778508Sblueswir1 else
6084778508Sblueswir1 pthread_mutex_unlock(&mmap_mutex);
6184778508Sblueswir1 }
6284778508Sblueswir1
6384778508Sblueswir1 /* NOTE: all the constants are the HOST ones, but addresses are target. */
target_mprotect(abi_ulong start,abi_ulong len,int prot)6484778508Sblueswir1 int target_mprotect(abi_ulong start, abi_ulong len, int prot)
6584778508Sblueswir1 {
6684778508Sblueswir1 abi_ulong end, host_start, host_end, addr;
6784778508Sblueswir1 int prot1, ret;
6884778508Sblueswir1
6945b8765eSWarner Losh qemu_log_mask(CPU_LOG_PAGE, "mprotect: start=0x" TARGET_ABI_FMT_lx
706a3b9bfdSWarner Losh " len=0x" TARGET_ABI_FMT_lx " prot=%c%c%c\n", start, len,
7184778508Sblueswir1 prot & PROT_READ ? 'r' : '-',
7284778508Sblueswir1 prot & PROT_WRITE ? 'w' : '-',
7384778508Sblueswir1 prot & PROT_EXEC ? 'x' : '-');
7484778508Sblueswir1 if ((start & ~TARGET_PAGE_MASK) != 0)
7584778508Sblueswir1 return -EINVAL;
7684778508Sblueswir1 len = TARGET_PAGE_ALIGN(len);
7784778508Sblueswir1 end = start + len;
7884778508Sblueswir1 if (end < start)
7984778508Sblueswir1 return -EINVAL;
8084778508Sblueswir1 prot &= PROT_READ | PROT_WRITE | PROT_EXEC;
8184778508Sblueswir1 if (len == 0)
8284778508Sblueswir1 return 0;
8384778508Sblueswir1
8484778508Sblueswir1 mmap_lock();
8584778508Sblueswir1 host_start = start & qemu_host_page_mask;
8684778508Sblueswir1 host_end = HOST_PAGE_ALIGN(end);
8784778508Sblueswir1 if (start > host_start) {
8884778508Sblueswir1 /* handle host page containing start */
8984778508Sblueswir1 prot1 = prot;
9084778508Sblueswir1 for (addr = host_start; addr < start; addr += TARGET_PAGE_SIZE) {
9184778508Sblueswir1 prot1 |= page_get_flags(addr);
9284778508Sblueswir1 }
9384778508Sblueswir1 if (host_end == host_start + qemu_host_page_size) {
9484778508Sblueswir1 for (addr = end; addr < host_end; addr += TARGET_PAGE_SIZE) {
9584778508Sblueswir1 prot1 |= page_get_flags(addr);
9684778508Sblueswir1 }
9784778508Sblueswir1 end = host_end;
9884778508Sblueswir1 }
993e8f1628SRichard Henderson ret = mprotect(g2h_untagged(host_start),
10086b7c551SBALATON Zoltan qemu_host_page_size, prot1 & PAGE_RWX);
10184778508Sblueswir1 if (ret != 0)
10284778508Sblueswir1 goto error;
10384778508Sblueswir1 host_start += qemu_host_page_size;
10484778508Sblueswir1 }
10584778508Sblueswir1 if (end < host_end) {
10684778508Sblueswir1 prot1 = prot;
10784778508Sblueswir1 for (addr = end; addr < host_end; addr += TARGET_PAGE_SIZE) {
10884778508Sblueswir1 prot1 |= page_get_flags(addr);
10984778508Sblueswir1 }
1103e8f1628SRichard Henderson ret = mprotect(g2h_untagged(host_end - qemu_host_page_size),
11186b7c551SBALATON Zoltan qemu_host_page_size, prot1 & PAGE_RWX);
11284778508Sblueswir1 if (ret != 0)
11384778508Sblueswir1 goto error;
11484778508Sblueswir1 host_end -= qemu_host_page_size;
11584778508Sblueswir1 }
11684778508Sblueswir1
11784778508Sblueswir1 /* handle the pages in the middle */
11884778508Sblueswir1 if (host_start < host_end) {
1193e8f1628SRichard Henderson ret = mprotect(g2h_untagged(host_start), host_end - host_start, prot);
12084778508Sblueswir1 if (ret != 0)
12184778508Sblueswir1 goto error;
12284778508Sblueswir1 }
12349840a4aSRichard Henderson page_set_flags(start, start + len - 1, prot | PAGE_VALID);
12484778508Sblueswir1 mmap_unlock();
12584778508Sblueswir1 return 0;
12684778508Sblueswir1 error:
12784778508Sblueswir1 mmap_unlock();
12884778508Sblueswir1 return ret;
12984778508Sblueswir1 }
13084778508Sblueswir1
131a6b2d060SWarner Losh /*
132*5b73b248SRichard Henderson * Perform a pread on behalf of target_mmap. We can reach EOF, we can be
133*5b73b248SRichard Henderson * interrupted by signals, and in general there's no good error return path.
134*5b73b248SRichard Henderson * If @zero, zero the rest of the block at EOF.
135*5b73b248SRichard Henderson * Return true on success.
136*5b73b248SRichard Henderson */
mmap_pread(int fd,void * p,size_t len,off_t offset,bool zero)137*5b73b248SRichard Henderson static bool mmap_pread(int fd, void *p, size_t len, off_t offset, bool zero)
138*5b73b248SRichard Henderson {
139*5b73b248SRichard Henderson while (1) {
140*5b73b248SRichard Henderson ssize_t r = pread(fd, p, len, offset);
141*5b73b248SRichard Henderson
142*5b73b248SRichard Henderson if (likely(r == len)) {
143*5b73b248SRichard Henderson /* Complete */
144*5b73b248SRichard Henderson return true;
145*5b73b248SRichard Henderson }
146*5b73b248SRichard Henderson if (r == 0) {
147*5b73b248SRichard Henderson /* EOF */
148*5b73b248SRichard Henderson if (zero) {
149*5b73b248SRichard Henderson memset(p, 0, len);
150*5b73b248SRichard Henderson }
151*5b73b248SRichard Henderson return true;
152*5b73b248SRichard Henderson }
153*5b73b248SRichard Henderson if (r > 0) {
154*5b73b248SRichard Henderson /* Short read */
155*5b73b248SRichard Henderson p += r;
156*5b73b248SRichard Henderson len -= r;
157*5b73b248SRichard Henderson offset += r;
158*5b73b248SRichard Henderson } else if (errno != EINTR) {
159*5b73b248SRichard Henderson /* Error */
160*5b73b248SRichard Henderson return false;
161*5b73b248SRichard Henderson }
162*5b73b248SRichard Henderson }
163*5b73b248SRichard Henderson }
164*5b73b248SRichard Henderson
165*5b73b248SRichard Henderson /*
166a6b2d060SWarner Losh * map an incomplete host page
167a6b2d060SWarner Losh *
168a6b2d060SWarner Losh * mmap_frag can be called with a valid fd, if flags doesn't contain one of
169a6b2d060SWarner Losh * MAP_ANON, MAP_STACK, MAP_GUARD. If we need to map a page in those cases, we
170a6b2d060SWarner Losh * pass fd == -1. However, if flags contains MAP_GUARD then MAP_ANON cannot be
171a6b2d060SWarner Losh * added.
172a6b2d060SWarner Losh *
173a6b2d060SWarner Losh * * If fd is valid (not -1) we want to map the pages with MAP_ANON.
174a6b2d060SWarner Losh * * If flags contains MAP_GUARD we don't want to add MAP_ANON because it
175a6b2d060SWarner Losh * will be rejected. See kern_mmap's enforcing of constraints for MAP_GUARD
176a6b2d060SWarner Losh * in sys/vm/vm_mmap.c.
177a6b2d060SWarner Losh * * If flags contains MAP_ANON it doesn't matter if we add it or not.
178a6b2d060SWarner Losh * * If flags contains MAP_STACK, mmap adds MAP_ANON when called so doesn't
179a6b2d060SWarner Losh * matter if we add it or not either. See enforcing of constraints for
180a6b2d060SWarner Losh * MAP_STACK in kern_mmap.
181a6b2d060SWarner Losh *
182a6b2d060SWarner Losh * Don't add MAP_ANON for the flags that use fd == -1 without specifying the
183a6b2d060SWarner Losh * flags directly, with the assumption that future flags that require fd == -1
184a6b2d060SWarner Losh * will also not require MAP_ANON.
185a6b2d060SWarner Losh */
mmap_frag(abi_ulong real_start,abi_ulong start,abi_ulong end,int prot,int flags,int fd,abi_ulong offset)18684778508Sblueswir1 static int mmap_frag(abi_ulong real_start,
18784778508Sblueswir1 abi_ulong start, abi_ulong end,
18884778508Sblueswir1 int prot, int flags, int fd, abi_ulong offset)
18984778508Sblueswir1 {
19084778508Sblueswir1 abi_ulong real_end, addr;
19184778508Sblueswir1 void *host_start;
19284778508Sblueswir1 int prot1, prot_new;
19384778508Sblueswir1
19484778508Sblueswir1 real_end = real_start + qemu_host_page_size;
1953e8f1628SRichard Henderson host_start = g2h_untagged(real_start);
19684778508Sblueswir1
19784778508Sblueswir1 /* get the protection of the target pages outside the mapping */
19884778508Sblueswir1 prot1 = 0;
19984778508Sblueswir1 for (addr = real_start; addr < real_end; addr++) {
20084778508Sblueswir1 if (addr < start || addr >= end)
20184778508Sblueswir1 prot1 |= page_get_flags(addr);
20284778508Sblueswir1 }
20384778508Sblueswir1
20484778508Sblueswir1 if (prot1 == 0) {
205a6b2d060SWarner Losh /* no page was there, so we allocate one. See also above. */
20684778508Sblueswir1 void *p = mmap(host_start, qemu_host_page_size, prot,
207a6b2d060SWarner Losh flags | ((fd != -1) ? MAP_ANON : 0), -1, 0);
20884778508Sblueswir1 if (p == MAP_FAILED)
20984778508Sblueswir1 return -1;
21084778508Sblueswir1 prot1 = prot;
21184778508Sblueswir1 }
21286b7c551SBALATON Zoltan prot1 &= PAGE_RWX;
21384778508Sblueswir1
21484778508Sblueswir1 prot_new = prot | prot1;
215a6b2d060SWarner Losh if (fd != -1) {
21684778508Sblueswir1 /* msync() won't work here, so we return an error if write is
21784778508Sblueswir1 possible while it is a shared mapping */
2186c173b3cSblueswir1 if ((flags & TARGET_BSD_MAP_FLAGMASK) == MAP_SHARED &&
21984778508Sblueswir1 (prot & PROT_WRITE))
220059bca46SBlue Swirl return -1;
22184778508Sblueswir1
22284778508Sblueswir1 /* adjust protection to be able to read */
22384778508Sblueswir1 if (!(prot1 & PROT_WRITE))
22484778508Sblueswir1 mprotect(host_start, qemu_host_page_size, prot1 | PROT_WRITE);
22584778508Sblueswir1
22684778508Sblueswir1 /* read the corresponding file data */
227*5b73b248SRichard Henderson if (!mmap_pread(fd, g2h_untagged(start), end - start, offset, true)) {
22826778ac3SMikaël Urankar return -1;
22926778ac3SMikaël Urankar }
23084778508Sblueswir1
23184778508Sblueswir1 /* put final protection */
23284778508Sblueswir1 if (prot_new != (prot1 | PROT_WRITE))
23384778508Sblueswir1 mprotect(host_start, qemu_host_page_size, prot_new);
23484778508Sblueswir1 } else {
23584778508Sblueswir1 if (prot_new != prot1) {
23684778508Sblueswir1 mprotect(host_start, qemu_host_page_size, prot_new);
23784778508Sblueswir1 }
238948516a3SMikaël Urankar if (prot_new & PROT_WRITE) {
239948516a3SMikaël Urankar memset(g2h_untagged(start), 0, end - start);
240948516a3SMikaël Urankar }
24184778508Sblueswir1 }
24284778508Sblueswir1 return 0;
24384778508Sblueswir1 }
24484778508Sblueswir1
245be04f210SWarner Losh #if HOST_LONG_BITS == 64 && TARGET_ABI_BITS == 64
246be04f210SWarner Losh # define TASK_UNMAPPED_BASE (1ul << 38)
247be04f210SWarner Losh #else
248be04f210SWarner Losh # define TASK_UNMAPPED_BASE 0x40000000
249be04f210SWarner Losh #endif
250be04f210SWarner Losh abi_ulong mmap_next_start = TASK_UNMAPPED_BASE;
25184778508Sblueswir1
252be04f210SWarner Losh /*
253be04f210SWarner Losh * Subroutine of mmap_find_vma, used when we have pre-allocated a chunk of guest
254be04f210SWarner Losh * address space.
25584778508Sblueswir1 */
mmap_find_vma_reserved(abi_ulong start,abi_ulong size,abi_ulong alignment)256be04f210SWarner Losh static abi_ulong mmap_find_vma_reserved(abi_ulong start, abi_ulong size,
257be04f210SWarner Losh abi_ulong alignment)
25884778508Sblueswir1 {
259f12294b5SRichard Henderson abi_ulong ret;
26084778508Sblueswir1
261f12294b5SRichard Henderson ret = page_find_range_empty(start, reserved_va, size, alignment);
262f12294b5SRichard Henderson if (ret == -1 && start > TARGET_PAGE_SIZE) {
263f12294b5SRichard Henderson /* Restart at the beginning of the address space. */
264f12294b5SRichard Henderson ret = page_find_range_empty(TARGET_PAGE_SIZE, start - 1,
265f12294b5SRichard Henderson size, alignment);
26684778508Sblueswir1 }
267be04f210SWarner Losh
268f12294b5SRichard Henderson return ret;
26984778508Sblueswir1 }
27084778508Sblueswir1
271be04f210SWarner Losh /*
272be04f210SWarner Losh * Find and reserve a free memory area of size 'size'. The search
273be04f210SWarner Losh * starts at 'start'.
274be04f210SWarner Losh * It must be called with mmap_lock() held.
275be04f210SWarner Losh * Return -1 if error.
276be04f210SWarner Losh */
mmap_find_vma_aligned(abi_ulong start,abi_ulong size,abi_ulong alignment)277be04f210SWarner Losh static abi_ulong mmap_find_vma_aligned(abi_ulong start, abi_ulong size,
278be04f210SWarner Losh abi_ulong alignment)
279be04f210SWarner Losh {
280be04f210SWarner Losh void *ptr, *prev;
281be04f210SWarner Losh abi_ulong addr;
282be04f210SWarner Losh int flags;
283be04f210SWarner Losh int wrapped, repeat;
284be04f210SWarner Losh
285be04f210SWarner Losh /* If 'start' == 0, then a default start address is used. */
286be04f210SWarner Losh if (start == 0) {
287be04f210SWarner Losh start = mmap_next_start;
288be04f210SWarner Losh } else {
289be04f210SWarner Losh start &= qemu_host_page_mask;
290be04f210SWarner Losh }
291be04f210SWarner Losh
292be04f210SWarner Losh size = HOST_PAGE_ALIGN(size);
293be04f210SWarner Losh
294be04f210SWarner Losh if (reserved_va) {
295be04f210SWarner Losh return mmap_find_vma_reserved(start, size,
2960f2f3247SWarner Losh (alignment != 0 ? 1 << alignment :
2970f2f3247SWarner Losh MAX(qemu_host_page_size, TARGET_PAGE_SIZE)));
298be04f210SWarner Losh }
299be04f210SWarner Losh
300be04f210SWarner Losh addr = start;
301be04f210SWarner Losh wrapped = repeat = 0;
302be04f210SWarner Losh prev = 0;
303953b69ccSWarner Losh flags = MAP_ANON | MAP_PRIVATE;
304be04f210SWarner Losh if (alignment != 0) {
305be04f210SWarner Losh flags |= MAP_ALIGNED(alignment);
306be04f210SWarner Losh }
307be04f210SWarner Losh
308be04f210SWarner Losh for (;; prev = ptr) {
309be04f210SWarner Losh /*
310be04f210SWarner Losh * Reserve needed memory area to avoid a race.
311be04f210SWarner Losh * It should be discarded using:
312be04f210SWarner Losh * - mmap() with MAP_FIXED flag
313be04f210SWarner Losh * - mremap() with MREMAP_FIXED flag
314be04f210SWarner Losh * - shmat() with SHM_REMAP flag
315be04f210SWarner Losh */
316be04f210SWarner Losh ptr = mmap(g2h_untagged(addr), size, PROT_NONE,
317be04f210SWarner Losh flags, -1, 0);
318be04f210SWarner Losh
319be04f210SWarner Losh /* ENOMEM, if host address space has no memory */
320be04f210SWarner Losh if (ptr == MAP_FAILED) {
321be04f210SWarner Losh return (abi_ulong)-1;
322be04f210SWarner Losh }
323be04f210SWarner Losh
324be04f210SWarner Losh /*
325be04f210SWarner Losh * Count the number of sequential returns of the same address.
326be04f210SWarner Losh * This is used to modify the search algorithm below.
327be04f210SWarner Losh */
328be04f210SWarner Losh repeat = (ptr == prev ? repeat + 1 : 0);
329be04f210SWarner Losh
330be04f210SWarner Losh if (h2g_valid(ptr + size - 1)) {
331be04f210SWarner Losh addr = h2g(ptr);
332be04f210SWarner Losh
333be04f210SWarner Losh if ((addr & ~TARGET_PAGE_MASK) == 0) {
334be04f210SWarner Losh /* Success. */
335be04f210SWarner Losh if (start == mmap_next_start && addr >= TASK_UNMAPPED_BASE) {
336be04f210SWarner Losh mmap_next_start = addr + size;
337be04f210SWarner Losh }
338be04f210SWarner Losh return addr;
339be04f210SWarner Losh }
340be04f210SWarner Losh
341be04f210SWarner Losh /* The address is not properly aligned for the target. */
342be04f210SWarner Losh switch (repeat) {
343be04f210SWarner Losh case 0:
344be04f210SWarner Losh /*
345be04f210SWarner Losh * Assume the result that the kernel gave us is the
346be04f210SWarner Losh * first with enough free space, so start again at the
347be04f210SWarner Losh * next higher target page.
348be04f210SWarner Losh */
349be04f210SWarner Losh addr = TARGET_PAGE_ALIGN(addr);
350be04f210SWarner Losh break;
351be04f210SWarner Losh case 1:
352be04f210SWarner Losh /*
353be04f210SWarner Losh * Sometimes the kernel decides to perform the allocation
354be04f210SWarner Losh * at the top end of memory instead.
355be04f210SWarner Losh */
356be04f210SWarner Losh addr &= TARGET_PAGE_MASK;
357be04f210SWarner Losh break;
358be04f210SWarner Losh case 2:
359be04f210SWarner Losh /* Start over at low memory. */
360be04f210SWarner Losh addr = 0;
361be04f210SWarner Losh break;
362be04f210SWarner Losh default:
363be04f210SWarner Losh /* Fail. This unaligned block must the last. */
364be04f210SWarner Losh addr = -1;
365be04f210SWarner Losh break;
366be04f210SWarner Losh }
367be04f210SWarner Losh } else {
368be04f210SWarner Losh /*
369be04f210SWarner Losh * Since the result the kernel gave didn't fit, start
370be04f210SWarner Losh * again at low memory. If any repetition, fail.
371be04f210SWarner Losh */
372be04f210SWarner Losh addr = (repeat ? -1 : 0);
373be04f210SWarner Losh }
374be04f210SWarner Losh
375be04f210SWarner Losh /* Unmap and try again. */
376be04f210SWarner Losh munmap(ptr, size);
377be04f210SWarner Losh
378be04f210SWarner Losh /* ENOMEM if we checked the whole of the target address space. */
379be04f210SWarner Losh if (addr == (abi_ulong)-1) {
380be04f210SWarner Losh return (abi_ulong)-1;
381be04f210SWarner Losh } else if (addr == 0) {
382be04f210SWarner Losh if (wrapped) {
383be04f210SWarner Losh return (abi_ulong)-1;
384be04f210SWarner Losh }
385be04f210SWarner Losh wrapped = 1;
386be04f210SWarner Losh /*
387be04f210SWarner Losh * Don't actually use 0 when wrapping, instead indicate
388be04f210SWarner Losh * that we'd truly like an allocation in low memory.
389be04f210SWarner Losh */
390be04f210SWarner Losh addr = TARGET_PAGE_SIZE;
391be04f210SWarner Losh } else if (wrapped && addr >= start) {
392be04f210SWarner Losh return (abi_ulong)-1;
393be04f210SWarner Losh }
394be04f210SWarner Losh }
395be04f210SWarner Losh }
396be04f210SWarner Losh
mmap_find_vma(abi_ulong start,abi_ulong size)397be04f210SWarner Losh abi_ulong mmap_find_vma(abi_ulong start, abi_ulong size)
398be04f210SWarner Losh {
399be04f210SWarner Losh return mmap_find_vma_aligned(start, size, 0);
400be04f210SWarner Losh }
401be04f210SWarner Losh
40284778508Sblueswir1 /* NOTE: all the constants are the HOST ones */
target_mmap(abi_ulong start,abi_ulong len,int prot,int flags,int fd,off_t offset)40384778508Sblueswir1 abi_long target_mmap(abi_ulong start, abi_ulong len, int prot,
404be04f210SWarner Losh int flags, int fd, off_t offset)
40584778508Sblueswir1 {
40684778508Sblueswir1 abi_ulong ret, end, real_start, real_end, retaddr, host_offset, host_len;
40784778508Sblueswir1
40884778508Sblueswir1 mmap_lock();
40945b8765eSWarner Losh if (qemu_loglevel_mask(CPU_LOG_PAGE)) {
41045b8765eSWarner Losh qemu_log("mmap: start=0x" TARGET_ABI_FMT_lx
4116a3b9bfdSWarner Losh " len=0x" TARGET_ABI_FMT_lx " prot=%c%c%c flags=",
41284778508Sblueswir1 start, len,
41384778508Sblueswir1 prot & PROT_READ ? 'r' : '-',
41484778508Sblueswir1 prot & PROT_WRITE ? 'w' : '-',
41584778508Sblueswir1 prot & PROT_EXEC ? 'x' : '-');
4166a3b9bfdSWarner Losh if (flags & MAP_ALIGNMENT_MASK) {
41745b8765eSWarner Losh qemu_log("MAP_ALIGNED(%u) ",
41845b8765eSWarner Losh (flags & MAP_ALIGNMENT_MASK) >> MAP_ALIGNMENT_SHIFT);
41984778508Sblueswir1 }
4206a3b9bfdSWarner Losh if (flags & MAP_GUARD) {
42145b8765eSWarner Losh qemu_log("MAP_GUARD ");
4226a3b9bfdSWarner Losh }
4236a3b9bfdSWarner Losh if (flags & MAP_FIXED) {
42445b8765eSWarner Losh qemu_log("MAP_FIXED ");
4256a3b9bfdSWarner Losh }
426953b69ccSWarner Losh if (flags & MAP_ANON) {
42745b8765eSWarner Losh qemu_log("MAP_ANON ");
4286a3b9bfdSWarner Losh }
4296a3b9bfdSWarner Losh if (flags & MAP_EXCL) {
43045b8765eSWarner Losh qemu_log("MAP_EXCL ");
4316a3b9bfdSWarner Losh }
4326a3b9bfdSWarner Losh if (flags & MAP_PRIVATE) {
43345b8765eSWarner Losh qemu_log("MAP_PRIVATE ");
4346a3b9bfdSWarner Losh }
4356a3b9bfdSWarner Losh if (flags & MAP_SHARED) {
43645b8765eSWarner Losh qemu_log("MAP_SHARED ");
4376a3b9bfdSWarner Losh }
4386a3b9bfdSWarner Losh if (flags & MAP_NOCORE) {
43945b8765eSWarner Losh qemu_log("MAP_NOCORE ");
4406a3b9bfdSWarner Losh }
4416a3b9bfdSWarner Losh if (flags & MAP_STACK) {
44245b8765eSWarner Losh qemu_log("MAP_STACK ");
4436a3b9bfdSWarner Losh }
44445b8765eSWarner Losh qemu_log("fd=%d offset=0x%lx\n", fd, offset);
44584778508Sblueswir1 }
44684778508Sblueswir1
447953b69ccSWarner Losh if ((flags & MAP_ANON) && fd != -1) {
448be04f210SWarner Losh errno = EINVAL;
449be04f210SWarner Losh goto fail;
450be04f210SWarner Losh }
451be04f210SWarner Losh if (flags & MAP_STACK) {
452be04f210SWarner Losh if ((fd != -1) || ((prot & (PROT_READ | PROT_WRITE)) !=
453be04f210SWarner Losh (PROT_READ | PROT_WRITE))) {
454be04f210SWarner Losh errno = EINVAL;
455be04f210SWarner Losh goto fail;
456be04f210SWarner Losh }
457be04f210SWarner Losh }
458be04f210SWarner Losh if ((flags & MAP_GUARD) && (prot != PROT_NONE || fd != -1 ||
459be04f210SWarner Losh offset != 0 || (flags & (MAP_SHARED | MAP_PRIVATE |
460be04f210SWarner Losh /* MAP_PREFAULT | */ /* MAP_PREFAULT not in mman.h */
461be04f210SWarner Losh MAP_PREFAULT_READ | MAP_ANON | MAP_STACK)) != 0)) {
462be04f210SWarner Losh errno = EINVAL;
463be04f210SWarner Losh goto fail;
464be04f210SWarner Losh }
465be04f210SWarner Losh
46684778508Sblueswir1 if (offset & ~TARGET_PAGE_MASK) {
46784778508Sblueswir1 errno = EINVAL;
46884778508Sblueswir1 goto fail;
46984778508Sblueswir1 }
47084778508Sblueswir1
471be04f210SWarner Losh if (len == 0) {
472be04f210SWarner Losh errno = EINVAL;
473be04f210SWarner Losh goto fail;
474be04f210SWarner Losh }
47514837a3fSWarner Losh
47614837a3fSWarner Losh /* Check for overflows */
47714837a3fSWarner Losh len = TARGET_PAGE_ALIGN(len);
47814837a3fSWarner Losh if (len == 0) {
47914837a3fSWarner Losh errno = ENOMEM;
48014837a3fSWarner Losh goto fail;
48114837a3fSWarner Losh }
48214837a3fSWarner Losh
48384778508Sblueswir1 real_start = start & qemu_host_page_mask;
48484778508Sblueswir1 host_offset = offset & qemu_host_page_mask;
485be04f210SWarner Losh
486be04f210SWarner Losh /*
487be04f210SWarner Losh * If the user is asking for the kernel to find a location, do that
488be04f210SWarner Losh * before we truncate the length for mapping files below.
489be04f210SWarner Losh */
490be04f210SWarner Losh if (!(flags & MAP_FIXED)) {
49184778508Sblueswir1 host_len = len + offset - host_offset;
49284778508Sblueswir1 host_len = HOST_PAGE_ALIGN(host_len);
493be04f210SWarner Losh if ((flags & MAP_ALIGNMENT_MASK) != 0)
494be04f210SWarner Losh start = mmap_find_vma_aligned(real_start, host_len,
495be04f210SWarner Losh (flags & MAP_ALIGNMENT_MASK) >> MAP_ALIGNMENT_SHIFT);
496be04f210SWarner Losh else
497be04f210SWarner Losh start = mmap_find_vma(real_start, host_len);
498be04f210SWarner Losh if (start == (abi_ulong)-1) {
49984778508Sblueswir1 errno = ENOMEM;
50084778508Sblueswir1 goto fail;
50184778508Sblueswir1 }
502be04f210SWarner Losh }
503be04f210SWarner Losh
504be04f210SWarner Losh /*
505be04f210SWarner Losh * When mapping files into a memory area larger than the file, accesses
506be04f210SWarner Losh * to pages beyond the file size will cause a SIGBUS.
507be04f210SWarner Losh *
508be04f210SWarner Losh * For example, if mmaping a file of 100 bytes on a host with 4K pages
509be04f210SWarner Losh * emulating a target with 8K pages, the target expects to be able to
510be04f210SWarner Losh * access the first 8K. But the host will trap us on any access beyond
511be04f210SWarner Losh * 4K.
512be04f210SWarner Losh *
513be04f210SWarner Losh * When emulating a target with a larger page-size than the hosts, we
514be04f210SWarner Losh * may need to truncate file maps at EOF and add extra anonymous pages
515be04f210SWarner Losh * up to the targets page boundary.
516be04f210SWarner Losh */
517be04f210SWarner Losh
5188e3b0cbbSMarc-André Lureau if ((qemu_real_host_page_size() < qemu_host_page_size) && fd != -1) {
519be04f210SWarner Losh struct stat sb;
520be04f210SWarner Losh
521be04f210SWarner Losh if (fstat(fd, &sb) == -1) {
522be04f210SWarner Losh goto fail;
523be04f210SWarner Losh }
524be04f210SWarner Losh
525be04f210SWarner Losh /* Are we trying to create a map beyond EOF?. */
526be04f210SWarner Losh if (offset + len > sb.st_size) {
527be04f210SWarner Losh /*
528be04f210SWarner Losh * If so, truncate the file map at eof aligned with
529be04f210SWarner Losh * the hosts real pagesize. Additional anonymous maps
530be04f210SWarner Losh * will be created beyond EOF.
531be04f210SWarner Losh */
532be04f210SWarner Losh len = REAL_HOST_PAGE_ALIGN(sb.st_size - offset);
533be04f210SWarner Losh }
534be04f210SWarner Losh }
535be04f210SWarner Losh
536be04f210SWarner Losh if (!(flags & MAP_FIXED)) {
537be04f210SWarner Losh unsigned long host_start;
538be04f210SWarner Losh void *p;
539be04f210SWarner Losh
540be04f210SWarner Losh host_len = len + offset - host_offset;
541be04f210SWarner Losh host_len = HOST_PAGE_ALIGN(host_len);
542be04f210SWarner Losh
543be04f210SWarner Losh /*
544be04f210SWarner Losh * Note: we prefer to control the mapping address. It is
545be04f210SWarner Losh * especially important if qemu_host_page_size >
546be04f210SWarner Losh * qemu_real_host_page_size
547be04f210SWarner Losh */
548be04f210SWarner Losh p = mmap(g2h_untagged(start), host_len, prot,
549953b69ccSWarner Losh flags | MAP_FIXED | ((fd != -1) ? MAP_ANON : 0), -1, 0);
55084778508Sblueswir1 if (p == MAP_FAILED)
55184778508Sblueswir1 goto fail;
55284778508Sblueswir1 /* update start so that it points to the file position at 'offset' */
55384778508Sblueswir1 host_start = (unsigned long)p;
554be04f210SWarner Losh if (fd != -1) {
555be04f210SWarner Losh p = mmap(g2h_untagged(start), len, prot,
556be04f210SWarner Losh flags | MAP_FIXED, fd, host_offset);
557be04f210SWarner Losh if (p == MAP_FAILED) {
558be04f210SWarner Losh munmap(g2h_untagged(start), host_len);
559be04f210SWarner Losh goto fail;
560be04f210SWarner Losh }
56184778508Sblueswir1 host_start += offset - host_offset;
562be04f210SWarner Losh }
56384778508Sblueswir1 start = h2g(host_start);
56484778508Sblueswir1 } else {
56584778508Sblueswir1 if (start & ~TARGET_PAGE_MASK) {
56684778508Sblueswir1 errno = EINVAL;
56784778508Sblueswir1 goto fail;
56884778508Sblueswir1 }
56984778508Sblueswir1 end = start + len;
57084778508Sblueswir1 real_end = HOST_PAGE_ALIGN(end);
57184778508Sblueswir1
572be04f210SWarner Losh /*
573be04f210SWarner Losh * Test if requested memory area fits target address space
574be04f210SWarner Losh * It can fail only on 64-bit host with 32-bit target.
575be04f210SWarner Losh * On any other target/host host mmap() handles this error correctly.
576be04f210SWarner Losh */
5770fc76b68SKyle Evans if (!guest_range_valid_untagged(start, len)) {
578be04f210SWarner Losh errno = EINVAL;
57984778508Sblueswir1 goto fail;
58084778508Sblueswir1 }
58184778508Sblueswir1
582be04f210SWarner Losh /*
583be04f210SWarner Losh * worst case: we cannot map the file because the offset is not
584be04f210SWarner Losh * aligned, so we read it
585be04f210SWarner Losh */
586a6b2d060SWarner Losh if (fd != -1 &&
58784778508Sblueswir1 (offset & ~qemu_host_page_mask) != (start & ~qemu_host_page_mask)) {
588be04f210SWarner Losh /*
589be04f210SWarner Losh * msync() won't work here, so we return an error if write is
590be04f210SWarner Losh * possible while it is a shared mapping
591be04f210SWarner Losh */
5926c173b3cSblueswir1 if ((flags & TARGET_BSD_MAP_FLAGMASK) == MAP_SHARED &&
59384778508Sblueswir1 (prot & PROT_WRITE)) {
59484778508Sblueswir1 errno = EINVAL;
59584778508Sblueswir1 goto fail;
59684778508Sblueswir1 }
59784778508Sblueswir1 retaddr = target_mmap(start, len, prot | PROT_WRITE,
59884778508Sblueswir1 MAP_FIXED | MAP_PRIVATE | MAP_ANON,
59984778508Sblueswir1 -1, 0);
60084778508Sblueswir1 if (retaddr == -1)
60184778508Sblueswir1 goto fail;
602*5b73b248SRichard Henderson if (!mmap_pread(fd, g2h_untagged(start), len, offset, false)) {
60326778ac3SMikaël Urankar goto fail;
60426778ac3SMikaël Urankar }
60584778508Sblueswir1 if (!(prot & PROT_WRITE)) {
60684778508Sblueswir1 ret = target_mprotect(start, len, prot);
60791a5addaSWarner Losh assert(ret == 0);
60884778508Sblueswir1 }
60984778508Sblueswir1 goto the_end;
61084778508Sblueswir1 }
61184778508Sblueswir1
6120fc76b68SKyle Evans /* Reject the mapping if any page within the range is mapped */
6139c255cb5SRichard Henderson if ((flags & MAP_EXCL) && !page_check_range_empty(start, end - 1)) {
6140fc76b68SKyle Evans errno = EINVAL;
6150fc76b68SKyle Evans goto fail;
6160fc76b68SKyle Evans }
6170fc76b68SKyle Evans
61884778508Sblueswir1 /* handle the start of the mapping */
61984778508Sblueswir1 if (start > real_start) {
62084778508Sblueswir1 if (real_end == real_start + qemu_host_page_size) {
62184778508Sblueswir1 /* one single host page */
62284778508Sblueswir1 ret = mmap_frag(real_start, start, end,
62384778508Sblueswir1 prot, flags, fd, offset);
62484778508Sblueswir1 if (ret == -1)
62584778508Sblueswir1 goto fail;
62684778508Sblueswir1 goto the_end1;
62784778508Sblueswir1 }
62884778508Sblueswir1 ret = mmap_frag(real_start, start, real_start + qemu_host_page_size,
62984778508Sblueswir1 prot, flags, fd, offset);
63084778508Sblueswir1 if (ret == -1)
63184778508Sblueswir1 goto fail;
63284778508Sblueswir1 real_start += qemu_host_page_size;
63384778508Sblueswir1 }
63484778508Sblueswir1 /* handle the end of the mapping */
63584778508Sblueswir1 if (end < real_end) {
63684778508Sblueswir1 ret = mmap_frag(real_end - qemu_host_page_size,
637be04f210SWarner Losh real_end - qemu_host_page_size, end,
63884778508Sblueswir1 prot, flags, fd,
63984778508Sblueswir1 offset + real_end - qemu_host_page_size - start);
64084778508Sblueswir1 if (ret == -1)
64184778508Sblueswir1 goto fail;
64284778508Sblueswir1 real_end -= qemu_host_page_size;
64384778508Sblueswir1 }
64484778508Sblueswir1
64584778508Sblueswir1 /* map the middle (easier) */
64684778508Sblueswir1 if (real_start < real_end) {
64784778508Sblueswir1 void *p;
64884778508Sblueswir1 unsigned long offset1;
64984778508Sblueswir1 if (flags & MAP_ANON)
65084778508Sblueswir1 offset1 = 0;
65184778508Sblueswir1 else
65284778508Sblueswir1 offset1 = offset + real_start - start;
6533e8f1628SRichard Henderson p = mmap(g2h_untagged(real_start), real_end - real_start,
65484778508Sblueswir1 prot, flags, fd, offset1);
65584778508Sblueswir1 if (p == MAP_FAILED)
65684778508Sblueswir1 goto fail;
65784778508Sblueswir1 }
65884778508Sblueswir1 }
65984778508Sblueswir1 the_end1:
66049840a4aSRichard Henderson page_set_flags(start, start + len - 1, prot | PAGE_VALID);
66184778508Sblueswir1 the_end:
66284778508Sblueswir1 #ifdef DEBUG_MMAP
6636a3b9bfdSWarner Losh printf("ret=0x" TARGET_ABI_FMT_lx "\n", start);
66484778508Sblueswir1 page_dump(stdout);
66584778508Sblueswir1 printf("\n");
66684778508Sblueswir1 #endif
66784778508Sblueswir1 mmap_unlock();
66884778508Sblueswir1 return start;
66984778508Sblueswir1 fail:
67084778508Sblueswir1 mmap_unlock();
67184778508Sblueswir1 return -1;
67284778508Sblueswir1 }
67384778508Sblueswir1
mmap_reserve(abi_ulong start,abi_ulong size)6744e00b7d8SStacey Son void mmap_reserve(abi_ulong start, abi_ulong size)
675be04f210SWarner Losh {
676be04f210SWarner Losh abi_ulong real_start;
677be04f210SWarner Losh abi_ulong real_end;
678be04f210SWarner Losh abi_ulong addr;
679be04f210SWarner Losh abi_ulong end;
680be04f210SWarner Losh int prot;
681be04f210SWarner Losh
682be04f210SWarner Losh real_start = start & qemu_host_page_mask;
683be04f210SWarner Losh real_end = HOST_PAGE_ALIGN(start + size);
684be04f210SWarner Losh end = start + size;
685be04f210SWarner Losh if (start > real_start) {
686be04f210SWarner Losh /* handle host page containing start */
687be04f210SWarner Losh prot = 0;
688be04f210SWarner Losh for (addr = real_start; addr < start; addr += TARGET_PAGE_SIZE) {
689be04f210SWarner Losh prot |= page_get_flags(addr);
690be04f210SWarner Losh }
691be04f210SWarner Losh if (real_end == real_start + qemu_host_page_size) {
692be04f210SWarner Losh for (addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) {
693be04f210SWarner Losh prot |= page_get_flags(addr);
694be04f210SWarner Losh }
695be04f210SWarner Losh end = real_end;
696be04f210SWarner Losh }
697be04f210SWarner Losh if (prot != 0) {
698be04f210SWarner Losh real_start += qemu_host_page_size;
699be04f210SWarner Losh }
700be04f210SWarner Losh }
701be04f210SWarner Losh if (end < real_end) {
702be04f210SWarner Losh prot = 0;
703be04f210SWarner Losh for (addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) {
704be04f210SWarner Losh prot |= page_get_flags(addr);
705be04f210SWarner Losh }
706be04f210SWarner Losh if (prot != 0) {
707be04f210SWarner Losh real_end -= qemu_host_page_size;
708be04f210SWarner Losh }
709be04f210SWarner Losh }
710be04f210SWarner Losh if (real_start != real_end) {
711be04f210SWarner Losh mmap(g2h_untagged(real_start), real_end - real_start, PROT_NONE,
712953b69ccSWarner Losh MAP_FIXED | MAP_ANON | MAP_PRIVATE, -1, 0);
713be04f210SWarner Losh }
714be04f210SWarner Losh }
715be04f210SWarner Losh
target_munmap(abi_ulong start,abi_ulong len)71684778508Sblueswir1 int target_munmap(abi_ulong start, abi_ulong len)
71784778508Sblueswir1 {
71884778508Sblueswir1 abi_ulong end, real_start, real_end, addr;
71984778508Sblueswir1 int prot, ret;
72084778508Sblueswir1
72184778508Sblueswir1 #ifdef DEBUG_MMAP
7226a3b9bfdSWarner Losh printf("munmap: start=0x" TARGET_ABI_FMT_lx " len=0x"
7236a3b9bfdSWarner Losh TARGET_ABI_FMT_lx "\n",
7246a3b9bfdSWarner Losh start, len);
72584778508Sblueswir1 #endif
72684778508Sblueswir1 if (start & ~TARGET_PAGE_MASK)
72784778508Sblueswir1 return -EINVAL;
72884778508Sblueswir1 len = TARGET_PAGE_ALIGN(len);
72984778508Sblueswir1 if (len == 0)
73084778508Sblueswir1 return -EINVAL;
73184778508Sblueswir1 mmap_lock();
73284778508Sblueswir1 end = start + len;
73384778508Sblueswir1 real_start = start & qemu_host_page_mask;
73484778508Sblueswir1 real_end = HOST_PAGE_ALIGN(end);
73584778508Sblueswir1
73684778508Sblueswir1 if (start > real_start) {
73784778508Sblueswir1 /* handle host page containing start */
73884778508Sblueswir1 prot = 0;
73984778508Sblueswir1 for (addr = real_start; addr < start; addr += TARGET_PAGE_SIZE) {
74084778508Sblueswir1 prot |= page_get_flags(addr);
74184778508Sblueswir1 }
74284778508Sblueswir1 if (real_end == real_start + qemu_host_page_size) {
74384778508Sblueswir1 for (addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) {
74484778508Sblueswir1 prot |= page_get_flags(addr);
74584778508Sblueswir1 }
74684778508Sblueswir1 end = real_end;
74784778508Sblueswir1 }
74884778508Sblueswir1 if (prot != 0)
74984778508Sblueswir1 real_start += qemu_host_page_size;
75084778508Sblueswir1 }
75184778508Sblueswir1 if (end < real_end) {
75284778508Sblueswir1 prot = 0;
75384778508Sblueswir1 for (addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) {
75484778508Sblueswir1 prot |= page_get_flags(addr);
75584778508Sblueswir1 }
75684778508Sblueswir1 if (prot != 0)
75784778508Sblueswir1 real_end -= qemu_host_page_size;
75884778508Sblueswir1 }
75984778508Sblueswir1
76084778508Sblueswir1 ret = 0;
76184778508Sblueswir1 /* unmap what we can */
76284778508Sblueswir1 if (real_start < real_end) {
763be04f210SWarner Losh if (reserved_va) {
764be04f210SWarner Losh mmap_reserve(real_start, real_end - real_start);
765be04f210SWarner Losh } else {
7663e8f1628SRichard Henderson ret = munmap(g2h_untagged(real_start), real_end - real_start);
76784778508Sblueswir1 }
768be04f210SWarner Losh }
76984778508Sblueswir1
770be04f210SWarner Losh if (ret == 0) {
77149840a4aSRichard Henderson page_set_flags(start, start + len - 1, 0);
772be04f210SWarner Losh }
77384778508Sblueswir1 mmap_unlock();
77484778508Sblueswir1 return ret;
77584778508Sblueswir1 }
77684778508Sblueswir1
target_msync(abi_ulong start,abi_ulong len,int flags)77784778508Sblueswir1 int target_msync(abi_ulong start, abi_ulong len, int flags)
77884778508Sblueswir1 {
77984778508Sblueswir1 abi_ulong end;
78084778508Sblueswir1
78184778508Sblueswir1 if (start & ~TARGET_PAGE_MASK)
78284778508Sblueswir1 return -EINVAL;
78384778508Sblueswir1 len = TARGET_PAGE_ALIGN(len);
78484778508Sblueswir1 end = start + len;
78584778508Sblueswir1 if (end < start)
78684778508Sblueswir1 return -EINVAL;
78784778508Sblueswir1 if (end == start)
78884778508Sblueswir1 return 0;
78984778508Sblueswir1
79084778508Sblueswir1 start &= qemu_host_page_mask;
7913e8f1628SRichard Henderson return msync(g2h_untagged(start), end - start, flags);
79284778508Sblueswir1 }
793