184778508Sblueswir1 /* 284778508Sblueswir1 * mmap support for qemu 384778508Sblueswir1 * 484778508Sblueswir1 * Copyright (c) 2003 - 2008 Fabrice Bellard 584778508Sblueswir1 * 684778508Sblueswir1 * This program is free software; you can redistribute it and/or modify 784778508Sblueswir1 * it under the terms of the GNU General Public License as published by 884778508Sblueswir1 * the Free Software Foundation; either version 2 of the License, or 984778508Sblueswir1 * (at your option) any later version. 1084778508Sblueswir1 * 1184778508Sblueswir1 * This program is distributed in the hope that it will be useful, 1284778508Sblueswir1 * but WITHOUT ANY WARRANTY; without even the implied warranty of 1384778508Sblueswir1 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 1484778508Sblueswir1 * GNU General Public License for more details. 1584778508Sblueswir1 * 1684778508Sblueswir1 * You should have received a copy of the GNU General Public License 178167ee88SBlue Swirl * along with this program; if not, see <http://www.gnu.org/licenses/>. 1884778508Sblueswir1 */ 192231197cSPeter Maydell #include "qemu/osdep.h" 2074781c08SPhilippe Mathieu-Daudé #include "exec/page-protection.h" 2184778508Sblueswir1 2284778508Sblueswir1 #include "qemu.h" 2384778508Sblueswir1 2495992b67SAlex Bennée static pthread_mutex_t mmap_mutex = PTHREAD_MUTEX_INITIALIZER; 2506943a62SPeter Maydell static __thread int mmap_lock_count; 2684778508Sblueswir1 2784778508Sblueswir1 void mmap_lock(void) 2884778508Sblueswir1 { 2984778508Sblueswir1 if (mmap_lock_count++ == 0) { 3084778508Sblueswir1 pthread_mutex_lock(&mmap_mutex); 3184778508Sblueswir1 } 3284778508Sblueswir1 } 3384778508Sblueswir1 3484778508Sblueswir1 void mmap_unlock(void) 3584778508Sblueswir1 { 36990ef918SRichard Henderson assert(mmap_lock_count > 0); 3784778508Sblueswir1 if (--mmap_lock_count == 0) { 3884778508Sblueswir1 pthread_mutex_unlock(&mmap_mutex); 3984778508Sblueswir1 } 4084778508Sblueswir1 } 4184778508Sblueswir1 42301e40edSAlex Bennée bool have_mmap_lock(void) 43301e40edSAlex Bennée { 44301e40edSAlex Bennée return mmap_lock_count > 0 ? true : false; 45301e40edSAlex Bennée } 46301e40edSAlex Bennée 4784778508Sblueswir1 /* Grab lock to make sure things are in a consistent state after fork(). */ 4884778508Sblueswir1 void mmap_fork_start(void) 4984778508Sblueswir1 { 5084778508Sblueswir1 if (mmap_lock_count) 5184778508Sblueswir1 abort(); 5284778508Sblueswir1 pthread_mutex_lock(&mmap_mutex); 5384778508Sblueswir1 } 5484778508Sblueswir1 5584778508Sblueswir1 void mmap_fork_end(int child) 5684778508Sblueswir1 { 5784778508Sblueswir1 if (child) 5884778508Sblueswir1 pthread_mutex_init(&mmap_mutex, NULL); 5984778508Sblueswir1 else 6084778508Sblueswir1 pthread_mutex_unlock(&mmap_mutex); 6184778508Sblueswir1 } 6284778508Sblueswir1 6384778508Sblueswir1 /* NOTE: all the constants are the HOST ones, but addresses are target. */ 6484778508Sblueswir1 int target_mprotect(abi_ulong start, abi_ulong len, int prot) 6584778508Sblueswir1 { 6684778508Sblueswir1 abi_ulong end, host_start, host_end, addr; 6784778508Sblueswir1 int prot1, ret; 6884778508Sblueswir1 6945b8765eSWarner Losh qemu_log_mask(CPU_LOG_PAGE, "mprotect: start=0x" TARGET_ABI_FMT_lx 706a3b9bfdSWarner Losh " len=0x" TARGET_ABI_FMT_lx " prot=%c%c%c\n", start, len, 7184778508Sblueswir1 prot & PROT_READ ? 'r' : '-', 7284778508Sblueswir1 prot & PROT_WRITE ? 'w' : '-', 7384778508Sblueswir1 prot & PROT_EXEC ? 'x' : '-'); 7484778508Sblueswir1 if ((start & ~TARGET_PAGE_MASK) != 0) 7584778508Sblueswir1 return -EINVAL; 7684778508Sblueswir1 len = TARGET_PAGE_ALIGN(len); 7784778508Sblueswir1 end = start + len; 7884778508Sblueswir1 if (end < start) 7984778508Sblueswir1 return -EINVAL; 8084778508Sblueswir1 prot &= PROT_READ | PROT_WRITE | PROT_EXEC; 8184778508Sblueswir1 if (len == 0) 8284778508Sblueswir1 return 0; 8384778508Sblueswir1 8484778508Sblueswir1 mmap_lock(); 8584778508Sblueswir1 host_start = start & qemu_host_page_mask; 8684778508Sblueswir1 host_end = HOST_PAGE_ALIGN(end); 8784778508Sblueswir1 if (start > host_start) { 8884778508Sblueswir1 /* handle host page containing start */ 8984778508Sblueswir1 prot1 = prot; 9084778508Sblueswir1 for (addr = host_start; addr < start; addr += TARGET_PAGE_SIZE) { 9184778508Sblueswir1 prot1 |= page_get_flags(addr); 9284778508Sblueswir1 } 9384778508Sblueswir1 if (host_end == host_start + qemu_host_page_size) { 9484778508Sblueswir1 for (addr = end; addr < host_end; addr += TARGET_PAGE_SIZE) { 9584778508Sblueswir1 prot1 |= page_get_flags(addr); 9684778508Sblueswir1 } 9784778508Sblueswir1 end = host_end; 9884778508Sblueswir1 } 993e8f1628SRichard Henderson ret = mprotect(g2h_untagged(host_start), 10086b7c551SBALATON Zoltan qemu_host_page_size, prot1 & PAGE_RWX); 10184778508Sblueswir1 if (ret != 0) 10284778508Sblueswir1 goto error; 10384778508Sblueswir1 host_start += qemu_host_page_size; 10484778508Sblueswir1 } 10584778508Sblueswir1 if (end < host_end) { 10684778508Sblueswir1 prot1 = prot; 10784778508Sblueswir1 for (addr = end; addr < host_end; addr += TARGET_PAGE_SIZE) { 10884778508Sblueswir1 prot1 |= page_get_flags(addr); 10984778508Sblueswir1 } 1103e8f1628SRichard Henderson ret = mprotect(g2h_untagged(host_end - qemu_host_page_size), 11186b7c551SBALATON Zoltan qemu_host_page_size, prot1 & PAGE_RWX); 11284778508Sblueswir1 if (ret != 0) 11384778508Sblueswir1 goto error; 11484778508Sblueswir1 host_end -= qemu_host_page_size; 11584778508Sblueswir1 } 11684778508Sblueswir1 11784778508Sblueswir1 /* handle the pages in the middle */ 11884778508Sblueswir1 if (host_start < host_end) { 1193e8f1628SRichard Henderson ret = mprotect(g2h_untagged(host_start), host_end - host_start, prot); 12084778508Sblueswir1 if (ret != 0) 12184778508Sblueswir1 goto error; 12284778508Sblueswir1 } 12349840a4aSRichard Henderson page_set_flags(start, start + len - 1, prot | PAGE_VALID); 12484778508Sblueswir1 mmap_unlock(); 12584778508Sblueswir1 return 0; 12684778508Sblueswir1 error: 12784778508Sblueswir1 mmap_unlock(); 12884778508Sblueswir1 return ret; 12984778508Sblueswir1 } 13084778508Sblueswir1 131a6b2d060SWarner Losh /* 132*5b73b248SRichard Henderson * Perform a pread on behalf of target_mmap. We can reach EOF, we can be 133*5b73b248SRichard Henderson * interrupted by signals, and in general there's no good error return path. 134*5b73b248SRichard Henderson * If @zero, zero the rest of the block at EOF. 135*5b73b248SRichard Henderson * Return true on success. 136*5b73b248SRichard Henderson */ 137*5b73b248SRichard Henderson static bool mmap_pread(int fd, void *p, size_t len, off_t offset, bool zero) 138*5b73b248SRichard Henderson { 139*5b73b248SRichard Henderson while (1) { 140*5b73b248SRichard Henderson ssize_t r = pread(fd, p, len, offset); 141*5b73b248SRichard Henderson 142*5b73b248SRichard Henderson if (likely(r == len)) { 143*5b73b248SRichard Henderson /* Complete */ 144*5b73b248SRichard Henderson return true; 145*5b73b248SRichard Henderson } 146*5b73b248SRichard Henderson if (r == 0) { 147*5b73b248SRichard Henderson /* EOF */ 148*5b73b248SRichard Henderson if (zero) { 149*5b73b248SRichard Henderson memset(p, 0, len); 150*5b73b248SRichard Henderson } 151*5b73b248SRichard Henderson return true; 152*5b73b248SRichard Henderson } 153*5b73b248SRichard Henderson if (r > 0) { 154*5b73b248SRichard Henderson /* Short read */ 155*5b73b248SRichard Henderson p += r; 156*5b73b248SRichard Henderson len -= r; 157*5b73b248SRichard Henderson offset += r; 158*5b73b248SRichard Henderson } else if (errno != EINTR) { 159*5b73b248SRichard Henderson /* Error */ 160*5b73b248SRichard Henderson return false; 161*5b73b248SRichard Henderson } 162*5b73b248SRichard Henderson } 163*5b73b248SRichard Henderson } 164*5b73b248SRichard Henderson 165*5b73b248SRichard Henderson /* 166a6b2d060SWarner Losh * map an incomplete host page 167a6b2d060SWarner Losh * 168a6b2d060SWarner Losh * mmap_frag can be called with a valid fd, if flags doesn't contain one of 169a6b2d060SWarner Losh * MAP_ANON, MAP_STACK, MAP_GUARD. If we need to map a page in those cases, we 170a6b2d060SWarner Losh * pass fd == -1. However, if flags contains MAP_GUARD then MAP_ANON cannot be 171a6b2d060SWarner Losh * added. 172a6b2d060SWarner Losh * 173a6b2d060SWarner Losh * * If fd is valid (not -1) we want to map the pages with MAP_ANON. 174a6b2d060SWarner Losh * * If flags contains MAP_GUARD we don't want to add MAP_ANON because it 175a6b2d060SWarner Losh * will be rejected. See kern_mmap's enforcing of constraints for MAP_GUARD 176a6b2d060SWarner Losh * in sys/vm/vm_mmap.c. 177a6b2d060SWarner Losh * * If flags contains MAP_ANON it doesn't matter if we add it or not. 178a6b2d060SWarner Losh * * If flags contains MAP_STACK, mmap adds MAP_ANON when called so doesn't 179a6b2d060SWarner Losh * matter if we add it or not either. See enforcing of constraints for 180a6b2d060SWarner Losh * MAP_STACK in kern_mmap. 181a6b2d060SWarner Losh * 182a6b2d060SWarner Losh * Don't add MAP_ANON for the flags that use fd == -1 without specifying the 183a6b2d060SWarner Losh * flags directly, with the assumption that future flags that require fd == -1 184a6b2d060SWarner Losh * will also not require MAP_ANON. 185a6b2d060SWarner Losh */ 18684778508Sblueswir1 static int mmap_frag(abi_ulong real_start, 18784778508Sblueswir1 abi_ulong start, abi_ulong end, 18884778508Sblueswir1 int prot, int flags, int fd, abi_ulong offset) 18984778508Sblueswir1 { 19084778508Sblueswir1 abi_ulong real_end, addr; 19184778508Sblueswir1 void *host_start; 19284778508Sblueswir1 int prot1, prot_new; 19384778508Sblueswir1 19484778508Sblueswir1 real_end = real_start + qemu_host_page_size; 1953e8f1628SRichard Henderson host_start = g2h_untagged(real_start); 19684778508Sblueswir1 19784778508Sblueswir1 /* get the protection of the target pages outside the mapping */ 19884778508Sblueswir1 prot1 = 0; 19984778508Sblueswir1 for (addr = real_start; addr < real_end; addr++) { 20084778508Sblueswir1 if (addr < start || addr >= end) 20184778508Sblueswir1 prot1 |= page_get_flags(addr); 20284778508Sblueswir1 } 20384778508Sblueswir1 20484778508Sblueswir1 if (prot1 == 0) { 205a6b2d060SWarner Losh /* no page was there, so we allocate one. See also above. */ 20684778508Sblueswir1 void *p = mmap(host_start, qemu_host_page_size, prot, 207a6b2d060SWarner Losh flags | ((fd != -1) ? MAP_ANON : 0), -1, 0); 20884778508Sblueswir1 if (p == MAP_FAILED) 20984778508Sblueswir1 return -1; 21084778508Sblueswir1 prot1 = prot; 21184778508Sblueswir1 } 21286b7c551SBALATON Zoltan prot1 &= PAGE_RWX; 21384778508Sblueswir1 21484778508Sblueswir1 prot_new = prot | prot1; 215a6b2d060SWarner Losh if (fd != -1) { 21684778508Sblueswir1 /* msync() won't work here, so we return an error if write is 21784778508Sblueswir1 possible while it is a shared mapping */ 2186c173b3cSblueswir1 if ((flags & TARGET_BSD_MAP_FLAGMASK) == MAP_SHARED && 21984778508Sblueswir1 (prot & PROT_WRITE)) 220059bca46SBlue Swirl return -1; 22184778508Sblueswir1 22284778508Sblueswir1 /* adjust protection to be able to read */ 22384778508Sblueswir1 if (!(prot1 & PROT_WRITE)) 22484778508Sblueswir1 mprotect(host_start, qemu_host_page_size, prot1 | PROT_WRITE); 22584778508Sblueswir1 22684778508Sblueswir1 /* read the corresponding file data */ 227*5b73b248SRichard Henderson if (!mmap_pread(fd, g2h_untagged(start), end - start, offset, true)) { 22826778ac3SMikaël Urankar return -1; 22926778ac3SMikaël Urankar } 23084778508Sblueswir1 23184778508Sblueswir1 /* put final protection */ 23284778508Sblueswir1 if (prot_new != (prot1 | PROT_WRITE)) 23384778508Sblueswir1 mprotect(host_start, qemu_host_page_size, prot_new); 23484778508Sblueswir1 } else { 23584778508Sblueswir1 if (prot_new != prot1) { 23684778508Sblueswir1 mprotect(host_start, qemu_host_page_size, prot_new); 23784778508Sblueswir1 } 238948516a3SMikaël Urankar if (prot_new & PROT_WRITE) { 239948516a3SMikaël Urankar memset(g2h_untagged(start), 0, end - start); 240948516a3SMikaël Urankar } 24184778508Sblueswir1 } 24284778508Sblueswir1 return 0; 24384778508Sblueswir1 } 24484778508Sblueswir1 245be04f210SWarner Losh #if HOST_LONG_BITS == 64 && TARGET_ABI_BITS == 64 246be04f210SWarner Losh # define TASK_UNMAPPED_BASE (1ul << 38) 247be04f210SWarner Losh #else 248be04f210SWarner Losh # define TASK_UNMAPPED_BASE 0x40000000 249be04f210SWarner Losh #endif 250be04f210SWarner Losh abi_ulong mmap_next_start = TASK_UNMAPPED_BASE; 25184778508Sblueswir1 252be04f210SWarner Losh /* 253be04f210SWarner Losh * Subroutine of mmap_find_vma, used when we have pre-allocated a chunk of guest 254be04f210SWarner Losh * address space. 25584778508Sblueswir1 */ 256be04f210SWarner Losh static abi_ulong mmap_find_vma_reserved(abi_ulong start, abi_ulong size, 257be04f210SWarner Losh abi_ulong alignment) 25884778508Sblueswir1 { 259f12294b5SRichard Henderson abi_ulong ret; 26084778508Sblueswir1 261f12294b5SRichard Henderson ret = page_find_range_empty(start, reserved_va, size, alignment); 262f12294b5SRichard Henderson if (ret == -1 && start > TARGET_PAGE_SIZE) { 263f12294b5SRichard Henderson /* Restart at the beginning of the address space. */ 264f12294b5SRichard Henderson ret = page_find_range_empty(TARGET_PAGE_SIZE, start - 1, 265f12294b5SRichard Henderson size, alignment); 26684778508Sblueswir1 } 267be04f210SWarner Losh 268f12294b5SRichard Henderson return ret; 26984778508Sblueswir1 } 27084778508Sblueswir1 271be04f210SWarner Losh /* 272be04f210SWarner Losh * Find and reserve a free memory area of size 'size'. The search 273be04f210SWarner Losh * starts at 'start'. 274be04f210SWarner Losh * It must be called with mmap_lock() held. 275be04f210SWarner Losh * Return -1 if error. 276be04f210SWarner Losh */ 277be04f210SWarner Losh static abi_ulong mmap_find_vma_aligned(abi_ulong start, abi_ulong size, 278be04f210SWarner Losh abi_ulong alignment) 279be04f210SWarner Losh { 280be04f210SWarner Losh void *ptr, *prev; 281be04f210SWarner Losh abi_ulong addr; 282be04f210SWarner Losh int flags; 283be04f210SWarner Losh int wrapped, repeat; 284be04f210SWarner Losh 285be04f210SWarner Losh /* If 'start' == 0, then a default start address is used. */ 286be04f210SWarner Losh if (start == 0) { 287be04f210SWarner Losh start = mmap_next_start; 288be04f210SWarner Losh } else { 289be04f210SWarner Losh start &= qemu_host_page_mask; 290be04f210SWarner Losh } 291be04f210SWarner Losh 292be04f210SWarner Losh size = HOST_PAGE_ALIGN(size); 293be04f210SWarner Losh 294be04f210SWarner Losh if (reserved_va) { 295be04f210SWarner Losh return mmap_find_vma_reserved(start, size, 2960f2f3247SWarner Losh (alignment != 0 ? 1 << alignment : 2970f2f3247SWarner Losh MAX(qemu_host_page_size, TARGET_PAGE_SIZE))); 298be04f210SWarner Losh } 299be04f210SWarner Losh 300be04f210SWarner Losh addr = start; 301be04f210SWarner Losh wrapped = repeat = 0; 302be04f210SWarner Losh prev = 0; 303953b69ccSWarner Losh flags = MAP_ANON | MAP_PRIVATE; 304be04f210SWarner Losh if (alignment != 0) { 305be04f210SWarner Losh flags |= MAP_ALIGNED(alignment); 306be04f210SWarner Losh } 307be04f210SWarner Losh 308be04f210SWarner Losh for (;; prev = ptr) { 309be04f210SWarner Losh /* 310be04f210SWarner Losh * Reserve needed memory area to avoid a race. 311be04f210SWarner Losh * It should be discarded using: 312be04f210SWarner Losh * - mmap() with MAP_FIXED flag 313be04f210SWarner Losh * - mremap() with MREMAP_FIXED flag 314be04f210SWarner Losh * - shmat() with SHM_REMAP flag 315be04f210SWarner Losh */ 316be04f210SWarner Losh ptr = mmap(g2h_untagged(addr), size, PROT_NONE, 317be04f210SWarner Losh flags, -1, 0); 318be04f210SWarner Losh 319be04f210SWarner Losh /* ENOMEM, if host address space has no memory */ 320be04f210SWarner Losh if (ptr == MAP_FAILED) { 321be04f210SWarner Losh return (abi_ulong)-1; 322be04f210SWarner Losh } 323be04f210SWarner Losh 324be04f210SWarner Losh /* 325be04f210SWarner Losh * Count the number of sequential returns of the same address. 326be04f210SWarner Losh * This is used to modify the search algorithm below. 327be04f210SWarner Losh */ 328be04f210SWarner Losh repeat = (ptr == prev ? repeat + 1 : 0); 329be04f210SWarner Losh 330be04f210SWarner Losh if (h2g_valid(ptr + size - 1)) { 331be04f210SWarner Losh addr = h2g(ptr); 332be04f210SWarner Losh 333be04f210SWarner Losh if ((addr & ~TARGET_PAGE_MASK) == 0) { 334be04f210SWarner Losh /* Success. */ 335be04f210SWarner Losh if (start == mmap_next_start && addr >= TASK_UNMAPPED_BASE) { 336be04f210SWarner Losh mmap_next_start = addr + size; 337be04f210SWarner Losh } 338be04f210SWarner Losh return addr; 339be04f210SWarner Losh } 340be04f210SWarner Losh 341be04f210SWarner Losh /* The address is not properly aligned for the target. */ 342be04f210SWarner Losh switch (repeat) { 343be04f210SWarner Losh case 0: 344be04f210SWarner Losh /* 345be04f210SWarner Losh * Assume the result that the kernel gave us is the 346be04f210SWarner Losh * first with enough free space, so start again at the 347be04f210SWarner Losh * next higher target page. 348be04f210SWarner Losh */ 349be04f210SWarner Losh addr = TARGET_PAGE_ALIGN(addr); 350be04f210SWarner Losh break; 351be04f210SWarner Losh case 1: 352be04f210SWarner Losh /* 353be04f210SWarner Losh * Sometimes the kernel decides to perform the allocation 354be04f210SWarner Losh * at the top end of memory instead. 355be04f210SWarner Losh */ 356be04f210SWarner Losh addr &= TARGET_PAGE_MASK; 357be04f210SWarner Losh break; 358be04f210SWarner Losh case 2: 359be04f210SWarner Losh /* Start over at low memory. */ 360be04f210SWarner Losh addr = 0; 361be04f210SWarner Losh break; 362be04f210SWarner Losh default: 363be04f210SWarner Losh /* Fail. This unaligned block must the last. */ 364be04f210SWarner Losh addr = -1; 365be04f210SWarner Losh break; 366be04f210SWarner Losh } 367be04f210SWarner Losh } else { 368be04f210SWarner Losh /* 369be04f210SWarner Losh * Since the result the kernel gave didn't fit, start 370be04f210SWarner Losh * again at low memory. If any repetition, fail. 371be04f210SWarner Losh */ 372be04f210SWarner Losh addr = (repeat ? -1 : 0); 373be04f210SWarner Losh } 374be04f210SWarner Losh 375be04f210SWarner Losh /* Unmap and try again. */ 376be04f210SWarner Losh munmap(ptr, size); 377be04f210SWarner Losh 378be04f210SWarner Losh /* ENOMEM if we checked the whole of the target address space. */ 379be04f210SWarner Losh if (addr == (abi_ulong)-1) { 380be04f210SWarner Losh return (abi_ulong)-1; 381be04f210SWarner Losh } else if (addr == 0) { 382be04f210SWarner Losh if (wrapped) { 383be04f210SWarner Losh return (abi_ulong)-1; 384be04f210SWarner Losh } 385be04f210SWarner Losh wrapped = 1; 386be04f210SWarner Losh /* 387be04f210SWarner Losh * Don't actually use 0 when wrapping, instead indicate 388be04f210SWarner Losh * that we'd truly like an allocation in low memory. 389be04f210SWarner Losh */ 390be04f210SWarner Losh addr = TARGET_PAGE_SIZE; 391be04f210SWarner Losh } else if (wrapped && addr >= start) { 392be04f210SWarner Losh return (abi_ulong)-1; 393be04f210SWarner Losh } 394be04f210SWarner Losh } 395be04f210SWarner Losh } 396be04f210SWarner Losh 397be04f210SWarner Losh abi_ulong mmap_find_vma(abi_ulong start, abi_ulong size) 398be04f210SWarner Losh { 399be04f210SWarner Losh return mmap_find_vma_aligned(start, size, 0); 400be04f210SWarner Losh } 401be04f210SWarner Losh 40284778508Sblueswir1 /* NOTE: all the constants are the HOST ones */ 40384778508Sblueswir1 abi_long target_mmap(abi_ulong start, abi_ulong len, int prot, 404be04f210SWarner Losh int flags, int fd, off_t offset) 40584778508Sblueswir1 { 40684778508Sblueswir1 abi_ulong ret, end, real_start, real_end, retaddr, host_offset, host_len; 40784778508Sblueswir1 40884778508Sblueswir1 mmap_lock(); 40945b8765eSWarner Losh if (qemu_loglevel_mask(CPU_LOG_PAGE)) { 41045b8765eSWarner Losh qemu_log("mmap: start=0x" TARGET_ABI_FMT_lx 4116a3b9bfdSWarner Losh " len=0x" TARGET_ABI_FMT_lx " prot=%c%c%c flags=", 41284778508Sblueswir1 start, len, 41384778508Sblueswir1 prot & PROT_READ ? 'r' : '-', 41484778508Sblueswir1 prot & PROT_WRITE ? 'w' : '-', 41584778508Sblueswir1 prot & PROT_EXEC ? 'x' : '-'); 4166a3b9bfdSWarner Losh if (flags & MAP_ALIGNMENT_MASK) { 41745b8765eSWarner Losh qemu_log("MAP_ALIGNED(%u) ", 41845b8765eSWarner Losh (flags & MAP_ALIGNMENT_MASK) >> MAP_ALIGNMENT_SHIFT); 41984778508Sblueswir1 } 4206a3b9bfdSWarner Losh if (flags & MAP_GUARD) { 42145b8765eSWarner Losh qemu_log("MAP_GUARD "); 4226a3b9bfdSWarner Losh } 4236a3b9bfdSWarner Losh if (flags & MAP_FIXED) { 42445b8765eSWarner Losh qemu_log("MAP_FIXED "); 4256a3b9bfdSWarner Losh } 426953b69ccSWarner Losh if (flags & MAP_ANON) { 42745b8765eSWarner Losh qemu_log("MAP_ANON "); 4286a3b9bfdSWarner Losh } 4296a3b9bfdSWarner Losh if (flags & MAP_EXCL) { 43045b8765eSWarner Losh qemu_log("MAP_EXCL "); 4316a3b9bfdSWarner Losh } 4326a3b9bfdSWarner Losh if (flags & MAP_PRIVATE) { 43345b8765eSWarner Losh qemu_log("MAP_PRIVATE "); 4346a3b9bfdSWarner Losh } 4356a3b9bfdSWarner Losh if (flags & MAP_SHARED) { 43645b8765eSWarner Losh qemu_log("MAP_SHARED "); 4376a3b9bfdSWarner Losh } 4386a3b9bfdSWarner Losh if (flags & MAP_NOCORE) { 43945b8765eSWarner Losh qemu_log("MAP_NOCORE "); 4406a3b9bfdSWarner Losh } 4416a3b9bfdSWarner Losh if (flags & MAP_STACK) { 44245b8765eSWarner Losh qemu_log("MAP_STACK "); 4436a3b9bfdSWarner Losh } 44445b8765eSWarner Losh qemu_log("fd=%d offset=0x%lx\n", fd, offset); 44584778508Sblueswir1 } 44684778508Sblueswir1 447953b69ccSWarner Losh if ((flags & MAP_ANON) && fd != -1) { 448be04f210SWarner Losh errno = EINVAL; 449be04f210SWarner Losh goto fail; 450be04f210SWarner Losh } 451be04f210SWarner Losh if (flags & MAP_STACK) { 452be04f210SWarner Losh if ((fd != -1) || ((prot & (PROT_READ | PROT_WRITE)) != 453be04f210SWarner Losh (PROT_READ | PROT_WRITE))) { 454be04f210SWarner Losh errno = EINVAL; 455be04f210SWarner Losh goto fail; 456be04f210SWarner Losh } 457be04f210SWarner Losh } 458be04f210SWarner Losh if ((flags & MAP_GUARD) && (prot != PROT_NONE || fd != -1 || 459be04f210SWarner Losh offset != 0 || (flags & (MAP_SHARED | MAP_PRIVATE | 460be04f210SWarner Losh /* MAP_PREFAULT | */ /* MAP_PREFAULT not in mman.h */ 461be04f210SWarner Losh MAP_PREFAULT_READ | MAP_ANON | MAP_STACK)) != 0)) { 462be04f210SWarner Losh errno = EINVAL; 463be04f210SWarner Losh goto fail; 464be04f210SWarner Losh } 465be04f210SWarner Losh 46684778508Sblueswir1 if (offset & ~TARGET_PAGE_MASK) { 46784778508Sblueswir1 errno = EINVAL; 46884778508Sblueswir1 goto fail; 46984778508Sblueswir1 } 47084778508Sblueswir1 471be04f210SWarner Losh if (len == 0) { 472be04f210SWarner Losh errno = EINVAL; 473be04f210SWarner Losh goto fail; 474be04f210SWarner Losh } 47514837a3fSWarner Losh 47614837a3fSWarner Losh /* Check for overflows */ 47714837a3fSWarner Losh len = TARGET_PAGE_ALIGN(len); 47814837a3fSWarner Losh if (len == 0) { 47914837a3fSWarner Losh errno = ENOMEM; 48014837a3fSWarner Losh goto fail; 48114837a3fSWarner Losh } 48214837a3fSWarner Losh 48384778508Sblueswir1 real_start = start & qemu_host_page_mask; 48484778508Sblueswir1 host_offset = offset & qemu_host_page_mask; 485be04f210SWarner Losh 486be04f210SWarner Losh /* 487be04f210SWarner Losh * If the user is asking for the kernel to find a location, do that 488be04f210SWarner Losh * before we truncate the length for mapping files below. 489be04f210SWarner Losh */ 490be04f210SWarner Losh if (!(flags & MAP_FIXED)) { 49184778508Sblueswir1 host_len = len + offset - host_offset; 49284778508Sblueswir1 host_len = HOST_PAGE_ALIGN(host_len); 493be04f210SWarner Losh if ((flags & MAP_ALIGNMENT_MASK) != 0) 494be04f210SWarner Losh start = mmap_find_vma_aligned(real_start, host_len, 495be04f210SWarner Losh (flags & MAP_ALIGNMENT_MASK) >> MAP_ALIGNMENT_SHIFT); 496be04f210SWarner Losh else 497be04f210SWarner Losh start = mmap_find_vma(real_start, host_len); 498be04f210SWarner Losh if (start == (abi_ulong)-1) { 49984778508Sblueswir1 errno = ENOMEM; 50084778508Sblueswir1 goto fail; 50184778508Sblueswir1 } 502be04f210SWarner Losh } 503be04f210SWarner Losh 504be04f210SWarner Losh /* 505be04f210SWarner Losh * When mapping files into a memory area larger than the file, accesses 506be04f210SWarner Losh * to pages beyond the file size will cause a SIGBUS. 507be04f210SWarner Losh * 508be04f210SWarner Losh * For example, if mmaping a file of 100 bytes on a host with 4K pages 509be04f210SWarner Losh * emulating a target with 8K pages, the target expects to be able to 510be04f210SWarner Losh * access the first 8K. But the host will trap us on any access beyond 511be04f210SWarner Losh * 4K. 512be04f210SWarner Losh * 513be04f210SWarner Losh * When emulating a target with a larger page-size than the hosts, we 514be04f210SWarner Losh * may need to truncate file maps at EOF and add extra anonymous pages 515be04f210SWarner Losh * up to the targets page boundary. 516be04f210SWarner Losh */ 517be04f210SWarner Losh 5188e3b0cbbSMarc-André Lureau if ((qemu_real_host_page_size() < qemu_host_page_size) && fd != -1) { 519be04f210SWarner Losh struct stat sb; 520be04f210SWarner Losh 521be04f210SWarner Losh if (fstat(fd, &sb) == -1) { 522be04f210SWarner Losh goto fail; 523be04f210SWarner Losh } 524be04f210SWarner Losh 525be04f210SWarner Losh /* Are we trying to create a map beyond EOF?. */ 526be04f210SWarner Losh if (offset + len > sb.st_size) { 527be04f210SWarner Losh /* 528be04f210SWarner Losh * If so, truncate the file map at eof aligned with 529be04f210SWarner Losh * the hosts real pagesize. Additional anonymous maps 530be04f210SWarner Losh * will be created beyond EOF. 531be04f210SWarner Losh */ 532be04f210SWarner Losh len = REAL_HOST_PAGE_ALIGN(sb.st_size - offset); 533be04f210SWarner Losh } 534be04f210SWarner Losh } 535be04f210SWarner Losh 536be04f210SWarner Losh if (!(flags & MAP_FIXED)) { 537be04f210SWarner Losh unsigned long host_start; 538be04f210SWarner Losh void *p; 539be04f210SWarner Losh 540be04f210SWarner Losh host_len = len + offset - host_offset; 541be04f210SWarner Losh host_len = HOST_PAGE_ALIGN(host_len); 542be04f210SWarner Losh 543be04f210SWarner Losh /* 544be04f210SWarner Losh * Note: we prefer to control the mapping address. It is 545be04f210SWarner Losh * especially important if qemu_host_page_size > 546be04f210SWarner Losh * qemu_real_host_page_size 547be04f210SWarner Losh */ 548be04f210SWarner Losh p = mmap(g2h_untagged(start), host_len, prot, 549953b69ccSWarner Losh flags | MAP_FIXED | ((fd != -1) ? MAP_ANON : 0), -1, 0); 55084778508Sblueswir1 if (p == MAP_FAILED) 55184778508Sblueswir1 goto fail; 55284778508Sblueswir1 /* update start so that it points to the file position at 'offset' */ 55384778508Sblueswir1 host_start = (unsigned long)p; 554be04f210SWarner Losh if (fd != -1) { 555be04f210SWarner Losh p = mmap(g2h_untagged(start), len, prot, 556be04f210SWarner Losh flags | MAP_FIXED, fd, host_offset); 557be04f210SWarner Losh if (p == MAP_FAILED) { 558be04f210SWarner Losh munmap(g2h_untagged(start), host_len); 559be04f210SWarner Losh goto fail; 560be04f210SWarner Losh } 56184778508Sblueswir1 host_start += offset - host_offset; 562be04f210SWarner Losh } 56384778508Sblueswir1 start = h2g(host_start); 56484778508Sblueswir1 } else { 56584778508Sblueswir1 if (start & ~TARGET_PAGE_MASK) { 56684778508Sblueswir1 errno = EINVAL; 56784778508Sblueswir1 goto fail; 56884778508Sblueswir1 } 56984778508Sblueswir1 end = start + len; 57084778508Sblueswir1 real_end = HOST_PAGE_ALIGN(end); 57184778508Sblueswir1 572be04f210SWarner Losh /* 573be04f210SWarner Losh * Test if requested memory area fits target address space 574be04f210SWarner Losh * It can fail only on 64-bit host with 32-bit target. 575be04f210SWarner Losh * On any other target/host host mmap() handles this error correctly. 576be04f210SWarner Losh */ 5770fc76b68SKyle Evans if (!guest_range_valid_untagged(start, len)) { 578be04f210SWarner Losh errno = EINVAL; 57984778508Sblueswir1 goto fail; 58084778508Sblueswir1 } 58184778508Sblueswir1 582be04f210SWarner Losh /* 583be04f210SWarner Losh * worst case: we cannot map the file because the offset is not 584be04f210SWarner Losh * aligned, so we read it 585be04f210SWarner Losh */ 586a6b2d060SWarner Losh if (fd != -1 && 58784778508Sblueswir1 (offset & ~qemu_host_page_mask) != (start & ~qemu_host_page_mask)) { 588be04f210SWarner Losh /* 589be04f210SWarner Losh * msync() won't work here, so we return an error if write is 590be04f210SWarner Losh * possible while it is a shared mapping 591be04f210SWarner Losh */ 5926c173b3cSblueswir1 if ((flags & TARGET_BSD_MAP_FLAGMASK) == MAP_SHARED && 59384778508Sblueswir1 (prot & PROT_WRITE)) { 59484778508Sblueswir1 errno = EINVAL; 59584778508Sblueswir1 goto fail; 59684778508Sblueswir1 } 59784778508Sblueswir1 retaddr = target_mmap(start, len, prot | PROT_WRITE, 59884778508Sblueswir1 MAP_FIXED | MAP_PRIVATE | MAP_ANON, 59984778508Sblueswir1 -1, 0); 60084778508Sblueswir1 if (retaddr == -1) 60184778508Sblueswir1 goto fail; 602*5b73b248SRichard Henderson if (!mmap_pread(fd, g2h_untagged(start), len, offset, false)) { 60326778ac3SMikaël Urankar goto fail; 60426778ac3SMikaël Urankar } 60584778508Sblueswir1 if (!(prot & PROT_WRITE)) { 60684778508Sblueswir1 ret = target_mprotect(start, len, prot); 60791a5addaSWarner Losh assert(ret == 0); 60884778508Sblueswir1 } 60984778508Sblueswir1 goto the_end; 61084778508Sblueswir1 } 61184778508Sblueswir1 6120fc76b68SKyle Evans /* Reject the mapping if any page within the range is mapped */ 6139c255cb5SRichard Henderson if ((flags & MAP_EXCL) && !page_check_range_empty(start, end - 1)) { 6140fc76b68SKyle Evans errno = EINVAL; 6150fc76b68SKyle Evans goto fail; 6160fc76b68SKyle Evans } 6170fc76b68SKyle Evans 61884778508Sblueswir1 /* handle the start of the mapping */ 61984778508Sblueswir1 if (start > real_start) { 62084778508Sblueswir1 if (real_end == real_start + qemu_host_page_size) { 62184778508Sblueswir1 /* one single host page */ 62284778508Sblueswir1 ret = mmap_frag(real_start, start, end, 62384778508Sblueswir1 prot, flags, fd, offset); 62484778508Sblueswir1 if (ret == -1) 62584778508Sblueswir1 goto fail; 62684778508Sblueswir1 goto the_end1; 62784778508Sblueswir1 } 62884778508Sblueswir1 ret = mmap_frag(real_start, start, real_start + qemu_host_page_size, 62984778508Sblueswir1 prot, flags, fd, offset); 63084778508Sblueswir1 if (ret == -1) 63184778508Sblueswir1 goto fail; 63284778508Sblueswir1 real_start += qemu_host_page_size; 63384778508Sblueswir1 } 63484778508Sblueswir1 /* handle the end of the mapping */ 63584778508Sblueswir1 if (end < real_end) { 63684778508Sblueswir1 ret = mmap_frag(real_end - qemu_host_page_size, 637be04f210SWarner Losh real_end - qemu_host_page_size, end, 63884778508Sblueswir1 prot, flags, fd, 63984778508Sblueswir1 offset + real_end - qemu_host_page_size - start); 64084778508Sblueswir1 if (ret == -1) 64184778508Sblueswir1 goto fail; 64284778508Sblueswir1 real_end -= qemu_host_page_size; 64384778508Sblueswir1 } 64484778508Sblueswir1 64584778508Sblueswir1 /* map the middle (easier) */ 64684778508Sblueswir1 if (real_start < real_end) { 64784778508Sblueswir1 void *p; 64884778508Sblueswir1 unsigned long offset1; 64984778508Sblueswir1 if (flags & MAP_ANON) 65084778508Sblueswir1 offset1 = 0; 65184778508Sblueswir1 else 65284778508Sblueswir1 offset1 = offset + real_start - start; 6533e8f1628SRichard Henderson p = mmap(g2h_untagged(real_start), real_end - real_start, 65484778508Sblueswir1 prot, flags, fd, offset1); 65584778508Sblueswir1 if (p == MAP_FAILED) 65684778508Sblueswir1 goto fail; 65784778508Sblueswir1 } 65884778508Sblueswir1 } 65984778508Sblueswir1 the_end1: 66049840a4aSRichard Henderson page_set_flags(start, start + len - 1, prot | PAGE_VALID); 66184778508Sblueswir1 the_end: 66284778508Sblueswir1 #ifdef DEBUG_MMAP 6636a3b9bfdSWarner Losh printf("ret=0x" TARGET_ABI_FMT_lx "\n", start); 66484778508Sblueswir1 page_dump(stdout); 66584778508Sblueswir1 printf("\n"); 66684778508Sblueswir1 #endif 66784778508Sblueswir1 mmap_unlock(); 66884778508Sblueswir1 return start; 66984778508Sblueswir1 fail: 67084778508Sblueswir1 mmap_unlock(); 67184778508Sblueswir1 return -1; 67284778508Sblueswir1 } 67384778508Sblueswir1 6744e00b7d8SStacey Son void mmap_reserve(abi_ulong start, abi_ulong size) 675be04f210SWarner Losh { 676be04f210SWarner Losh abi_ulong real_start; 677be04f210SWarner Losh abi_ulong real_end; 678be04f210SWarner Losh abi_ulong addr; 679be04f210SWarner Losh abi_ulong end; 680be04f210SWarner Losh int prot; 681be04f210SWarner Losh 682be04f210SWarner Losh real_start = start & qemu_host_page_mask; 683be04f210SWarner Losh real_end = HOST_PAGE_ALIGN(start + size); 684be04f210SWarner Losh end = start + size; 685be04f210SWarner Losh if (start > real_start) { 686be04f210SWarner Losh /* handle host page containing start */ 687be04f210SWarner Losh prot = 0; 688be04f210SWarner Losh for (addr = real_start; addr < start; addr += TARGET_PAGE_SIZE) { 689be04f210SWarner Losh prot |= page_get_flags(addr); 690be04f210SWarner Losh } 691be04f210SWarner Losh if (real_end == real_start + qemu_host_page_size) { 692be04f210SWarner Losh for (addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) { 693be04f210SWarner Losh prot |= page_get_flags(addr); 694be04f210SWarner Losh } 695be04f210SWarner Losh end = real_end; 696be04f210SWarner Losh } 697be04f210SWarner Losh if (prot != 0) { 698be04f210SWarner Losh real_start += qemu_host_page_size; 699be04f210SWarner Losh } 700be04f210SWarner Losh } 701be04f210SWarner Losh if (end < real_end) { 702be04f210SWarner Losh prot = 0; 703be04f210SWarner Losh for (addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) { 704be04f210SWarner Losh prot |= page_get_flags(addr); 705be04f210SWarner Losh } 706be04f210SWarner Losh if (prot != 0) { 707be04f210SWarner Losh real_end -= qemu_host_page_size; 708be04f210SWarner Losh } 709be04f210SWarner Losh } 710be04f210SWarner Losh if (real_start != real_end) { 711be04f210SWarner Losh mmap(g2h_untagged(real_start), real_end - real_start, PROT_NONE, 712953b69ccSWarner Losh MAP_FIXED | MAP_ANON | MAP_PRIVATE, -1, 0); 713be04f210SWarner Losh } 714be04f210SWarner Losh } 715be04f210SWarner Losh 71684778508Sblueswir1 int target_munmap(abi_ulong start, abi_ulong len) 71784778508Sblueswir1 { 71884778508Sblueswir1 abi_ulong end, real_start, real_end, addr; 71984778508Sblueswir1 int prot, ret; 72084778508Sblueswir1 72184778508Sblueswir1 #ifdef DEBUG_MMAP 7226a3b9bfdSWarner Losh printf("munmap: start=0x" TARGET_ABI_FMT_lx " len=0x" 7236a3b9bfdSWarner Losh TARGET_ABI_FMT_lx "\n", 7246a3b9bfdSWarner Losh start, len); 72584778508Sblueswir1 #endif 72684778508Sblueswir1 if (start & ~TARGET_PAGE_MASK) 72784778508Sblueswir1 return -EINVAL; 72884778508Sblueswir1 len = TARGET_PAGE_ALIGN(len); 72984778508Sblueswir1 if (len == 0) 73084778508Sblueswir1 return -EINVAL; 73184778508Sblueswir1 mmap_lock(); 73284778508Sblueswir1 end = start + len; 73384778508Sblueswir1 real_start = start & qemu_host_page_mask; 73484778508Sblueswir1 real_end = HOST_PAGE_ALIGN(end); 73584778508Sblueswir1 73684778508Sblueswir1 if (start > real_start) { 73784778508Sblueswir1 /* handle host page containing start */ 73884778508Sblueswir1 prot = 0; 73984778508Sblueswir1 for (addr = real_start; addr < start; addr += TARGET_PAGE_SIZE) { 74084778508Sblueswir1 prot |= page_get_flags(addr); 74184778508Sblueswir1 } 74284778508Sblueswir1 if (real_end == real_start + qemu_host_page_size) { 74384778508Sblueswir1 for (addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) { 74484778508Sblueswir1 prot |= page_get_flags(addr); 74584778508Sblueswir1 } 74684778508Sblueswir1 end = real_end; 74784778508Sblueswir1 } 74884778508Sblueswir1 if (prot != 0) 74984778508Sblueswir1 real_start += qemu_host_page_size; 75084778508Sblueswir1 } 75184778508Sblueswir1 if (end < real_end) { 75284778508Sblueswir1 prot = 0; 75384778508Sblueswir1 for (addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) { 75484778508Sblueswir1 prot |= page_get_flags(addr); 75584778508Sblueswir1 } 75684778508Sblueswir1 if (prot != 0) 75784778508Sblueswir1 real_end -= qemu_host_page_size; 75884778508Sblueswir1 } 75984778508Sblueswir1 76084778508Sblueswir1 ret = 0; 76184778508Sblueswir1 /* unmap what we can */ 76284778508Sblueswir1 if (real_start < real_end) { 763be04f210SWarner Losh if (reserved_va) { 764be04f210SWarner Losh mmap_reserve(real_start, real_end - real_start); 765be04f210SWarner Losh } else { 7663e8f1628SRichard Henderson ret = munmap(g2h_untagged(real_start), real_end - real_start); 76784778508Sblueswir1 } 768be04f210SWarner Losh } 76984778508Sblueswir1 770be04f210SWarner Losh if (ret == 0) { 77149840a4aSRichard Henderson page_set_flags(start, start + len - 1, 0); 772be04f210SWarner Losh } 77384778508Sblueswir1 mmap_unlock(); 77484778508Sblueswir1 return ret; 77584778508Sblueswir1 } 77684778508Sblueswir1 77784778508Sblueswir1 int target_msync(abi_ulong start, abi_ulong len, int flags) 77884778508Sblueswir1 { 77984778508Sblueswir1 abi_ulong end; 78084778508Sblueswir1 78184778508Sblueswir1 if (start & ~TARGET_PAGE_MASK) 78284778508Sblueswir1 return -EINVAL; 78384778508Sblueswir1 len = TARGET_PAGE_ALIGN(len); 78484778508Sblueswir1 end = start + len; 78584778508Sblueswir1 if (end < start) 78684778508Sblueswir1 return -EINVAL; 78784778508Sblueswir1 if (end == start) 78884778508Sblueswir1 return 0; 78984778508Sblueswir1 79084778508Sblueswir1 start &= qemu_host_page_mask; 7913e8f1628SRichard Henderson return msync(g2h_untagged(start), end - start, flags); 79284778508Sblueswir1 } 793