1 /* 2 * qemu bsd user main 3 * 4 * Copyright (c) 2003-2008 Fabrice Bellard 5 * Copyright (c) 2013-14 Stacey Son 6 * 7 * This program is free software; you can redistribute it and/or modify 8 * it under the terms of the GNU General Public License as published by 9 * the Free Software Foundation; either version 2 of the License, or 10 * (at your option) any later version. 11 * 12 * This program is distributed in the hope that it will be useful, 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of 14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 15 * GNU General Public License for more details. 16 * 17 * You should have received a copy of the GNU General Public License 18 * along with this program; if not, see <http://www.gnu.org/licenses/>. 19 */ 20 21 #include "qemu/osdep.h" 22 #include <sys/resource.h> 23 #include <sys/sysctl.h> 24 25 #include "qemu/help-texts.h" 26 #include "qemu/units.h" 27 #include "qemu/accel.h" 28 #include "qemu-version.h" 29 #include <machine/trap.h> 30 31 #include "qapi/error.h" 32 #include "qemu.h" 33 #include "qemu/config-file.h" 34 #include "qemu/error-report.h" 35 #include "qemu/path.h" 36 #include "qemu/help_option.h" 37 #include "qemu/module.h" 38 #include "exec/exec-all.h" 39 #include "tcg/startup.h" 40 #include "qemu/timer.h" 41 #include "qemu/envlist.h" 42 #include "qemu/cutils.h" 43 #include "exec/log.h" 44 #include "trace/control.h" 45 #include "crypto/init.h" 46 #include "qemu/guest-random.h" 47 #include "gdbstub/user.h" 48 49 #include "host-os.h" 50 #include "target_arch_cpu.h" 51 52 53 /* 54 * TODO: Remove these and rely only on qemu_real_host_page_size(). 55 */ 56 uintptr_t qemu_host_page_size; 57 intptr_t qemu_host_page_mask; 58 59 static bool opt_one_insn_per_tb; 60 uintptr_t guest_base; 61 bool have_guest_base; 62 /* 63 * When running 32-on-64 we should make sure we can fit all of the possible 64 * guest address space into a contiguous chunk of virtual host memory. 65 * 66 * This way we will never overlap with our own libraries or binaries or stack 67 * or anything else that QEMU maps. 68 * 69 * Many cpus reserve the high bit (or more than one for some 64-bit cpus) 70 * of the address for the kernel. Some cpus rely on this and user space 71 * uses the high bit(s) for pointer tagging and the like. For them, we 72 * must preserve the expected address space. 73 */ 74 #ifndef MAX_RESERVED_VA 75 # if HOST_LONG_BITS > TARGET_VIRT_ADDR_SPACE_BITS 76 # if TARGET_VIRT_ADDR_SPACE_BITS == 32 && \ 77 (TARGET_LONG_BITS == 32 || defined(TARGET_ABI32)) 78 # define MAX_RESERVED_VA 0xfffffffful 79 # else 80 # define MAX_RESERVED_VA ((1ul << TARGET_VIRT_ADDR_SPACE_BITS) - 1) 81 # endif 82 # else 83 # define MAX_RESERVED_VA 0 84 # endif 85 #endif 86 87 /* 88 * That said, reserving *too* much vm space via mmap can run into problems 89 * with rlimits, oom due to page table creation, etc. We will still try it, 90 * if directed by the command-line option, but not by default. 91 */ 92 #if HOST_LONG_BITS == 64 && TARGET_VIRT_ADDR_SPACE_BITS <= 32 93 unsigned long reserved_va = MAX_RESERVED_VA; 94 #else 95 unsigned long reserved_va; 96 #endif 97 98 const char *interp_prefix = CONFIG_QEMU_INTERP_PREFIX; 99 const char *qemu_uname_release; 100 char qemu_proc_pathname[PATH_MAX]; /* full path to exeutable */ 101 102 unsigned long target_maxtsiz = TARGET_MAXTSIZ; /* max text size */ 103 unsigned long target_dfldsiz = TARGET_DFLDSIZ; /* initial data size limit */ 104 unsigned long target_maxdsiz = TARGET_MAXDSIZ; /* max data size */ 105 unsigned long target_dflssiz = TARGET_DFLSSIZ; /* initial data size limit */ 106 unsigned long target_maxssiz = TARGET_MAXSSIZ; /* max stack size */ 107 unsigned long target_sgrowsiz = TARGET_SGROWSIZ; /* amount to grow stack */ 108 109 /* Helper routines for implementing atomic operations. */ 110 111 void fork_start(void) 112 { 113 start_exclusive(); 114 cpu_list_lock(); 115 mmap_fork_start(); 116 gdbserver_fork_start(); 117 } 118 119 void fork_end(pid_t pid) 120 { 121 bool child = pid == 0; 122 123 if (child) { 124 CPUState *cpu, *next_cpu; 125 /* 126 * Child processes created by fork() only have a single thread. Discard 127 * information about the parent threads. 128 */ 129 CPU_FOREACH_SAFE(cpu, next_cpu) { 130 if (cpu != thread_cpu) { 131 QTAILQ_REMOVE_RCU(&cpus_queue, cpu, node); 132 } 133 } 134 mmap_fork_end(child); 135 /* 136 * qemu_init_cpu_list() takes care of reinitializing the exclusive 137 * state, so we don't need to end_exclusive() here. 138 */ 139 qemu_init_cpu_list(); 140 get_task_state(thread_cpu)->ts_tid = qemu_get_thread_id(); 141 gdbserver_fork_end(thread_cpu, pid); 142 } else { 143 mmap_fork_end(child); 144 cpu_list_unlock(); 145 gdbserver_fork_end(thread_cpu, pid); 146 end_exclusive(); 147 } 148 } 149 150 void cpu_loop(CPUArchState *env) 151 { 152 target_cpu_loop(env); 153 } 154 155 static void usage(void) 156 { 157 printf("qemu-" TARGET_NAME " version " QEMU_FULL_VERSION 158 "\n" QEMU_COPYRIGHT "\n" 159 "usage: qemu-" TARGET_NAME " [options] program [arguments...]\n" 160 "BSD CPU emulator (compiled for %s emulation)\n" 161 "\n" 162 "Standard options:\n" 163 "-h print this help\n" 164 "-g port wait gdb connection to port\n" 165 "-L path set the elf interpreter prefix (default=%s)\n" 166 "-s size set the stack size in bytes (default=%ld)\n" 167 "-cpu model select CPU (-cpu help for list)\n" 168 "-drop-ld-preload drop LD_PRELOAD for target process\n" 169 "-E var=value sets/modifies targets environment variable(s)\n" 170 "-U var unsets targets environment variable(s)\n" 171 "-B address set guest_base address to address\n" 172 "\n" 173 "Debug options:\n" 174 "-d item1[,...] enable logging of specified items\n" 175 " (use '-d help' for a list of log items)\n" 176 "-D logfile write logs to 'logfile' (default stderr)\n" 177 "-one-insn-per-tb run with one guest instruction per emulated TB\n" 178 "-strace log system calls\n" 179 "-trace [[enable=]<pattern>][,events=<file>][,file=<file>]\n" 180 " specify tracing options\n" 181 "\n" 182 "Environment variables:\n" 183 "QEMU_STRACE Print system calls and arguments similar to the\n" 184 " 'strace' program. Enable by setting to any value.\n" 185 "You can use -E and -U options to set/unset environment variables\n" 186 "for target process. It is possible to provide several variables\n" 187 "by repeating the option. For example:\n" 188 " -E var1=val2 -E var2=val2 -U LD_PRELOAD -U LD_DEBUG\n" 189 "Note that if you provide several changes to single variable\n" 190 "last change will stay in effect.\n" 191 "\n" 192 QEMU_HELP_BOTTOM "\n" 193 , 194 TARGET_NAME, 195 interp_prefix, 196 target_dflssiz); 197 exit(1); 198 } 199 200 __thread CPUState *thread_cpu; 201 202 void stop_all_tasks(void) 203 { 204 /* 205 * We trust when using NPTL (pthreads) start_exclusive() handles thread 206 * stopping correctly. 207 */ 208 start_exclusive(); 209 } 210 211 bool qemu_cpu_is_self(CPUState *cpu) 212 { 213 return thread_cpu == cpu; 214 } 215 216 void qemu_cpu_kick(CPUState *cpu) 217 { 218 cpu_exit(cpu); 219 } 220 221 /* Assumes contents are already zeroed. */ 222 static void init_task_state(TaskState *ts) 223 { 224 ts->sigaltstack_used = (struct target_sigaltstack) { 225 .ss_sp = 0, 226 .ss_size = 0, 227 .ss_flags = TARGET_SS_DISABLE, 228 }; 229 } 230 231 void gemu_log(const char *fmt, ...) 232 { 233 va_list ap; 234 235 va_start(ap, fmt); 236 vfprintf(stderr, fmt, ap); 237 va_end(ap); 238 } 239 240 static void 241 adjust_ssize(void) 242 { 243 struct rlimit rl; 244 245 if (getrlimit(RLIMIT_STACK, &rl) != 0) { 246 return; 247 } 248 249 target_maxssiz = MIN(target_maxssiz, rl.rlim_max); 250 target_dflssiz = MIN(MAX(target_dflssiz, rl.rlim_cur), target_maxssiz); 251 252 rl.rlim_max = target_maxssiz; 253 rl.rlim_cur = target_dflssiz; 254 setrlimit(RLIMIT_STACK, &rl); 255 } 256 257 static void save_proc_pathname(char *argv0) 258 { 259 int mib[4]; 260 size_t len; 261 262 mib[0] = CTL_KERN; 263 mib[1] = KERN_PROC; 264 mib[2] = KERN_PROC_PATHNAME; 265 mib[3] = -1; 266 267 len = sizeof(qemu_proc_pathname); 268 if (sysctl(mib, 4, qemu_proc_pathname, &len, NULL, 0)) { 269 perror("sysctl"); 270 } 271 } 272 273 int main(int argc, char **argv) 274 { 275 const char *filename; 276 const char *cpu_model; 277 const char *cpu_type; 278 const char *log_file = NULL; 279 const char *log_mask = NULL; 280 const char *seed_optarg = NULL; 281 struct target_pt_regs regs1, *regs = ®s1; 282 struct image_info info1, *info = &info1; 283 struct bsd_binprm bprm; 284 TaskState *ts; 285 CPUArchState *env; 286 CPUState *cpu; 287 int optind, rv; 288 const char *r; 289 const char *gdbstub = NULL; 290 char **target_environ, **wrk; 291 envlist_t *envlist = NULL; 292 char *argv0 = NULL; 293 294 adjust_ssize(); 295 296 if (argc <= 1) { 297 usage(); 298 } 299 300 save_proc_pathname(argv[0]); 301 302 error_init(argv[0]); 303 module_call_init(MODULE_INIT_TRACE); 304 qemu_init_cpu_list(); 305 module_call_init(MODULE_INIT_QOM); 306 307 envlist = envlist_create(); 308 309 /* 310 * add current environment into the list 311 * envlist_setenv adds to the front of the list; to preserve environ 312 * order add from back to front 313 */ 314 for (wrk = environ; *wrk != NULL; wrk++) { 315 continue; 316 } 317 while (wrk != environ) { 318 wrk--; 319 (void) envlist_setenv(envlist, *wrk); 320 } 321 322 qemu_host_page_size = getpagesize(); 323 qemu_host_page_size = MAX(qemu_host_page_size, TARGET_PAGE_SIZE); 324 325 cpu_model = NULL; 326 327 qemu_add_opts(&qemu_trace_opts); 328 329 optind = 1; 330 for (;;) { 331 if (optind >= argc) { 332 break; 333 } 334 r = argv[optind]; 335 if (r[0] != '-') { 336 break; 337 } 338 optind++; 339 r++; 340 if (!strcmp(r, "-")) { 341 break; 342 } else if (!strcmp(r, "d")) { 343 if (optind >= argc) { 344 break; 345 } 346 log_mask = argv[optind++]; 347 } else if (!strcmp(r, "D")) { 348 if (optind >= argc) { 349 break; 350 } 351 log_file = argv[optind++]; 352 } else if (!strcmp(r, "E")) { 353 r = argv[optind++]; 354 if (envlist_setenv(envlist, r) != 0) { 355 usage(); 356 } 357 } else if (!strcmp(r, "ignore-environment")) { 358 envlist_free(envlist); 359 envlist = envlist_create(); 360 } else if (!strcmp(r, "U")) { 361 r = argv[optind++]; 362 if (envlist_unsetenv(envlist, r) != 0) { 363 usage(); 364 } 365 } else if (!strcmp(r, "s")) { 366 r = argv[optind++]; 367 rv = qemu_strtoul(r, &r, 0, &target_dflssiz); 368 if (rv < 0 || target_dflssiz <= 0) { 369 usage(); 370 } 371 if (*r == 'M') { 372 target_dflssiz *= 1024 * 1024; 373 } else if (*r == 'k' || *r == 'K') { 374 target_dflssiz *= 1024; 375 } 376 if (target_dflssiz > target_maxssiz) { 377 usage(); 378 } 379 } else if (!strcmp(r, "L")) { 380 interp_prefix = argv[optind++]; 381 } else if (!strcmp(r, "p")) { 382 unsigned size, want = qemu_real_host_page_size(); 383 384 r = argv[optind++]; 385 if (qemu_strtoui(r, NULL, 10, &size) || size != want) { 386 warn_report("Deprecated page size option cannot " 387 "change host page size (%u)", want); 388 } 389 } else if (!strcmp(r, "g")) { 390 gdbstub = g_strdup(argv[optind++]); 391 } else if (!strcmp(r, "r")) { 392 qemu_uname_release = argv[optind++]; 393 } else if (!strcmp(r, "cpu")) { 394 cpu_model = argv[optind++]; 395 if (is_help_option(cpu_model)) { 396 list_cpus(); 397 exit(1); 398 } 399 } else if (!strcmp(r, "B")) { 400 rv = qemu_strtoul(argv[optind++], NULL, 0, &guest_base); 401 if (rv < 0) { 402 usage(); 403 } 404 have_guest_base = true; 405 } else if (!strcmp(r, "drop-ld-preload")) { 406 (void) envlist_unsetenv(envlist, "LD_PRELOAD"); 407 } else if (!strcmp(r, "seed")) { 408 seed_optarg = optarg; 409 } else if (!strcmp(r, "one-insn-per-tb")) { 410 opt_one_insn_per_tb = true; 411 } else if (!strcmp(r, "strace")) { 412 do_strace = 1; 413 } else if (!strcmp(r, "trace")) { 414 trace_opt_parse(optarg); 415 } else if (!strcmp(r, "0")) { 416 argv0 = argv[optind++]; 417 } else { 418 usage(); 419 } 420 } 421 422 qemu_host_page_mask = -qemu_host_page_size; 423 424 /* init debug */ 425 { 426 int mask = 0; 427 if (log_mask) { 428 mask = qemu_str_to_log_mask(log_mask); 429 if (!mask) { 430 qemu_print_log_usage(stdout); 431 exit(1); 432 } 433 } 434 qemu_set_log_filename_flags(log_file, mask, &error_fatal); 435 } 436 437 if (optind >= argc) { 438 usage(); 439 } 440 filename = argv[optind]; 441 if (argv0) { 442 argv[optind] = argv0; 443 } 444 445 if (!trace_init_backends()) { 446 exit(1); 447 } 448 trace_init_file(); 449 450 /* Zero out regs */ 451 memset(regs, 0, sizeof(struct target_pt_regs)); 452 453 /* Zero bsd params */ 454 memset(&bprm, 0, sizeof(bprm)); 455 456 /* Zero out image_info */ 457 memset(info, 0, sizeof(struct image_info)); 458 459 /* Scan interp_prefix dir for replacement files. */ 460 init_paths(interp_prefix); 461 462 if (cpu_model == NULL) { 463 cpu_model = TARGET_DEFAULT_CPU_MODEL; 464 } 465 466 cpu_type = parse_cpu_option(cpu_model); 467 468 /* init tcg before creating CPUs and to get qemu_host_page_size */ 469 { 470 AccelState *accel = current_accel(); 471 AccelClass *ac = ACCEL_GET_CLASS(accel); 472 473 accel_init_interfaces(ac); 474 object_property_set_bool(OBJECT(accel), "one-insn-per-tb", 475 opt_one_insn_per_tb, &error_abort); 476 ac->init_machine(NULL); 477 } 478 cpu = cpu_create(cpu_type); 479 env = cpu_env(cpu); 480 cpu_reset(cpu); 481 thread_cpu = cpu; 482 483 if (getenv("QEMU_STRACE")) { 484 do_strace = 1; 485 } 486 487 target_environ = envlist_to_environ(envlist, NULL); 488 envlist_free(envlist); 489 490 { 491 Error *err = NULL; 492 if (seed_optarg != NULL) { 493 qemu_guest_random_seed_main(seed_optarg, &err); 494 } else { 495 qcrypto_init(&err); 496 } 497 if (err) { 498 error_reportf_err(err, "cannot initialize crypto: "); 499 exit(1); 500 } 501 } 502 503 /* 504 * Now that page sizes are configured we can do 505 * proper page alignment for guest_base. 506 */ 507 if (have_guest_base) { 508 if (guest_base & ~qemu_host_page_mask) { 509 error_report("Selected guest base not host page aligned"); 510 exit(1); 511 } 512 } 513 514 /* 515 * If reserving host virtual address space, do so now. 516 * Combined with '-B', ensure that the chosen range is free. 517 */ 518 if (reserved_va) { 519 void *p; 520 521 if (have_guest_base) { 522 p = mmap((void *)guest_base, reserved_va + 1, PROT_NONE, 523 MAP_ANON | MAP_PRIVATE | MAP_FIXED | MAP_EXCL, -1, 0); 524 } else { 525 p = mmap(NULL, reserved_va + 1, PROT_NONE, 526 MAP_ANON | MAP_PRIVATE, -1, 0); 527 } 528 if (p == MAP_FAILED) { 529 const char *err = strerror(errno); 530 char *sz = size_to_str(reserved_va + 1); 531 532 if (have_guest_base) { 533 error_report("Cannot allocate %s bytes at -B %p for guest " 534 "address space: %s", sz, (void *)guest_base, err); 535 } else { 536 error_report("Cannot allocate %s bytes for guest " 537 "address space: %s", sz, err); 538 } 539 exit(1); 540 } 541 guest_base = (uintptr_t)p; 542 have_guest_base = true; 543 544 /* Ensure that mmap_next_start is within range. */ 545 if (reserved_va <= mmap_next_start) { 546 mmap_next_start = (reserved_va / 4 * 3) 547 & TARGET_PAGE_MASK & qemu_host_page_mask; 548 } 549 } 550 551 if (loader_exec(filename, argv + optind, target_environ, regs, info, 552 &bprm) != 0) { 553 printf("Error loading %s\n", filename); 554 _exit(1); 555 } 556 557 for (wrk = target_environ; *wrk; wrk++) { 558 g_free(*wrk); 559 } 560 561 g_free(target_environ); 562 563 if (qemu_loglevel_mask(CPU_LOG_PAGE)) { 564 FILE *f = qemu_log_trylock(); 565 if (f) { 566 fprintf(f, "guest_base %p\n", (void *)guest_base); 567 fprintf(f, "page layout changed following binary load\n"); 568 page_dump(f); 569 570 fprintf(f, "end_code 0x" TARGET_ABI_FMT_lx "\n", 571 info->end_code); 572 fprintf(f, "start_code 0x" TARGET_ABI_FMT_lx "\n", 573 info->start_code); 574 fprintf(f, "start_data 0x" TARGET_ABI_FMT_lx "\n", 575 info->start_data); 576 fprintf(f, "end_data 0x" TARGET_ABI_FMT_lx "\n", 577 info->end_data); 578 fprintf(f, "start_stack 0x" TARGET_ABI_FMT_lx "\n", 579 info->start_stack); 580 fprintf(f, "brk 0x" TARGET_ABI_FMT_lx "\n", info->brk); 581 fprintf(f, "entry 0x" TARGET_ABI_FMT_lx "\n", info->entry); 582 583 qemu_log_unlock(f); 584 } 585 } 586 587 /* build Task State */ 588 ts = g_new0(TaskState, 1); 589 init_task_state(ts); 590 ts->info = info; 591 ts->bprm = &bprm; 592 cpu->opaque = ts; 593 594 target_set_brk(info->brk); 595 syscall_init(); 596 signal_init(); 597 598 /* 599 * Now that we've loaded the binary, GUEST_BASE is fixed. Delay 600 * generating the prologue until now so that the prologue can take 601 * the real value of GUEST_BASE into account. 602 */ 603 tcg_prologue_init(); 604 605 target_cpu_init(env, regs); 606 607 if (gdbstub) { 608 gdbserver_start(gdbstub); 609 gdb_handlesig(cpu, 0); 610 } 611 cpu_loop(env); 612 /* never exits */ 613 return 0; 614 } 615