1 // SPDX-License-Identifier: GPL-2.0-only 2 #include <linux/module.h> 3 #include <linux/sched.h> 4 #include <linux/ctype.h> 5 #include <linux/fd.h> 6 #include <linux/tty.h> 7 #include <linux/suspend.h> 8 #include <linux/root_dev.h> 9 #include <linux/security.h> 10 #include <linux/delay.h> 11 #include <linux/genhd.h> 12 #include <linux/mount.h> 13 #include <linux/device.h> 14 #include <linux/init.h> 15 #include <linux/fs.h> 16 #include <linux/initrd.h> 17 #include <linux/async.h> 18 #include <linux/fs_struct.h> 19 #include <linux/slab.h> 20 #include <linux/ramfs.h> 21 #include <linux/shmem_fs.h> 22 23 #include <linux/nfs_fs.h> 24 #include <linux/nfs_fs_sb.h> 25 #include <linux/nfs_mount.h> 26 #include <uapi/linux/mount.h> 27 28 #include "do_mounts.h" 29 30 int __initdata rd_doload; /* 1 = load RAM disk, 0 = don't load */ 31 32 int root_mountflags = MS_RDONLY | MS_SILENT; 33 static char * __initdata root_device_name; 34 static char __initdata saved_root_name[64]; 35 static int root_wait; 36 37 dev_t ROOT_DEV; 38 39 static int __init load_ramdisk(char *str) 40 { 41 rd_doload = simple_strtol(str,NULL,0) & 3; 42 return 1; 43 } 44 __setup("load_ramdisk=", load_ramdisk); 45 46 static int __init readonly(char *str) 47 { 48 if (*str) 49 return 0; 50 root_mountflags |= MS_RDONLY; 51 return 1; 52 } 53 54 static int __init readwrite(char *str) 55 { 56 if (*str) 57 return 0; 58 root_mountflags &= ~MS_RDONLY; 59 return 1; 60 } 61 62 __setup("ro", readonly); 63 __setup("rw", readwrite); 64 65 #ifdef CONFIG_BLOCK 66 struct uuidcmp { 67 const char *uuid; 68 int len; 69 }; 70 71 /** 72 * match_dev_by_uuid - callback for finding a partition using its uuid 73 * @dev: device passed in by the caller 74 * @data: opaque pointer to the desired struct uuidcmp to match 75 * 76 * Returns 1 if the device matches, and 0 otherwise. 77 */ 78 static int match_dev_by_uuid(struct device *dev, const void *data) 79 { 80 const struct uuidcmp *cmp = data; 81 struct hd_struct *part = dev_to_part(dev); 82 83 if (!part->info) 84 goto no_match; 85 86 if (strncasecmp(cmp->uuid, part->info->uuid, cmp->len)) 87 goto no_match; 88 89 return 1; 90 no_match: 91 return 0; 92 } 93 94 95 /** 96 * devt_from_partuuid - looks up the dev_t of a partition by its UUID 97 * @uuid_str: char array containing ascii UUID 98 * 99 * The function will return the first partition which contains a matching 100 * UUID value in its partition_meta_info struct. This does not search 101 * by filesystem UUIDs. 102 * 103 * If @uuid_str is followed by a "/PARTNROFF=%d", then the number will be 104 * extracted and used as an offset from the partition identified by the UUID. 105 * 106 * Returns the matching dev_t on success or 0 on failure. 107 */ 108 static dev_t devt_from_partuuid(const char *uuid_str) 109 { 110 dev_t res = 0; 111 struct uuidcmp cmp; 112 struct device *dev = NULL; 113 struct gendisk *disk; 114 struct hd_struct *part; 115 int offset = 0; 116 bool clear_root_wait = false; 117 char *slash; 118 119 cmp.uuid = uuid_str; 120 121 slash = strchr(uuid_str, '/'); 122 /* Check for optional partition number offset attributes. */ 123 if (slash) { 124 char c = 0; 125 /* Explicitly fail on poor PARTUUID syntax. */ 126 if (sscanf(slash + 1, 127 "PARTNROFF=%d%c", &offset, &c) != 1) { 128 clear_root_wait = true; 129 goto done; 130 } 131 cmp.len = slash - uuid_str; 132 } else { 133 cmp.len = strlen(uuid_str); 134 } 135 136 if (!cmp.len) { 137 clear_root_wait = true; 138 goto done; 139 } 140 141 dev = class_find_device(&block_class, NULL, &cmp, 142 &match_dev_by_uuid); 143 if (!dev) 144 goto done; 145 146 res = dev->devt; 147 148 /* Attempt to find the partition by offset. */ 149 if (!offset) 150 goto no_offset; 151 152 res = 0; 153 disk = part_to_disk(dev_to_part(dev)); 154 part = disk_get_part(disk, dev_to_part(dev)->partno + offset); 155 if (part) { 156 res = part_devt(part); 157 put_device(part_to_dev(part)); 158 } 159 160 no_offset: 161 put_device(dev); 162 done: 163 if (clear_root_wait) { 164 pr_err("VFS: PARTUUID= is invalid.\n" 165 "Expected PARTUUID=<valid-uuid-id>[/PARTNROFF=%%d]\n"); 166 if (root_wait) 167 pr_err("Disabling rootwait; root= is invalid.\n"); 168 root_wait = 0; 169 } 170 return res; 171 } 172 173 /** 174 * match_dev_by_label - callback for finding a partition using its label 175 * @dev: device passed in by the caller 176 * @data: opaque pointer to the label to match 177 * 178 * Returns 1 if the device matches, and 0 otherwise. 179 */ 180 static int match_dev_by_label(struct device *dev, const void *data) 181 { 182 const char *label = data; 183 struct hd_struct *part = dev_to_part(dev); 184 185 if (part->info && !strcmp(label, part->info->volname)) 186 return 1; 187 188 return 0; 189 } 190 #endif 191 192 /* 193 * Convert a name into device number. We accept the following variants: 194 * 195 * 1) <hex_major><hex_minor> device number in hexadecimal represents itself 196 * no leading 0x, for example b302. 197 * 2) /dev/nfs represents Root_NFS (0xff) 198 * 3) /dev/<disk_name> represents the device number of disk 199 * 4) /dev/<disk_name><decimal> represents the device number 200 * of partition - device number of disk plus the partition number 201 * 5) /dev/<disk_name>p<decimal> - same as the above, that form is 202 * used when disk name of partitioned disk ends on a digit. 203 * 6) PARTUUID=00112233-4455-6677-8899-AABBCCDDEEFF representing the 204 * unique id of a partition if the partition table provides it. 205 * The UUID may be either an EFI/GPT UUID, or refer to an MSDOS 206 * partition using the format SSSSSSSS-PP, where SSSSSSSS is a zero- 207 * filled hex representation of the 32-bit "NT disk signature", and PP 208 * is a zero-filled hex representation of the 1-based partition number. 209 * 7) PARTUUID=<UUID>/PARTNROFF=<int> to select a partition in relation to 210 * a partition with a known unique id. 211 * 8) <major>:<minor> major and minor number of the device separated by 212 * a colon. 213 * 9) PARTLABEL=<name> with name being the GPT partition label. 214 * MSDOS partitions do not support labels! 215 * 10) /dev/cifs represents Root_CIFS (0xfe) 216 * 217 * If name doesn't have fall into the categories above, we return (0,0). 218 * block_class is used to check if something is a disk name. If the disk 219 * name contains slashes, the device name has them replaced with 220 * bangs. 221 */ 222 223 dev_t name_to_dev_t(const char *name) 224 { 225 char s[32]; 226 char *p; 227 dev_t res = 0; 228 int part; 229 230 #ifdef CONFIG_BLOCK 231 if (strncmp(name, "PARTUUID=", 9) == 0) { 232 name += 9; 233 res = devt_from_partuuid(name); 234 if (!res) 235 goto fail; 236 goto done; 237 } else if (strncmp(name, "PARTLABEL=", 10) == 0) { 238 struct device *dev; 239 240 dev = class_find_device(&block_class, NULL, name + 10, 241 &match_dev_by_label); 242 if (!dev) 243 goto fail; 244 245 res = dev->devt; 246 put_device(dev); 247 goto done; 248 } 249 #endif 250 251 if (strncmp(name, "/dev/", 5) != 0) { 252 unsigned maj, min, offset; 253 char dummy; 254 255 if ((sscanf(name, "%u:%u%c", &maj, &min, &dummy) == 2) || 256 (sscanf(name, "%u:%u:%u:%c", &maj, &min, &offset, &dummy) == 3)) { 257 res = MKDEV(maj, min); 258 if (maj != MAJOR(res) || min != MINOR(res)) 259 goto fail; 260 } else { 261 res = new_decode_dev(simple_strtoul(name, &p, 16)); 262 if (*p) 263 goto fail; 264 } 265 goto done; 266 } 267 268 name += 5; 269 res = Root_NFS; 270 if (strcmp(name, "nfs") == 0) 271 goto done; 272 res = Root_CIFS; 273 if (strcmp(name, "cifs") == 0) 274 goto done; 275 res = Root_RAM0; 276 if (strcmp(name, "ram") == 0) 277 goto done; 278 279 if (strlen(name) > 31) 280 goto fail; 281 strcpy(s, name); 282 for (p = s; *p; p++) 283 if (*p == '/') 284 *p = '!'; 285 res = blk_lookup_devt(s, 0); 286 if (res) 287 goto done; 288 289 /* 290 * try non-existent, but valid partition, which may only exist 291 * after revalidating the disk, like partitioned md devices 292 */ 293 while (p > s && isdigit(p[-1])) 294 p--; 295 if (p == s || !*p || *p == '0') 296 goto fail; 297 298 /* try disk name without <part number> */ 299 part = simple_strtoul(p, NULL, 10); 300 *p = '\0'; 301 res = blk_lookup_devt(s, part); 302 if (res) 303 goto done; 304 305 /* try disk name without p<part number> */ 306 if (p < s + 2 || !isdigit(p[-2]) || p[-1] != 'p') 307 goto fail; 308 p[-1] = '\0'; 309 res = blk_lookup_devt(s, part); 310 if (res) 311 goto done; 312 313 fail: 314 return 0; 315 done: 316 return res; 317 } 318 EXPORT_SYMBOL_GPL(name_to_dev_t); 319 320 static int __init root_dev_setup(char *line) 321 { 322 strlcpy(saved_root_name, line, sizeof(saved_root_name)); 323 return 1; 324 } 325 326 __setup("root=", root_dev_setup); 327 328 static int __init rootwait_setup(char *str) 329 { 330 if (*str) 331 return 0; 332 root_wait = 1; 333 return 1; 334 } 335 336 __setup("rootwait", rootwait_setup); 337 338 static char * __initdata root_mount_data; 339 static int __init root_data_setup(char *str) 340 { 341 root_mount_data = str; 342 return 1; 343 } 344 345 static char * __initdata root_fs_names; 346 static int __init fs_names_setup(char *str) 347 { 348 root_fs_names = str; 349 return 1; 350 } 351 352 static unsigned int __initdata root_delay; 353 static int __init root_delay_setup(char *str) 354 { 355 root_delay = simple_strtoul(str, NULL, 0); 356 return 1; 357 } 358 359 __setup("rootflags=", root_data_setup); 360 __setup("rootfstype=", fs_names_setup); 361 __setup("rootdelay=", root_delay_setup); 362 363 static void __init get_fs_names(char *page) 364 { 365 char *s = page; 366 367 if (root_fs_names) { 368 strcpy(page, root_fs_names); 369 while (*s++) { 370 if (s[-1] == ',') 371 s[-1] = '\0'; 372 } 373 } else { 374 int len = get_filesystem_list(page); 375 char *p, *next; 376 377 page[len] = '\0'; 378 for (p = page-1; p; p = next) { 379 next = strchr(++p, '\n'); 380 if (*p++ != '\t') 381 continue; 382 while ((*s++ = *p++) != '\n') 383 ; 384 s[-1] = '\0'; 385 } 386 } 387 *s = '\0'; 388 } 389 390 static int __init do_mount_root(const char *name, const char *fs, 391 const int flags, const void *data) 392 { 393 struct super_block *s; 394 char *data_page; 395 struct page *p; 396 int ret; 397 398 /* do_mount() requires a full page as fifth argument */ 399 p = alloc_page(GFP_KERNEL); 400 if (!p) 401 return -ENOMEM; 402 403 data_page = page_address(p); 404 strncpy(data_page, data, PAGE_SIZE - 1); 405 406 ret = do_mount(name, "/root", fs, flags, data_page); 407 if (ret) 408 goto out; 409 410 ksys_chdir("/root"); 411 s = current->fs->pwd.dentry->d_sb; 412 ROOT_DEV = s->s_dev; 413 printk(KERN_INFO 414 "VFS: Mounted root (%s filesystem)%s on device %u:%u.\n", 415 s->s_type->name, 416 sb_rdonly(s) ? " readonly" : "", 417 MAJOR(ROOT_DEV), MINOR(ROOT_DEV)); 418 419 out: 420 put_page(p); 421 return ret; 422 } 423 424 void __init mount_block_root(char *name, int flags) 425 { 426 struct page *page = alloc_page(GFP_KERNEL); 427 char *fs_names = page_address(page); 428 char *p; 429 #ifdef CONFIG_BLOCK 430 char b[BDEVNAME_SIZE]; 431 #else 432 const char *b = name; 433 #endif 434 435 get_fs_names(fs_names); 436 retry: 437 for (p = fs_names; *p; p += strlen(p)+1) { 438 int err = do_mount_root(name, p, flags, root_mount_data); 439 switch (err) { 440 case 0: 441 goto out; 442 case -EACCES: 443 case -EINVAL: 444 continue; 445 } 446 /* 447 * Allow the user to distinguish between failed sys_open 448 * and bad superblock on root device. 449 * and give them a list of the available devices 450 */ 451 #ifdef CONFIG_BLOCK 452 __bdevname(ROOT_DEV, b); 453 #endif 454 printk("VFS: Cannot open root device \"%s\" or %s: error %d\n", 455 root_device_name, b, err); 456 printk("Please append a correct \"root=\" boot option; here are the available partitions:\n"); 457 458 printk_all_partitions(); 459 #ifdef CONFIG_DEBUG_BLOCK_EXT_DEVT 460 printk("DEBUG_BLOCK_EXT_DEVT is enabled, you need to specify " 461 "explicit textual name for \"root=\" boot option.\n"); 462 #endif 463 panic("VFS: Unable to mount root fs on %s", b); 464 } 465 if (!(flags & SB_RDONLY)) { 466 flags |= SB_RDONLY; 467 goto retry; 468 } 469 470 printk("List of all partitions:\n"); 471 printk_all_partitions(); 472 printk("No filesystem could mount root, tried: "); 473 for (p = fs_names; *p; p += strlen(p)+1) 474 printk(" %s", p); 475 printk("\n"); 476 #ifdef CONFIG_BLOCK 477 __bdevname(ROOT_DEV, b); 478 #endif 479 panic("VFS: Unable to mount root fs on %s", b); 480 out: 481 put_page(page); 482 } 483 484 #ifdef CONFIG_ROOT_NFS 485 486 #define NFSROOT_TIMEOUT_MIN 5 487 #define NFSROOT_TIMEOUT_MAX 30 488 #define NFSROOT_RETRY_MAX 5 489 490 static int __init mount_nfs_root(void) 491 { 492 char *root_dev, *root_data; 493 unsigned int timeout; 494 int try, err; 495 496 err = nfs_root_data(&root_dev, &root_data); 497 if (err != 0) 498 return 0; 499 500 /* 501 * The server or network may not be ready, so try several 502 * times. Stop after a few tries in case the client wants 503 * to fall back to other boot methods. 504 */ 505 timeout = NFSROOT_TIMEOUT_MIN; 506 for (try = 1; ; try++) { 507 err = do_mount_root(root_dev, "nfs", 508 root_mountflags, root_data); 509 if (err == 0) 510 return 1; 511 if (try > NFSROOT_RETRY_MAX) 512 break; 513 514 /* Wait, in case the server refused us immediately */ 515 ssleep(timeout); 516 timeout <<= 1; 517 if (timeout > NFSROOT_TIMEOUT_MAX) 518 timeout = NFSROOT_TIMEOUT_MAX; 519 } 520 return 0; 521 } 522 #endif 523 524 #ifdef CONFIG_CIFS_ROOT 525 526 extern int cifs_root_data(char **dev, char **opts); 527 528 #define CIFSROOT_TIMEOUT_MIN 5 529 #define CIFSROOT_TIMEOUT_MAX 30 530 #define CIFSROOT_RETRY_MAX 5 531 532 static int __init mount_cifs_root(void) 533 { 534 char *root_dev, *root_data; 535 unsigned int timeout; 536 int try, err; 537 538 err = cifs_root_data(&root_dev, &root_data); 539 if (err != 0) 540 return 0; 541 542 timeout = CIFSROOT_TIMEOUT_MIN; 543 for (try = 1; ; try++) { 544 err = do_mount_root(root_dev, "cifs", root_mountflags, 545 root_data); 546 if (err == 0) 547 return 1; 548 if (try > CIFSROOT_RETRY_MAX) 549 break; 550 551 ssleep(timeout); 552 timeout <<= 1; 553 if (timeout > CIFSROOT_TIMEOUT_MAX) 554 timeout = CIFSROOT_TIMEOUT_MAX; 555 } 556 return 0; 557 } 558 #endif 559 560 #if defined(CONFIG_BLK_DEV_RAM) || defined(CONFIG_BLK_DEV_FD) 561 void __init change_floppy(char *fmt, ...) 562 { 563 struct termios termios; 564 char buf[80]; 565 char c; 566 int fd; 567 va_list args; 568 va_start(args, fmt); 569 vsprintf(buf, fmt, args); 570 va_end(args); 571 fd = ksys_open("/dev/root", O_RDWR | O_NDELAY, 0); 572 if (fd >= 0) { 573 ksys_ioctl(fd, FDEJECT, 0); 574 ksys_close(fd); 575 } 576 printk(KERN_NOTICE "VFS: Insert %s and press ENTER\n", buf); 577 fd = ksys_open("/dev/console", O_RDWR, 0); 578 if (fd >= 0) { 579 ksys_ioctl(fd, TCGETS, (long)&termios); 580 termios.c_lflag &= ~ICANON; 581 ksys_ioctl(fd, TCSETSF, (long)&termios); 582 ksys_read(fd, &c, 1); 583 termios.c_lflag |= ICANON; 584 ksys_ioctl(fd, TCSETSF, (long)&termios); 585 ksys_close(fd); 586 } 587 } 588 #endif 589 590 void __init mount_root(void) 591 { 592 #ifdef CONFIG_ROOT_NFS 593 if (ROOT_DEV == Root_NFS) { 594 if (mount_nfs_root()) 595 return; 596 597 printk(KERN_ERR "VFS: Unable to mount root fs via NFS, trying floppy.\n"); 598 ROOT_DEV = Root_FD0; 599 } 600 #endif 601 #ifdef CONFIG_CIFS_ROOT 602 if (ROOT_DEV == Root_CIFS) { 603 if (mount_cifs_root()) 604 return; 605 606 printk(KERN_ERR "VFS: Unable to mount root fs via SMB, trying floppy.\n"); 607 ROOT_DEV = Root_FD0; 608 } 609 #endif 610 #ifdef CONFIG_BLK_DEV_FD 611 if (MAJOR(ROOT_DEV) == FLOPPY_MAJOR) { 612 /* rd_doload is 2 for a dual initrd/ramload setup */ 613 if (rd_doload==2) { 614 if (rd_load_disk(1)) { 615 ROOT_DEV = Root_RAM1; 616 root_device_name = NULL; 617 } 618 } else 619 change_floppy("root floppy"); 620 } 621 #endif 622 #ifdef CONFIG_BLOCK 623 { 624 int err = create_dev("/dev/root", ROOT_DEV); 625 626 if (err < 0) 627 pr_emerg("Failed to create /dev/root: %d\n", err); 628 mount_block_root("/dev/root", root_mountflags); 629 } 630 #endif 631 } 632 633 /* 634 * Prepare the namespace - decide what/where to mount, load ramdisks, etc. 635 */ 636 void __init prepare_namespace(void) 637 { 638 int is_floppy; 639 640 if (root_delay) { 641 printk(KERN_INFO "Waiting %d sec before mounting root device...\n", 642 root_delay); 643 ssleep(root_delay); 644 } 645 646 /* 647 * wait for the known devices to complete their probing 648 * 649 * Note: this is a potential source of long boot delays. 650 * For example, it is not atypical to wait 5 seconds here 651 * for the touchpad of a laptop to initialize. 652 */ 653 wait_for_device_probe(); 654 655 md_run_setup(); 656 657 if (saved_root_name[0]) { 658 root_device_name = saved_root_name; 659 if (!strncmp(root_device_name, "mtd", 3) || 660 !strncmp(root_device_name, "ubi", 3)) { 661 mount_block_root(root_device_name, root_mountflags); 662 goto out; 663 } 664 ROOT_DEV = name_to_dev_t(root_device_name); 665 if (strncmp(root_device_name, "/dev/", 5) == 0) 666 root_device_name += 5; 667 } 668 669 if (initrd_load()) 670 goto out; 671 672 /* wait for any asynchronous scanning to complete */ 673 if ((ROOT_DEV == 0) && root_wait) { 674 printk(KERN_INFO "Waiting for root device %s...\n", 675 saved_root_name); 676 while (driver_probe_done() != 0 || 677 (ROOT_DEV = name_to_dev_t(saved_root_name)) == 0) 678 msleep(5); 679 async_synchronize_full(); 680 } 681 682 is_floppy = MAJOR(ROOT_DEV) == FLOPPY_MAJOR; 683 684 if (is_floppy && rd_doload && rd_load_disk(0)) 685 ROOT_DEV = Root_RAM0; 686 687 mount_root(); 688 out: 689 devtmpfs_mount(); 690 do_mount(".", "/", NULL, MS_MOVE, NULL); 691 ksys_chroot("."); 692 } 693 694 static bool is_tmpfs; 695 static int rootfs_init_fs_context(struct fs_context *fc) 696 { 697 if (IS_ENABLED(CONFIG_TMPFS) && is_tmpfs) 698 return shmem_init_fs_context(fc); 699 700 return ramfs_init_fs_context(fc); 701 } 702 703 struct file_system_type rootfs_fs_type = { 704 .name = "rootfs", 705 .init_fs_context = rootfs_init_fs_context, 706 .kill_sb = kill_litter_super, 707 }; 708 709 void __init init_rootfs(void) 710 { 711 if (IS_ENABLED(CONFIG_TMPFS) && !saved_root_name[0] && 712 (!root_fs_names || strstr(root_fs_names, "tmpfs"))) 713 is_tmpfs = true; 714 } 715