/* SPDX-License-Identifier: LGPL-2.1-or-later */ #include #include #include #include #include #include #include #include "base-filesystem.h" #include "chase.h" #include "fd-util.h" #include "initrd-util.h" #include "log.h" #include "missing_syscall.h" #include "mkdir-label.h" #include "mount-util.h" #include "mountpoint-util.h" #include "path-util.h" #include "rm-rf.h" #include "stdio-util.h" #include "string-util.h" #include "strv.h" #include "switch-root.h" #include "user-util.h" int switch_root(const char *new_root, const char *old_root_after, /* path below the new root, where to place the old root after the transition; may be NULL to unmount it */ unsigned long mount_flags) { /* MS_MOVE or MS_BIND used for /proc/, /dev/, /run/, /sys/ */ _cleanup_close_ int old_root_fd = -EBADF, new_root_fd = -EBADF; _cleanup_free_ char *resolved_old_root_after = NULL; int r, istmp; assert(new_root); assert(IN_SET(mount_flags, MS_MOVE, MS_BIND)); if (path_equal(new_root, "/")) return 0; /* Check if we shall remove the contents of the old root */ old_root_fd = open("/", O_DIRECTORY|O_CLOEXEC); if (old_root_fd < 0) return log_error_errno(errno, "Failed to open root directory: %m"); istmp = fd_is_temporary_fs(old_root_fd); if (istmp < 0) return log_error_errno(istmp, "Failed to stat root directory: %m"); if (istmp > 0) log_debug("Root directory is on tmpfs, will do cleanup later."); new_root_fd = open(new_root, O_DIRECTORY|O_CLOEXEC); if (new_root_fd < 0) return log_error_errno(errno, "Failed to open target directory '%s': %m", new_root); if (old_root_after) { /* Determine where we shall place the old root after the transition */ r = chase(old_root_after, new_root, CHASE_PREFIX_ROOT|CHASE_NONEXISTENT, &resolved_old_root_after, NULL); if (r < 0) return log_error_errno(r, "Failed to resolve %s/%s: %m", new_root, old_root_after); if (r == 0) /* Doesn't exist yet. Let's create it */ (void) mkdir_p_label(resolved_old_root_after, 0755); } /* Work-around for kernel design: the kernel refuses MS_MOVE if any file systems are mounted * MS_SHARED. Hence remount them MS_PRIVATE here as a work-around. * * https://bugzilla.redhat.com/show_bug.cgi?id=847418 */ if (mount(NULL, "/", NULL, MS_REC|MS_PRIVATE, NULL) < 0) return log_error_errno(errno, "Failed to set \"/\" mount propagation to private: %m"); FOREACH_STRING(path, "/sys", "/dev", "/run", "/proc") { _cleanup_free_ char *chased = NULL; r = chase(path, new_root, CHASE_PREFIX_ROOT|CHASE_NONEXISTENT, &chased, NULL); if (r < 0) return log_error_errno(r, "Failed to resolve %s/%s: %m", new_root, path); if (r > 0) { /* Already exists. Let's see if it is a mount point already. */ r = path_is_mount_point(chased, NULL, 0); if (r < 0) return log_error_errno(r, "Failed to determine whether %s is a mount point: %m", chased); if (r > 0) /* If it is already mounted, then do nothing */ continue; } else /* Doesn't exist yet? */ (void) mkdir_p_label(chased, 0755); if (mount(path, chased, NULL, mount_flags, NULL) < 0) return log_error_errno(errno, "Failed to mount %s to %s: %m", path, chased); } /* Do not fail if base_filesystem_create() fails. Not all switch roots are like base_filesystem_create() wants * them to look like. They might even boot, if they are RO and don't have the FS layout. Just ignore the error * and switch_root() nevertheless. */ (void) base_filesystem_create_fd(new_root_fd, new_root, UID_INVALID, GID_INVALID); if (fchdir(new_root_fd) < 0) return log_error_errno(errno, "Failed to change directory to %s: %m", new_root); /* We first try a pivot_root() so that we can umount the old root dir. In many cases (i.e. where rootfs is /), * that's not possible however, and hence we simply overmount root */ if (resolved_old_root_after) r = RET_NERRNO(pivot_root(".", resolved_old_root_after)); else { r = RET_NERRNO(pivot_root(".", ".")); if (r >= 0) { /* Now unmount the upper of the two stacked file systems */ if (umount2(".", MNT_DETACH) < 0) return log_error_errno(errno, "Failed to unmount the old root: %m"); } } if (r < 0) { log_debug_errno(r, "Pivoting root file system failed, moving mounts instead: %m"); if (mount(".", "/", NULL, MS_MOVE, NULL) < 0) return log_error_errno(errno, "Failed to move %s to /: %m", new_root); if (chroot(".") < 0) return log_error_errno(errno, "Failed to change root: %m"); if (chdir(".") < 0) return log_error_errno(errno, "Failed to change directory: %m"); } if (istmp) { struct stat rb; if (fstat(old_root_fd, &rb) < 0) return log_error_errno(errno, "Failed to stat old root directory: %m"); /* Note: the below won't operate on non-memory file systems (i.e. only on tmpfs, ramfs), and * it will stop at mount boundaries */ (void) rm_rf_children(TAKE_FD(old_root_fd), 0, &rb); /* takes possession of the dir fd, even on failure */ } return 0; }