|  | /* Copyright (c) 2012 The Chromium OS Authors. All rights reserved. | 
|  | * Use of this source code is governed by a BSD-style license that can be | 
|  | * found in the LICENSE file. | 
|  | * | 
|  | * Implements root device discovery via sysfs with optional bells and whistles. | 
|  | */ | 
|  |  | 
|  | #include "rootdev.h" | 
|  |  | 
|  | #include <ctype.h> | 
|  | #include <dirent.h> | 
|  | #include <err.h> | 
|  | #include <errno.h> | 
|  | #include <fcntl.h> | 
|  | #include <stdbool.h> | 
|  | #include <stddef.h> | 
|  | #include <stdio.h> | 
|  | #include <stdlib.h> | 
|  | #include <string.h> | 
|  | #include <sys/ioctl.h> | 
|  | #include <sys/stat.h> | 
|  | #include <sys/sysmacros.h> | 
|  | #include <sys/types.h> | 
|  | #include <sys/vfs.h> | 
|  | #include <unistd.h> | 
|  | #include <linux/btrfs.h> | 
|  | #include <linux/magic.h> | 
|  |  | 
|  | /* | 
|  | * Limit prevents endless looping to find slave. | 
|  | * We currently have at most 2 levels, this allows | 
|  | * for future growth. | 
|  | */ | 
|  | #define MAX_SLAVE_DEPTH 8 | 
|  |  | 
|  | static const char *kDefaultSearchPath = "/sys/block"; | 
|  | static const char *kDefaultDevPath = "/dev"; | 
|  |  | 
|  | /* Encode the root device structuring here for Chromium OS */ | 
|  | static const char kActiveRoot[] = "/dev/ACTIVE_ROOT"; | 
|  | static const char kRootDev[] = "/dev/ROOT"; | 
|  | static const char kRootA[] = "/dev/ROOT0"; | 
|  | static const char kRootB[] = "/dev/ROOT1"; | 
|  |  | 
|  | struct part_config { | 
|  | const char *name; | 
|  | int offset; | 
|  | }; | 
|  |  | 
|  | #define CHROMEOS_PRIMARY_PARTITION 3 | 
|  | static const struct part_config kPrimaryPart[] = { { kRootA,    0 }, | 
|  | { kRootDev, -3 }, | 
|  | { kRootB,    2 } }; | 
|  | #define CHROMEOS_SECONDARY_PARTITION 5 | 
|  | static const struct part_config kSecondaryPart[] = { { kRootB,    0 }, | 
|  | { kRootDev, -5 }, | 
|  | { kRootA,   -2 } }; | 
|  |  | 
|  | /* The number of entries in a part_config so we could add RootC easily. */ | 
|  | static const int kPartitionEntries = 3; | 
|  |  | 
|  | /* Converts a file of %u:%u -> dev_t. */ | 
|  | static dev_t devt_from_file(const char *file) { | 
|  | char candidate[10];  /* TODO(wad) system-provided constant? */ | 
|  | ssize_t bytes = 0; | 
|  | unsigned int major_num = 0; | 
|  | unsigned int minor_num = 0; | 
|  | dev_t dev = 0; | 
|  | int fd = -1; | 
|  |  | 
|  | /* Never hang. Either get the data or return 0. */ | 
|  | fd = open(file, O_NONBLOCK | O_RDONLY); | 
|  | if (fd < 0) | 
|  | return 0; | 
|  | bytes = read(fd, candidate, sizeof(candidate)); | 
|  | close(fd); | 
|  |  | 
|  | /* 0:0 should be considered the minimum size. */ | 
|  | if (bytes < 3) | 
|  | return 0; | 
|  | candidate[bytes] = 0; | 
|  | if (sscanf(candidate, "%u:%u", &major_num, &minor_num) == 2) { | 
|  | /* candidate's size artificially limits the size of the converted | 
|  | * %u to safely convert to a signed int. */ | 
|  | dev = makedev(major_num, minor_num); | 
|  | } | 
|  | return dev; | 
|  | } | 
|  |  | 
|  | /* Walks sysfs and recurses into any directory/link that represents | 
|  | * a block device to find sub-devices (partitions) for dev. | 
|  | * If dev == 0, the name fo the first device in the directory will be returned. | 
|  | * Returns the device's name in "name" */ | 
|  | static int match_sysfs_device(char *name, size_t name_len, | 
|  | const char *basedir, dev_t *dev, int depth) { | 
|  | int found = -1; | 
|  | size_t basedir_len; | 
|  | DIR *dirp = NULL; | 
|  | struct dirent *entry = NULL; | 
|  | char *working_path = NULL; | 
|  | long working_path_size = 0; | 
|  |  | 
|  | if (!name || !name_len || !basedir || !dev) { | 
|  | warnx("match_sysfs_device: invalid arguments supplied"); | 
|  | return -1; | 
|  | } | 
|  | basedir_len = strlen(basedir); | 
|  | if (!basedir_len) { | 
|  | warnx("match_sysfs_device: basedir must not be empty"); | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | errno = 0; | 
|  | dirp = opendir(basedir); | 
|  | if (!dirp) { | 
|  | /* Don't complain if the directory doesn't exist. */ | 
|  | if (errno != ENOENT) | 
|  | warn("match_sysfs_device:opendir(%s)", basedir); | 
|  | return found; | 
|  | } | 
|  |  | 
|  | /* Grab a platform appropriate path to work with. | 
|  | * Ideally, this won't vary under sys/block. */ | 
|  | working_path_size = pathconf(basedir, _PC_NAME_MAX) + 1; | 
|  | /* Fallback to PATH_MAX on any pathconf error. */ | 
|  | if (working_path_size < 0) | 
|  | working_path_size = PATH_MAX; | 
|  |  | 
|  | working_path = malloc(working_path_size); | 
|  | if (!working_path) { | 
|  | warn("malloc(dirent)"); | 
|  | closedir(dirp); | 
|  | return found; | 
|  | } | 
|  |  | 
|  | /* Allocate a properly sized entry. */ | 
|  | entry = malloc(offsetof(struct dirent, d_name) + working_path_size); | 
|  | if (!entry) { | 
|  | warn("malloc(dirent)"); | 
|  | free(working_path); | 
|  | closedir(dirp); | 
|  | return found; | 
|  | } | 
|  |  | 
|  | while ((entry = readdir(dirp))) { | 
|  | size_t candidate_len = strlen(entry->d_name); | 
|  | size_t path_len = 0; | 
|  | dev_t found_devt = 0; | 
|  | /* Ignore the usual */ | 
|  | if (!strcmp(entry->d_name, ".") || !strcmp(entry->d_name, "..")) | 
|  | continue; | 
|  | /* TODO(wad) determine how to best bubble up this case. */ | 
|  | if (candidate_len > name_len) | 
|  | continue; | 
|  | /* Only traverse directories or symlinks (to directories ideally) */ | 
|  | switch (entry->d_type) { | 
|  | case DT_UNKNOWN: | 
|  | case DT_DIR: | 
|  | case DT_LNK: | 
|  | break; | 
|  | default: | 
|  | continue; | 
|  | } | 
|  | /* Determine path to block device number */ | 
|  | path_len = snprintf(working_path, working_path_size, "%s/%s/dev", | 
|  | basedir, entry->d_name); | 
|  | /* Ignore if truncation occurs. */ | 
|  | if (path_len != candidate_len + basedir_len + 5) | 
|  | continue; | 
|  |  | 
|  | found_devt = devt_from_file(working_path); | 
|  | /* *dev == 0 is a wildcard. */ | 
|  | if (!*dev || found_devt == *dev) { | 
|  | snprintf(name, name_len, "%s", entry->d_name); | 
|  | *dev = found_devt; | 
|  | found = 1; | 
|  | break; | 
|  | } | 
|  |  | 
|  | /* Prevent infinite recursion on symlink loops by limiting depth. */ | 
|  | if (depth > 5) | 
|  | break; | 
|  |  | 
|  | /* Recurse one level for devices that may have a matching partition. */ | 
|  | if (major(found_devt) == major(*dev) && minor(*dev) > minor(found_devt)) { | 
|  | sprintf(working_path, "%s/%s", basedir, entry->d_name); | 
|  | found = match_sysfs_device(name, name_len, working_path, dev, depth + 1); | 
|  | if (found > 0) | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | free(working_path); | 
|  | closedir(dirp); | 
|  | return found; | 
|  | } | 
|  |  | 
|  | const char *rootdev_get_partition(const char *dst, size_t len) { | 
|  | const char *end = dst + strnlen(dst, len); | 
|  | const char *part = end - 1; | 
|  | if (!len) | 
|  | return NULL; | 
|  |  | 
|  | if (!isdigit(*part--)) | 
|  | return NULL; | 
|  |  | 
|  | while (part > dst && isdigit(*part)) part--; | 
|  | part++; | 
|  |  | 
|  | if (part >= end) | 
|  | return NULL; | 
|  |  | 
|  | return part; | 
|  | } | 
|  |  | 
|  | void rootdev_strip_partition(char *dst, size_t len) { | 
|  | char *part = (char *)rootdev_get_partition(dst, len); | 
|  | if (!part) | 
|  | return; | 
|  |  | 
|  | /* For devices matching dm-NN, the digits are not a partition. */ | 
|  | if (*(part - 1) == '-') | 
|  | return; | 
|  |  | 
|  | /* For devices that end with a digit, the kernel uses a 'p' | 
|  | * as a separator. E.g., mmcblk1p2 and loop0p1, but not loop0. */ | 
|  | if (*(part - 1) == 'p') { | 
|  | part--; | 
|  | if (strncmp(dst, "loop", 4) == 0 && dst + 3 == part) | 
|  | return; | 
|  | } | 
|  | *part = '\0'; | 
|  | } | 
|  |  | 
|  | int rootdev_symlink_active(const char *path) { | 
|  | int ret = 0; | 
|  | /* Don't overwrite an existing link. */ | 
|  | errno = 0; | 
|  | if ((symlink(path, kActiveRoot)) && errno != EEXIST) { | 
|  | warn("failed to symlink %s -> %s", kActiveRoot, path); | 
|  | ret = -1; | 
|  | } | 
|  | return ret; | 
|  | } | 
|  |  | 
|  | int rootdev_get_device(char *dst, size_t size, dev_t dev, | 
|  | const char *search) { | 
|  | struct stat active_root_statbuf; | 
|  |  | 
|  | if (search == NULL) | 
|  | search = kDefaultSearchPath; | 
|  |  | 
|  | /* Check if the -s symlink exists. */ | 
|  | if ((stat(kActiveRoot, &active_root_statbuf) == 0) && | 
|  | active_root_statbuf.st_rdev == dev) { | 
|  | /* Note, if the link is not fully qualified, this won't be | 
|  | * either. */ | 
|  | ssize_t len = readlink(kActiveRoot, dst, PATH_MAX); | 
|  | if (len > 0) { | 
|  | dst[len] = 0; | 
|  | return 0; | 
|  | } | 
|  | /* If readlink fails or is empty, fall through */ | 
|  | } | 
|  |  | 
|  | snprintf(dst, size, "%s", search); | 
|  | if (match_sysfs_device(dst, size, dst, &dev, 0) <= 0) { | 
|  | fprintf (stderr, "unable to find match\n"); | 
|  | return 1; | 
|  | } | 
|  |  | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * rootdev_get_device_slave returns results in slave which | 
|  | * may be the original device or the name of the slave. | 
|  | * | 
|  | * Because slave and device may point to the same data, | 
|  | * must be careful how they are handled because slave | 
|  | * is modified (can't use snprintf). | 
|  | */ | 
|  | void rootdev_get_device_slave(char *slave, size_t size, dev_t *dev, | 
|  | const char *device, const char *search) { | 
|  | char dst[PATH_MAX]; | 
|  | int len = 0; | 
|  | int i; | 
|  |  | 
|  | if (search == NULL) | 
|  | search = kDefaultSearchPath; | 
|  |  | 
|  | /* | 
|  | * With stacked device mappers, we have to chain through all the levels | 
|  | * and find the last device. For example, verity can be stacked on bootcache | 
|  | * that is stacked on a disk partition. | 
|  | */ | 
|  | if (slave != device) | 
|  | strncpy(slave, device, size); | 
|  | slave[size - 1] = '\0'; | 
|  | for (i = 0; i < MAX_SLAVE_DEPTH; i++) { | 
|  | len = snprintf(dst, sizeof(dst), "%s/%s/slaves", search, slave); | 
|  | if (len != strlen(device) + strlen(search) + 8) { | 
|  | warnx("rootdev_get_device_slave: device name too long"); | 
|  | return; | 
|  | } | 
|  | *dev = 0; | 
|  | if (match_sysfs_device(slave, size, dst, dev, 0) <= 0) { | 
|  | return; | 
|  | } | 
|  | } | 
|  | warnx("slave depth greater than %d at %s", i, slave); | 
|  | } | 
|  |  | 
|  | int rootdev_create_devices(const char *name, dev_t dev, bool symlink) { | 
|  | int ret = 0; | 
|  | unsigned int major_num = major(dev); | 
|  | unsigned int minor_num = minor(dev); | 
|  | int i; | 
|  | const struct part_config *config; | 
|  | const char *part_s = rootdev_get_partition(name, strlen(name)); | 
|  |  | 
|  | if (part_s == NULL) { | 
|  | warnx("create_devices: unable to determine partition"); | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | switch (atoi(part_s)) { | 
|  | case CHROMEOS_PRIMARY_PARTITION: | 
|  | config = kPrimaryPart; | 
|  | break; | 
|  | case CHROMEOS_SECONDARY_PARTITION: | 
|  | config = kSecondaryPart; | 
|  | break; | 
|  | default: | 
|  | warnx("create_devices: unable to determine partition: %s", | 
|  | part_s); | 
|  | return -1; | 
|  | } | 
|  |  | 
|  | for (i = 0; i < kPartitionEntries; ++i) { | 
|  | dev = makedev(major_num, minor_num + config[i].offset); | 
|  | errno = 0; | 
|  | if (mknod(config[i].name, | 
|  | S_IFBLK | S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH, | 
|  | dev) && errno != EEXIST) { | 
|  | warn("failed to create %s", config[i].name); | 
|  | return -1; | 
|  | } | 
|  | } | 
|  |  | 
|  | if (symlink) | 
|  | ret = rootdev_symlink_active(config[0].name); | 
|  | return ret; | 
|  | } | 
|  |  | 
|  | int rootdev_get_path(char *path, size_t size, const char *device, | 
|  | dev_t dev, const char *dev_path) { | 
|  | int path_len; | 
|  | struct stat dev_statbuf; | 
|  |  | 
|  | if (!dev_path) | 
|  | dev_path = kDefaultDevPath; | 
|  |  | 
|  | if (!path || !size || !device) | 
|  | return -1; | 
|  |  | 
|  | path_len = snprintf(path, size, "%s/%s", dev_path, device); | 
|  | if (path_len != strlen(dev_path) + 1 + strlen(device)) | 
|  | return -1; | 
|  |  | 
|  | if (stat(path, &dev_statbuf) != 0) | 
|  | return 1; | 
|  |  | 
|  | if (dev && dev != dev_statbuf.st_rdev) | 
|  | return 2; | 
|  |  | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | static int get_rootdev_btrfs(char *path, size_t size, const char *mount_path) { | 
|  | const char *di_path; | 
|  |  | 
|  | /* Open the mount point path */ | 
|  | int fd = open(mount_path, O_RDONLY | O_CLOEXEC); | 
|  | if (fd == -1) { | 
|  | return -1; | 
|  | } | 
|  | /* Create space to hold the ioctl dev info. */ | 
|  | struct btrfs_ioctl_dev_info_args di_args; | 
|  | /* Since we use always use single device in chromebook rootfs, | 
|  | * the device id for this device is always 1. */ | 
|  | di_args.devid = 1; | 
|  | /* Read the ioctl device info (btrfs). */ | 
|  | if (ioctl(fd, BTRFS_IOC_DEV_INFO, &di_args) != 0) { | 
|  | close(fd); | 
|  | return -1; | 
|  | } | 
|  | close(fd); | 
|  |  | 
|  | di_path = (const char *)di_args.path; | 
|  | /* Try to access the device at di_args->path to verify its existence. */ | 
|  | if (access((char *)di_path, F_OK) != 0) { | 
|  | return -1; | 
|  | } | 
|  | if (strlen(di_path) >= size) | 
|  | return -1; | 
|  | strcpy(path, di_path); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | int rootdev_wrapper(char *path, size_t size, | 
|  | bool full, bool strip, | 
|  | dev_t *dev, | 
|  | const char *mount_path, | 
|  | const char *search, const char *dev_path) { | 
|  | int res = 0; | 
|  | char devname[PATH_MAX]; | 
|  | struct statfs mount_statfs; | 
|  |  | 
|  | if (!search) | 
|  | search = kDefaultSearchPath; | 
|  | if (!dev_path) | 
|  | dev_path = kDefaultDevPath; | 
|  | if (!dev) | 
|  | return -1; | 
|  | if (statfs(mount_path, &mount_statfs) == 0) { | 
|  | if (mount_statfs.f_type == BTRFS_SUPER_MAGIC) { | 
|  | /* BTRFS uses virtual device id which is different from actual | 
|  | * device id. So we zero-out dev_t indicating that dev_t is not | 
|  | * a valid device id. */ | 
|  | *dev = 0; | 
|  | return get_rootdev_btrfs(path, size, mount_path); | 
|  | } | 
|  | } | 
|  |  | 
|  | res = rootdev_get_device(devname, sizeof(devname), *dev, search); | 
|  | if (res != 0) | 
|  | return res; | 
|  |  | 
|  | if (full) | 
|  | rootdev_get_device_slave(devname, sizeof(devname), dev, devname, | 
|  | search); | 
|  |  | 
|  | /* TODO(wad) we should really just track the block dev, partition number, and | 
|  | *           dev path.  When we rewrite this, we can track all the sysfs info | 
|  | *           in the class. */ | 
|  | if (strip) { | 
|  | /* When we strip the partition, we don't want get_path to return non-zero | 
|  | * because of dev mismatch.  Passing in 0 tells it to not test. */ | 
|  | *dev = 0; | 
|  | rootdev_strip_partition(devname, size); | 
|  | } | 
|  |  | 
|  | res = rootdev_get_path(path, size, devname, *dev, dev_path); | 
|  |  | 
|  | return res; | 
|  | } | 
|  |  | 
|  | int rootdev(char *path, size_t size, bool full, bool strip) { | 
|  | struct stat root_statbuf; | 
|  | dev_t _root_dev, *root_dev = &_root_dev; | 
|  |  | 
|  | /* Yields the containing dev_t in st_dev. */ | 
|  | if (stat("/", &root_statbuf) != 0) | 
|  | return -1; | 
|  |  | 
|  | /* Some ABIs (like mips o32) are broken and the st_dev field isn't actually | 
|  | * a dev_t.  In that case, pass a pointer to a local dev_t who we took care | 
|  | * of truncating the value into.  On sane arches, gcc can optimize this to | 
|  | * the same code, so should only be a penalty when the ABI is broken. */ | 
|  | if (sizeof(root_statbuf.st_dev) == sizeof(*root_dev)) { | 
|  | /* Cast is OK since we verified size here. */ | 
|  | root_dev = (dev_t *)&root_statbuf.st_dev; | 
|  | } else { | 
|  | *root_dev = root_statbuf.st_dev; | 
|  | } | 
|  |  | 
|  | return rootdev_wrapper(path, | 
|  | size, | 
|  | full, | 
|  | strip, | 
|  | root_dev, | 
|  | "/", | 
|  | NULL,  /* default /sys dir */ | 
|  | NULL);  /* default /dev dir */ | 
|  | } |