#include #include #include #include #include #include #include #include #include //#define VFS_DEBUG static VFS* s_the; VFS& VFS::the() { ASSERT(s_the); return *s_the; } VFS::VFS() { #ifdef VFS_DEBUG kprintf("VFS: Constructing VFS\n"); #endif s_the = this; } VFS::~VFS() { } InodeIdentifier VFS::root_inode_id() const { ASSERT(m_root_inode); return m_root_inode->identifier(); } bool VFS::mount(Retained&& file_system, StringView path) { auto result = resolve_path(path, root_custody()); if (result.is_error()) { kprintf("VFS: mount can't resolve mount point '%s'\n", path.characters()); return false; } auto& inode = result.value()->inode(); kprintf("VFS: mounting %s{%p} at %s (inode: %u)\n", file_system->class_name(), file_system.ptr(), path.characters(), inode.index()); // FIXME: check that this is not already a mount point auto mount = make(*result.value(), move(file_system)); m_mounts.append(move(mount)); result.value()->did_mount_on({}); return true; } bool VFS::mount_root(Retained&& file_system) { if (m_root_inode) { kprintf("VFS: mount_root can't mount another root\n"); return false; } auto mount = make(nullptr, move(file_system)); auto root_inode_id = mount->guest().fs()->root_inode(); auto root_inode = mount->guest().fs()->get_inode(root_inode_id); if (!root_inode->is_directory()) { kprintf("VFS: root inode (%02u:%08u) for / is not a directory :(\n", root_inode_id.fsid(), root_inode_id.index()); return false; } m_root_inode = move(root_inode); kprintf("VFS: mounted root on %s{%p}\n", m_root_inode->fs().class_name(), &m_root_inode->fs()); m_mounts.append(move(mount)); return true; } auto VFS::find_mount_for_host(InodeIdentifier inode) -> Mount* { for (auto& mount : m_mounts) { if (mount->host() == inode) return mount.ptr(); } return nullptr; } auto VFS::find_mount_for_guest(InodeIdentifier inode) -> Mount* { for (auto& mount : m_mounts) { if (mount->guest() == inode) return mount.ptr(); } return nullptr; } bool VFS::is_vfs_root(InodeIdentifier inode) const { return inode == root_inode_id(); } void VFS::traverse_directory_inode(Inode& dir_inode, Function callback) { dir_inode.traverse_as_directory([&](const FS::DirectoryEntry& entry) { InodeIdentifier resolved_inode; if (auto mount = find_mount_for_host(entry.inode)) resolved_inode = mount->guest(); else resolved_inode = entry.inode; if (dir_inode.identifier().is_root_inode() && !is_vfs_root(dir_inode.identifier()) && !strcmp(entry.name, "..")) { auto mount = find_mount_for_guest(entry.inode); ASSERT(mount); resolved_inode = mount->host(); } callback(FS::DirectoryEntry(entry.name, entry.name_length, resolved_inode, entry.file_type)); return true; }); } KResult VFS::utime(StringView path, Custody& base, time_t atime, time_t mtime) { auto descriptor_or_error = VFS::the().open(move(path), 0, 0, base); if (descriptor_or_error.is_error()) return descriptor_or_error.error(); auto& inode = *descriptor_or_error.value()->inode(); if (inode.fs().is_readonly()) return KResult(-EROFS); if (inode.metadata().uid != current->process().euid()) return KResult(-EACCES); int error = inode.set_atime(atime); if (error) return KResult(error); error = inode.set_mtime(mtime); if (error) return KResult(error); return KSuccess; } KResult VFS::stat(StringView path, int options, Custody& base, struct stat& statbuf) { auto custody_or_error = resolve_path(path, base, nullptr, options); if (custody_or_error.is_error()) return custody_or_error.error(); return custody_or_error.value()->inode().metadata().stat(statbuf); } KResultOr> VFS::open(StringView path, int options, mode_t mode, Custody& base) { RetainPtr parent_custody; auto custody_or_error = resolve_path(path, base, &parent_custody, options); if (options & O_CREAT) { if (!parent_custody) return KResult(-ENOENT); if (custody_or_error.is_error()) { if (custody_or_error.error() != -ENOENT) return custody_or_error.error(); return create(path, options, mode, *parent_custody); } if (options & O_EXCL) return KResult(-EEXIST); } if (custody_or_error.is_error()) return custody_or_error.error(); auto& custody = *custody_or_error.value(); auto& inode = custody.inode(); auto metadata = inode.metadata(); bool should_truncate_file = false; // NOTE: Read permission is a bit weird, since O_RDONLY == 0, // so we check if (NOT write_only OR read_and_write) if (!(options & O_WRONLY) || (options & O_RDWR)) { if (!metadata.may_read(current->process())) return KResult(-EACCES); } if ((options & O_WRONLY) || (options & O_RDWR)) { if (!metadata.may_write(current->process())) return KResult(-EACCES); if (metadata.is_directory()) return KResult(-EISDIR); should_truncate_file = options & O_TRUNC; } if (metadata.is_device()) { auto it = m_devices.find(encoded_device(metadata.major_device, metadata.minor_device)); if (it == m_devices.end()) { return KResult(-ENODEV); } auto descriptor_or_error = (*it).value->open(options); if (descriptor_or_error.is_error()) return descriptor_or_error.error(); descriptor_or_error.value()->set_original_inode({}, inode); return descriptor_or_error; } if (should_truncate_file) inode.truncate(0); return FileDescription::create(custody); } KResult VFS::mknod(StringView path, mode_t mode, dev_t dev, Custody& base) { if (!is_regular_file(mode) && !is_block_device(mode) && !is_character_device(mode) && !is_fifo(mode) && !is_socket(mode)) return KResult(-EINVAL); RetainPtr parent_custody; auto existing_file_or_error = resolve_path(path, base, &parent_custody); if (!existing_file_or_error.is_error()) return KResult(-EEXIST); if (!parent_custody) return KResult(-ENOENT); if (existing_file_or_error.error() != -ENOENT) return existing_file_or_error.error(); auto& parent_inode = parent_custody->inode(); if (!parent_inode.metadata().may_write(current->process())) return KResult(-EACCES); FileSystemPath p(path); dbgprintf("VFS::mknod: '%s' mode=%o dev=%u in %u:%u\n", p.basename().characters(), mode, dev, parent_inode.fsid(), parent_inode.index()); int error; auto new_file = parent_inode.fs().create_inode(parent_inode.identifier(), p.basename(), mode, 0, dev, error); if (!new_file) return KResult(error); return KSuccess; } KResultOr> VFS::create(StringView path, int options, mode_t mode, Custody& parent_custody) { (void)options; if (!is_socket(mode) && !is_fifo(mode) && !is_block_device(mode) && !is_character_device(mode)) { // Turn it into a regular file. (This feels rather hackish.) mode |= 0100000; } auto& parent_inode = parent_custody.inode(); if (!parent_inode.metadata().may_write(current->process())) return KResult(-EACCES); FileSystemPath p(path); dbgprintf("VFS::create_file: '%s' in %u:%u\n", p.basename().characters(), parent_inode.fsid(), parent_inode.index()); int error; auto new_file = parent_inode.fs().create_inode(parent_inode.identifier(), p.basename(), mode, 0, 0, error); if (!new_file) return KResult(error); auto new_custody = Custody::create(&parent_custody, p.basename(), *new_file); return FileDescription::create(*new_custody); } KResult VFS::mkdir(StringView path, mode_t mode, Custody& base) { RetainPtr parent_custody; auto result = resolve_path(path, base, &parent_custody); if (!result.is_error()) return KResult(-EEXIST); if (!parent_custody) return KResult(-ENOENT); if (result.error() != -ENOENT) return result.error(); auto& parent_inode = parent_custody->inode(); if (!parent_inode.metadata().may_write(current->process())) return KResult(-EACCES); FileSystemPath p(path); dbgprintf("VFS::mkdir: '%s' in %u:%u\n", p.basename().characters(), parent_inode.fsid(), parent_inode.index()); int error; auto new_dir = parent_inode.fs().create_directory(parent_inode.identifier(), p.basename(), mode, error); if (new_dir) return KSuccess; return KResult(error); } KResult VFS::access(StringView path, int mode, Custody& base) { auto custody_or_error = resolve_path(path, base); if (custody_or_error.is_error()) return custody_or_error.error(); auto& custody = *custody_or_error.value(); auto& inode = custody.inode(); auto metadata = inode.metadata(); if (mode & R_OK) { if (!metadata.may_read(current->process())) return KResult(-EACCES); } if (mode & W_OK) { if (!metadata.may_write(current->process())) return KResult(-EACCES); } if (mode & X_OK) { if (!metadata.may_execute(current->process())) return KResult(-EACCES); } return KSuccess; } KResultOr> VFS::open_directory(StringView path, Custody& base) { auto inode_or_error = resolve_path(path, base); if (inode_or_error.is_error()) return inode_or_error.error(); auto& custody = *inode_or_error.value(); auto& inode = custody.inode(); if (!inode.is_directory()) return KResult(-ENOTDIR); if (!inode.metadata().may_execute(current->process())) return KResult(-EACCES); return custody; } KResult VFS::chmod(Inode& inode, mode_t mode) { if (inode.fs().is_readonly()) return KResult(-EROFS); if (current->process().euid() != inode.metadata().uid && !current->process().is_superuser()) return KResult(-EPERM); // Only change the permission bits. mode = (inode.mode() & ~04777u) | (mode & 04777u); return inode.chmod(mode); } KResult VFS::chmod(StringView path, mode_t mode, Custody& base) { auto custody_or_error = resolve_path(path, base); if (custody_or_error.is_error()) return custody_or_error.error(); auto& custody = *custody_or_error.value(); auto& inode = custody.inode(); return chmod(inode, mode); } KResult VFS::rename(StringView old_path, StringView new_path, Custody& base) { RetainPtr old_parent_custody; auto old_custody_or_error = resolve_path(old_path, base, &old_parent_custody); if (old_custody_or_error.is_error()) return old_custody_or_error.error(); auto& old_custody = *old_custody_or_error.value(); auto& old_inode = old_custody.inode(); RetainPtr new_parent_custody; auto new_custody_or_error = resolve_path(new_path, base, &new_parent_custody); if (new_custody_or_error.is_error()) { if (new_custody_or_error.error() != -ENOENT) return new_custody_or_error.error(); } auto& old_parent_inode = old_parent_custody->inode(); auto& new_parent_inode = new_parent_custody->inode(); if (!new_parent_inode.metadata().may_write(current->process())) return KResult(-EACCES); if (!old_parent_inode.metadata().may_write(current->process())) return KResult(-EACCES); if (old_parent_inode.metadata().is_sticky()) { if (!current->process().is_superuser() && old_inode.metadata().uid != current->process().euid()) return KResult(-EACCES); } auto new_basename = FileSystemPath(new_path).basename(); if (!new_custody_or_error.is_error()) { auto& new_custody = *new_custody_or_error.value(); auto& new_inode = new_custody.inode(); // FIXME: Is this really correct? Check what other systems do. if (&new_inode == &old_inode) return KSuccess; if (new_parent_inode.metadata().is_sticky()) { if (!current->process().is_superuser() && new_inode.metadata().uid != current->process().euid()) return KResult(-EACCES); } if (new_inode.is_directory() && !old_inode.is_directory()) return KResult(-EISDIR); auto result = new_parent_inode.remove_child(new_basename); if (result.is_error()) return result; new_custody.did_delete({}); } auto result = new_parent_inode.add_child(old_inode.identifier(), new_basename, old_inode.mode()); if (result.is_error()) return result; result = old_parent_inode.remove_child(FileSystemPath(old_path).basename()); if (result.is_error()) return result; old_custody.did_rename({}, new_basename); return KSuccess; } KResult VFS::chown(Inode& inode, uid_t a_uid, gid_t a_gid) { if (inode.fs().is_readonly()) return KResult(-EROFS); auto metadata = inode.metadata(); if (current->process().euid() != metadata.uid && !current->process().is_superuser()) return KResult(-EPERM); uid_t new_uid = metadata.uid; gid_t new_gid = metadata.gid; if (a_uid != (uid_t)-1) { if (current->process().euid() != a_uid && !current->process().is_superuser()) return KResult(-EPERM); new_uid = a_uid; } if (a_gid != (gid_t)-1) { if (!current->process().in_group(a_gid) && !current->process().is_superuser()) return KResult(-EPERM); new_gid = a_gid; } dbgprintf("VFS::chown(): inode %u:%u <- uid:%d, gid:%d\n", inode.fsid(), inode.index(), new_uid, new_gid); return inode.chown(new_uid, new_gid); } KResult VFS::chown(StringView path, uid_t a_uid, gid_t a_gid, Custody& base) { auto custody_or_error = resolve_path(path, base); if (custody_or_error.is_error()) return custody_or_error.error(); auto& custody = *custody_or_error.value(); auto& inode = custody.inode(); return chown(inode, a_uid, a_gid); } KResult VFS::link(StringView old_path, StringView new_path, Custody& base) { auto old_custody_or_error = resolve_path(old_path, base); if (old_custody_or_error.is_error()) return old_custody_or_error.error(); auto& old_custody = *old_custody_or_error.value(); auto& old_inode = old_custody.inode(); RetainPtr parent_custody; auto new_custody_or_error = resolve_path(new_path, base, &parent_custody); if (!new_custody_or_error.is_error()) return KResult(-EEXIST); if (!parent_custody) return KResult(-ENOENT); auto& parent_inode = parent_custody->inode(); if (parent_inode.fsid() != old_inode.fsid()) return KResult(-EXDEV); if (parent_inode.fs().is_readonly()) return KResult(-EROFS); if (!parent_inode.metadata().may_write(current->process())) return KResult(-EACCES); return parent_inode.add_child(old_inode.identifier(), FileSystemPath(new_path).basename(), old_inode.mode()); } KResult VFS::unlink(StringView path, Custody& base) { RetainPtr parent_custody; auto custody_or_error = resolve_path(path, base, &parent_custody); if (custody_or_error.is_error()) return custody_or_error.error(); auto& custody = *custody_or_error.value(); auto& inode = custody.inode(); if (inode.is_directory()) return KResult(-EISDIR); auto& parent_inode = parent_custody->inode(); if (!parent_inode.metadata().may_write(current->process())) return KResult(-EACCES); if (parent_inode.metadata().is_sticky()) { if (!current->process().is_superuser() && inode.metadata().uid != current->process().euid()) return KResult(-EACCES); } auto result = parent_inode.remove_child(FileSystemPath(path).basename()); if (result.is_error()) return result; custody.did_delete({}); return KSuccess; } KResult VFS::symlink(StringView target, StringView linkpath, Custody& base) { RetainPtr parent_custody; auto existing_custody_or_error = resolve_path(linkpath, base, &parent_custody); if (!existing_custody_or_error.is_error()) return KResult(-EEXIST); if (!parent_custody) return KResult(-ENOENT); if (existing_custody_or_error.error() != -ENOENT) return existing_custody_or_error.error(); auto& parent_inode = parent_custody->inode(); if (!parent_inode.metadata().may_write(current->process())) return KResult(-EACCES); FileSystemPath p(linkpath); dbgprintf("VFS::symlink: '%s' (-> '%s') in %u:%u\n", p.basename().characters(), target.characters(), parent_inode.fsid(), parent_inode.index()); int error; auto new_file = parent_inode.fs().create_inode(parent_inode.identifier(), p.basename(), 0120644, 0, 0, error); if (!new_file) return KResult(error); ssize_t nwritten = new_file->write_bytes(0, target.length(), (const byte*)target.characters(), nullptr); if (nwritten < 0) return KResult(nwritten); return KSuccess; } KResult VFS::rmdir(StringView path, Custody& base) { RetainPtr parent_custody; auto custody_or_error = resolve_path(path, base, &parent_custody); if (custody_or_error.is_error()) return KResult(custody_or_error.error()); auto& custody = *custody_or_error.value(); auto& inode = custody.inode(); if (inode.fs().is_readonly()) return KResult(-EROFS); // FIXME: We should return EINVAL if the last component of the path is "." // FIXME: We should return ENOTEMPTY if the last component of the path is ".." if (!inode.is_directory()) return KResult(-ENOTDIR); auto& parent_inode = parent_custody->inode(); if (!parent_inode.metadata().may_write(current->process())) return KResult(-EACCES); if (inode.directory_entry_count() != 2) return KResult(-ENOTEMPTY); auto result = inode.remove_child("."); if (result.is_error()) return result; result = inode.remove_child(".."); if (result.is_error()) return result; return parent_inode.remove_child(FileSystemPath(path).basename()); } RetainPtr VFS::get_inode(InodeIdentifier inode_id) { if (!inode_id.is_valid()) return nullptr; return inode_id.fs()->get_inode(inode_id); } VFS::Mount::Mount(RetainPtr&& host_custody, Retained&& guest_fs) : m_guest(guest_fs->root_inode()) , m_guest_fs(move(guest_fs)) , m_host_custody(move(host_custody)) { } String VFS::Mount::absolute_path() const { if (!m_host_custody) return "/"; return m_host_custody->absolute_path(); } InodeIdentifier VFS::Mount::host() const { if (!m_host_custody) return {}; return m_host_custody->inode().identifier(); } void VFS::register_device(Badge, Device& device) { m_devices.set(encoded_device(device.major(), device.minor()), &device); } void VFS::unregister_device(Badge, Device& device) { m_devices.remove(encoded_device(device.major(), device.minor())); } Device* VFS::get_device(unsigned major, unsigned minor) { auto it = m_devices.find(encoded_device(major, minor)); if (it == m_devices.end()) return nullptr; return (*it).value; } void VFS::for_each_mount(Function callback) const { for (auto& mount : m_mounts) { callback(*mount); } } void VFS::sync() { FS::sync(); } Custody& VFS::root_custody() { if (!m_root_custody) m_root_custody = Custody::create(nullptr, "", *m_root_inode); return *m_root_custody; } KResultOr> VFS::resolve_path(StringView path, Custody& base, RetainPtr* parent_custody, int options) { if (path.is_empty()) return KResult(-EINVAL); auto parts = path.split_view('/'); InodeIdentifier crumb_id; Vector, 32> custody_chain; if (path[0] == '/') { custody_chain.append(root_custody()); crumb_id = root_inode_id(); } else { for (auto* custody = &base; custody; custody = custody->parent()) { // FIXME: Prepending here is not efficient! Fix this. custody_chain.prepend(*custody); } crumb_id = base.inode().identifier(); } if (parent_custody) *parent_custody = custody_chain.last(); for (int i = 0; i < parts.size(); ++i) { bool inode_was_root_at_head_of_loop = crumb_id.is_root_inode(); auto& part = parts[i]; if (part.is_empty()) break; auto crumb_inode = get_inode(crumb_id); if (!crumb_inode) return KResult(-EIO); auto metadata = crumb_inode->metadata(); if (!metadata.is_directory()) return KResult(-ENOTDIR); if (!metadata.may_execute(current->process())) return KResult(-EACCES); auto current_parent = custody_chain.last(); crumb_id = crumb_inode->lookup(part); if (!crumb_id.is_valid()) return KResult(-ENOENT); if (auto mount = find_mount_for_host(crumb_id)) crumb_id = mount->guest(); if (inode_was_root_at_head_of_loop && crumb_id.is_root_inode() && !is_vfs_root(crumb_id) && part == "..") { auto mount = find_mount_for_guest(crumb_id); auto dir_inode = get_inode(mount->host()); ASSERT(dir_inode); crumb_id = dir_inode->lookup(".."); } crumb_inode = get_inode(crumb_id); ASSERT(crumb_inode); custody_chain.append(Custody::get_or_create(custody_chain.last().ptr(), part, *crumb_inode)); metadata = crumb_inode->metadata(); if (metadata.is_directory()) { if (i != parts.size() - 1) { if (parent_custody) *parent_custody = custody_chain.last(); } } if (metadata.is_symlink()) { if (i == parts.size() - 1) { if (options & O_NOFOLLOW) return KResult(-ELOOP); if (options & O_NOFOLLOW_NOERROR) return custody_chain.last(); } auto symlink_contents = crumb_inode->read_entire(); if (!symlink_contents) return KResult(-ENOENT); // FIXME: We should limit the recursion here and return -ELOOP if it goes to deep. auto symlink_target = resolve_path( StringView(symlink_contents.pointer(), symlink_contents.size()), *current_parent, parent_custody, options); if (symlink_target.is_error()) return symlink_target; bool have_more_parts = i + 1 < parts.size(); if (i + 1 == parts.size() - 1 && parts[i + 1].is_empty()) have_more_parts = false; if (!have_more_parts) return symlink_target; const char* remaining_path_chars = parts[i + 1].characters(); int remaining_path_length = path.length() - (remaining_path_chars - path.characters()); StringView remaining_path { remaining_path_chars, remaining_path_length }; return resolve_path(remaining_path, *symlink_target.value(), parent_custody, options); } } return custody_chain.last(); }