2020-01-18 11:38:21 +03:00
|
|
|
/*
|
2021-07-11 01:25:24 +03:00
|
|
|
* Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
|
2020-01-18 11:38:21 +03:00
|
|
|
*
|
2021-04-22 11:24:48 +03:00
|
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
2020-01-18 11:38:21 +03:00
|
|
|
*/
|
|
|
|
|
2018-10-10 12:53:07 +03:00
|
|
|
#pragma once
|
|
|
|
|
2019-05-31 16:36:49 +03:00
|
|
|
#include <AK/Badge.h>
|
2021-11-08 02:51:39 +03:00
|
|
|
#include <AK/Error.h>
|
2019-05-28 12:53:16 +03:00
|
|
|
#include <AK/Function.h>
|
2018-10-10 12:53:07 +03:00
|
|
|
#include <AK/HashMap.h>
|
|
|
|
#include <AK/OwnPtr.h>
|
2022-08-20 00:03:24 +03:00
|
|
|
#include <AK/RefPtr.h>
|
|
|
|
#include <Kernel/FileSystem/FileBackedFileSystem.h>
|
2019-05-31 16:36:49 +03:00
|
|
|
#include <Kernel/FileSystem/FileSystem.h>
|
2022-12-15 12:42:40 +03:00
|
|
|
#include <Kernel/FileSystem/Initializer.h>
|
2019-05-31 16:36:49 +03:00
|
|
|
#include <Kernel/FileSystem/InodeIdentifier.h>
|
|
|
|
#include <Kernel/FileSystem/InodeMetadata.h>
|
2021-07-11 01:46:06 +03:00
|
|
|
#include <Kernel/FileSystem/Mount.h>
|
2022-12-15 12:42:40 +03:00
|
|
|
#include <Kernel/FileSystem/MountFile.h>
|
2021-08-06 15:11:45 +03:00
|
|
|
#include <Kernel/FileSystem/UnveilNode.h>
|
2021-07-11 12:49:16 +03:00
|
|
|
#include <Kernel/Forward.h>
|
2022-12-15 12:42:40 +03:00
|
|
|
#include <Kernel/Locking/MutexProtected.h>
|
2022-02-03 03:37:46 +03:00
|
|
|
#include <Kernel/Locking/SpinlockProtected.h>
|
2018-10-10 12:53:07 +03:00
|
|
|
|
2020-02-16 03:27:42 +03:00
|
|
|
namespace Kernel {
|
2020-01-21 15:34:39 +03:00
|
|
|
|
2021-08-14 20:46:18 +03:00
|
|
|
// Kernel internal options.
|
|
|
|
#define O_NOFOLLOW_NOERROR (1 << 29)
|
|
|
|
#define O_UNLINK_INTERNAL (1 << 30)
|
|
|
|
|
2020-01-03 22:13:21 +03:00
|
|
|
struct UidAndGid {
|
2021-08-28 23:11:16 +03:00
|
|
|
UserID uid;
|
|
|
|
GroupID gid;
|
2020-01-03 22:13:21 +03:00
|
|
|
};
|
|
|
|
|
2022-10-01 15:24:56 +03:00
|
|
|
enum class AccessFlags {
|
|
|
|
None = 0,
|
|
|
|
EffectiveAccess = 1 << 0,
|
|
|
|
DoNotFollowSymlinks = 1 << 1,
|
|
|
|
};
|
|
|
|
|
|
|
|
AK_ENUM_BITWISE_OPERATORS(AccessFlags);
|
|
|
|
|
2021-07-11 01:25:24 +03:00
|
|
|
class VirtualFileSystem {
|
2018-10-10 12:53:07 +03:00
|
|
|
public:
|
2021-12-21 18:11:19 +03:00
|
|
|
// Required to be at least 8 by POSIX
|
|
|
|
// https://pubs.opengroup.org/onlinepubs/9699919799/basedefs/limits.h.html
|
|
|
|
static constexpr int symlink_recursion_limit = 8;
|
|
|
|
|
2020-08-25 04:35:19 +03:00
|
|
|
static void initialize();
|
2021-07-11 01:25:24 +03:00
|
|
|
static VirtualFileSystem& the();
|
2018-10-10 12:53:07 +03:00
|
|
|
|
2022-12-15 12:42:40 +03:00
|
|
|
static ErrorOr<FileSystemInitializer const*> find_filesystem_type_initializer(StringView fs_type);
|
|
|
|
|
2021-07-11 01:25:24 +03:00
|
|
|
VirtualFileSystem();
|
|
|
|
~VirtualFileSystem();
|
2018-10-10 12:53:07 +03:00
|
|
|
|
2021-11-08 02:51:39 +03:00
|
|
|
ErrorOr<void> mount_root(FileSystem&);
|
2022-12-15 12:42:40 +03:00
|
|
|
ErrorOr<void> mount(MountFile&, OpenFileDescription*, Custody& mount_point, int flags);
|
2021-11-08 02:51:39 +03:00
|
|
|
ErrorOr<void> bind_mount(Custody& source, Custody& mount_point, int flags);
|
|
|
|
ErrorOr<void> remount(Custody& mount_point, int new_flags);
|
2022-08-20 00:03:24 +03:00
|
|
|
ErrorOr<void> unmount(Custody& mount_point);
|
2023-06-17 19:17:00 +03:00
|
|
|
ErrorOr<void> unmount(Inode& guest_inode, StringView custody_path);
|
2021-11-08 02:51:39 +03:00
|
|
|
|
2023-03-06 21:29:25 +03:00
|
|
|
ErrorOr<NonnullRefPtr<OpenFileDescription>> open(Credentials const&, StringView path, int options, mode_t mode, Custody& base, Optional<UidAndGid> = {});
|
|
|
|
ErrorOr<NonnullRefPtr<OpenFileDescription>> open(Process const&, Credentials const&, StringView path, int options, mode_t mode, Custody& base, Optional<UidAndGid> = {});
|
|
|
|
ErrorOr<NonnullRefPtr<OpenFileDescription>> create(Credentials const&, StringView path, int options, mode_t mode, Custody& parent_custody, Optional<UidAndGid> = {});
|
|
|
|
ErrorOr<NonnullRefPtr<OpenFileDescription>> create(Process const&, Credentials const&, StringView path, int options, mode_t mode, Custody& parent_custody, Optional<UidAndGid> = {});
|
2022-08-21 17:02:24 +03:00
|
|
|
ErrorOr<void> mkdir(Credentials const&, StringView path, mode_t mode, Custody& base);
|
|
|
|
ErrorOr<void> link(Credentials const&, StringView old_path, StringView new_path, Custody& base);
|
|
|
|
ErrorOr<void> unlink(Credentials const&, StringView path, Custody& base);
|
|
|
|
ErrorOr<void> symlink(Credentials const&, StringView target, StringView linkpath, Custody& base);
|
|
|
|
ErrorOr<void> rmdir(Credentials const&, StringView path, Custody& base);
|
|
|
|
ErrorOr<void> chmod(Credentials const&, StringView path, mode_t, Custody& base, int options = 0);
|
|
|
|
ErrorOr<void> chmod(Credentials const&, Custody&, mode_t);
|
|
|
|
ErrorOr<void> chown(Credentials const&, StringView path, UserID, GroupID, Custody& base, int options);
|
|
|
|
ErrorOr<void> chown(Credentials const&, Custody&, UserID, GroupID);
|
2022-10-01 15:24:56 +03:00
|
|
|
ErrorOr<void> access(Credentials const&, StringView path, int mode, Custody& base, AccessFlags);
|
2022-08-21 17:02:24 +03:00
|
|
|
ErrorOr<InodeMetadata> lookup_metadata(Credentials const&, StringView path, Custody& base, int options = 0);
|
|
|
|
ErrorOr<void> utime(Credentials const&, StringView path, Custody& base, time_t atime, time_t mtime);
|
|
|
|
ErrorOr<void> utimensat(Credentials const&, StringView path, Custody& base, timespec const& atime, timespec const& mtime, int options = 0);
|
2023-04-08 11:37:15 +03:00
|
|
|
ErrorOr<void> do_utimens(Credentials const& credentials, Custody& custody, timespec const& atime, timespec const& mtime);
|
2022-10-01 14:42:25 +03:00
|
|
|
ErrorOr<void> rename(Credentials const&, Custody& old_base, StringView oldpath, Custody& new_base, StringView newpath);
|
2022-08-21 17:02:24 +03:00
|
|
|
ErrorOr<void> mknod(Credentials const&, StringView path, mode_t, dev_t, Custody& base);
|
|
|
|
ErrorOr<NonnullRefPtr<Custody>> open_directory(Credentials const&, StringView path, Custody& base);
|
2018-10-10 12:53:07 +03:00
|
|
|
|
2022-04-01 20:58:27 +03:00
|
|
|
ErrorOr<void> for_each_mount(Function<ErrorOr<void>(Mount const&)>) const;
|
2018-10-26 19:43:25 +03:00
|
|
|
|
Kernel/FileSystem: Discard safely filesystems when unmounted last time
This commit reached that goal of "safely discarding" a filesystem by
doing the following:
1. Stop using the s_file_system_map HashMap as it was an unsafe measure
to access pointers of FileSystems. Instead, make sure to register all
FileSystems at the VFS layer, with an IntrusiveList, to avoid problems
related to OOM conditions.
2. Make sure to cleanly remove the DiskCache object from a BlockBased
filesystem, so the destructor of such object will not need to do that in
the destruction point.
3. For ext2 filesystems, don't cache the root inode at m_inode_cache
HashMap. The reason for this is that when unmounting an ext2 filesystem,
we lookup at the cache to see if there's a reference to a cached inode
and if that's the case, we fail with EBUSY. If we keep the m_root_inode
also being referenced at the m_inode_cache map, we have 2 references to
that object, which will lead to fail with EBUSY. Also, it's much simpler
to always ask for a root inode and get it immediately from m_root_inode,
instead of looking up the cache for that inode.
2022-08-20 09:28:02 +03:00
|
|
|
void sync_filesystems();
|
|
|
|
void lock_all_filesystems();
|
|
|
|
|
2021-07-11 01:26:17 +03:00
|
|
|
static void sync();
|
2018-12-20 02:39:29 +03:00
|
|
|
|
2022-08-21 02:04:35 +03:00
|
|
|
NonnullRefPtr<Custody> root_custody();
|
2022-08-21 17:02:24 +03:00
|
|
|
ErrorOr<NonnullRefPtr<Custody>> resolve_path(Credentials const&, StringView path, NonnullRefPtr<Custody> base, RefPtr<Custody>* out_parent = nullptr, int options = 0, int symlink_recursion_level = 0);
|
2023-03-04 21:01:54 +03:00
|
|
|
ErrorOr<NonnullRefPtr<Custody>> resolve_path(Process const&, Credentials const&, StringView path, NonnullRefPtr<Custody> base, RefPtr<Custody>* out_parent = nullptr, int options = 0, int symlink_recursion_level = 0);
|
2022-08-21 17:02:24 +03:00
|
|
|
ErrorOr<NonnullRefPtr<Custody>> resolve_path_without_veil(Credentials const&, StringView path, NonnullRefPtr<Custody> base, RefPtr<Custody>* out_parent = nullptr, int options = 0, int symlink_recursion_level = 0);
|
2019-05-30 18:46:08 +03:00
|
|
|
|
2018-10-10 12:53:07 +03:00
|
|
|
private:
|
2021-09-07 14:39:11 +03:00
|
|
|
friend class OpenFileDescription;
|
2018-10-24 13:43:52 +03:00
|
|
|
|
2023-03-04 21:01:54 +03:00
|
|
|
UnveilNode const& find_matching_unveiled_path(Process const&, StringView path);
|
|
|
|
ErrorOr<void> validate_path_against_process_veil(Process const&, StringView path, int options);
|
|
|
|
ErrorOr<void> validate_path_against_process_veil(Process const& process, Custody const& custody, int options);
|
2021-11-08 02:51:39 +03:00
|
|
|
ErrorOr<void> validate_path_against_process_veil(Custody const& path, int options);
|
|
|
|
ErrorOr<void> validate_path_against_process_veil(StringView path, int options);
|
Kernel: Add a basic implementation of unveil()
This syscall is a complement to pledge() and adds the same sort of
incremental relinquishing of capabilities for filesystem access.
The first call to unveil() will "drop a veil" on the process, and from
now on, only unveiled parts of the filesystem are visible to it.
Each call to unveil() specifies a path to either a directory or a file
along with permissions for that path. The permissions are a combination
of the following:
- r: Read access (like the "rpath" promise)
- w: Write access (like the "wpath" promise)
- x: Execute access
- c: Create/remove access (like the "cpath" promise)
Attempts to open a path that has not been unveiled with fail with
ENOENT. If the unveiled path lacks sufficient permissions, it will fail
with EACCES.
Like pledge(), subsequent calls to unveil() with the same path can only
remove permissions, not add them.
Once you call unveil(nullptr, nullptr), the veil is locked, and it's no
longer possible to unveil any more paths for the process, ever.
This concept comes from OpenBSD, and their implementation does various
things differently, I'm sure. This is just a first implementation for
SerenityOS, and we'll keep improving on it as we go. :^)
2020-01-21 00:12:04 +03:00
|
|
|
|
2022-12-15 12:42:40 +03:00
|
|
|
ErrorOr<void> add_file_system_to_mount_table(FileSystem& file_system, Custody& mount_point, int flags);
|
|
|
|
|
2021-11-10 17:42:39 +03:00
|
|
|
ErrorOr<void> traverse_directory_inode(Inode&, Function<ErrorOr<void>(FileSystem::DirectoryEntryView const&)>);
|
2018-10-10 12:53:07 +03:00
|
|
|
|
2023-08-04 14:54:52 +03:00
|
|
|
static bool check_matching_absolute_path_hierarchy(Custody const& first_custody, Custody const& second_custody);
|
|
|
|
bool mount_point_exists_at_custody(Custody& mount_point);
|
2022-08-10 18:50:23 +03:00
|
|
|
|
2023-08-04 22:57:25 +03:00
|
|
|
ErrorOr<void> apply_to_mount_for_host_custody(Custody const& current_custody, Function<void(Mount&)>);
|
2018-10-10 12:53:07 +03:00
|
|
|
|
2023-03-07 14:25:00 +03:00
|
|
|
RefPtr<Inode> m_root_inode;
|
2021-08-16 02:40:19 +03:00
|
|
|
|
2022-11-09 13:39:58 +03:00
|
|
|
SpinlockProtected<RefPtr<Custody>, LockRank::None> m_root_custody {};
|
2022-08-21 02:04:35 +03:00
|
|
|
|
2022-11-09 13:39:58 +03:00
|
|
|
SpinlockProtected<IntrusiveList<&Mount::m_vfs_list_node>, LockRank::None> m_mounts {};
|
2022-12-15 12:42:40 +03:00
|
|
|
|
|
|
|
// NOTE: The FileBackedFileSystem list is protected by a mutex because we need to scan it
|
|
|
|
// to search for existing filesystems for already used block devices and therefore when doing
|
|
|
|
// that we could fail to find a filesystem so we need to create a new filesystem which might
|
|
|
|
// need to do disk access (i.e. taking Mutexes in other places) and then register that new filesystem
|
|
|
|
// in this list, to avoid TOCTOU bugs.
|
|
|
|
MutexProtected<IntrusiveList<&FileBackedFileSystem::m_file_backed_file_system_node>> m_file_backed_file_systems_list {};
|
|
|
|
|
2022-11-09 13:39:58 +03:00
|
|
|
SpinlockProtected<IntrusiveList<&FileSystem::m_file_system_node>, LockRank::FileSystem> m_file_systems_list {};
|
2018-10-10 12:53:07 +03:00
|
|
|
};
|
2020-02-16 03:27:42 +03:00
|
|
|
|
|
|
|
}
|