sapling/eden/fs/utils/PathFuncs.cpp
Xavier Deguillard 09f97fa27a store: diff should respect the mount case sensitivity
Summary:
During a diff operation, files that have a case change should not reported as
changed for case insensitive mount. This is a follow up to D29150552 (37ccaa9231) where the
TreeInode code was taught to ignore case changes for case insensitive mounts.

Reviewed By: kmancini

Differential Revision: D29952464

fbshipit-source-id: e5fa8eccc1c1984a680838fd8589a0278989d9d0
2021-07-29 11:29:42 -07:00

405 lines
12 KiB
C++

/*
* Copyright (c) Facebook, Inc. and its affiliates.
*
* This software may be used and distributed according to the terms of the
* GNU General Public License version 2.
*/
#include "eden/fs/utils/PathFuncs.h"
#include <boost/filesystem/operations.hpp>
#include <folly/Exception.h>
#include <folly/logging/xlog.h>
#include <folly/portability/Stdlib.h>
#include <optional>
#ifdef _WIN32
#include <folly/portability/Unistd.h>
#else
#include <unistd.h>
#endif
#ifdef __APPLE__
#include <mach-o/dyld.h> // @manual
#endif
using folly::Expected;
using folly::StringPiece;
namespace facebook {
namespace eden {
StringPiece dirname(StringPiece path) {
auto dirSeparator = detail::rfindPathSeparator(path);
if (dirSeparator != std::string::npos) {
return path.subpiece(0, dirSeparator);
}
return "";
}
StringPiece basename(StringPiece path) {
auto dirSeparator = detail::rfindPathSeparator(path);
if (dirSeparator != std::string::npos) {
path.advance(dirSeparator + 1);
return path;
}
return path;
}
AbsolutePath getcwd() {
char cwd[PATH_MAX];
if (!::getcwd(cwd, sizeof(cwd))) {
folly::throwSystemError("getcwd() failed");
}
return AbsolutePath{cwd};
}
namespace {
struct CanonicalData {
std::vector<StringPiece> components;
bool isAbsolute{false};
};
/**
* Parse path into a collection of path components such that:
* - "." (single dot) and "" (empty) components are discarded.
* - ".." component either destructively combines with the last
* parsed path component, or becomes the first component when
* the vector of previously extracted components is empty.
*/
CanonicalData canonicalPathData(StringPiece path) {
CanonicalData data;
const char* componentStart = path.begin();
auto processSlash = [&](const char* end) {
auto component = StringPiece{componentStart, end};
componentStart = end + 1;
if (component.empty()) {
// Ignore empty components (doubled slash characters)
// An empty component at the start of the string indicates an
// absolute path.
//
// (POSIX specifies that "//" at the start of a path is special, and has
// platform-specific behavior. We intentionally ignore that, and treat a
// leading "//" the same as a single leading "/".)
if (component.begin() == path.begin()) {
data.isAbsolute = true;
}
} else if (component == ".") {
// ignore this component
} else if (component == "..") {
if (data.components.empty()) {
if (!data.isAbsolute) {
// We have no choice but to add ".." to the start
data.components.push_back(component);
}
} else if (data.components.back() != "..") {
data.components.pop_back();
}
} else {
data.components.push_back(component);
}
};
for (const char* p = path.begin(); p != path.end(); ++p) {
if (detail::isDirSeparator(*p)) {
processSlash(p);
}
}
if (componentStart != path.end()) {
processSlash(path.end());
}
return data;
}
AbsolutePath canonicalPathImpl(
StringPiece path,
std::optional<AbsolutePathPiece> base) {
auto makeAbsolutePath = [](const std::vector<StringPiece>& parts) {
if (parts.empty()) {
return AbsolutePath{};
}
size_t length = 1; // reserve 1 byte for terminating '\0'
for (const auto& part : parts) {
length += part.size();
}
std::string value;
value.reserve(length);
for (const auto& part : parts) {
value.push_back('/');
value.append(part.begin(), part.end());
}
return AbsolutePath{std::move(value)};
};
auto canon = canonicalPathData(path);
if (canon.isAbsolute) {
return makeAbsolutePath(canon.components);
}
// Get the components from the base path
// For simplicity we are just re-using canonicalPathData() even though the
// base path is guaranteed to already be in canonical form.
CanonicalData baseCanon;
AbsolutePath cwd;
if (!base.has_value()) {
// canonicalPathData() returns StringPieces pointing to the input,
// so we have to store the cwd in a variable that will persist until the
// end of this function.
cwd = getcwd();
baseCanon = canonicalPathData(cwd.stringPiece());
} else {
baseCanon = canonicalPathData(base.value().stringPiece());
}
for (auto it = canon.components.begin(); it != canon.components.end(); ++it) {
// There may be leading ".." parts, so we have to deal with them here
if (*it == "..") {
if (!baseCanon.components.empty()) {
baseCanon.components.pop_back();
}
} else {
// Once we found a non-".." component, none of the rest can be "..",
// so add everything else and break out of the loop
baseCanon.components.insert(
baseCanon.components.end(), it, canon.components.end());
break;
}
}
return makeAbsolutePath(baseCanon.components);
}
} // namespace
AbsolutePath canonicalPath(folly::StringPiece path) {
// Pass in std::nullopt.
// canonicalPathImpl() will only call getcwd() if it is actually necessary.
return canonicalPathImpl(path, std::nullopt);
}
AbsolutePath canonicalPath(folly::StringPiece path, AbsolutePathPiece base) {
return canonicalPathImpl(path, std::optional<AbsolutePathPiece>{base});
}
folly::Expected<RelativePath, int> joinAndNormalize(
RelativePathPiece base,
folly::StringPiece path) {
if (path.startsWith(kDirSeparator)) {
return folly::makeUnexpected(EPERM);
}
const std::string joined = base.value().empty() ? path.str()
: path.empty() ? base.value().str()
: folly::to<std::string>(base, kDirSeparator, path);
const CanonicalData cdata{canonicalPathData(joined)};
const auto& parts{cdata.components};
XDCHECK(!cdata.isAbsolute);
if (!parts.empty() && parts[0] == "..") {
return folly::makeUnexpected(EXDEV);
} else {
return folly::makeExpected<int>(RelativePath{parts.begin(), parts.end()});
}
}
Expected<AbsolutePath, int> realpathExpected(const char* path) {
auto pathBuffer = ::realpath(path, nullptr);
if (!pathBuffer) {
return folly::makeUnexpected(errno);
}
SCOPE_EXIT {
free(pathBuffer);
};
return folly::makeExpected<int>(AbsolutePath{pathBuffer});
}
Expected<AbsolutePath, int> realpathExpected(StringPiece path) {
// The input may not be nul-terminated, so we have to construct a std::string
return realpath(path.str().c_str());
}
AbsolutePath realpath(const char* path) {
auto result = realpathExpected(path);
if (!result) {
folly::throwSystemErrorExplicit(
result.error(), "realpath(", path, ") failed");
}
return result.value();
}
AbsolutePath realpath(StringPiece path) {
// The input may not be nul-terminated, so we have to construct a std::string
return realpath(path.str().c_str());
}
AbsolutePath normalizeBestEffort(const char* path) {
auto result = realpathExpected(path);
if (result) {
return result.value();
}
return canonicalPathImpl(path, std::nullopt);
}
AbsolutePath normalizeBestEffort(folly::StringPiece path) {
return normalizeBestEffort(path.str().c_str());
}
std::pair<PathComponentPiece, RelativePathPiece> splitFirst(
RelativePathPiece path) {
auto piece = path.stringPiece();
auto dirSeparator = detail::findPathSeparator(piece);
if (dirSeparator != std::string::npos) {
return {
PathComponentPiece{
folly::StringPiece{piece.begin(), piece.begin() + dirSeparator}},
RelativePathPiece{
folly::StringPiece{piece.begin() + dirSeparator + 1, piece.end()}}};
} else {
return {PathComponentPiece{piece}, RelativePathPiece{}};
}
}
void validatePathComponentLength(PathComponentPiece name) {
if (name.value().size() > kMaxPathComponentLength) {
folly::throwSystemErrorExplicit(
ENAMETOOLONG, "path component too long: ", name);
}
}
bool ensureDirectoryExists(AbsolutePathPiece path) {
return boost::filesystem::create_directories(path.as_boost());
}
bool ensureDirectoryExists(
AbsolutePathPiece path,
boost::system::error_code& error) noexcept {
return boost::filesystem::create_directories(path.as_boost(), error);
}
bool removeRecursively(AbsolutePathPiece path) {
return boost::filesystem::remove_all(path.as_boost());
}
bool removeFileWithAbsolutePath(AbsolutePathPiece path) {
return boost::filesystem::remove(path.as_boost());
}
void renameWithAbsolutePath(
AbsolutePathPiece srcPath,
AbsolutePathPiece destPath) {
boost::filesystem::rename(srcPath.as_boost(), destPath.as_boost());
}
AbsolutePath expandUser(
folly::StringPiece path,
std::optional<folly::StringPiece> homeDir) {
if (!path.startsWith("~")) {
return canonicalPath(path);
}
if (path.size() > 1 && !path.startsWith("~/")) {
// path is not "~" and doesn't start with "~/".
// Most likely the input is something like "~user" which
// we don't support.
throw std::runtime_error(folly::to<std::string>(
"expandUser: can only ~-expand the current user. Input path was: `",
path,
"`"));
}
if (!homeDir) {
throw std::runtime_error(
"Unable to expand ~ in path because homeDir is not set");
}
if (homeDir->size() == 0) {
throw std::runtime_error(
"Unable to expand ~ in path because homeDir is the empty string");
}
if (path == "~") {
return canonicalPath(*homeDir);
}
// Otherwise: we know the path startsWith("~/") due to the
// checks made above, so we can skip the first 2 characters
// to build the expansion here.
auto expanded =
folly::to<std::string>(*homeDir, kDirSeparator, path.subpiece(2));
return canonicalPath(expanded);
}
AbsolutePath executablePath() {
#ifdef __linux__
// The maximum symlink limit is filesystem dependent, but many common Linux
// filesystems have a limit of 4096.
constexpr size_t pathMax = 4096;
std::array<char, pathMax> buf;
auto result = readlink("/proc/self/exe", buf.data(), buf.size());
folly::checkUnixError(result, "failed to read /proc/self/exe");
return AbsolutePath(
folly::StringPiece(buf.data(), static_cast<size_t>(result)));
#elif defined(__APPLE__)
std::vector<char> buf;
buf.resize(4096, 0);
uint32_t size = buf.size();
if (_NSGetExecutablePath(buf.data(), &size) != 0) {
buf.resize(size, 0);
if (_NSGetExecutablePath(buf.data(), &size) != 0) {
throw std::runtime_error("_NSGetExecutablePath failed");
}
}
// Note that on success, the size is not updated and we need to look
// for NUL termination
return AbsolutePath(folly::StringPiece(buf.data()));
#elif defined(_WIN32)
std::vector<WCHAR> buf;
buf.resize(4096);
auto res =
GetModuleFileNameW(NULL, buf.data(), static_cast<DWORD>(buf.size()));
while (res == buf.size()) {
buf.resize(buf.size() * 2);
res = GetModuleFileNameW(NULL, buf.data(), static_cast<DWORD>(buf.size()));
}
if (res == 0) {
auto err = GetLastError();
throw std::system_error(err, std::system_category(), "GetModuleFileNameW");
}
return AbsolutePath(std::wstring_view(buf.data(), static_cast<size_t>(res)));
#else
#error executablePath not implemented
#endif
}
CompareResult comparePathComponent(
PathComponentPiece left,
PathComponentPiece right,
CaseSensitivity caseSensitivity) {
if (caseSensitivity == CaseSensitivity::Insensitive) {
if (left.stringPiece().equals(
right.stringPiece(), folly::AsciiCaseInsensitive())) {
return CompareResult::EQUAL;
}
} else {
if (left == right) {
return CompareResult::EQUAL;
}
}
if (left < right) {
return CompareResult::BEFORE;
} else {
return CompareResult::AFTER;
}
}
} // namespace eden
} // namespace facebook