mirror of
https://github.com/privatevoid-net/nix-super.git
synced 2024-11-29 09:06:15 +02:00
Purify CanonPath
The core `CanonPath` constructors were using `absPath`, but `absPath` in some situations does IO which is not appropriate. It turns out that these constructors avoided those situations, and thus were pure, but it was far from obvious this was the case. To remedy the situation, abstract the core algorithm from `canonPath` to use separately in `CanonPath` without any IO. No we know by-construction that those constructors are pure. That leaves `CanonPath::fromCWD` as the only operation which uses IO / is impure. Add docs on it, and `CanonPath` as a whole, explaining the situation. This is also necessary to support Windows paths on windows without messing up `CanonPath`. But, I think it is good even without that. Co-authored-by: Eelco Dolstra <edolstra@gmail.com> Co-authored-by: Robert Hensing <roberth@users.noreply.github.com>
This commit is contained in:
parent
d53c8901ef
commit
d17e1d9737
5 changed files with 155 additions and 57 deletions
|
@ -1,16 +1,25 @@
|
||||||
#include "canon-path.hh"
|
#include "canon-path.hh"
|
||||||
#include "file-system.hh"
|
#include "util.hh"
|
||||||
|
#include "file-path-impl.hh"
|
||||||
|
|
||||||
namespace nix {
|
namespace nix {
|
||||||
|
|
||||||
CanonPath CanonPath::root = CanonPath("/");
|
CanonPath CanonPath::root = CanonPath("/");
|
||||||
|
|
||||||
|
static std::string absPathPure(std::string_view path)
|
||||||
|
{
|
||||||
|
return canonPathInner(path, [](auto &, auto &){});
|
||||||
|
}
|
||||||
|
|
||||||
CanonPath::CanonPath(std::string_view raw)
|
CanonPath::CanonPath(std::string_view raw)
|
||||||
: path(absPath(raw, "/"))
|
: path(absPathPure(concatStrings("/", raw)))
|
||||||
{ }
|
{ }
|
||||||
|
|
||||||
CanonPath::CanonPath(std::string_view raw, const CanonPath & root)
|
CanonPath::CanonPath(std::string_view raw, const CanonPath & root)
|
||||||
: path(absPath(raw, root.abs()))
|
: path(absPathPure(
|
||||||
|
raw.size() > 0 && raw[0] == '/'
|
||||||
|
? raw
|
||||||
|
: concatStrings(root.abs(), "/", raw)))
|
||||||
{ }
|
{ }
|
||||||
|
|
||||||
CanonPath::CanonPath(const std::vector<std::string> & elems)
|
CanonPath::CanonPath(const std::vector<std::string> & elems)
|
||||||
|
|
|
@ -21,9 +21,21 @@ namespace nix {
|
||||||
*
|
*
|
||||||
* - There are no components equal to '.' or '..'.
|
* - There are no components equal to '.' or '..'.
|
||||||
*
|
*
|
||||||
* Note that the path does not need to correspond to an actually
|
* `CanonPath` are "virtual" Nix paths for abstract file system objects;
|
||||||
* existing path, and there is no guarantee that symlinks are
|
* they are always Unix-style paths, regardless of what OS Nix is
|
||||||
* resolved.
|
* running on. The `/` root doesn't denote the ambient host file system
|
||||||
|
* root, but some virtual FS root.
|
||||||
|
*
|
||||||
|
* @note It might be useful to compare `openat(some_fd, "foo/bar")` on
|
||||||
|
* Unix. `"foo/bar"` is a relative path because an absolute path would
|
||||||
|
* "override" the `some_fd` directory file descriptor and escape to the
|
||||||
|
* "system root". Conversely, Nix's abstract file operations *never* escape the
|
||||||
|
* designated virtual file system (i.e. `SourceAccessor` or
|
||||||
|
* `ParseSink`), so `CanonPath` does not need an absolute/relative
|
||||||
|
* distinction.
|
||||||
|
*
|
||||||
|
* @note The path does not need to correspond to an actually existing
|
||||||
|
* path, and the path may or may not have unresolved symlinks.
|
||||||
*/
|
*/
|
||||||
class CanonPath
|
class CanonPath
|
||||||
{
|
{
|
||||||
|
|
81
src/libutil/file-path-impl.hh
Normal file
81
src/libutil/file-path-impl.hh
Normal file
|
@ -0,0 +1,81 @@
|
||||||
|
#pragma once
|
||||||
|
/**
|
||||||
|
* @file
|
||||||
|
*
|
||||||
|
* Pure (no IO) infrastructure just for defining other path types;
|
||||||
|
* should not be used directly outside of utilities.
|
||||||
|
*/
|
||||||
|
#include <string>
|
||||||
|
#include <string_view>
|
||||||
|
|
||||||
|
namespace nix {
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Core pure path canonicalization algorithm.
|
||||||
|
*
|
||||||
|
* @param hookComponent
|
||||||
|
* A callback which is passed two arguments,
|
||||||
|
* references to
|
||||||
|
*
|
||||||
|
* 1. the result so far
|
||||||
|
*
|
||||||
|
* 2. the remaining path to resolve
|
||||||
|
*
|
||||||
|
* This is a chance to modify those two paths in arbitrary way, e.g. if
|
||||||
|
* "result" points to a symlink.
|
||||||
|
*/
|
||||||
|
typename std::string canonPathInner(
|
||||||
|
std::string_view remaining,
|
||||||
|
auto && hookComponent)
|
||||||
|
{
|
||||||
|
assert(remaining != "");
|
||||||
|
|
||||||
|
std::string result;
|
||||||
|
result.reserve(256);
|
||||||
|
|
||||||
|
while (true) {
|
||||||
|
|
||||||
|
/* Skip slashes. */
|
||||||
|
while (!remaining.empty() && remaining[0] == '/')
|
||||||
|
remaining.remove_prefix(1);
|
||||||
|
|
||||||
|
if (remaining.empty()) break;
|
||||||
|
|
||||||
|
auto nextComp = ({
|
||||||
|
auto nextPathSep = remaining.find('/');
|
||||||
|
nextPathSep == remaining.npos ? remaining : remaining.substr(0, nextPathSep);
|
||||||
|
});
|
||||||
|
|
||||||
|
/* Ignore `.'. */
|
||||||
|
if (nextComp == ".")
|
||||||
|
remaining.remove_prefix(1);
|
||||||
|
|
||||||
|
/* If `..', delete the last component. */
|
||||||
|
else if (nextComp == "..")
|
||||||
|
{
|
||||||
|
if (!result.empty()) result.erase(result.rfind('/'));
|
||||||
|
remaining.remove_prefix(2);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Normal component; copy it. */
|
||||||
|
else {
|
||||||
|
result += '/';
|
||||||
|
if (const auto slash = remaining.find('/'); slash == result.npos) {
|
||||||
|
result += remaining;
|
||||||
|
remaining = {};
|
||||||
|
} else {
|
||||||
|
result += remaining.substr(0, slash);
|
||||||
|
remaining = remaining.substr(slash);
|
||||||
|
}
|
||||||
|
|
||||||
|
hookComponent(result, remaining);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (result.empty())
|
||||||
|
result = "/";
|
||||||
|
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
|
@ -1,5 +1,6 @@
|
||||||
#include "environment-variables.hh"
|
#include "environment-variables.hh"
|
||||||
#include "file-system.hh"
|
#include "file-system.hh"
|
||||||
|
#include "file-path-impl.hh"
|
||||||
#include "signals.hh"
|
#include "signals.hh"
|
||||||
#include "finally.hh"
|
#include "finally.hh"
|
||||||
#include "serialise.hh"
|
#include "serialise.hh"
|
||||||
|
@ -21,11 +22,18 @@ namespace fs = std::filesystem;
|
||||||
|
|
||||||
namespace nix {
|
namespace nix {
|
||||||
|
|
||||||
|
/** Treat the string as possibly an absolute path, by inspecting the start of it. Return whether it was probably intended to be absolute. */
|
||||||
|
static bool isAbsolute(PathView path)
|
||||||
|
{
|
||||||
|
return !path.empty() && path[0] == '/';
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
Path absPath(PathView path, std::optional<PathView> dir, bool resolveSymlinks)
|
Path absPath(PathView path, std::optional<PathView> dir, bool resolveSymlinks)
|
||||||
{
|
{
|
||||||
std::string scratch;
|
std::string scratch;
|
||||||
|
|
||||||
if (path.empty() || path[0] != '/') {
|
if (!isAbsolute(path)) {
|
||||||
// In this case we need to call `canonPath` on a newly-created
|
// In this case we need to call `canonPath` on a newly-created
|
||||||
// string. We set `scratch` to that string first, and then set
|
// string. We set `scratch` to that string first, and then set
|
||||||
// `path` to `scratch`. This ensures the newly-created string
|
// `path` to `scratch`. This ensures the newly-created string
|
||||||
|
@ -58,69 +66,39 @@ Path canonPath(PathView path, bool resolveSymlinks)
|
||||||
{
|
{
|
||||||
assert(path != "");
|
assert(path != "");
|
||||||
|
|
||||||
std::string s;
|
if (!isAbsolute(path))
|
||||||
s.reserve(256);
|
|
||||||
|
|
||||||
if (path[0] != '/')
|
|
||||||
throw Error("not an absolute path: '%1%'", path);
|
throw Error("not an absolute path: '%1%'", path);
|
||||||
|
|
||||||
|
/* This just exists because we cannot set the target of `remaining`
|
||||||
|
(the callback parameter) directly to a newly-constructed string,
|
||||||
|
since it is `std::string_view`. */
|
||||||
std::string temp;
|
std::string temp;
|
||||||
|
|
||||||
/* Count the number of times we follow a symlink and stop at some
|
/* Count the number of times we follow a symlink and stop at some
|
||||||
arbitrary (but high) limit to prevent infinite loops. */
|
arbitrary (but high) limit to prevent infinite loops. */
|
||||||
unsigned int followCount = 0, maxFollow = 1024;
|
unsigned int followCount = 0, maxFollow = 1024;
|
||||||
|
|
||||||
while (1) {
|
return canonPathInner(
|
||||||
|
path,
|
||||||
/* Skip slashes. */
|
[&followCount, &temp, maxFollow, resolveSymlinks]
|
||||||
while (!path.empty() && path[0] == '/') path.remove_prefix(1);
|
(std::string & result, std::string_view & remaining) {
|
||||||
if (path.empty()) break;
|
if (resolveSymlinks && isLink(result)) {
|
||||||
|
|
||||||
/* Ignore `.'. */
|
|
||||||
if (path == "." || path.substr(0, 2) == "./")
|
|
||||||
path.remove_prefix(1);
|
|
||||||
|
|
||||||
/* If `..', delete the last component. */
|
|
||||||
else if (path == ".." || path.substr(0, 3) == "../")
|
|
||||||
{
|
|
||||||
if (!s.empty()) s.erase(s.rfind('/'));
|
|
||||||
path.remove_prefix(2);
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Normal component; copy it. */
|
|
||||||
else {
|
|
||||||
s += '/';
|
|
||||||
if (const auto slash = path.find('/'); slash == path.npos) {
|
|
||||||
s += path;
|
|
||||||
path = {};
|
|
||||||
} else {
|
|
||||||
s += path.substr(0, slash);
|
|
||||||
path = path.substr(slash);
|
|
||||||
}
|
|
||||||
|
|
||||||
/* If s points to a symlink, resolve it and continue from there */
|
|
||||||
if (resolveSymlinks && isLink(s)) {
|
|
||||||
if (++followCount >= maxFollow)
|
if (++followCount >= maxFollow)
|
||||||
throw Error("infinite symlink recursion in path '%1%'", path);
|
throw Error("infinite symlink recursion in path '%0%'", remaining);
|
||||||
temp = concatStrings(readLink(s), path);
|
remaining = (temp = concatStrings(readLink(result), remaining));
|
||||||
path = temp;
|
if (isAbsolute(remaining)) {
|
||||||
if (!temp.empty() && temp[0] == '/') {
|
/* restart for symlinks pointing to absolute path */
|
||||||
s.clear(); /* restart for symlinks pointing to absolute path */
|
result.clear();
|
||||||
} else {
|
} else {
|
||||||
s = dirOf(s);
|
result = dirOf(result);
|
||||||
if (s == "/") { // we don’t want trailing slashes here, which dirOf only produces if s = /
|
if (result == "/") {
|
||||||
s.clear();
|
/* we don’t want trailing slashes here, which `dirOf`
|
||||||
|
only produces if `result = /` */
|
||||||
|
result.clear();
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
});
|
||||||
}
|
|
||||||
|
|
||||||
if (s.empty()) {
|
|
||||||
s = "/";
|
|
||||||
}
|
|
||||||
|
|
||||||
return s;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -41,6 +41,24 @@ namespace nix {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
TEST(CanonPath, from_existing) {
|
||||||
|
CanonPath p0("foo//bar/");
|
||||||
|
{
|
||||||
|
CanonPath p("/baz//quux/", p0);
|
||||||
|
ASSERT_EQ(p.abs(), "/baz/quux");
|
||||||
|
ASSERT_EQ(p.rel(), "baz/quux");
|
||||||
|
ASSERT_EQ(*p.baseName(), "quux");
|
||||||
|
ASSERT_EQ(*p.dirOf(), "/baz");
|
||||||
|
}
|
||||||
|
{
|
||||||
|
CanonPath p("baz//quux/", p0);
|
||||||
|
ASSERT_EQ(p.abs(), "/foo/bar/baz/quux");
|
||||||
|
ASSERT_EQ(p.rel(), "foo/bar/baz/quux");
|
||||||
|
ASSERT_EQ(*p.baseName(), "quux");
|
||||||
|
ASSERT_EQ(*p.dirOf(), "/foo/bar/baz");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
TEST(CanonPath, pop) {
|
TEST(CanonPath, pop) {
|
||||||
CanonPath p("foo/bar/x");
|
CanonPath p("foo/bar/x");
|
||||||
ASSERT_EQ(p.abs(), "/foo/bar/x");
|
ASSERT_EQ(p.abs(), "/foo/bar/x");
|
||||||
|
|
Loading…
Reference in a new issue