2020-06-01 21:32:27 +00:00
|
|
|
|
#pragma once
|
2023-04-01 03:18:41 +00:00
|
|
|
|
///@file
|
2020-06-01 21:32:27 +00:00
|
|
|
|
|
2020-06-01 22:53:31 +00:00
|
|
|
|
#include <variant>
|
2020-06-01 21:32:27 +00:00
|
|
|
|
#include "hash.hh"
|
2020-10-07 13:52:20 +00:00
|
|
|
|
#include "path.hh"
|
2022-03-25 22:40:40 +00:00
|
|
|
|
#include "comparator.hh"
|
2020-06-01 21:32:27 +00:00
|
|
|
|
|
|
|
|
|
namespace nix {
|
|
|
|
|
|
2020-10-07 13:52:20 +00:00
|
|
|
|
/*
|
2020-10-13 03:30:14 +00:00
|
|
|
|
* Content addressing method
|
2020-10-07 13:52:20 +00:00
|
|
|
|
*/
|
|
|
|
|
|
2020-10-12 23:51:23 +00:00
|
|
|
|
/* We only have one way to hash text with references, so this is a single-value
|
|
|
|
|
type, mainly useful with std::variant.
|
|
|
|
|
*/
|
2023-03-30 20:28:53 +00:00
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* The single way we can serialize "text" file system objects.
|
|
|
|
|
*
|
|
|
|
|
* Somewhat obscure, used by \ref Derivation derivations and
|
|
|
|
|
* `builtins.toFile` currently.
|
2023-04-21 05:30:55 +00:00
|
|
|
|
*
|
|
|
|
|
* TextIngestionMethod is identical to FileIngestionMethod::Fixed except that
|
|
|
|
|
* the former may not have self-references and is tagged `text:${algo}:${hash}`
|
|
|
|
|
* rather than `fixed:${algo}:${hash}`. The contents of the store path are
|
|
|
|
|
* ingested and hashed identically, aside from the slightly different tag and
|
|
|
|
|
* restriction on self-references.
|
2023-03-30 20:28:53 +00:00
|
|
|
|
*/
|
2023-04-17 23:02:45 +00:00
|
|
|
|
struct TextIngestionMethod : std::monostate { };
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
2023-03-30 20:28:53 +00:00
|
|
|
|
* An enumeration of the main ways we can serialize file system
|
|
|
|
|
* objects.
|
2023-03-25 23:12:44 +00:00
|
|
|
|
*/
|
2020-06-01 21:32:27 +00:00
|
|
|
|
enum struct FileIngestionMethod : uint8_t {
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
|
|
|
|
* Flat-file hashing. Directly ingest the contents of a single file
|
|
|
|
|
*/
|
2020-06-01 21:32:27 +00:00
|
|
|
|
Flat = false,
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
|
|
|
|
* Recursive (or NAR) hashing. Serializes the file-system object in Nix
|
|
|
|
|
* Archive format and ingest that
|
|
|
|
|
*/
|
2020-06-01 21:32:27 +00:00
|
|
|
|
Recursive = true
|
|
|
|
|
};
|
|
|
|
|
|
2023-03-30 20:28:53 +00:00
|
|
|
|
/**
|
|
|
|
|
* Compute the prefix to the hash algorithm which indicates how the
|
|
|
|
|
* files were ingested.
|
|
|
|
|
*/
|
2020-10-12 23:51:23 +00:00
|
|
|
|
std::string makeFileIngestionPrefix(FileIngestionMethod m);
|
|
|
|
|
|
2023-03-30 20:28:53 +00:00
|
|
|
|
/**
|
|
|
|
|
* An enumeration of all the ways we can serialize file system objects.
|
|
|
|
|
*
|
|
|
|
|
* Just the type of a content address. Combine with the hash itself, and
|
|
|
|
|
* we have a `ContentAddress` as defined below. Combine that, in turn,
|
|
|
|
|
* with info on references, and we have `ContentAddressWithReferences`,
|
|
|
|
|
* as defined further below.
|
|
|
|
|
*/
|
2023-03-30 21:12:49 +00:00
|
|
|
|
struct ContentAddressMethod
|
|
|
|
|
{
|
|
|
|
|
typedef std::variant<
|
2023-04-17 23:02:45 +00:00
|
|
|
|
TextIngestionMethod,
|
2023-04-01 20:40:32 +00:00
|
|
|
|
FileIngestionMethod
|
2023-03-30 21:12:49 +00:00
|
|
|
|
> Raw;
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
Raw raw;
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
2023-04-01 20:40:32 +00:00
|
|
|
|
GENERATE_CMP(ContentAddressMethod, me->raw);
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
/* The moral equivalent of `using Raw::Raw;` */
|
|
|
|
|
ContentAddressMethod(auto &&... arg)
|
|
|
|
|
: raw(std::forward<decltype(arg)>(arg)...)
|
|
|
|
|
{ }
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
|
|
|
|
|
2023-04-01 20:40:32 +00:00
|
|
|
|
/**
|
2023-05-09 16:45:51 +00:00
|
|
|
|
* Parse the prefix tag which indicates how the files
|
|
|
|
|
* were ingested, with the fixed output case not prefixed for back
|
2023-04-01 20:40:32 +00:00
|
|
|
|
* compat.
|
2023-05-09 17:05:38 +00:00
|
|
|
|
*
|
|
|
|
|
* @param [in] m A string that should begin with the prefix.
|
|
|
|
|
* @param [out] m The remainder of the string after the prefix.
|
2023-04-01 20:40:32 +00:00
|
|
|
|
*/
|
|
|
|
|
static ContentAddressMethod parsePrefix(std::string_view & m);
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
2023-05-09 17:05:38 +00:00
|
|
|
|
/**
|
|
|
|
|
* Render the prefix tag which indicates how the files wre ingested.
|
|
|
|
|
*
|
|
|
|
|
* The rough inverse of `parsePrefix()`.
|
|
|
|
|
*/
|
2023-04-01 20:40:32 +00:00
|
|
|
|
std::string renderPrefix() const;
|
|
|
|
|
|
|
|
|
|
/**
|
2023-05-09 17:05:38 +00:00
|
|
|
|
* Parse a content addressing method and hash type.
|
2023-04-01 20:40:32 +00:00
|
|
|
|
*/
|
|
|
|
|
static std::pair<ContentAddressMethod, HashType> parse(std::string_view rawCaMethod);
|
|
|
|
|
|
2023-05-09 17:05:38 +00:00
|
|
|
|
/**
|
|
|
|
|
* Render a content addressing method and hash type in a
|
|
|
|
|
* nicer way, prefixing both cases.
|
|
|
|
|
*
|
|
|
|
|
* The rough inverse of `parse()`.
|
|
|
|
|
*/
|
2023-04-01 20:40:32 +00:00
|
|
|
|
std::string render(HashType ht) const;
|
2023-03-30 21:12:49 +00:00
|
|
|
|
};
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
2020-10-07 13:52:20 +00:00
|
|
|
|
|
2020-10-13 03:30:14 +00:00
|
|
|
|
/*
|
|
|
|
|
* Mini content address
|
|
|
|
|
*/
|
2020-10-07 13:52:20 +00:00
|
|
|
|
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
|
|
|
|
* Somewhat obscure, used by \ref Derivation derivations and
|
|
|
|
|
* `builtins.toFile` currently.
|
|
|
|
|
*/
|
2020-06-01 23:26:40 +00:00
|
|
|
|
struct TextHash {
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
|
|
|
|
* Hash of the contents of the text/file.
|
|
|
|
|
*/
|
2020-06-01 23:26:40 +00:00
|
|
|
|
Hash hash;
|
2022-03-25 22:40:40 +00:00
|
|
|
|
|
|
|
|
|
GENERATE_CMP(TextHash, me->hash);
|
2020-06-01 23:26:40 +00:00
|
|
|
|
};
|
|
|
|
|
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
2023-03-30 20:28:53 +00:00
|
|
|
|
* Used by most store objects that are content-addressed.
|
2023-03-25 23:12:44 +00:00
|
|
|
|
*/
|
2020-06-19 15:18:19 +00:00
|
|
|
|
struct FixedOutputHash {
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
|
|
|
|
* How the file system objects are serialized
|
|
|
|
|
*/
|
2020-06-01 21:32:27 +00:00
|
|
|
|
FileIngestionMethod method;
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
|
|
|
|
* Hash of that serialization
|
|
|
|
|
*/
|
2020-06-01 21:32:27 +00:00
|
|
|
|
Hash hash;
|
2023-03-25 23:12:44 +00:00
|
|
|
|
|
2020-06-01 21:32:27 +00:00
|
|
|
|
std::string printMethodAlgo() const;
|
2022-03-25 22:40:40 +00:00
|
|
|
|
|
|
|
|
|
GENERATE_CMP(FixedOutputHash, me->method, me->hash);
|
2020-06-01 21:32:27 +00:00
|
|
|
|
};
|
|
|
|
|
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
|
|
|
|
* We've accumulated several types of content-addressed paths over the
|
|
|
|
|
* years; fixed-output derivations support multiple hash algorithms and
|
|
|
|
|
* serialisation methods (flat file vs NAR). Thus, ‘ca’ has one of the
|
|
|
|
|
* following forms:
|
|
|
|
|
*
|
|
|
|
|
* - ‘text:sha256:<sha256 hash of file contents>’: For paths
|
|
|
|
|
* computed by Store::makeTextPath() / Store::addTextToStore().
|
|
|
|
|
*
|
|
|
|
|
* - ‘fixed:<r?>:<ht>:<h>’: For paths computed by
|
|
|
|
|
* Store::makeFixedOutputPath() / Store::addToStore().
|
|
|
|
|
*/
|
2023-03-30 21:12:49 +00:00
|
|
|
|
struct ContentAddress
|
|
|
|
|
{
|
|
|
|
|
typedef std::variant<
|
|
|
|
|
TextHash,
|
|
|
|
|
FixedOutputHash
|
|
|
|
|
> Raw;
|
2020-06-01 22:53:31 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
Raw raw;
|
2020-06-01 23:26:40 +00:00
|
|
|
|
|
2023-04-01 20:40:32 +00:00
|
|
|
|
GENERATE_CMP(ContentAddress, me->raw);
|
2020-06-01 23:26:40 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
/* The moral equivalent of `using Raw::Raw;` */
|
|
|
|
|
ContentAddress(auto &&... arg)
|
|
|
|
|
: raw(std::forward<decltype(arg)>(arg)...)
|
|
|
|
|
{ }
|
2020-06-02 00:37:43 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
/**
|
2023-04-19 18:13:30 +00:00
|
|
|
|
* Compute the content-addressability assertion
|
|
|
|
|
* (`ValidPathInfo::ca`) for paths created by
|
|
|
|
|
* `Store::makeFixedOutputPath()` / `Store::addToStore()`.
|
2023-03-30 21:12:49 +00:00
|
|
|
|
*/
|
|
|
|
|
std::string render() const;
|
2020-06-02 00:37:43 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
static ContentAddress parse(std::string_view rawCa);
|
2020-06-02 00:37:43 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
static std::optional<ContentAddress> parseOpt(std::string_view rawCaOpt);
|
2020-07-10 11:21:37 +00:00
|
|
|
|
|
2023-04-19 18:13:30 +00:00
|
|
|
|
/**
|
|
|
|
|
* Create a `ContentAddress` from 2 parts:
|
|
|
|
|
*
|
|
|
|
|
* @param method Way ingesting the file system data.
|
|
|
|
|
*
|
|
|
|
|
* @param hash Hash of ingested file system data.
|
|
|
|
|
*/
|
|
|
|
|
static ContentAddress fromParts(
|
2023-05-09 17:05:38 +00:00
|
|
|
|
ContentAddressMethod method, Hash hash) noexcept;
|
2023-04-19 18:13:30 +00:00
|
|
|
|
|
|
|
|
|
ContentAddressMethod getMethod() const;
|
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
const Hash & getHash() const;
|
2023-04-19 18:48:53 +00:00
|
|
|
|
|
|
|
|
|
std::string printMethodAlgo() const;
|
2023-03-30 21:12:49 +00:00
|
|
|
|
};
|
|
|
|
|
|
2023-05-09 17:05:38 +00:00
|
|
|
|
/**
|
|
|
|
|
* Render the `ContentAddress` if it exists to a string, return empty
|
|
|
|
|
* string otherwise.
|
|
|
|
|
*/
|
2023-03-30 21:12:49 +00:00
|
|
|
|
std::string renderContentAddress(std::optional<ContentAddress> ca);
|
2020-06-02 00:37:43 +00:00
|
|
|
|
|
2020-07-10 11:21:37 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
/*
|
|
|
|
|
* Full content address
|
|
|
|
|
*
|
|
|
|
|
* See the schema for store paths in store-api.cc
|
|
|
|
|
*/
|
2020-09-17 15:15:05 +00:00
|
|
|
|
|
2023-03-30 20:28:53 +00:00
|
|
|
|
/**
|
|
|
|
|
* A set of references to other store objects.
|
|
|
|
|
*
|
|
|
|
|
* References to other store objects are tracked with store paths, self
|
|
|
|
|
* references however are tracked with a boolean.
|
2020-10-07 13:52:20 +00:00
|
|
|
|
*/
|
2023-01-14 21:38:43 +00:00
|
|
|
|
struct StoreReferences {
|
2023-03-30 20:28:53 +00:00
|
|
|
|
/**
|
|
|
|
|
* References to other store objects
|
|
|
|
|
*/
|
2023-01-14 21:38:43 +00:00
|
|
|
|
StorePathSet others;
|
2023-03-30 20:28:53 +00:00
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Reference to this store object
|
|
|
|
|
*/
|
2023-01-14 21:38:43 +00:00
|
|
|
|
bool self = false;
|
|
|
|
|
|
2023-03-30 20:28:53 +00:00
|
|
|
|
/**
|
|
|
|
|
* @return true iff no references, i.e. others is empty and self is
|
|
|
|
|
* false.
|
|
|
|
|
*/
|
2023-01-14 21:38:43 +00:00
|
|
|
|
bool empty() const;
|
2023-03-30 20:28:53 +00:00
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the numbers of references, i.e. the size of others + 1
|
|
|
|
|
* iff self is true.
|
|
|
|
|
*/
|
2023-01-14 21:38:43 +00:00
|
|
|
|
size_t size() const;
|
|
|
|
|
|
|
|
|
|
GENERATE_CMP(StoreReferences, me->self, me->others);
|
|
|
|
|
};
|
2020-10-07 13:52:20 +00:00
|
|
|
|
|
|
|
|
|
// This matches the additional info that we need for makeTextPath
|
2023-02-28 17:13:43 +00:00
|
|
|
|
struct TextInfo {
|
|
|
|
|
TextHash hash;
|
2023-03-30 20:28:53 +00:00
|
|
|
|
/**
|
|
|
|
|
* References to other store objects only; self references
|
|
|
|
|
* disallowed
|
|
|
|
|
*/
|
2020-10-07 13:52:20 +00:00
|
|
|
|
StorePathSet references;
|
2022-03-25 22:40:40 +00:00
|
|
|
|
|
2023-02-28 17:13:43 +00:00
|
|
|
|
GENERATE_CMP(TextInfo, me->hash, me->references);
|
2020-10-07 13:52:20 +00:00
|
|
|
|
};
|
|
|
|
|
|
2023-02-28 17:13:43 +00:00
|
|
|
|
struct FixedOutputInfo {
|
|
|
|
|
FixedOutputHash hash;
|
2023-03-30 20:28:53 +00:00
|
|
|
|
/**
|
|
|
|
|
* References to other store objects or this one.
|
|
|
|
|
*/
|
2023-01-06 20:36:05 +00:00
|
|
|
|
StoreReferences references;
|
2022-03-25 22:40:40 +00:00
|
|
|
|
|
2023-02-28 17:13:43 +00:00
|
|
|
|
GENERATE_CMP(FixedOutputInfo, me->hash, me->references);
|
2020-10-07 13:52:20 +00:00
|
|
|
|
};
|
|
|
|
|
|
2023-03-25 23:12:44 +00:00
|
|
|
|
/**
|
|
|
|
|
* Ways of content addressing but not a complete ContentAddress.
|
|
|
|
|
*
|
|
|
|
|
* A ContentAddress without a Hash.
|
|
|
|
|
*/
|
2023-03-30 21:12:49 +00:00
|
|
|
|
struct ContentAddressWithReferences
|
|
|
|
|
{
|
|
|
|
|
typedef std::variant<
|
|
|
|
|
TextInfo,
|
|
|
|
|
FixedOutputInfo
|
|
|
|
|
> Raw;
|
2020-10-07 13:52:20 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
Raw raw;
|
2020-10-07 13:52:20 +00:00
|
|
|
|
|
2023-04-01 20:40:32 +00:00
|
|
|
|
GENERATE_CMP(ContentAddressWithReferences, me->raw);
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
/* The moral equivalent of `using Raw::Raw;` */
|
|
|
|
|
ContentAddressWithReferences(auto &&... arg)
|
|
|
|
|
: raw(std::forward<decltype(arg)>(arg)...)
|
|
|
|
|
{ }
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
2023-03-30 21:12:49 +00:00
|
|
|
|
/**
|
2023-04-19 18:13:30 +00:00
|
|
|
|
* Create a `ContentAddressWithReferences` from a mere
|
2023-05-09 16:45:51 +00:00
|
|
|
|
* `ContentAddress`, by claiming no references.
|
2023-03-30 21:12:49 +00:00
|
|
|
|
*/
|
2023-05-09 16:45:51 +00:00
|
|
|
|
static ContentAddressWithReferences withoutRefs(const ContentAddress &) noexcept;
|
2023-04-01 20:40:32 +00:00
|
|
|
|
|
|
|
|
|
/**
|
2023-04-19 18:13:30 +00:00
|
|
|
|
* Create a `ContentAddressWithReferences` from 3 parts:
|
2023-04-01 20:40:32 +00:00
|
|
|
|
*
|
|
|
|
|
* @param method Way ingesting the file system data.
|
|
|
|
|
*
|
|
|
|
|
* @param hash Hash of ingested file system data.
|
|
|
|
|
*
|
|
|
|
|
* @param refs References to other store objects or oneself.
|
|
|
|
|
*
|
|
|
|
|
* Do note that not all combinations are supported.
|
|
|
|
|
*/
|
|
|
|
|
static ContentAddressWithReferences fromParts(
|
|
|
|
|
ContentAddressMethod method, Hash hash, StoreReferences refs);
|
|
|
|
|
|
|
|
|
|
ContentAddressMethod getMethod() const;
|
|
|
|
|
|
|
|
|
|
Hash getHash() const;
|
2023-03-30 21:12:49 +00:00
|
|
|
|
};
|
2020-10-12 23:51:23 +00:00
|
|
|
|
|
2020-06-01 21:32:27 +00:00
|
|
|
|
}
|