forked from lix-project/lix
Move ChunkedVector to its own header
This commit is contained in:
parent
8adaa6acb5
commit
7ca6fbc8ca
4 changed files with 70 additions and 59 deletions
|
@ -6,6 +6,7 @@
|
||||||
#include "value.hh"
|
#include "value.hh"
|
||||||
#include "symbol-table.hh"
|
#include "symbol-table.hh"
|
||||||
#include "error.hh"
|
#include "error.hh"
|
||||||
|
#include "chunked-vector.hh"
|
||||||
|
|
||||||
|
|
||||||
namespace nix {
|
namespace nix {
|
||||||
|
|
|
@ -5,6 +5,7 @@
|
||||||
#include <unordered_map>
|
#include <unordered_map>
|
||||||
|
|
||||||
#include "types.hh"
|
#include "types.hh"
|
||||||
|
#include "chunked-vector.hh"
|
||||||
|
|
||||||
namespace nix {
|
namespace nix {
|
||||||
|
|
||||||
|
|
68
src/libutil/chunked-vector.hh
Normal file
68
src/libutil/chunked-vector.hh
Normal file
|
@ -0,0 +1,68 @@
|
||||||
|
#pragma once
|
||||||
|
|
||||||
|
#include <bits/stdint-uintn.h>
|
||||||
|
#include <cstdlib>
|
||||||
|
#include <vector>
|
||||||
|
#include <limits>
|
||||||
|
|
||||||
|
namespace nix {
|
||||||
|
|
||||||
|
/* Provides an indexable container like vector<> with memory overhead
|
||||||
|
guarantees like list<> by allocating storage in chunks of ChunkSize
|
||||||
|
elements instead of using a contiguous memory allocation like vector<>
|
||||||
|
does. Not using a single vector that is resized reduces memory overhead
|
||||||
|
on large data sets by on average (growth factor)/2, mostly
|
||||||
|
eliminates copies within the vector during resizing, and provides stable
|
||||||
|
references to its elements. */
|
||||||
|
template<typename T, size_t ChunkSize>
|
||||||
|
class ChunkedVector {
|
||||||
|
private:
|
||||||
|
uint32_t size_ = 0;
|
||||||
|
std::vector<std::vector<T>> chunks;
|
||||||
|
|
||||||
|
/* keep this out of the ::add hot path */
|
||||||
|
[[gnu::noinline]]
|
||||||
|
auto & addChunk()
|
||||||
|
{
|
||||||
|
if (size_ >= std::numeric_limits<uint32_t>::max() - ChunkSize)
|
||||||
|
abort();
|
||||||
|
chunks.emplace_back();
|
||||||
|
chunks.back().reserve(ChunkSize);
|
||||||
|
return chunks.back();
|
||||||
|
}
|
||||||
|
|
||||||
|
public:
|
||||||
|
ChunkedVector(uint32_t reserve)
|
||||||
|
{
|
||||||
|
chunks.reserve(reserve);
|
||||||
|
addChunk();
|
||||||
|
}
|
||||||
|
|
||||||
|
uint32_t size() const { return size_; }
|
||||||
|
|
||||||
|
std::pair<T &, uint32_t> add(T value)
|
||||||
|
{
|
||||||
|
const auto idx = size_++;
|
||||||
|
auto & chunk = [&] () -> auto & {
|
||||||
|
if (auto & back = chunks.back(); back.size() < ChunkSize)
|
||||||
|
return back;
|
||||||
|
return addChunk();
|
||||||
|
}();
|
||||||
|
auto & result = chunk.emplace_back(std::move(value));
|
||||||
|
return {result, idx};
|
||||||
|
}
|
||||||
|
|
||||||
|
const T & operator[](uint32_t idx) const
|
||||||
|
{
|
||||||
|
return chunks[idx / ChunkSize][idx % ChunkSize];
|
||||||
|
}
|
||||||
|
|
||||||
|
template<typename Fn>
|
||||||
|
void forEach(Fn fn) const
|
||||||
|
{
|
||||||
|
for (const auto & c : chunks)
|
||||||
|
for (const auto & e : c)
|
||||||
|
fn(e);
|
||||||
|
}
|
||||||
|
};
|
||||||
|
}
|
|
@ -103,63 +103,4 @@ public:
|
||||||
Ptr operator->() const { return Ptr(**this); }
|
Ptr operator->() const { return Ptr(**this); }
|
||||||
};
|
};
|
||||||
|
|
||||||
/* Provides an indexable container like vector<> with memory overhead
|
|
||||||
guarantees like list<> by allocating storage in chunks of ChunkSize
|
|
||||||
elements instead of using a contiguous memory allocation like vector<>
|
|
||||||
does. Not using a single vector that is resized reduces memory overhead
|
|
||||||
on large data sets by on average (growth factor)/2, mostly
|
|
||||||
eliminates copies within the vector during resizing, and provides stable
|
|
||||||
references to its elements. */
|
|
||||||
template<typename T, size_t ChunkSize>
|
|
||||||
class ChunkedVector {
|
|
||||||
private:
|
|
||||||
uint32_t size_ = 0;
|
|
||||||
std::vector<std::vector<T>> chunks;
|
|
||||||
|
|
||||||
/* keep this out of the ::add hot path */
|
|
||||||
[[gnu::noinline]]
|
|
||||||
auto & addChunk()
|
|
||||||
{
|
|
||||||
if (size_ >= std::numeric_limits<uint32_t>::max() - ChunkSize)
|
|
||||||
abort();
|
|
||||||
chunks.emplace_back();
|
|
||||||
chunks.back().reserve(ChunkSize);
|
|
||||||
return chunks.back();
|
|
||||||
}
|
|
||||||
|
|
||||||
public:
|
|
||||||
ChunkedVector(uint32_t reserve)
|
|
||||||
{
|
|
||||||
chunks.reserve(reserve);
|
|
||||||
addChunk();
|
|
||||||
}
|
|
||||||
|
|
||||||
uint32_t size() const { return size_; }
|
|
||||||
|
|
||||||
std::pair<T &, uint32_t> add(T value)
|
|
||||||
{
|
|
||||||
const auto idx = size_++;
|
|
||||||
auto & chunk = [&] () -> auto & {
|
|
||||||
if (auto & back = chunks.back(); back.size() < ChunkSize)
|
|
||||||
return back;
|
|
||||||
return addChunk();
|
|
||||||
}();
|
|
||||||
auto & result = chunk.emplace_back(std::move(value));
|
|
||||||
return {result, idx};
|
|
||||||
}
|
|
||||||
|
|
||||||
const T & operator[](uint32_t idx) const
|
|
||||||
{
|
|
||||||
return chunks[idx / ChunkSize][idx % ChunkSize];
|
|
||||||
}
|
|
||||||
|
|
||||||
template<typename Fn>
|
|
||||||
void forEach(Fn fn) const
|
|
||||||
{
|
|
||||||
for (const auto & c : chunks)
|
|
||||||
for (const auto & e : c)
|
|
||||||
fn(e);
|
|
||||||
}
|
|
||||||
};
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in a new issue