aboutsummaryrefslogtreecommitdiffstats
path: root/libyul/YulString.h
diff options
context:
space:
mode:
authorDaniel Kirchner <daniel@ekpyron.org>2018-11-10 03:21:26 +0800
committerDaniel Kirchner <daniel@ekpyron.org>2018-11-13 06:43:16 +0800
commit74557ceb0e520838d3e3a580cc30671a9c274ca7 (patch)
tree1015ebc5d46f250d314aaf80a849aaf0eae47882 /libyul/YulString.h
parent09f8ff27fc576dbbd05e31471bb39c00abe90563 (diff)
downloaddexon-solidity-74557ceb0e520838d3e3a580cc30671a9c274ca7.tar.gz
dexon-solidity-74557ceb0e520838d3e3a580cc30671a9c274ca7.tar.zst
dexon-solidity-74557ceb0e520838d3e3a580cc30671a9c274ca7.zip
Deterministic YulStringRepository using string hashes.
Diffstat (limited to 'libyul/YulString.h')
-rw-r--r--libyul/YulString.h93
1 files changed, 61 insertions, 32 deletions
diff --git a/libyul/YulString.h b/libyul/YulString.h
index a8015239..ad900a70 100644
--- a/libyul/YulString.h
+++ b/libyul/YulString.h
@@ -22,7 +22,7 @@
#include <boost/noncopyable.hpp>
-#include <map>
+#include <unordered_map>
#include <memory>
#include <vector>
#include <string>
@@ -32,72 +32,101 @@ namespace dev
namespace yul
{
+/// Repository for YulStrings.
+/// Owns the string data for all YulStrings, which can be referenced by a Handle.
+/// A Handle consists of an ID (that depends on the insertion order of YulStrings and is potentially
+/// non-deterministic) and a deterministic string hash.
class YulStringRepository: boost::noncopyable
{
public:
- YulStringRepository()
+ struct Handle
{
- reset();
- }
+ size_t id;
+ std::uint64_t hash;
+ };
+ YulStringRepository():
+ m_strings{std::make_shared<std::string>()},
+ m_hashToID{std::make_pair(emptyHash(), 0)}
+ {}
static YulStringRepository& instance()
{
static YulStringRepository inst;
return inst;
}
- size_t stringToId(std::string const& _string)
+ Handle stringToHandle(std::string const& _string)
{
if (_string.empty())
- return 0;
- size_t& id = m_ids[_string];
- if (id == 0)
- {
- m_strings.emplace_back(std::make_shared<std::string>(_string));
- id = m_strings.size() - 1;
- }
- return id;
- }
- std::string const& idToString(size_t _id) const
- {
- return *m_strings.at(_id);
+ return { 0, emptyHash() };
+ std::uint64_t h = hash(_string);
+ auto range = m_hashToID.equal_range(h);
+ for (auto it = range.first; it != range.second; ++it)
+ if (*m_strings[it->second] == _string)
+ return Handle{it->second, h};
+ m_strings.emplace_back(std::make_shared<std::string>(_string));
+ size_t id = m_strings.size() - 1;
+ m_hashToID.emplace_hint(range.second, std::make_pair(h, id));
+ return Handle{id, h};
}
+ std::string const& idToString(size_t _id) const { return *m_strings.at(_id); }
- void reset()
+ static std::uint64_t hash(std::string const& v)
{
- m_strings.clear();
- m_ids.clear();
- m_strings.emplace_back(std::make_shared<std::string>());
- m_ids[std::string{}] = 0;
- }
+ // FNV hash - can be replaced by a better one, e.g. xxhash64
+ std::uint64_t hash = emptyHash();
+ for (auto c: v)
+ {
+ hash *= 1099511628211u;
+ hash ^= c;
+ }
+ return hash;
+ }
+ static constexpr std::uint64_t emptyHash() { return 14695981039346656037u; }
private:
std::vector<std::shared_ptr<std::string>> m_strings;
- std::map<std::string, size_t> m_ids;
+ std::unordered_multimap<std::uint64_t, size_t> m_hashToID;
};
+/// Wrapper around handles into the YulString repository.
+/// Equality of two YulStrings is determined by comparing their ID.
+/// The <-operator depends on the string hash and is not consistent
+/// with string comparisons (however, it is still deterministic).
class YulString
{
public:
YulString() = default;
- explicit YulString(std::string const& _s): m_id(YulStringRepository::instance().stringToId(_s)) {}
+ explicit YulString(std::string const& _s): m_handle(YulStringRepository::instance().stringToHandle(_s)) {}
YulString(YulString const&) = default;
YulString(YulString&&) = default;
YulString& operator=(YulString const&) = default;
YulString& operator=(YulString&&) = default;
/// This is not consistent with the string <-operator!
- bool operator<(YulString const& _other) const { return m_id < _other.m_id; }
- bool operator==(YulString const& _other) const { return m_id == _other.m_id; }
- bool operator!=(YulString const& _other) const { return m_id != _other.m_id; }
+ /// First compares the string hashes. If they are equal
+ /// it checks for identical IDs (only identical strings have
+ /// identical IDs and identical strings do not compare as "less").
+ /// If the hashes are identical and the strings are distinct, it
+ /// falls back to string comparison.
+ bool operator<(YulString const& _other) const
+ {
+ if (m_handle.hash < _other.m_handle.hash) return true;
+ if (_other.m_handle.hash < m_handle.hash) return false;
+ if (m_handle.id == _other.m_handle.id) return false;
+ return str() < _other.str();
+ }
+ /// Equality is determined based on the string ID.
+ bool operator==(YulString const& _other) const { return m_handle.id == _other.m_handle.id; }
+ bool operator!=(YulString const& _other) const { return m_handle.id != _other.m_handle.id; }
- bool empty() const { return m_id == 0; }
+ bool empty() const { return m_handle.id == 0; }
std::string const& str() const
{
- return YulStringRepository::instance().idToString(m_id);
+ return YulStringRepository::instance().idToString(m_handle.id);
}
private:
- /// ID of the string. Assumes that the empty string has ID zero.
- size_t m_id = 0;
+ /// Handle of the string. Assumes that the empty string has ID zero.
+ YulStringRepository::Handle m_handle{ 0, YulStringRepository::emptyHash() };
};
}