aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorchriseth <chris@ethereum.org>2018-11-13 07:07:55 +0800
committerGitHub <noreply@github.com>2018-11-13 07:07:55 +0800
commitb14eec5babb416edf49aa15d6b4765dd579da823 (patch)
tree66cdcbd42cb479cd4fbb088ebe35cd33af76edb1
parent4eaed37b96c219c0486a125fc34c916cdb729026 (diff)
parent74557ceb0e520838d3e3a580cc30671a9c274ca7 (diff)
downloaddexon-solidity-b14eec5babb416edf49aa15d6b4765dd579da823.tar
dexon-solidity-b14eec5babb416edf49aa15d6b4765dd579da823.tar.gz
dexon-solidity-b14eec5babb416edf49aa15d6b4765dd579da823.tar.bz2
dexon-solidity-b14eec5babb416edf49aa15d6b4765dd579da823.tar.lz
dexon-solidity-b14eec5babb416edf49aa15d6b4765dd579da823.tar.xz
dexon-solidity-b14eec5babb416edf49aa15d6b4765dd579da823.tar.zst
dexon-solidity-b14eec5babb416edf49aa15d6b4765dd579da823.zip
Merge pull request #5392 from ethereum/yulStringRepositoryHash
[Yul] Deterministic YulStringRepository using string hashes.
-rw-r--r--libsolidity/interface/CompilerStack.cpp1
-rw-r--r--libyul/YulString.h93
-rw-r--r--test/libyul/Inliner.cpp6
-rw-r--r--test/libyul/YulOptimizerTest.cpp2
-rw-r--r--test/libyul/yulOptimizerTests/fullInliner/multi_fun_callback.yul13
5 files changed, 71 insertions, 44 deletions
diff --git a/libsolidity/interface/CompilerStack.cpp b/libsolidity/interface/CompilerStack.cpp
index e0909eb3..7aa0faa7 100644
--- a/libsolidity/interface/CompilerStack.cpp
+++ b/libsolidity/interface/CompilerStack.cpp
@@ -106,7 +106,6 @@ void CompilerStack::reset(bool _keepSources)
m_stackState = Empty;
m_sources.clear();
}
- yul::YulStringRepository::instance().reset();
m_libraries.clear();
m_evmVersion = EVMVersion();
m_optimize = false;
diff --git a/libyul/YulString.h b/libyul/YulString.h
index a8015239..ad900a70 100644
--- a/libyul/YulString.h
+++ b/libyul/YulString.h
@@ -22,7 +22,7 @@
#include <boost/noncopyable.hpp>
-#include <map>
+#include <unordered_map>
#include <memory>
#include <vector>
#include <string>
@@ -32,72 +32,101 @@ namespace dev
namespace yul
{
+/// Repository for YulStrings.
+/// Owns the string data for all YulStrings, which can be referenced by a Handle.
+/// A Handle consists of an ID (that depends on the insertion order of YulStrings and is potentially
+/// non-deterministic) and a deterministic string hash.
class YulStringRepository: boost::noncopyable
{
public:
- YulStringRepository()
+ struct Handle
{
- reset();
- }
+ size_t id;
+ std::uint64_t hash;
+ };
+ YulStringRepository():
+ m_strings{std::make_shared<std::string>()},
+ m_hashToID{std::make_pair(emptyHash(), 0)}
+ {}
static YulStringRepository& instance()
{
static YulStringRepository inst;
return inst;
}
- size_t stringToId(std::string const& _string)
+ Handle stringToHandle(std::string const& _string)
{
if (_string.empty())
- return 0;
- size_t& id = m_ids[_string];
- if (id == 0)
- {
- m_strings.emplace_back(std::make_shared<std::string>(_string));
- id = m_strings.size() - 1;
- }
- return id;
- }
- std::string const& idToString(size_t _id) const
- {
- return *m_strings.at(_id);
+ return { 0, emptyHash() };
+ std::uint64_t h = hash(_string);
+ auto range = m_hashToID.equal_range(h);
+ for (auto it = range.first; it != range.second; ++it)
+ if (*m_strings[it->second] == _string)
+ return Handle{it->second, h};
+ m_strings.emplace_back(std::make_shared<std::string>(_string));
+ size_t id = m_strings.size() - 1;
+ m_hashToID.emplace_hint(range.second, std::make_pair(h, id));
+ return Handle{id, h};
}
+ std::string const& idToString(size_t _id) const { return *m_strings.at(_id); }
- void reset()
+ static std::uint64_t hash(std::string const& v)
{
- m_strings.clear();
- m_ids.clear();
- m_strings.emplace_back(std::make_shared<std::string>());
- m_ids[std::string{}] = 0;
- }
+ // FNV hash - can be replaced by a better one, e.g. xxhash64
+ std::uint64_t hash = emptyHash();
+ for (auto c: v)
+ {
+ hash *= 1099511628211u;
+ hash ^= c;
+ }
+ return hash;
+ }
+ static constexpr std::uint64_t emptyHash() { return 14695981039346656037u; }
private:
std::vector<std::shared_ptr<std::string>> m_strings;
- std::map<std::string, size_t> m_ids;
+ std::unordered_multimap<std::uint64_t, size_t> m_hashToID;
};
+/// Wrapper around handles into the YulString repository.
+/// Equality of two YulStrings is determined by comparing their ID.
+/// The <-operator depends on the string hash and is not consistent
+/// with string comparisons (however, it is still deterministic).
class YulString
{
public:
YulString() = default;
- explicit YulString(std::string const& _s): m_id(YulStringRepository::instance().stringToId(_s)) {}
+ explicit YulString(std::string const& _s): m_handle(YulStringRepository::instance().stringToHandle(_s)) {}
YulString(YulString const&) = default;
YulString(YulString&&) = default;
YulString& operator=(YulString const&) = default;
YulString& operator=(YulString&&) = default;
/// This is not consistent with the string <-operator!
- bool operator<(YulString const& _other) const { return m_id < _other.m_id; }
- bool operator==(YulString const& _other) const { return m_id == _other.m_id; }
- bool operator!=(YulString const& _other) const { return m_id != _other.m_id; }
+ /// First compares the string hashes. If they are equal
+ /// it checks for identical IDs (only identical strings have
+ /// identical IDs and identical strings do not compare as "less").
+ /// If the hashes are identical and the strings are distinct, it
+ /// falls back to string comparison.
+ bool operator<(YulString const& _other) const
+ {
+ if (m_handle.hash < _other.m_handle.hash) return true;
+ if (_other.m_handle.hash < m_handle.hash) return false;
+ if (m_handle.id == _other.m_handle.id) return false;
+ return str() < _other.str();
+ }
+ /// Equality is determined based on the string ID.
+ bool operator==(YulString const& _other) const { return m_handle.id == _other.m_handle.id; }
+ bool operator!=(YulString const& _other) const { return m_handle.id != _other.m_handle.id; }
- bool empty() const { return m_id == 0; }
+ bool empty() const { return m_handle.id == 0; }
std::string const& str() const
{
- return YulStringRepository::instance().idToString(m_id);
+ return YulStringRepository::instance().idToString(m_handle.id);
}
private:
- /// ID of the string. Assumes that the empty string has ID zero.
- size_t m_id = 0;
+ /// Handle of the string. Assumes that the empty string has ID zero.
+ YulStringRepository::Handle m_handle{ 0, YulStringRepository::emptyHash() };
};
}
diff --git a/test/libyul/Inliner.cpp b/test/libyul/Inliner.cpp
index 4ed52b47..66810298 100644
--- a/test/libyul/Inliner.cpp
+++ b/test/libyul/Inliner.cpp
@@ -71,7 +71,7 @@ BOOST_AUTO_TEST_CASE(simple)
BOOST_CHECK_EQUAL(inlinableFunctions("{"
"function g(a:u256) -> b:u256 { b := a }"
"function f() -> x:u256 { x := g(2:u256) }"
- "}"), "f,g");
+ "}"), "g,f");
}
BOOST_AUTO_TEST_CASE(simple_inside_structures)
@@ -82,7 +82,7 @@ BOOST_AUTO_TEST_CASE(simple_inside_structures)
"function g(a:u256) -> b:u256 { b := a }"
"function f() -> x:u256 { x := g(2:u256) }"
"}"
- "}"), "f,g");
+ "}"), "g,f");
BOOST_CHECK_EQUAL(inlinableFunctions("{"
"for {"
"function g(a:u256) -> b:u256 { b := a }"
@@ -92,7 +92,7 @@ BOOST_AUTO_TEST_CASE(simple_inside_structures)
"{"
"function h() -> y:u256 { y := 2:u256 }"
"}"
- "}"), "f,g,h");
+ "}"), "h,g,f");
}
BOOST_AUTO_TEST_CASE(negative)
diff --git a/test/libyul/YulOptimizerTest.cpp b/test/libyul/YulOptimizerTest.cpp
index 162b167c..03cd6446 100644
--- a/test/libyul/YulOptimizerTest.cpp
+++ b/test/libyul/YulOptimizerTest.cpp
@@ -90,8 +90,6 @@ YulOptimizerTest::YulOptimizerTest(string const& _filename)
bool YulOptimizerTest::run(ostream& _stream, string const& _linePrefix, bool const _formatted)
{
- yul::YulStringRepository::instance().reset();
-
assembly::AsmPrinter printer{m_yul};
shared_ptr<Block> ast;
shared_ptr<assembly::AsmAnalysisInfo> analysisInfo;
diff --git a/test/libyul/yulOptimizerTests/fullInliner/multi_fun_callback.yul b/test/libyul/yulOptimizerTests/fullInliner/multi_fun_callback.yul
index d09877de..19ac945e 100644
--- a/test/libyul/yulOptimizerTests/fullInliner/multi_fun_callback.yul
+++ b/test/libyul/yulOptimizerTests/fullInliner/multi_fun_callback.yul
@@ -41,18 +41,19 @@
// h_t := 2
// mstore(7, h_t)
// let g_x_1 := 10
-// f(1)
+// let g_f_x_8 := 1
+// mstore(0, g_f_x_8)
+// mstore(7, h())
+// g(10)
+// mstore(1, g_f_x_8)
// mstore(1, x)
// }
// function g(x_1)
// {
// let f_x_8 := 1
// mstore(0, f_x_8)
-// let f_h_t
-// f_h_t := 2
-// mstore(7, f_h_t)
-// let f_g_x_1 := 10
-// f(1)
+// mstore(7, h())
+// g(10)
// mstore(1, f_x_8)
// }
// function h() -> t