chriseth
10 years ago
12 changed files with 796 additions and 354 deletions
@ -0,0 +1,326 @@ |
|||
/*
|
|||
This file is part of cpp-ethereum. |
|||
|
|||
cpp-ethereum is free software: you can redistribute it and/or modify |
|||
it under the terms of the GNU General Public License as published by |
|||
the Free Software Foundation, either version 3 of the License, or |
|||
(at your option) any later version. |
|||
|
|||
cpp-ethereum is distributed in the hope that it will be useful, |
|||
but WITHOUT ANY WARRANTY; without even the implied warranty of |
|||
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|||
GNU General Public License for more details. |
|||
|
|||
You should have received a copy of the GNU General Public License |
|||
along with cpp-ethereum. If not, see <http://www.gnu.org/licenses/>.
|
|||
*/ |
|||
/**
|
|||
* @file KnownState.cpp |
|||
* @author Christian <c@ethdev.com> |
|||
* @date 2015 |
|||
* Contains knowledge about the state of the virtual machine at a specific instruction. |
|||
*/ |
|||
|
|||
#include "KnownState.h" |
|||
#include <functional> |
|||
#include <libdevcrypto/SHA3.h> |
|||
#include <libevmasm/AssemblyItem.h> |
|||
|
|||
using namespace std; |
|||
using namespace dev; |
|||
using namespace dev::eth; |
|||
|
|||
ostream& KnownState::stream(ostream& _out) const |
|||
{ |
|||
auto streamExpressionClass = [this](ostream& _out, Id _id) |
|||
{ |
|||
auto const& expr = m_expressionClasses->representative(_id); |
|||
_out << " " << dec << _id << ": "; |
|||
if (!expr.item) |
|||
_out << " no item"; |
|||
else if (expr.item->type() == UndefinedItem) |
|||
_out << " unknown " << int(expr.item->data()); |
|||
else |
|||
_out << *expr.item; |
|||
if (expr.sequenceNumber) |
|||
_out << "@" << dec << expr.sequenceNumber; |
|||
_out << "("; |
|||
for (Id arg: expr.arguments) |
|||
_out << dec << arg << ","; |
|||
_out << ")" << endl; |
|||
}; |
|||
|
|||
_out << "=== State ===" << endl; |
|||
_out << "Stack height: " << dec << m_stackHeight << endl; |
|||
_out << "Equivalence classes: " << endl; |
|||
for (Id eqClass = 0; eqClass < m_expressionClasses->size(); ++eqClass) |
|||
streamExpressionClass(_out, eqClass); |
|||
|
|||
_out << "Stack: " << endl; |
|||
for (auto const& it: m_stackElements) |
|||
{ |
|||
_out << " " << dec << it.first << ": "; |
|||
streamExpressionClass(_out, it.second); |
|||
} |
|||
_out << "Storage: " << endl; |
|||
for (auto const& it: m_storageContent) |
|||
{ |
|||
_out << " "; |
|||
streamExpressionClass(_out, it.first); |
|||
_out << ": "; |
|||
streamExpressionClass(_out, it.second); |
|||
} |
|||
_out << "Memory: " << endl; |
|||
for (auto const& it: m_memoryContent) |
|||
{ |
|||
_out << " "; |
|||
streamExpressionClass(_out, it.first); |
|||
_out << ": "; |
|||
streamExpressionClass(_out, it.second); |
|||
} |
|||
|
|||
return _out; |
|||
} |
|||
|
|||
KnownState::StoreOperation KnownState::feedItem(AssemblyItem const& _item, bool _copyItem) |
|||
{ |
|||
StoreOperation op; |
|||
if (_item.type() == Tag) |
|||
{ |
|||
// can be ignored
|
|||
} |
|||
else if (_item.type() != Operation) |
|||
{ |
|||
assertThrow(_item.deposit() == 1, InvalidDeposit, ""); |
|||
setStackElement(++m_stackHeight, m_expressionClasses->find(_item, {}, _copyItem)); |
|||
} |
|||
else |
|||
{ |
|||
Instruction instruction = _item.instruction(); |
|||
InstructionInfo info = instructionInfo(instruction); |
|||
if (SemanticInformation::isDupInstruction(_item)) |
|||
setStackElement( |
|||
m_stackHeight + 1, |
|||
stackElement( |
|||
m_stackHeight - int(instruction) + int(Instruction::DUP1), |
|||
_item.getLocation() |
|||
) |
|||
); |
|||
else if (SemanticInformation::isSwapInstruction(_item)) |
|||
swapStackElements( |
|||
m_stackHeight, |
|||
m_stackHeight - 1 - int(instruction) + int(Instruction::SWAP1), |
|||
_item.getLocation() |
|||
); |
|||
else if (instruction != Instruction::POP) |
|||
{ |
|||
vector<Id> arguments(info.args); |
|||
for (int i = 0; i < info.args; ++i) |
|||
arguments[i] = stackElement(m_stackHeight - i, _item.getLocation()); |
|||
|
|||
if (_item.instruction() == Instruction::SSTORE) |
|||
op = storeInStorage(arguments[0], arguments[1], _item.getLocation()); |
|||
else if (_item.instruction() == Instruction::SLOAD) |
|||
setStackElement( |
|||
m_stackHeight + _item.deposit(), |
|||
loadFromStorage(arguments[0], _item.getLocation()) |
|||
); |
|||
else if (_item.instruction() == Instruction::MSTORE) |
|||
op = storeInMemory(arguments[0], arguments[1], _item.getLocation()); |
|||
else if (_item.instruction() == Instruction::MLOAD) |
|||
setStackElement( |
|||
m_stackHeight + _item.deposit(), |
|||
loadFromMemory(arguments[0], _item.getLocation()) |
|||
); |
|||
else if (_item.instruction() == Instruction::SHA3) |
|||
setStackElement( |
|||
m_stackHeight + _item.deposit(), |
|||
applySha3(arguments.at(0), arguments.at(1), _item.getLocation()) |
|||
); |
|||
else |
|||
{ |
|||
if (SemanticInformation::invalidatesMemory(_item.instruction())) |
|||
resetMemory(); |
|||
if (SemanticInformation::invalidatesStorage(_item.instruction())) |
|||
resetStorage(); |
|||
assertThrow(info.ret <= 1, InvalidDeposit, ""); |
|||
if (info.ret == 1) |
|||
setStackElement( |
|||
m_stackHeight + _item.deposit(), |
|||
m_expressionClasses->find(_item, arguments, _copyItem) |
|||
); |
|||
} |
|||
} |
|||
m_stackElements.erase( |
|||
m_stackElements.upper_bound(m_stackHeight + _item.deposit()), |
|||
m_stackElements.end() |
|||
); |
|||
m_stackHeight += _item.deposit(); |
|||
} |
|||
return op; |
|||
} |
|||
|
|||
void KnownState::reduceToCommonKnowledge(KnownState const& /*_other*/) |
|||
{ |
|||
//@todo
|
|||
*this = KnownState(m_expressionClasses); |
|||
} |
|||
|
|||
bool KnownState::operator==(const KnownState& _other) const |
|||
{ |
|||
//@todo
|
|||
return ( |
|||
m_stackElements.empty() && |
|||
_other.m_stackElements.empty() && |
|||
m_storageContent.empty() && |
|||
_other.m_storageContent.empty() && |
|||
m_memoryContent.empty() && |
|||
_other.m_memoryContent.empty() |
|||
); |
|||
} |
|||
|
|||
ExpressionClasses::Id KnownState::stackElement(int _stackHeight, SourceLocation const& _location) |
|||
{ |
|||
if (m_stackElements.count(_stackHeight)) |
|||
return m_stackElements.at(_stackHeight); |
|||
// Stack element not found (not assigned yet), create new unknown equivalence class.
|
|||
//@todo check that we do not infer incorrect equivalences when the stack is cleared partially
|
|||
//in between.
|
|||
return m_stackElements[_stackHeight] = initialStackElement(_stackHeight, _location); |
|||
} |
|||
|
|||
ExpressionClasses::Id KnownState::initialStackElement( |
|||
int _stackHeight, |
|||
SourceLocation const& _location |
|||
) |
|||
{ |
|||
// This is a special assembly item that refers to elements pre-existing on the initial stack.
|
|||
return m_expressionClasses->find(AssemblyItem(UndefinedItem, u256(_stackHeight), _location)); |
|||
} |
|||
|
|||
void KnownState::setStackElement(int _stackHeight, Id _class) |
|||
{ |
|||
m_stackElements[_stackHeight] = _class; |
|||
} |
|||
|
|||
void KnownState::swapStackElements( |
|||
int _stackHeightA, |
|||
int _stackHeightB, |
|||
SourceLocation const& _location |
|||
) |
|||
{ |
|||
assertThrow(_stackHeightA != _stackHeightB, OptimizerException, "Swap on same stack elements."); |
|||
// ensure they are created
|
|||
stackElement(_stackHeightA, _location); |
|||
stackElement(_stackHeightB, _location); |
|||
|
|||
swap(m_stackElements[_stackHeightA], m_stackElements[_stackHeightB]); |
|||
} |
|||
|
|||
KnownState::StoreOperation KnownState::storeInStorage( |
|||
Id _slot, |
|||
Id _value, |
|||
SourceLocation const& _location) |
|||
{ |
|||
if (m_storageContent.count(_slot) && m_storageContent[_slot] == _value) |
|||
// do not execute the storage if we know that the value is already there
|
|||
return StoreOperation(); |
|||
m_sequenceNumber++; |
|||
decltype(m_storageContent) storageContents; |
|||
// Copy over all values (i.e. retain knowledge about them) where we know that this store
|
|||
// operation will not destroy the knowledge. Specifically, we copy storage locations we know
|
|||
// are different from _slot or locations where we know that the stored value is equal to _value.
|
|||
for (auto const& storageItem: m_storageContent) |
|||
if (m_expressionClasses->knownToBeDifferent(storageItem.first, _slot) || storageItem.second == _value) |
|||
storageContents.insert(storageItem); |
|||
m_storageContent = move(storageContents); |
|||
|
|||
AssemblyItem item(Instruction::SSTORE, _location); |
|||
Id id = m_expressionClasses->find(item, {_slot, _value}, true, m_sequenceNumber); |
|||
StoreOperation operation(StoreOperation::Storage, _slot, m_sequenceNumber, id); |
|||
m_storageContent[_slot] = _value; |
|||
// increment a second time so that we get unique sequence numbers for writes
|
|||
m_sequenceNumber++; |
|||
|
|||
return operation; |
|||
} |
|||
|
|||
ExpressionClasses::Id KnownState::loadFromStorage(Id _slot, SourceLocation const& _location) |
|||
{ |
|||
if (m_storageContent.count(_slot)) |
|||
return m_storageContent.at(_slot); |
|||
|
|||
AssemblyItem item(Instruction::SLOAD, _location); |
|||
return m_storageContent[_slot] = m_expressionClasses->find(item, {_slot}, true, m_sequenceNumber); |
|||
} |
|||
|
|||
KnownState::StoreOperation KnownState::storeInMemory(Id _slot, Id _value, SourceLocation const& _location) |
|||
{ |
|||
if (m_memoryContent.count(_slot) && m_memoryContent[_slot] == _value) |
|||
// do not execute the store if we know that the value is already there
|
|||
return StoreOperation(); |
|||
m_sequenceNumber++; |
|||
decltype(m_memoryContent) memoryContents; |
|||
// copy over values at points where we know that they are different from _slot by at least 32
|
|||
for (auto const& memoryItem: m_memoryContent) |
|||
if (m_expressionClasses->knownToBeDifferentBy32(memoryItem.first, _slot)) |
|||
memoryContents.insert(memoryItem); |
|||
m_memoryContent = move(memoryContents); |
|||
|
|||
AssemblyItem item(Instruction::MSTORE, _location); |
|||
Id id = m_expressionClasses->find(item, {_slot, _value}, true, m_sequenceNumber); |
|||
StoreOperation operation(StoreOperation(StoreOperation::Memory, _slot, m_sequenceNumber, id)); |
|||
m_memoryContent[_slot] = _value; |
|||
// increment a second time so that we get unique sequence numbers for writes
|
|||
m_sequenceNumber++; |
|||
return operation; |
|||
} |
|||
|
|||
ExpressionClasses::Id KnownState::loadFromMemory(Id _slot, SourceLocation const& _location) |
|||
{ |
|||
if (m_memoryContent.count(_slot)) |
|||
return m_memoryContent.at(_slot); |
|||
|
|||
AssemblyItem item(Instruction::MLOAD, _location); |
|||
return m_memoryContent[_slot] = m_expressionClasses->find(item, {_slot}, true, m_sequenceNumber); |
|||
} |
|||
|
|||
KnownState::Id KnownState::applySha3( |
|||
Id _start, |
|||
Id _length, |
|||
SourceLocation const& _location |
|||
) |
|||
{ |
|||
AssemblyItem sha3Item(Instruction::SHA3, _location); |
|||
// Special logic if length is a short constant, otherwise we cannot tell.
|
|||
u256 const* l = m_expressionClasses->knownConstant(_length); |
|||
// unknown or too large length
|
|||
if (!l || *l > 128) |
|||
return m_expressionClasses->find(sha3Item, {_start, _length}, true, m_sequenceNumber); |
|||
|
|||
vector<Id> arguments; |
|||
for (u256 i = 0; i < *l; i += 32) |
|||
{ |
|||
Id slot = m_expressionClasses->find( |
|||
AssemblyItem(Instruction::ADD, _location), |
|||
{_start, m_expressionClasses->find(i)} |
|||
); |
|||
arguments.push_back(loadFromMemory(slot, _location)); |
|||
} |
|||
if (m_knownSha3Hashes.count(arguments)) |
|||
return m_knownSha3Hashes.at(arguments); |
|||
Id v; |
|||
// If all arguments are known constants, compute the sha3 here
|
|||
if (all_of(arguments.begin(), arguments.end(), [this](Id _a) { return !!m_expressionClasses->knownConstant(_a); })) |
|||
{ |
|||
bytes data; |
|||
for (Id a: arguments) |
|||
data += toBigEndian(*m_expressionClasses->knownConstant(a)); |
|||
data.resize(size_t(*l)); |
|||
v = m_expressionClasses->find(AssemblyItem(u256(sha3(data)), _location)); |
|||
} |
|||
else |
|||
v = m_expressionClasses->find(sha3Item, {_start, _length}, true, m_sequenceNumber); |
|||
return m_knownSha3Hashes[arguments] = v; |
|||
} |
|||
|
@ -0,0 +1,163 @@ |
|||
/*
|
|||
This file is part of cpp-ethereum. |
|||
|
|||
cpp-ethereum is free software: you can redistribute it and/or modify |
|||
it under the terms of the GNU General Public License as published by |
|||
the Free Software Foundation, either version 3 of the License, or |
|||
(at your option) any later version. |
|||
|
|||
cpp-ethereum is distributed in the hope that it will be useful, |
|||
but WITHOUT ANY WARRANTY; without even the implied warranty of |
|||
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|||
GNU General Public License for more details. |
|||
|
|||
You should have received a copy of the GNU General Public License |
|||
along with cpp-ethereum. If not, see <http://www.gnu.org/licenses/>.
|
|||
*/ |
|||
/**
|
|||
* @file KnownState.h |
|||
* @author Christian <c@ethdev.com> |
|||
* @date 2015 |
|||
* Contains knowledge about the state of the virtual machine at a specific instruction. |
|||
*/ |
|||
|
|||
#pragma once |
|||
|
|||
#include <vector> |
|||
#include <map> |
|||
#include <set> |
|||
#include <tuple> |
|||
#include <memory> |
|||
#include <ostream> |
|||
#include <libdevcore/CommonIO.h> |
|||
#include <libdevcore/Exceptions.h> |
|||
#include <libevmasm/ExpressionClasses.h> |
|||
#include <libevmasm/SemanticInformation.h> |
|||
|
|||
namespace dev |
|||
{ |
|||
namespace eth |
|||
{ |
|||
|
|||
class AssemblyItem; |
|||
using AssemblyItems = std::vector<AssemblyItem>; |
|||
|
|||
/**
|
|||
* Class to infer and store knowledge about the state of the virtual machine at a specific |
|||
* instruction. |
|||
* |
|||
* The general workings are that for each assembly item that is fed, an equivalence class is |
|||
* derived from the operation and the equivalence class of its arguments. DUPi, SWAPi and some |
|||
* arithmetic instructions are used to infer equivalences while these classes are determined. |
|||
*/ |
|||
class KnownState |
|||
{ |
|||
public: |
|||
using Id = ExpressionClasses::Id; |
|||
struct StoreOperation |
|||
{ |
|||
enum Target { Invalid, Memory, Storage }; |
|||
StoreOperation(): target(Invalid), sequenceNumber(-1) {} |
|||
StoreOperation( |
|||
Target _target, |
|||
Id _slot, |
|||
unsigned _sequenceNumber, |
|||
Id _expression |
|||
): target(_target), slot(_slot), sequenceNumber(_sequenceNumber), expression(_expression) {} |
|||
bool isValid() const { return target != Invalid; } |
|||
Target target; |
|||
Id slot; |
|||
unsigned sequenceNumber; |
|||
Id expression; |
|||
}; |
|||
|
|||
explicit KnownState( |
|||
std::shared_ptr<ExpressionClasses> _expressionClasses = std::make_shared<ExpressionClasses>() |
|||
): m_expressionClasses(_expressionClasses) |
|||
{ |
|||
} |
|||
|
|||
/// Streams debugging information to @a _out.
|
|||
std::ostream& stream(std::ostream& _out) const; |
|||
|
|||
/// Feeds the item into the system for analysis.
|
|||
/// @returns a possible store operation
|
|||
StoreOperation feedItem(AssemblyItem const& _item, bool _copyItem = false); |
|||
|
|||
/// Resets any knowledge about storage.
|
|||
void resetStorage() { m_storageContent.clear(); } |
|||
/// Resets any knowledge about storage.
|
|||
void resetMemory() { m_memoryContent.clear(); } |
|||
/// Resets any knowledge about the current stack.
|
|||
void resetStack() { m_stackElements.clear(); m_stackHeight = 0; } |
|||
/// Resets any knowledge.
|
|||
void reset() { resetStorage(); resetMemory(); resetStack(); } |
|||
|
|||
/// Manually increments the storage and memory sequence number.
|
|||
void incrementSequenceNumber() { m_sequenceNumber += 2; } |
|||
|
|||
/// Replaces the state by the intersection with _other, i.e. only equal knowledge is retained.
|
|||
/// If the stack heighht is different, the smaller one is used and the stack is compared
|
|||
/// relatively.
|
|||
void reduceToCommonKnowledge(KnownState const& _other); |
|||
|
|||
/// @returns a shared pointer to a copy of this state.
|
|||
std::shared_ptr<KnownState> copy() const { return std::make_shared<KnownState>(*this); } |
|||
|
|||
/// @returns true if the knowledge about the state of both objects is (known to be) equal.
|
|||
bool operator==(KnownState const& _other) const; |
|||
|
|||
///@todo the sequence numbers in two copies of this class should never be the same.
|
|||
/// might be doable using two-dimensional sequence numbers, where the first value is incremented
|
|||
/// for each copy
|
|||
|
|||
/// Retrieves the current equivalence class fo the given stack element (or generates a new
|
|||
/// one if it does not exist yet).
|
|||
Id stackElement(int _stackHeight, SourceLocation const& _location); |
|||
/// @returns the equivalence class id of the special initial stack element at the given height.
|
|||
Id initialStackElement(int _stackHeight, SourceLocation const& _location); |
|||
|
|||
int stackHeight() const { return m_stackHeight; } |
|||
std::map<int, Id> const& stackElements() const { return m_stackElements; } |
|||
ExpressionClasses& expressionClasses() const { return *m_expressionClasses; } |
|||
|
|||
private: |
|||
/// Assigns a new equivalence class to the next sequence number of the given stack element.
|
|||
void setStackElement(int _stackHeight, Id _class); |
|||
/// Swaps the given stack elements in their next sequence number.
|
|||
void swapStackElements(int _stackHeightA, int _stackHeightB, SourceLocation const& _location); |
|||
|
|||
/// Increments the sequence number, deletes all storage information that might be overwritten
|
|||
/// and stores the new value at the given slot.
|
|||
/// @returns the store operation, which might be invalid if storage was not modified
|
|||
StoreOperation storeInStorage(Id _slot, Id _value, SourceLocation const& _location); |
|||
/// Retrieves the current value at the given slot in storage or creates a new special sload class.
|
|||
Id loadFromStorage(Id _slot, SourceLocation const& _location); |
|||
/// Increments the sequence number, deletes all memory information that might be overwritten
|
|||
/// and stores the new value at the given slot.
|
|||
/// @returns the store operation, which might be invalid if memory was not modified
|
|||
StoreOperation storeInMemory(Id _slot, Id _value, SourceLocation const& _location); |
|||
/// Retrieves the current value at the given slot in memory or creates a new special mload class.
|
|||
Id loadFromMemory(Id _slot, SourceLocation const& _location); |
|||
/// Finds or creates a new expression that applies the sha3 hash function to the contents in memory.
|
|||
Id applySha3(Id _start, Id _length, SourceLocation const& _location); |
|||
|
|||
/// Current stack height, can be negative.
|
|||
int m_stackHeight = 0; |
|||
/// Current stack layout, mapping stack height -> equivalence class
|
|||
std::map<int, Id> m_stackElements; |
|||
/// Current sequence number, this is incremented with each modification to storage or memory.
|
|||
unsigned m_sequenceNumber = 1; |
|||
/// Knowledge about storage content.
|
|||
std::map<Id, Id> m_storageContent; |
|||
/// Knowledge about memory content. Keys are memory addresses, note that the values overlap
|
|||
/// and are not contained here if they are not completely known.
|
|||
std::map<Id, Id> m_memoryContent; |
|||
/// Keeps record of all sha3 hashes that are computed.
|
|||
std::map<std::vector<Id>, Id> m_knownSha3Hashes; |
|||
/// Structure containing the classes of equivalent expressions.
|
|||
std::shared_ptr<ExpressionClasses> m_expressionClasses; |
|||
}; |
|||
|
|||
} |
|||
} |
Loading…
Reference in new issue