chriseth
10 years ago
6 changed files with 455 additions and 307 deletions
@ -0,0 +1,278 @@ |
|||||
|
/*
|
||||
|
This file is part of cpp-ethereum. |
||||
|
|
||||
|
cpp-ethereum is free software: you can redistribute it and/or modify |
||||
|
it under the terms of the GNU General Public License as published by |
||||
|
the Free Software Foundation, either version 3 of the License, or |
||||
|
(at your option) any later version. |
||||
|
|
||||
|
cpp-ethereum is distributed in the hope that it will be useful, |
||||
|
but WITHOUT ANY WARRANTY; without even the implied warranty of |
||||
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
||||
|
GNU General Public License for more details. |
||||
|
|
||||
|
You should have received a copy of the GNU General Public License |
||||
|
along with cpp-ethereum. If not, see <http://www.gnu.org/licenses/>.
|
||||
|
*/ |
||||
|
/**
|
||||
|
* @file KnownState.cpp |
||||
|
* @author Christian <c@ethdev.com> |
||||
|
* @date 2015 |
||||
|
* Contains knowledge about the state of the virtual machine at a specific instruction. |
||||
|
*/ |
||||
|
|
||||
|
#include "KnownState.h" |
||||
|
#include <functional> |
||||
|
#include <libdevcrypto/SHA3.h> |
||||
|
#include <libevmasm/AssemblyItem.h> |
||||
|
|
||||
|
using namespace std; |
||||
|
using namespace dev; |
||||
|
using namespace dev::eth; |
||||
|
|
||||
|
ostream& KnownState::stream( |
||||
|
ostream& _out, |
||||
|
map<int, Id> _initialStack, |
||||
|
map<int, Id> _targetStack |
||||
|
) const |
||||
|
{ |
||||
|
auto streamExpressionClass = [this](ostream& _out, Id _id) |
||||
|
{ |
||||
|
auto const& expr = m_expressionClasses->representative(_id); |
||||
|
_out << " " << dec << _id << ": " << *expr.item; |
||||
|
if (expr.sequenceNumber) |
||||
|
_out << "@" << dec << expr.sequenceNumber; |
||||
|
_out << "("; |
||||
|
for (Id arg: expr.arguments) |
||||
|
_out << dec << arg << ","; |
||||
|
_out << ")" << endl; |
||||
|
}; |
||||
|
|
||||
|
_out << "Optimizer analysis:" << endl; |
||||
|
_out << "Final stack height: " << dec << m_stackHeight << endl; |
||||
|
_out << "Equivalence classes: " << endl; |
||||
|
for (Id eqClass = 0; eqClass < m_expressionClasses->size(); ++eqClass) |
||||
|
streamExpressionClass(_out, eqClass); |
||||
|
|
||||
|
_out << "Initial stack: " << endl; |
||||
|
for (auto const& it: _initialStack) |
||||
|
{ |
||||
|
_out << " " << dec << it.first << ": "; |
||||
|
streamExpressionClass(_out, it.second); |
||||
|
} |
||||
|
_out << "Target stack: " << endl; |
||||
|
for (auto const& it: _targetStack) |
||||
|
{ |
||||
|
_out << " " << dec << it.first << ": "; |
||||
|
streamExpressionClass(_out, it.second); |
||||
|
} |
||||
|
|
||||
|
return _out; |
||||
|
} |
||||
|
|
||||
|
KnownState::StoreOperation KnownState::feedItem(AssemblyItem const& _item, bool _copyItem) |
||||
|
{ |
||||
|
StoreOperation op; |
||||
|
if (_item.type() != Operation) |
||||
|
{ |
||||
|
assertThrow(_item.deposit() == 1, InvalidDeposit, ""); |
||||
|
setStackElement(++m_stackHeight, m_expressionClasses->find(_item, {}, _copyItem)); |
||||
|
} |
||||
|
else |
||||
|
{ |
||||
|
Instruction instruction = _item.instruction(); |
||||
|
InstructionInfo info = instructionInfo(instruction); |
||||
|
if (SemanticInformation::isDupInstruction(_item)) |
||||
|
setStackElement( |
||||
|
m_stackHeight + 1, |
||||
|
stackElement( |
||||
|
m_stackHeight - int(instruction) + int(Instruction::DUP1), |
||||
|
_item.getLocation() |
||||
|
) |
||||
|
); |
||||
|
else if (SemanticInformation::isSwapInstruction(_item)) |
||||
|
swapStackElements( |
||||
|
m_stackHeight, |
||||
|
m_stackHeight - 1 - int(instruction) + int(Instruction::SWAP1), |
||||
|
_item.getLocation() |
||||
|
); |
||||
|
else if (instruction != Instruction::POP) |
||||
|
{ |
||||
|
vector<Id> arguments(info.args); |
||||
|
for (int i = 0; i < info.args; ++i) |
||||
|
arguments[i] = stackElement(m_stackHeight - i, _item.getLocation()); |
||||
|
if (_item.instruction() == Instruction::SSTORE) |
||||
|
op = storeInStorage(arguments[0], arguments[1], _item.getLocation()); |
||||
|
else if (_item.instruction() == Instruction::SLOAD) |
||||
|
setStackElement( |
||||
|
m_stackHeight + _item.deposit(), |
||||
|
loadFromStorage(arguments[0], _item.getLocation()) |
||||
|
); |
||||
|
else if (_item.instruction() == Instruction::MSTORE) |
||||
|
op = storeInMemory(arguments[0], arguments[1], _item.getLocation()); |
||||
|
else if (_item.instruction() == Instruction::MLOAD) |
||||
|
setStackElement( |
||||
|
m_stackHeight + _item.deposit(), |
||||
|
loadFromMemory(arguments[0], _item.getLocation()) |
||||
|
); |
||||
|
else if (_item.instruction() == Instruction::SHA3) |
||||
|
setStackElement( |
||||
|
m_stackHeight + _item.deposit(), |
||||
|
applySha3(arguments.at(0), arguments.at(1), _item.getLocation()) |
||||
|
); |
||||
|
else |
||||
|
setStackElement( |
||||
|
m_stackHeight + _item.deposit(), |
||||
|
m_expressionClasses->find(_item, arguments, _copyItem) |
||||
|
); |
||||
|
} |
||||
|
m_stackHeight += _item.deposit(); |
||||
|
} |
||||
|
return op; |
||||
|
} |
||||
|
|
||||
|
ExpressionClasses::Id KnownState::stackElement(int _stackHeight, SourceLocation const& _location) |
||||
|
{ |
||||
|
if (m_stackElements.count(_stackHeight)) |
||||
|
return m_stackElements.at(_stackHeight); |
||||
|
// Stack element not found (not assigned yet), create new equivalence class.
|
||||
|
return m_stackElements[_stackHeight] = initialStackElement(_stackHeight, _location); |
||||
|
} |
||||
|
|
||||
|
ExpressionClasses::Id KnownState::initialStackElement( |
||||
|
int _stackHeight, |
||||
|
SourceLocation const& _location |
||||
|
) |
||||
|
{ |
||||
|
assertThrow(_stackHeight <= 0, OptimizerException, "Initial stack element of positive height requested."); |
||||
|
assertThrow(_stackHeight > -16, StackTooDeepException, ""); |
||||
|
// This is a special assembly item that refers to elements pre-existing on the initial stack.
|
||||
|
return m_expressionClasses->find(AssemblyItem(dupInstruction(1 - _stackHeight), _location)); |
||||
|
} |
||||
|
|
||||
|
void KnownState::setStackElement(int _stackHeight, Id _class) |
||||
|
{ |
||||
|
m_stackElements[_stackHeight] = _class; |
||||
|
} |
||||
|
|
||||
|
void KnownState::swapStackElements( |
||||
|
int _stackHeightA, |
||||
|
int _stackHeightB, |
||||
|
SourceLocation const& _location |
||||
|
) |
||||
|
{ |
||||
|
assertThrow(_stackHeightA != _stackHeightB, OptimizerException, "Swap on same stack elements."); |
||||
|
// ensure they are created
|
||||
|
stackElement(_stackHeightA, _location); |
||||
|
stackElement(_stackHeightB, _location); |
||||
|
|
||||
|
swap(m_stackElements[_stackHeightA], m_stackElements[_stackHeightB]); |
||||
|
} |
||||
|
|
||||
|
KnownState::StoreOperation KnownState::storeInStorage( |
||||
|
Id _slot, |
||||
|
Id _value, |
||||
|
SourceLocation const& _location) |
||||
|
{ |
||||
|
if (m_storageContent.count(_slot) && m_storageContent[_slot] == _value) |
||||
|
// do not execute the storage if we know that the value is already there
|
||||
|
return StoreOperation(); |
||||
|
m_sequenceNumber++; |
||||
|
decltype(m_storageContent) storageContents; |
||||
|
// Copy over all values (i.e. retain knowledge about them) where we know that this store
|
||||
|
// operation will not destroy the knowledge. Specifically, we copy storage locations we know
|
||||
|
// are different from _slot or locations where we know that the stored value is equal to _value.
|
||||
|
for (auto const& storageItem: m_storageContent) |
||||
|
if (m_expressionClasses->knownToBeDifferent(storageItem.first, _slot) || storageItem.second == _value) |
||||
|
storageContents.insert(storageItem); |
||||
|
m_storageContent = move(storageContents); |
||||
|
|
||||
|
AssemblyItem item(Instruction::SSTORE, _location); |
||||
|
Id id = m_expressionClasses->find(item, {_slot, _value}, true, m_sequenceNumber); |
||||
|
StoreOperation operation(StoreOperation::Storage, _slot, m_sequenceNumber, id); |
||||
|
m_storageContent[_slot] = _value; |
||||
|
// increment a second time so that we get unique sequence numbers for writes
|
||||
|
m_sequenceNumber++; |
||||
|
|
||||
|
return operation; |
||||
|
} |
||||
|
|
||||
|
ExpressionClasses::Id KnownState::loadFromStorage(Id _slot, SourceLocation const& _location) |
||||
|
{ |
||||
|
if (m_storageContent.count(_slot)) |
||||
|
return m_storageContent.at(_slot); |
||||
|
|
||||
|
AssemblyItem item(Instruction::SLOAD, _location); |
||||
|
return m_storageContent[_slot] = m_expressionClasses->find(item, {_slot}, true, m_sequenceNumber); |
||||
|
} |
||||
|
|
||||
|
KnownState::StoreOperation KnownState::storeInMemory(Id _slot, Id _value, SourceLocation const& _location) |
||||
|
{ |
||||
|
if (m_memoryContent.count(_slot) && m_memoryContent[_slot] == _value) |
||||
|
// do not execute the store if we know that the value is already there
|
||||
|
return StoreOperation(); |
||||
|
m_sequenceNumber++; |
||||
|
decltype(m_memoryContent) memoryContents; |
||||
|
// copy over values at points where we know that they are different from _slot by at least 32
|
||||
|
for (auto const& memoryItem: m_memoryContent) |
||||
|
if (m_expressionClasses->knownToBeDifferentBy32(memoryItem.first, _slot)) |
||||
|
memoryContents.insert(memoryItem); |
||||
|
m_memoryContent = move(memoryContents); |
||||
|
|
||||
|
AssemblyItem item(Instruction::MSTORE, _location); |
||||
|
Id id = m_expressionClasses->find(item, {_slot, _value}, true, m_sequenceNumber); |
||||
|
StoreOperation operation(StoreOperation(StoreOperation::Memory, _slot, m_sequenceNumber, id)); |
||||
|
m_memoryContent[_slot] = _value; |
||||
|
// increment a second time so that we get unique sequence numbers for writes
|
||||
|
m_sequenceNumber++; |
||||
|
return operation; |
||||
|
} |
||||
|
|
||||
|
ExpressionClasses::Id KnownState::loadFromMemory(Id _slot, SourceLocation const& _location) |
||||
|
{ |
||||
|
if (m_memoryContent.count(_slot)) |
||||
|
return m_memoryContent.at(_slot); |
||||
|
|
||||
|
AssemblyItem item(Instruction::MLOAD, _location); |
||||
|
return m_memoryContent[_slot] = m_expressionClasses->find(item, {_slot}, true, m_sequenceNumber); |
||||
|
} |
||||
|
|
||||
|
KnownState::Id KnownState::applySha3( |
||||
|
Id _start, |
||||
|
Id _length, |
||||
|
SourceLocation const& _location |
||||
|
) |
||||
|
{ |
||||
|
AssemblyItem sha3Item(Instruction::SHA3, _location); |
||||
|
// Special logic if length is a short constant, otherwise we cannot tell.
|
||||
|
u256 const* l = m_expressionClasses->knownConstant(_length); |
||||
|
// unknown or too large length
|
||||
|
if (!l || *l > 128) |
||||
|
return m_expressionClasses->find(sha3Item, {_start, _length}, true, m_sequenceNumber); |
||||
|
|
||||
|
vector<Id> arguments; |
||||
|
for (u256 i = 0; i < *l; i += 32) |
||||
|
{ |
||||
|
Id slot = m_expressionClasses->find( |
||||
|
AssemblyItem(Instruction::ADD, _location), |
||||
|
{_start, m_expressionClasses->find(i)} |
||||
|
); |
||||
|
arguments.push_back(loadFromMemory(slot, _location)); |
||||
|
} |
||||
|
if (m_knownSha3Hashes.count(arguments)) |
||||
|
return m_knownSha3Hashes.at(arguments); |
||||
|
Id v; |
||||
|
// If all arguments are known constants, compute the sha3 here
|
||||
|
if (all_of(arguments.begin(), arguments.end(), [this](Id _a) { return !!m_expressionClasses->knownConstant(_a); })) |
||||
|
{ |
||||
|
bytes data; |
||||
|
for (Id a: arguments) |
||||
|
data += toBigEndian(*m_expressionClasses->knownConstant(a)); |
||||
|
data.resize(size_t(*l)); |
||||
|
v = m_expressionClasses->find(AssemblyItem(u256(sha3(data)), _location)); |
||||
|
} |
||||
|
else |
||||
|
v = m_expressionClasses->find(sha3Item, {_start, _length}, true, m_sequenceNumber); |
||||
|
return m_knownSha3Hashes[arguments] = v; |
||||
|
} |
||||
|
|
@ -0,0 +1,149 @@ |
|||||
|
/*
|
||||
|
This file is part of cpp-ethereum. |
||||
|
|
||||
|
cpp-ethereum is free software: you can redistribute it and/or modify |
||||
|
it under the terms of the GNU General Public License as published by |
||||
|
the Free Software Foundation, either version 3 of the License, or |
||||
|
(at your option) any later version. |
||||
|
|
||||
|
cpp-ethereum is distributed in the hope that it will be useful, |
||||
|
but WITHOUT ANY WARRANTY; without even the implied warranty of |
||||
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
||||
|
GNU General Public License for more details. |
||||
|
|
||||
|
You should have received a copy of the GNU General Public License |
||||
|
along with cpp-ethereum. If not, see <http://www.gnu.org/licenses/>.
|
||||
|
*/ |
||||
|
/**
|
||||
|
* @file KnownState.h |
||||
|
* @author Christian <c@ethdev.com> |
||||
|
* @date 2015 |
||||
|
* Contains knowledge about the state of the virtual machine at a specific instruction. |
||||
|
*/ |
||||
|
|
||||
|
#pragma once |
||||
|
|
||||
|
#include <vector> |
||||
|
#include <map> |
||||
|
#include <set> |
||||
|
#include <tuple> |
||||
|
#include <ostream> |
||||
|
#include <libdevcore/CommonIO.h> |
||||
|
#include <libdevcore/Exceptions.h> |
||||
|
#include <libevmasm/ExpressionClasses.h> |
||||
|
#include <libevmasm/SemanticInformation.h> |
||||
|
|
||||
|
namespace dev |
||||
|
{ |
||||
|
namespace eth |
||||
|
{ |
||||
|
|
||||
|
class AssemblyItem; |
||||
|
using AssemblyItems = std::vector<AssemblyItem>; |
||||
|
|
||||
|
/**
|
||||
|
* Class to infer and store knowledge about the state of the virtual machine at a specific |
||||
|
* instruction. |
||||
|
* |
||||
|
* The general workings are that for each assembly item that is fed, an equivalence class is |
||||
|
* derived from the operation and the equivalence class of its arguments. DUPi, SWAPi and some |
||||
|
* arithmetic instructions are used to infer equivalences while these classes are determined. |
||||
|
*/ |
||||
|
class KnownState |
||||
|
{ |
||||
|
public: |
||||
|
using Id = ExpressionClasses::Id; |
||||
|
struct StoreOperation |
||||
|
{ |
||||
|
enum Target { Invalid, Memory, Storage }; |
||||
|
StoreOperation(): target(Invalid), sequenceNumber(-1) {} |
||||
|
StoreOperation( |
||||
|
Target _target, |
||||
|
Id _slot, |
||||
|
unsigned _sequenceNumber, |
||||
|
Id _expression |
||||
|
): target(_target), slot(_slot), sequenceNumber(_sequenceNumber), expression(_expression) {} |
||||
|
bool isValid() const { return target != Invalid; } |
||||
|
Target target; |
||||
|
Id slot; |
||||
|
unsigned sequenceNumber; |
||||
|
Id expression; |
||||
|
}; |
||||
|
|
||||
|
KnownState(): m_expressionClasses(std::make_shared<ExpressionClasses>()) {} |
||||
|
|
||||
|
/// Streams debugging information to @a _out.
|
||||
|
std::ostream& stream( |
||||
|
std::ostream& _out, |
||||
|
std::map<int, Id> _initialStack = std::map<int, Id>(), |
||||
|
std::map<int, Id> _targetStack = std::map<int, Id>() |
||||
|
) const; |
||||
|
|
||||
|
/// Feeds the item into the system for analysis.
|
||||
|
/// @returns a possible store operation
|
||||
|
StoreOperation feedItem(AssemblyItem const& _item, bool _copyItem = false); |
||||
|
|
||||
|
/// Resets any knowledge about storage.
|
||||
|
void resetStorage() { m_storageContent.clear(); } |
||||
|
/// Resets any knowledge about storage.
|
||||
|
void resetMemory() { m_memoryContent.clear(); } |
||||
|
/// Resets any knowledge about the current stack.
|
||||
|
void resetStack() { m_stackElements.clear(); m_stackHeight = 0; } |
||||
|
/// Resets any knowledge.
|
||||
|
void reset() { resetStorage(); resetMemory(); resetStack(); } |
||||
|
|
||||
|
///@todo the sequence numbers in two copies of this class should never be the same.
|
||||
|
/// might be doable using two-dimensional sequence numbers, where the first value is incremented
|
||||
|
/// for each copy
|
||||
|
|
||||
|
/// Retrieves the current equivalence class fo the given stack element (or generates a new
|
||||
|
/// one if it does not exist yet).
|
||||
|
Id stackElement(int _stackHeight, SourceLocation const& _location); |
||||
|
/// @returns the equivalence class id of the special initial stack element at the given height
|
||||
|
/// (must not be positive).
|
||||
|
Id initialStackElement(int _stackHeight, SourceLocation const& _location); |
||||
|
|
||||
|
int stackHeight() const { return m_stackHeight; } |
||||
|
std::map<int, Id> const& stackElements() const { return m_stackElements; } |
||||
|
ExpressionClasses& expressionClasses() const { return *m_expressionClasses; } |
||||
|
|
||||
|
private: |
||||
|
/// Assigns a new equivalence class to the next sequence number of the given stack element.
|
||||
|
void setStackElement(int _stackHeight, Id _class); |
||||
|
/// Swaps the given stack elements in their next sequence number.
|
||||
|
void swapStackElements(int _stackHeightA, int _stackHeightB, SourceLocation const& _location); |
||||
|
|
||||
|
/// Increments the sequence number, deletes all storage information that might be overwritten
|
||||
|
/// and stores the new value at the given slot.
|
||||
|
/// @returns the store operation, which might be invalid if storage was not modified
|
||||
|
StoreOperation storeInStorage(Id _slot, Id _value, SourceLocation const& _location); |
||||
|
/// Retrieves the current value at the given slot in storage or creates a new special sload class.
|
||||
|
Id loadFromStorage(Id _slot, SourceLocation const& _location); |
||||
|
/// Increments the sequence number, deletes all memory information that might be overwritten
|
||||
|
/// and stores the new value at the given slot.
|
||||
|
/// @returns the store operation, which might be invalid if memory was not modified
|
||||
|
StoreOperation storeInMemory(Id _slot, Id _value, SourceLocation const& _location); |
||||
|
/// Retrieves the current value at the given slot in memory or creates a new special mload class.
|
||||
|
Id loadFromMemory(Id _slot, SourceLocation const& _location); |
||||
|
/// Finds or creates a new expression that applies the sha3 hash function to the contents in memory.
|
||||
|
Id applySha3(Id _start, Id _length, SourceLocation const& _location); |
||||
|
|
||||
|
/// Current stack height, can be negative.
|
||||
|
int m_stackHeight = 0; |
||||
|
/// Current stack layout, mapping stack height -> equivalence class
|
||||
|
std::map<int, Id> m_stackElements; |
||||
|
/// Current sequence number, this is incremented with each modification to storage or memory.
|
||||
|
unsigned m_sequenceNumber = 1; |
||||
|
/// Knowledge about storage content.
|
||||
|
std::map<Id, Id> m_storageContent; |
||||
|
/// Knowledge about memory content. Keys are memory addresses, note that the values overlap
|
||||
|
/// and are not contained here if they are not completely known.
|
||||
|
std::map<Id, Id> m_memoryContent; |
||||
|
/// Keeps record of all sha3 hashes that are computed.
|
||||
|
std::map<std::vector<Id>, Id> m_knownSha3Hashes; |
||||
|
/// Structure containing the classes of equivalent expressions.
|
||||
|
std::shared_ptr<ExpressionClasses> m_expressionClasses; |
||||
|
}; |
||||
|
|
||||
|
} |
||||
|
} |
Loading…
Reference in new issue