You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
435 lines
16 KiB
435 lines
16 KiB
/*
|
|
This file is part of cpp-ethereum.
|
|
|
|
cpp-ethereum is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
cpp-ethereum is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with cpp-ethereum. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
/** @file RLP.h
|
|
* @author Gav Wood <i@gavwood.com>
|
|
* @date 2014
|
|
*
|
|
* RLP (de-)serialisation.
|
|
*/
|
|
|
|
#pragma once
|
|
|
|
#include <vector>
|
|
#include <array>
|
|
#include <exception>
|
|
#include <iostream>
|
|
#include <iomanip>
|
|
#include "vector_ref.h"
|
|
#include "Common.h"
|
|
#include "Exceptions.h"
|
|
#include "FixedHash.h"
|
|
|
|
namespace dev
|
|
{
|
|
|
|
class RLP;
|
|
using RLPs = std::vector<RLP>;
|
|
|
|
template <class _T> struct intTraits { static const unsigned maxSize = sizeof(_T); };
|
|
template <> struct intTraits<u160> { static const unsigned maxSize = 20; };
|
|
template <> struct intTraits<u256> { static const unsigned maxSize = 32; };
|
|
template <> struct intTraits<bigint> { static const unsigned maxSize = ~(unsigned)0; };
|
|
|
|
static const byte c_rlpMaxLengthBytes = 8;
|
|
static const byte c_rlpDataImmLenStart = 0x80;
|
|
static const byte c_rlpListStart = 0xc0;
|
|
|
|
static const byte c_rlpDataImmLenCount = c_rlpListStart - c_rlpDataImmLenStart - c_rlpMaxLengthBytes;
|
|
static const byte c_rlpDataIndLenZero = c_rlpDataImmLenStart + c_rlpDataImmLenCount - 1;
|
|
static const byte c_rlpListImmLenCount = 256 - c_rlpListStart - c_rlpMaxLengthBytes;
|
|
static const byte c_rlpListIndLenZero = c_rlpListStart + c_rlpListImmLenCount - 1;
|
|
|
|
/**
|
|
* @brief Class for interpreting Recursive Linear-Prefix Data.
|
|
* @by Gav Wood, 2013
|
|
*
|
|
* Class for reading byte arrays of data in RLP format.
|
|
*/
|
|
class RLP
|
|
{
|
|
public:
|
|
/// Conversion flags
|
|
enum
|
|
{
|
|
AllowNonCanon = 1,
|
|
ThrowOnFail = 4,
|
|
FailIfTooBig = 8,
|
|
FailIfTooSmall = 16,
|
|
Strict = ThrowOnFail | FailIfTooBig,
|
|
VeryStrict = ThrowOnFail | FailIfTooBig | FailIfTooSmall,
|
|
LaisezFaire = AllowNonCanon
|
|
};
|
|
|
|
using Strictness = int;
|
|
|
|
/// Construct a null node.
|
|
RLP() {}
|
|
|
|
/// Construct a node of value given in the bytes.
|
|
explicit RLP(bytesConstRef _d, Strictness _s = VeryStrict);
|
|
|
|
/// Construct a node of value given in the bytes.
|
|
explicit RLP(bytes const& _d, Strictness _s = VeryStrict): RLP(&_d, _s) {}
|
|
|
|
/// Construct a node to read RLP data in the bytes given.
|
|
RLP(byte const* _b, unsigned _s, Strictness _st = VeryStrict): RLP(bytesConstRef(_b, _s), _st) {}
|
|
|
|
/// Construct a node to read RLP data in the string.
|
|
explicit RLP(std::string const& _s, Strictness _st = VeryStrict): RLP(bytesConstRef((byte const*)_s.data(), _s.size()), _st) {}
|
|
|
|
/// The bare data of the RLP.
|
|
bytesConstRef data() const { return m_data; }
|
|
|
|
/// @returns true if the RLP is non-null.
|
|
explicit operator bool() const { return !isNull(); }
|
|
|
|
/// No value.
|
|
bool isNull() const { return m_data.size() == 0; }
|
|
|
|
/// Contains a zero-length string or zero-length list.
|
|
bool isEmpty() const { return !isNull() && (m_data[0] == c_rlpDataImmLenStart || m_data[0] == c_rlpListStart); }
|
|
|
|
/// String value.
|
|
bool isData() const { return !isNull() && m_data[0] < c_rlpListStart; }
|
|
|
|
/// List value.
|
|
bool isList() const { return !isNull() && m_data[0] >= c_rlpListStart; }
|
|
|
|
/// Integer value. Must not have a leading zero.
|
|
bool isInt() const;
|
|
|
|
/// @returns the number of items in the list, or zero if it isn't a list.
|
|
unsigned itemCount() const { return isList() ? items() : 0; }
|
|
unsigned itemCountStrict() const { if (!isList()) BOOST_THROW_EXCEPTION(BadCast()); return items(); }
|
|
|
|
/// @returns the number of bytes in the data, or zero if it isn't data.
|
|
unsigned size() const { return isData() ? length() : 0; }
|
|
unsigned sizeStrict() const { if (!isData()) BOOST_THROW_EXCEPTION(BadCast()); return length(); }
|
|
|
|
/// Equality operators; does best-effort conversion and checks for equality.
|
|
bool operator==(char const* _s) const { return isData() && toString() == _s; }
|
|
bool operator!=(char const* _s) const { return isData() && toString() != _s; }
|
|
bool operator==(std::string const& _s) const { return isData() && toString() == _s; }
|
|
bool operator!=(std::string const& _s) const { return isData() && toString() != _s; }
|
|
template <unsigned _N> bool operator==(FixedHash<_N> const& _h) const { return isData() && toHash<_N>() == _h; }
|
|
template <unsigned _N> bool operator!=(FixedHash<_N> const& _s) const { return isData() && toHash<_N>() != _s; }
|
|
bool operator==(unsigned const& _i) const { return isInt() && toInt<unsigned>() == _i; }
|
|
bool operator!=(unsigned const& _i) const { return isInt() && toInt<unsigned>() != _i; }
|
|
bool operator==(u256 const& _i) const { return isInt() && toInt<u256>() == _i; }
|
|
bool operator!=(u256 const& _i) const { return isInt() && toInt<u256>() != _i; }
|
|
bool operator==(bigint const& _i) const { return isInt() && toInt<bigint>() == _i; }
|
|
bool operator!=(bigint const& _i) const { return isInt() && toInt<bigint>() != _i; }
|
|
|
|
/// Subscript operator.
|
|
/// @returns the list item @a _i if isList() and @a _i < listItems(), or RLP() otherwise.
|
|
/// @note if used to access items in ascending order, this is efficient.
|
|
RLP operator[](unsigned _i) const;
|
|
|
|
using element_type = RLP;
|
|
|
|
/// @brief Iterator class for iterating through items of RLP list.
|
|
class iterator
|
|
{
|
|
friend class RLP;
|
|
|
|
public:
|
|
using value_type = RLP;
|
|
using element_type = RLP;
|
|
|
|
iterator& operator++();
|
|
iterator operator++(int) { auto ret = *this; operator++(); return ret; }
|
|
RLP operator*() const { return RLP(m_lastItem); }
|
|
bool operator==(iterator const& _cmp) const { return m_lastItem == _cmp.m_lastItem; }
|
|
bool operator!=(iterator const& _cmp) const { return !operator==(_cmp); }
|
|
|
|
private:
|
|
iterator() {}
|
|
iterator(RLP const& _parent, bool _begin);
|
|
|
|
unsigned m_remaining = 0;
|
|
bytesConstRef m_lastItem;
|
|
};
|
|
|
|
/// @brief Iterator into beginning of sub-item list (valid only if we are a list).
|
|
iterator begin() const { return iterator(*this, true); }
|
|
|
|
/// @brief Iterator into end of sub-item list (valid only if we are a list).
|
|
iterator end() const { return iterator(*this, false); }
|
|
|
|
/// Best-effort conversion operators.
|
|
explicit operator std::string() const { return toString(); }
|
|
explicit operator bytes() const { return toBytes(); }
|
|
explicit operator RLPs() const { return toList(); }
|
|
explicit operator uint8_t() const { return toInt<uint8_t>(); }
|
|
explicit operator uint16_t() const { return toInt<uint16_t>(); }
|
|
explicit operator uint32_t() const { return toInt<uint32_t>(); }
|
|
explicit operator uint64_t() const { return toInt<uint64_t>(); }
|
|
explicit operator u160() const { return toInt<u160>(); }
|
|
explicit operator u256() const { return toInt<u256>(); }
|
|
explicit operator bigint() const { return toInt<bigint>(); }
|
|
template <unsigned _N> explicit operator FixedHash<_N>() const { return toHash<FixedHash<_N>>(); }
|
|
template <class T, class U> explicit operator std::pair<T, U>() const { return toPair<T, U>(); }
|
|
template <class T> explicit operator std::vector<T>() const { return toVector<T>(); }
|
|
template <class T> explicit operator std::set<T>() const { return toSet<T>(); }
|
|
template <class T, size_t N> explicit operator std::array<T, N>() const { return toArray<T, N>(); }
|
|
|
|
/// Converts to bytearray. @returns the empty byte array if not a string.
|
|
bytes toBytes() const { if (!isData()) return bytes(); return bytes(payload().data(), payload().data() + length()); }
|
|
/// Converts to bytearray. @returns the empty byte array if not a string.
|
|
bytesConstRef toBytesConstRef() const { if (!isData()) return bytesConstRef(); return payload().cropped(0, length()); }
|
|
/// Converts to string. @returns the empty string if not a string.
|
|
std::string toString() const { if (!isData()) return std::string(); return payload().cropped(0, length()).toString(); }
|
|
/// Converts to string. @throws BadCast if not a string.
|
|
std::string toStringStrict() const { if (!isData()) BOOST_THROW_EXCEPTION(BadCast()); return payload().cropped(0, length()).toString(); }
|
|
|
|
template <class T>
|
|
std::vector<T> toVector() const
|
|
{
|
|
std::vector<T> ret;
|
|
if (isList())
|
|
{
|
|
ret.reserve(itemCount());
|
|
for (auto const& i: *this)
|
|
{
|
|
ret.push_back((T)i);
|
|
}
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
template <class T>
|
|
std::set<T> toSet() const
|
|
{
|
|
std::set<T> ret;
|
|
if (isList())
|
|
{
|
|
for (auto const& i: *this)
|
|
{
|
|
ret.insert((T)i);
|
|
}
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
template <class T, class U>
|
|
std::pair<T, U> toPair() const
|
|
{
|
|
std::pair<T, U> ret;
|
|
if (isList())
|
|
{
|
|
ret.first = (T)(*this)[0];
|
|
ret.second = (U)(*this)[1];
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
template <class T, size_t N>
|
|
std::array<T, N> toArray() const
|
|
{
|
|
if (itemCount() != N || !isList())
|
|
BOOST_THROW_EXCEPTION(BadCast());
|
|
std::array<T, N> ret;
|
|
for (unsigned i = 0; i < N; ++i)
|
|
{
|
|
ret[i] = (T)operator[](i);
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
/// Converts to int of type given; if isString(), decodes as big-endian bytestream. @returns 0 if not an int or string.
|
|
template <class _T = unsigned> _T toInt(int _flags = Strict) const
|
|
{
|
|
requireGood();
|
|
if ((!isInt() && !(_flags & AllowNonCanon)) || isList() || isNull())
|
|
if (_flags & ThrowOnFail)
|
|
BOOST_THROW_EXCEPTION(BadCast());
|
|
else
|
|
return 0;
|
|
else {}
|
|
|
|
auto p = payload();
|
|
if (p.size() > intTraits<_T>::maxSize && (_flags & FailIfTooBig))
|
|
if (_flags & ThrowOnFail)
|
|
BOOST_THROW_EXCEPTION(BadCast());
|
|
else
|
|
return 0;
|
|
else {}
|
|
|
|
return fromBigEndian<_T>(p);
|
|
}
|
|
|
|
template <class _N> _N toHash(int _flags = Strict) const
|
|
{
|
|
requireGood();
|
|
if (!isData() || (length() > _N::size && (_flags & FailIfTooBig)) || (length() < _N::size && (_flags & FailIfTooSmall)))
|
|
if (_flags & ThrowOnFail)
|
|
BOOST_THROW_EXCEPTION(BadCast());
|
|
else
|
|
return _N();
|
|
else{}
|
|
|
|
_N ret;
|
|
size_t s = std::min((size_t)_N::size, (size_t)length());
|
|
memcpy(ret.data() + _N::size - s, payload().data(), s);
|
|
return ret;
|
|
}
|
|
|
|
/// Converts to RLPs collection object. Useful if you need random access to sub items or will iterate over multiple times.
|
|
RLPs toList() const;
|
|
|
|
/// @returns the data payload. Valid for all types.
|
|
bytesConstRef payload() const { auto l = length(); if (l > m_data.size()) throw BadRLP(); return m_data.cropped(payloadOffset(), l); }
|
|
|
|
/// @returns the theoretical size of this item.
|
|
/// @note Under normal circumstances, is equivalent to m_data.size() - use that unless you know it won't work.
|
|
unsigned actualSize() const;
|
|
|
|
private:
|
|
/// Disable construction from rvalue
|
|
explicit RLP(bytes const&&) {}
|
|
|
|
/// Throws if is non-canonical data (i.e. single byte done in two bytes that could be done in one).
|
|
void requireGood() const;
|
|
|
|
/// Single-byte data payload.
|
|
bool isSingleByte() const { return !isNull() && m_data[0] < c_rlpDataImmLenStart; }
|
|
|
|
/// @returns the bytes used to encode the length of the data. Valid for all types.
|
|
unsigned lengthSize() const { if (isData() && m_data[0] > c_rlpDataIndLenZero) return m_data[0] - c_rlpDataIndLenZero; if (isList() && m_data[0] > c_rlpListIndLenZero) return m_data[0] - c_rlpListIndLenZero; return 0; }
|
|
|
|
/// @returns the size in bytes of the payload, as given by the RLP as opposed to as inferred from m_data.
|
|
unsigned length() const;
|
|
|
|
/// @returns the number of bytes into the data that the payload starts.
|
|
unsigned payloadOffset() const { return isSingleByte() ? 0 : (1 + lengthSize()); }
|
|
|
|
/// @returns the number of data items.
|
|
unsigned items() const;
|
|
|
|
/// Our byte data.
|
|
bytesConstRef m_data;
|
|
|
|
/// The list-indexing cache.
|
|
mutable unsigned m_lastIndex = (unsigned)-1;
|
|
mutable unsigned m_lastEnd = 0;
|
|
mutable bytesConstRef m_lastItem;
|
|
};
|
|
|
|
/**
|
|
* @brief Class for writing to an RLP bytestream.
|
|
*/
|
|
class RLPStream
|
|
{
|
|
public:
|
|
/// Initializes empty RLPStream.
|
|
RLPStream() {}
|
|
|
|
/// Initializes the RLPStream as a list of @a _listItems items.
|
|
explicit RLPStream(unsigned _listItems) { appendList(_listItems); }
|
|
|
|
~RLPStream() {}
|
|
|
|
/// Append given datum to the byte stream.
|
|
RLPStream& append(unsigned _s) { return append(bigint(_s)); }
|
|
RLPStream& append(u160 _s) { return append(bigint(_s)); }
|
|
RLPStream& append(u256 _s) { return append(bigint(_s)); }
|
|
RLPStream& append(bigint _s);
|
|
RLPStream& append(bytesConstRef _s, bool _compact = false);
|
|
RLPStream& append(bytes const& _s) { return append(bytesConstRef(&_s)); }
|
|
RLPStream& append(std::string const& _s) { return append(bytesConstRef(_s)); }
|
|
RLPStream& append(char const* _s) { return append(std::string(_s)); }
|
|
template <unsigned N> RLPStream& append(FixedHash<N> _s, bool _compact = false, bool _allOrNothing = false) { return _allOrNothing && !_s ? append(bytesConstRef()) : append(_s.ref(), _compact); }
|
|
|
|
/// Appends an arbitrary RLP fragment - this *must* be a single item unless @a _itemCount is given.
|
|
RLPStream& append(RLP const& _rlp, unsigned _itemCount = 1) { return appendRaw(_rlp.data(), _itemCount); }
|
|
|
|
/// Appends a sequence of data to the stream as a list.
|
|
template <class _T> RLPStream& append(std::vector<_T> const& _s) { return appendVector(_s); }
|
|
template <class _T> RLPStream& appendVector(std::vector<_T> const& _s) { appendList(_s.size()); for (auto const& i: _s) append(i); return *this; }
|
|
template <class _T, size_t S> RLPStream& append(std::array<_T, S> const& _s) { appendList(_s.size()); for (auto const& i: _s) append(i); return *this; }
|
|
template <class _T> RLPStream& append(std::set<_T> const& _s) { appendList(_s.size()); for (auto const& i: _s) append(i); return *this; }
|
|
template <class T, class U> RLPStream& append(std::pair<T, U> const& _s) { appendList(2); append(_s.first); append(_s.second); return *this; }
|
|
|
|
/// Appends a list.
|
|
RLPStream& appendList(unsigned _items);
|
|
RLPStream& appendList(bytesConstRef _rlp);
|
|
RLPStream& appendList(bytes const& _rlp) { return appendList(&_rlp); }
|
|
RLPStream& appendList(RLPStream const& _s) { return appendList(&_s.out()); }
|
|
|
|
/// Appends raw (pre-serialised) RLP data. Use with caution.
|
|
RLPStream& appendRaw(bytesConstRef _rlp, unsigned _itemCount = 1);
|
|
RLPStream& appendRaw(bytes const& _rlp, unsigned _itemCount = 1) { return appendRaw(&_rlp, _itemCount); }
|
|
|
|
/// Shift operators for appending data items.
|
|
template <class T> RLPStream& operator<<(T _data) { return append(_data); }
|
|
|
|
/// Clear the output stream so far.
|
|
void clear() { m_out.clear(); m_listStack.clear(); }
|
|
|
|
/// Read the byte stream.
|
|
bytes const& out() const { if(!m_listStack.empty()) BOOST_THROW_EXCEPTION(RLPException() << errinfo_comment("listStack is not empty")); return m_out; }
|
|
|
|
/// Swap the contents of the output stream out for some other byte array.
|
|
void swapOut(bytes& _dest) { if(!m_listStack.empty()) BOOST_THROW_EXCEPTION(RLPException() << errinfo_comment("listStack is not empty")); swap(m_out, _dest); }
|
|
|
|
private:
|
|
void noteAppended(unsigned _itemCount = 1);
|
|
|
|
/// Push the node-type byte (using @a _base) along with the item count @a _count.
|
|
/// @arg _count is number of characters for strings, data-bytes for ints, or items for lists.
|
|
void pushCount(unsigned _count, byte _offset);
|
|
|
|
/// Push an integer as a raw big-endian byte-stream.
|
|
template <class _T> void pushInt(_T _i, unsigned _br)
|
|
{
|
|
m_out.resize(m_out.size() + _br);
|
|
byte* b = &m_out.back();
|
|
for (; _i; _i >>= 8)
|
|
*(b--) = (byte)_i;
|
|
}
|
|
|
|
/// Our output byte stream.
|
|
bytes m_out;
|
|
|
|
std::vector<std::pair<unsigned, unsigned>> m_listStack;
|
|
};
|
|
|
|
template <class _T> void rlpListAux(RLPStream& _out, _T _t) { _out << _t; }
|
|
template <class _T, class ... _Ts> void rlpListAux(RLPStream& _out, _T _t, _Ts ... _ts) { rlpListAux(_out << _t, _ts...); }
|
|
|
|
/// Export a single item in RLP format, returning a byte array.
|
|
template <class _T> bytes rlp(_T _t) { return (RLPStream() << _t).out(); }
|
|
|
|
/// Export a list of items in RLP format, returning a byte array.
|
|
inline bytes rlpList() { return RLPStream(0).out(); }
|
|
template <class ... _Ts> bytes rlpList(_Ts ... _ts)
|
|
{
|
|
RLPStream out(sizeof ...(_Ts));
|
|
rlpListAux(out, _ts...);
|
|
return out.out();
|
|
}
|
|
|
|
/// The empty string in RLP format.
|
|
extern bytes RLPNull;
|
|
|
|
/// The empty list in RLP format.
|
|
extern bytes RLPEmptyList;
|
|
|
|
/// Human readable version of RLP.
|
|
std::ostream& operator<<(std::ostream& _out, dev::RLP const& _d);
|
|
|
|
}
|
|
|