2010-08-29 16:58:15 +00:00
// Copyright (c) 2009-2010 Satoshi Nakamoto
2022-12-24 23:49:50 +00:00
// Copyright (c) 2009-2022 The Bitcoin Core developers
2014-10-31 11:34:30 +08:00
// Distributed under the MIT software license, see the accompanying
2012-05-18 22:02:28 +08:00
// file COPYING or http://www.opensource.org/licenses/mit-license.php.
2013-04-13 00:13:08 -05:00
2011-05-15 09:11:04 +02:00
# ifndef BITCOIN_SERIALIZE_H
# define BITCOIN_SERIALIZE_H
2010-08-29 16:58:15 +00:00
2020-07-11 05:12:43 +02:00
# include <attributes.h>
2017-11-10 13:57:53 +13:00
# include <compat/endian.h>
2015-03-27 13:19:49 +01:00
2013-04-13 00:13:08 -05:00
# include <algorithm>
2019-12-29 13:04:02 -08:00
# include <cstdint>
2020-02-17 20:53:50 +01:00
# include <cstring>
2013-04-13 00:13:08 -05:00
# include <ios>
2014-09-14 12:43:56 +02:00
# include <limits>
2010-08-29 16:58:15 +00:00
# include <map>
2016-11-10 10:54:14 -08:00
# include <memory>
2010-09-06 21:03:04 +00:00
# include <set>
2013-04-13 00:13:08 -05:00
# include <string>
# include <string.h>
# include <utility>
# include <vector>
2011-05-15 09:11:04 +02:00
2017-11-10 13:57:53 +13:00
# include <prevector.h>
2018-04-04 12:40:10 -07:00
# include <span.h>
2013-04-13 00:13:08 -05:00
2020-10-08 20:27:27 -07:00
/**
* The maximum size of a serialized object in bytes or number of elements
* ( for eg vectors ) when the size is encoded as CompactSize .
*/
static constexpr uint64_t MAX_SIZE = 0x02000000 ;
2010-08-29 16:58:15 +00:00
2017-09-06 11:25:03 -07:00
/** Maximum amount of memory (in bytes) to allocate at once when deserializing vectors. */
static const unsigned int MAX_VECTOR_ALLOCATE = 5000000 ;
2016-11-10 10:54:14 -08:00
/**
* Dummy data type to identify deserializing constructors .
*
* By convention , a constructor of a type T with signature
*
* template < typename Stream > T : : T ( deserialize_type , Stream & s )
*
* is a deserializing constructor , which builds the type by
* deserializing it from s . If T contains const fields , this
* is likely the only way to do so .
*/
struct deserialize_type { } ;
constexpr deserialize_type deserialize { } ;
2014-12-19 11:41:50 +01:00
/*
* Lowest - level serialization and conversion .
*/
template < typename Stream > inline void ser_writedata8 ( Stream & s , uint8_t obj )
{
2022-01-02 11:31:25 +01:00
s . write ( AsBytes ( Span { & obj , 1 } ) ) ;
2014-12-19 11:41:50 +01:00
}
template < typename Stream > inline void ser_writedata16 ( Stream & s , uint16_t obj )
{
obj = htole16 ( obj ) ;
2022-01-02 11:31:25 +01:00
s . write ( AsBytes ( Span { & obj , 1 } ) ) ;
2014-12-19 11:41:50 +01:00
}
2018-04-08 09:39:05 -07:00
template < typename Stream > inline void ser_writedata16be ( Stream & s , uint16_t obj )
{
obj = htobe16 ( obj ) ;
2022-01-02 11:31:25 +01:00
s . write ( AsBytes ( Span { & obj , 1 } ) ) ;
2018-04-08 09:39:05 -07:00
}
2014-12-19 11:41:50 +01:00
template < typename Stream > inline void ser_writedata32 ( Stream & s , uint32_t obj )
{
obj = htole32 ( obj ) ;
2022-01-02 11:31:25 +01:00
s . write ( AsBytes ( Span { & obj , 1 } ) ) ;
2014-12-19 11:41:50 +01:00
}
2019-03-12 00:20:40 -07:00
template < typename Stream > inline void ser_writedata32be ( Stream & s , uint32_t obj )
{
obj = htobe32 ( obj ) ;
2022-01-02 11:31:25 +01:00
s . write ( AsBytes ( Span { & obj , 1 } ) ) ;
2019-03-12 00:20:40 -07:00
}
2014-12-19 11:41:50 +01:00
template < typename Stream > inline void ser_writedata64 ( Stream & s , uint64_t obj )
{
obj = htole64 ( obj ) ;
2022-01-02 11:31:25 +01:00
s . write ( AsBytes ( Span { & obj , 1 } ) ) ;
2014-12-19 11:41:50 +01:00
}
template < typename Stream > inline uint8_t ser_readdata8 ( Stream & s )
{
uint8_t obj ;
2022-01-02 11:31:25 +01:00
s . read ( AsWritableBytes ( Span { & obj , 1 } ) ) ;
2014-12-19 11:41:50 +01:00
return obj ;
}
template < typename Stream > inline uint16_t ser_readdata16 ( Stream & s )
{
uint16_t obj ;
2022-01-02 11:31:25 +01:00
s . read ( AsWritableBytes ( Span { & obj , 1 } ) ) ;
2014-12-19 11:41:50 +01:00
return le16toh ( obj ) ;
}
2018-04-08 09:39:05 -07:00
template < typename Stream > inline uint16_t ser_readdata16be ( Stream & s )
{
uint16_t obj ;
2022-01-02 11:31:25 +01:00
s . read ( AsWritableBytes ( Span { & obj , 1 } ) ) ;
2018-04-08 09:39:05 -07:00
return be16toh ( obj ) ;
}
2014-12-19 11:41:50 +01:00
template < typename Stream > inline uint32_t ser_readdata32 ( Stream & s )
{
uint32_t obj ;
2022-01-02 11:31:25 +01:00
s . read ( AsWritableBytes ( Span { & obj , 1 } ) ) ;
2014-12-19 11:41:50 +01:00
return le32toh ( obj ) ;
}
2019-03-12 00:20:40 -07:00
template < typename Stream > inline uint32_t ser_readdata32be ( Stream & s )
{
uint32_t obj ;
2022-01-02 11:31:25 +01:00
s . read ( AsWritableBytes ( Span { & obj , 1 } ) ) ;
2019-03-12 00:20:40 -07:00
return be32toh ( obj ) ;
}
2014-12-19 11:41:50 +01:00
template < typename Stream > inline uint64_t ser_readdata64 ( Stream & s )
{
uint64_t obj ;
2022-01-02 11:31:25 +01:00
s . read ( AsWritableBytes ( Span { & obj , 1 } ) ) ;
2014-12-19 11:41:50 +01:00
return le64toh ( obj ) ;
}
2010-08-29 16:58:15 +00:00
/////////////////////////////////////////////////////////////////
//
// Templates for serializing to anything that looks like a stream,
2022-01-02 11:31:25 +01:00
// i.e. anything that supports .read(Span<std::byte>) and .write(Span<const std::byte>)
2010-08-29 16:58:15 +00:00
//
2016-10-28 17:50:04 -07:00
class CSizeComputer ;
2010-08-29 16:58:15 +00:00
enum
{
// primary actions
SER_NETWORK = ( 1 < < 0 ) ,
SER_DISK = ( 1 < < 1 ) ,
SER_GETHASH = ( 1 < < 2 ) ,
} ;
2020-07-11 09:55:38 +02:00
/**
* Convert any argument to a reference to X , maintaining constness .
*
* This can be used in serialization code to invoke a base class ' s
* serialization routines .
*
* Example use :
* class Base { . . . } ;
* class Child : public Base {
* int m_data ;
* public :
* SERIALIZE_METHODS ( Child , obj ) {
* READWRITE ( AsBase < Base > ( obj ) , obj . m_data ) ;
* }
* } ;
*
* static_cast cannot easily be used here , as the type of Obj will be const Child &
* during serialization and Child & during deserialization . AsBase will convert to
* const Base & and Base & appropriately .
*/
template < class Out , class In >
Out & AsBase ( In & x )
{
static_assert ( std : : is_base_of_v < Out , In > ) ;
return x ;
}
template < class Out , class In >
const Out & AsBase ( const In & x )
{
static_assert ( std : : is_base_of_v < Out , In > ) ;
return x ;
}
2017-07-07 16:06:56 -07:00
2023-09-14 10:00:45 +10:00
# define READWRITE(...) (ser_action.SerReadWriteMany(s, __VA_ARGS__))
# define SER_READ(obj, code) ser_action.SerRead(s, obj, [&](Stream& s, typename std::remove_const<Type>::type& obj) { code; })
# define SER_WRITE(obj, code) ser_action.SerWrite(s, obj, [&](Stream& s, const Type& obj) { code; })
2010-08-29 16:58:15 +00:00
2020-01-18 07:32:31 -08:00
/**
* Implement the Ser and Unser methods needed for implementing a formatter ( see Using below ) .
*
* Both Ser and Unser are delegated to a single static method SerializationOps , which is polymorphic
* in the serialized / deserialized type ( allowing it to be const when serializing , and non - const when
* deserializing ) .
*
* Example use :
* struct FooFormatter {
* FORMATTER_METHODS ( Class , obj ) { READWRITE ( obj . val1 , VARINT ( obj . val2 ) ) ; }
* }
* would define a class FooFormatter that defines a serialization of Class objects consisting
* of serializing its val1 member using the default serialization , and its val2 member using
* VARINT serialization . That FooFormatter can then be used in statements like
* READWRITE ( Using < FooFormatter > ( obj . bla ) ) .
*/
# define FORMATTER_METHODS(cls, obj) \
template < typename Stream > \
2023-01-31 14:18:42 +01:00
static void Ser ( Stream & s , const cls & obj ) { SerializationOps ( obj , s , ActionSerialize { } ) ; } \
2020-01-18 07:32:31 -08:00
template < typename Stream > \
2023-01-31 14:18:42 +01:00
static void Unser ( Stream & s , cls & obj ) { SerializationOps ( obj , s , ActionUnserialize { } ) ; } \
2020-01-18 07:32:31 -08:00
template < typename Stream , typename Type , typename Operation > \
2023-01-31 14:18:42 +01:00
static void SerializationOps ( Type & obj , Stream & s , Operation ser_action )
2020-01-18 07:32:31 -08:00
2020-07-11 05:12:43 +02:00
/**
* Variant of FORMATTER_METHODS that supports a declared parameter type .
*
* If a formatter has a declared parameter type , it must be invoked directly or
* indirectly with a parameter of that type . This permits making serialization
* depend on run - time context in a type - safe way .
*
* Example use :
* struct BarParameter { bool fancy ; . . . } ;
* struct Bar { . . . } ;
* struct FooFormatter {
* FORMATTER_METHODS ( Bar , obj , BarParameter , param ) {
* if ( param . fancy ) {
* READWRITE ( VARINT ( obj . value ) ) ;
* } else {
* READWRITE ( obj . value ) ;
* }
* }
* } ;
* which would then be invoked as
* READWRITE ( WithParams ( BarParameter { . . . } , Using < FooFormatter > ( obj . foo ) ) )
*
* WithParams ( parameter , obj ) can be invoked anywhere in the call stack ; it is
* passed down recursively into all serialization code , until another
* WithParams overrides it .
*
* Parameters will be implicitly converted where appropriate . This means that
* " parent " serialization code can use a parameter that derives from , or is
* convertible to , a " child " formatter ' s parameter type .
*
* Compilation will fail in any context where serialization is invoked but
* no parameter of a type convertible to BarParameter is provided .
*/
# define FORMATTER_METHODS_PARAMS(cls, obj, paramcls, paramobj) \
template < typename Stream > \
static void Ser ( Stream & s , const cls & obj ) { SerializationOps ( obj , s , ActionSerialize { } , s . GetParams ( ) ) ; } \
template < typename Stream > \
static void Unser ( Stream & s , cls & obj ) { SerializationOps ( obj , s , ActionUnserialize { } , s . GetParams ( ) ) ; } \
template < typename Stream , typename Type , typename Operation > \
static void SerializationOps ( Type & obj , Stream & s , Operation ser_action , const paramcls & paramobj )
# define BASE_SERIALIZE_METHODS(cls) \
template < typename Stream > \
void Serialize ( Stream & s ) const \
{ \
static_assert ( std : : is_same < const cls & , decltype ( * this ) > : : value , " Serialize type mismatch " ) ; \
Ser ( s , * this ) ; \
} \
template < typename Stream > \
void Unserialize ( Stream & s ) \
{ \
static_assert ( std : : is_same < cls & , decltype ( * this ) > : : value , " Unserialize type mismatch " ) ; \
Unser ( s , * this ) ; \
}
2017-07-07 15:48:13 -07:00
/**
* Implement the Serialize and Unserialize methods by delegating to a single templated
* static method that takes the to - be - ( de ) serialized object as a parameter . This approach
* has the advantage that the constness of the object becomes a template parameter , and
* thus allows a single implementation that sees the object as const for serializing
* and non - const for deserializing , without casts .
*/
2020-07-11 05:12:43 +02:00
# define SERIALIZE_METHODS(cls, obj) \
BASE_SERIALIZE_METHODS ( cls ) \
2020-01-18 07:32:31 -08:00
FORMATTER_METHODS ( cls , obj )
2017-07-07 15:48:13 -07:00
2020-07-11 05:12:43 +02:00
/**
* Variant of SERIALIZE_METHODS that supports a declared parameter type .
*
* See FORMATTER_METHODS_PARAMS for more information on parameters .
*/
# define SERIALIZE_METHODS_PARAMS(cls, obj, paramcls, paramobj) \
BASE_SERIALIZE_METHODS ( cls ) \
FORMATTER_METHODS_PARAMS ( cls , obj , paramcls , paramobj )
2023-06-21 10:13:08 +02:00
// clang-format off
2018-07-01 13:58:37 +00:00
# ifndef CHAR_EQUALS_INT8
2022-01-02 11:55:43 +01:00
template < typename Stream > void Serialize ( Stream & , char ) = delete ; // char serialization forbidden. Use uint8_t or int8_t
2018-07-01 13:58:37 +00:00
# endif
2023-06-30 12:00:20 +02:00
template < typename Stream > void Serialize ( Stream & s , std : : byte a ) { ser_writedata8 ( s , uint8_t ( a ) ) ; }
2016-10-28 16:29:17 -07:00
template < typename Stream > inline void Serialize ( Stream & s , int8_t a ) { ser_writedata8 ( s , a ) ; }
template < typename Stream > inline void Serialize ( Stream & s , uint8_t a ) { ser_writedata8 ( s , a ) ; }
template < typename Stream > inline void Serialize ( Stream & s , int16_t a ) { ser_writedata16 ( s , a ) ; }
template < typename Stream > inline void Serialize ( Stream & s , uint16_t a ) { ser_writedata16 ( s , a ) ; }
template < typename Stream > inline void Serialize ( Stream & s , int32_t a ) { ser_writedata32 ( s , a ) ; }
template < typename Stream > inline void Serialize ( Stream & s , uint32_t a ) { ser_writedata32 ( s , a ) ; }
template < typename Stream > inline void Serialize ( Stream & s , int64_t a ) { ser_writedata64 ( s , a ) ; }
template < typename Stream > inline void Serialize ( Stream & s , uint64_t a ) { ser_writedata64 ( s , a ) ; }
2022-01-02 11:31:25 +01:00
template < typename Stream , int N > inline void Serialize ( Stream & s , const char ( & a ) [ N ] ) { s . write ( MakeByteSpan ( a ) ) ; }
template < typename Stream , int N > inline void Serialize ( Stream & s , const unsigned char ( & a ) [ N ] ) { s . write ( MakeByteSpan ( a ) ) ; }
2023-06-21 10:13:08 +02:00
template < typename Stream , typename B > void Serialize ( Stream & s , Span < B > span ) { ( void ) /* force byte-type */ UCharCast ( span . data ( ) ) ; s . write ( AsBytes ( span ) ) ; }
2014-12-19 11:41:50 +01:00
2018-07-01 13:58:37 +00:00
# ifndef CHAR_EQUALS_INT8
2022-01-02 11:55:43 +01:00
template < typename Stream > void Unserialize ( Stream & , char ) = delete ; // char serialization forbidden. Use uint8_t or int8_t
2018-07-01 13:58:37 +00:00
# endif
2023-06-30 12:00:20 +02:00
template < typename Stream > void Unserialize ( Stream & s , std : : byte & a ) { a = std : : byte { ser_readdata8 ( s ) } ; }
2016-10-28 16:29:17 -07:00
template < typename Stream > inline void Unserialize ( Stream & s , int8_t & a ) { a = ser_readdata8 ( s ) ; }
template < typename Stream > inline void Unserialize ( Stream & s , uint8_t & a ) { a = ser_readdata8 ( s ) ; }
template < typename Stream > inline void Unserialize ( Stream & s , int16_t & a ) { a = ser_readdata16 ( s ) ; }
template < typename Stream > inline void Unserialize ( Stream & s , uint16_t & a ) { a = ser_readdata16 ( s ) ; }
template < typename Stream > inline void Unserialize ( Stream & s , int32_t & a ) { a = ser_readdata32 ( s ) ; }
template < typename Stream > inline void Unserialize ( Stream & s , uint32_t & a ) { a = ser_readdata32 ( s ) ; }
template < typename Stream > inline void Unserialize ( Stream & s , int64_t & a ) { a = ser_readdata64 ( s ) ; }
template < typename Stream > inline void Unserialize ( Stream & s , uint64_t & a ) { a = ser_readdata64 ( s ) ; }
2022-01-02 11:31:25 +01:00
template < typename Stream , int N > inline void Unserialize ( Stream & s , char ( & a ) [ N ] ) { s . read ( MakeWritableByteSpan ( a ) ) ; }
template < typename Stream , int N > inline void Unserialize ( Stream & s , unsigned char ( & a ) [ N ] ) { s . read ( MakeWritableByteSpan ( a ) ) ; }
2023-06-21 10:13:08 +02:00
template < typename Stream , typename B > void Unserialize ( Stream & s , Span < B > span ) { ( void ) /* force byte-type */ UCharCast ( span . data ( ) ) ; s . read ( AsWritableBytes ( span ) ) ; }
2010-08-29 16:58:15 +00:00
2021-05-31 14:57:32 +02:00
template < typename Stream > inline void Serialize ( Stream & s , bool a ) { uint8_t f = a ; ser_writedata8 ( s , f ) ; }
template < typename Stream > inline void Unserialize ( Stream & s , bool & a ) { uint8_t f = ser_readdata8 ( s ) ; a = f ; }
2023-06-21 10:13:08 +02:00
// clang-format on
2010-08-29 16:58:15 +00:00
2014-10-31 11:34:30 +08:00
/**
* Compact Size
* size < 253 - - 1 byte
* size < = USHRT_MAX - - 3 bytes ( 253 + 2 bytes )
* size < = UINT_MAX - - 5 bytes ( 254 + 4 bytes )
* size > UINT_MAX - - 9 bytes ( 255 + 8 bytes )
*/
2013-04-13 00:13:08 -05:00
inline unsigned int GetSizeOfCompactSize ( uint64_t nSize )
2010-08-29 16:58:15 +00:00
{
2010-09-30 16:23:07 +00:00
if ( nSize < 253 ) return sizeof ( unsigned char ) ;
2019-12-29 13:04:02 -08:00
else if ( nSize < = std : : numeric_limits < uint16_t > : : max ( ) ) return sizeof ( unsigned char ) + sizeof ( uint16_t ) ;
2011-12-19 17:08:25 -05:00
else if ( nSize < = std : : numeric_limits < unsigned int > : : max ( ) ) return sizeof ( unsigned char ) + sizeof ( unsigned int ) ;
2013-04-13 00:13:08 -05:00
else return sizeof ( unsigned char ) + sizeof ( uint64_t ) ;
2010-08-29 16:58:15 +00:00
}
2016-10-28 17:50:04 -07:00
inline void WriteCompactSize ( CSizeComputer & os , uint64_t nSize ) ;
2010-08-29 16:58:15 +00:00
template < typename Stream >
2013-04-13 00:13:08 -05:00
void WriteCompactSize ( Stream & os , uint64_t nSize )
2010-08-29 16:58:15 +00:00
{
2010-09-30 16:23:07 +00:00
if ( nSize < 253 )
2010-08-29 16:58:15 +00:00
{
2014-12-19 11:41:50 +01:00
ser_writedata8 ( os , nSize ) ;
2010-08-29 16:58:15 +00:00
}
2019-12-29 13:04:02 -08:00
else if ( nSize < = std : : numeric_limits < uint16_t > : : max ( ) )
2010-08-29 16:58:15 +00:00
{
2014-12-19 11:41:50 +01:00
ser_writedata8 ( os , 253 ) ;
ser_writedata16 ( os , nSize ) ;
2010-08-29 16:58:15 +00:00
}
2011-12-19 17:08:25 -05:00
else if ( nSize < = std : : numeric_limits < unsigned int > : : max ( ) )
2010-08-29 16:58:15 +00:00
{
2014-12-19 11:41:50 +01:00
ser_writedata8 ( os , 254 ) ;
ser_writedata32 ( os , nSize ) ;
2010-08-29 16:58:15 +00:00
}
else
{
2014-12-19 11:41:50 +01:00
ser_writedata8 ( os , 255 ) ;
ser_writedata64 ( os , nSize ) ;
2010-08-29 16:58:15 +00:00
}
return ;
}
2020-10-08 20:27:27 -07:00
/**
* Decode a CompactSize - encoded variable - length integer .
*
* As these are primarily used to encode the size of vector - like serializations , by default a range
* check is performed . When used as a generic number encoding , range_check should be set to false .
*/
2010-08-29 16:58:15 +00:00
template < typename Stream >
2020-10-08 20:27:27 -07:00
uint64_t ReadCompactSize ( Stream & is , bool range_check = true )
2010-08-29 16:58:15 +00:00
{
2014-12-19 11:41:50 +01:00
uint8_t chSize = ser_readdata8 ( is ) ;
2013-04-13 00:13:08 -05:00
uint64_t nSizeRet = 0 ;
2010-09-30 16:23:07 +00:00
if ( chSize < 253 )
2010-08-29 16:58:15 +00:00
{
nSizeRet = chSize ;
}
2010-09-30 16:23:07 +00:00
else if ( chSize = = 253 )
2010-08-29 16:58:15 +00:00
{
2014-12-19 11:41:50 +01:00
nSizeRet = ser_readdata16 ( is ) ;
Reject non-canonically-encoded sizes
The length of vectors, maps, sets, etc are serialized using
Write/ReadCompactSize -- which, unfortunately, do not use a
unique encoding.
So deserializing and then re-serializing a transaction (for example)
can give you different bits than you started with. That doesn't
cause any problems that we are aware of, but it is exactly the type
of subtle mismatch that can lead to exploits.
With this pull, reading a non-canonical CompactSize throws an
exception, which means nodes will ignore 'tx' or 'block' or
other messages that are not properly encoded.
Please check my logic... but this change is safe with respect to
causing a network split. Old clients that receive
non-canonically-encoded transactions or blocks deserialize
them into CTransaction/CBlock structures in memory, and then
re-serialize them before relaying them to peers.
And please check my logic with respect to causing a blockchain
split: there are no CompactSize fields in the block header, so
the block hash is always canonical. The merkle root in the block
header is computed on a vector<CTransaction>, so
any non-canonical encoding of the transactions in 'tx' or 'block'
messages is erased as they are read into memory by old clients,
and does not affect the block hash. And, as noted above, old
clients re-serialize (with canonical encoding) 'tx' and 'block'
messages before relaying to peers.
2013-08-07 12:21:34 +10:00
if ( nSizeRet < 253 )
throw std : : ios_base : : failure ( " non-canonical ReadCompactSize() " ) ;
2010-08-29 16:58:15 +00:00
}
2010-09-30 16:23:07 +00:00
else if ( chSize = = 254 )
2010-08-29 16:58:15 +00:00
{
2014-12-19 11:41:50 +01:00
nSizeRet = ser_readdata32 ( is ) ;
Reject non-canonically-encoded sizes
The length of vectors, maps, sets, etc are serialized using
Write/ReadCompactSize -- which, unfortunately, do not use a
unique encoding.
So deserializing and then re-serializing a transaction (for example)
can give you different bits than you started with. That doesn't
cause any problems that we are aware of, but it is exactly the type
of subtle mismatch that can lead to exploits.
With this pull, reading a non-canonical CompactSize throws an
exception, which means nodes will ignore 'tx' or 'block' or
other messages that are not properly encoded.
Please check my logic... but this change is safe with respect to
causing a network split. Old clients that receive
non-canonically-encoded transactions or blocks deserialize
them into CTransaction/CBlock structures in memory, and then
re-serialize them before relaying them to peers.
And please check my logic with respect to causing a blockchain
split: there are no CompactSize fields in the block header, so
the block hash is always canonical. The merkle root in the block
header is computed on a vector<CTransaction>, so
any non-canonical encoding of the transactions in 'tx' or 'block'
messages is erased as they are read into memory by old clients,
and does not affect the block hash. And, as noted above, old
clients re-serialize (with canonical encoding) 'tx' and 'block'
messages before relaying to peers.
2013-08-07 12:21:34 +10:00
if ( nSizeRet < 0x10000u )
throw std : : ios_base : : failure ( " non-canonical ReadCompactSize() " ) ;
2010-08-29 16:58:15 +00:00
}
else
{
2014-12-19 11:41:50 +01:00
nSizeRet = ser_readdata64 ( is ) ;
2014-09-28 18:22:44 -04:00
if ( nSizeRet < 0x100000000ULL )
Reject non-canonically-encoded sizes
The length of vectors, maps, sets, etc are serialized using
Write/ReadCompactSize -- which, unfortunately, do not use a
unique encoding.
So deserializing and then re-serializing a transaction (for example)
can give you different bits than you started with. That doesn't
cause any problems that we are aware of, but it is exactly the type
of subtle mismatch that can lead to exploits.
With this pull, reading a non-canonical CompactSize throws an
exception, which means nodes will ignore 'tx' or 'block' or
other messages that are not properly encoded.
Please check my logic... but this change is safe with respect to
causing a network split. Old clients that receive
non-canonically-encoded transactions or blocks deserialize
them into CTransaction/CBlock structures in memory, and then
re-serialize them before relaying them to peers.
And please check my logic with respect to causing a blockchain
split: there are no CompactSize fields in the block header, so
the block hash is always canonical. The merkle root in the block
header is computed on a vector<CTransaction>, so
any non-canonical encoding of the transactions in 'tx' or 'block'
messages is erased as they are read into memory by old clients,
and does not affect the block hash. And, as noted above, old
clients re-serialize (with canonical encoding) 'tx' and 'block'
messages before relaying to peers.
2013-08-07 12:21:34 +10:00
throw std : : ios_base : : failure ( " non-canonical ReadCompactSize() " ) ;
2010-08-29 16:58:15 +00:00
}
2020-10-08 20:27:27 -07:00
if ( range_check & & nSizeRet > MAX_SIZE ) {
2015-01-08 11:44:25 +01:00
throw std : : ios_base : : failure ( " ReadCompactSize(): size too large " ) ;
2020-10-08 20:27:27 -07:00
}
2010-08-29 16:58:15 +00:00
return nSizeRet ;
}
2014-10-31 11:34:30 +08:00
/**
* Variable - length integers : bytes are a MSB base - 128 encoding of the number .
* The high bit in each byte signifies whether another digit follows . To make
* sure the encoding is one - to - one , one is subtracted from all but the last digit .
* Thus , the byte sequence a [ ] with length len , where all but the last byte
* has bit 128 set , encodes the number :
2018-07-24 16:59:49 +01:00
*
2014-10-31 11:34:30 +08:00
* ( a [ len - 1 ] & 0x7F ) + sum ( i = 1. . len - 1 , 128 ^ i * ( ( a [ len - i - 1 ] & 0x7F ) + 1 ) )
2018-07-24 16:59:49 +01:00
*
2014-10-31 11:34:30 +08:00
* Properties :
* * Very small ( 0 - 127 : 1 byte , 128 - 16511 : 2 bytes , 16512 - 2113663 : 3 bytes )
* * Every integer has exactly one encoding
* * Encoding does not depend on size of original integer type
* * No redundancy : every ( infinite ) byte sequence corresponds to a list
* of encoded integers .
2018-07-24 16:59:49 +01:00
*
2014-10-31 11:34:30 +08:00
* 0 : [ 0x00 ] 256 : [ 0x81 0x00 ]
* 1 : [ 0x01 ] 16383 : [ 0xFE 0x7F ]
* 127 : [ 0x7F ] 16384 : [ 0xFF 0x00 ]
2016-08-22 20:49:36 -04:00
* 128 : [ 0x80 0x00 ] 16511 : [ 0xFF 0x7F ]
* 255 : [ 0x80 0x7F ] 65535 : [ 0x82 0xFE 0x7F ]
2014-10-31 11:34:30 +08:00
* 2 ^ 32 : [ 0x8E 0xFE 0xFE 0xFF 0x00 ]
*/
2012-06-15 14:19:11 +02:00
2017-02-13 13:41:02 -05:00
/**
* Mode for encoding VarInts .
*
* Currently there is no support for signed encodings . The default mode will not
* compile with signed values , and the legacy " nonnegative signed " mode will
* accept signed values , but improperly encode and decode them if they are
* negative . In the future , the DEFAULT mode could be extended to support
* negative numbers in a backwards compatible way , and additional modes could be
* added to support different varint formats ( e . g . zigzag encoding ) .
*/
enum class VarIntMode { DEFAULT , NONNEGATIVE_SIGNED } ;
template < VarIntMode Mode , typename I >
struct CheckVarIntMode {
constexpr CheckVarIntMode ( )
{
static_assert ( Mode ! = VarIntMode : : DEFAULT | | std : : is_unsigned < I > : : value , " Unsigned type required with mode DEFAULT. " ) ;
static_assert ( Mode ! = VarIntMode : : NONNEGATIVE_SIGNED | | std : : is_signed < I > : : value , " Signed type required with mode NONNEGATIVE_SIGNED. " ) ;
}
} ;
template < VarIntMode Mode , typename I >
2012-06-15 14:19:11 +02:00
inline unsigned int GetSizeOfVarInt ( I n )
{
2017-02-13 13:41:02 -05:00
CheckVarIntMode < Mode , I > ( ) ;
2012-06-15 14:19:11 +02:00
int nRet = 0 ;
while ( true ) {
nRet + + ;
if ( n < = 0x7F )
break ;
n = ( n > > 7 ) - 1 ;
}
return nRet ;
}
2016-10-28 17:50:04 -07:00
template < typename I >
inline void WriteVarInt ( CSizeComputer & os , I n ) ;
2017-02-13 13:41:02 -05:00
template < typename Stream , VarIntMode Mode , typename I >
2012-06-15 14:19:11 +02:00
void WriteVarInt ( Stream & os , I n )
{
2017-02-13 13:41:02 -05:00
CheckVarIntMode < Mode , I > ( ) ;
2012-06-15 14:19:11 +02:00
unsigned char tmp [ ( sizeof ( n ) * 8 + 6 ) / 7 ] ;
int len = 0 ;
while ( true ) {
tmp [ len ] = ( n & 0x7F ) | ( len ? 0x80 : 0x00 ) ;
if ( n < = 0x7F )
break ;
n = ( n > > 7 ) - 1 ;
len + + ;
}
do {
2014-12-19 11:41:50 +01:00
ser_writedata8 ( os , tmp [ len ] ) ;
2012-06-15 14:19:11 +02:00
} while ( len - - ) ;
}
2010-08-29 16:58:15 +00:00
2017-02-13 13:41:02 -05:00
template < typename Stream , VarIntMode Mode , typename I >
2012-06-15 14:19:11 +02:00
I ReadVarInt ( Stream & is )
{
2017-02-13 13:41:02 -05:00
CheckVarIntMode < Mode , I > ( ) ;
2012-06-15 14:19:11 +02:00
I n = 0 ;
while ( true ) {
2014-12-19 11:41:50 +01:00
unsigned char chData = ser_readdata8 ( is ) ;
2017-02-06 02:52:27 +00:00
if ( n > ( std : : numeric_limits < I > : : max ( ) > > 7 ) ) {
throw std : : ios_base : : failure ( " ReadVarInt(): size too large " ) ;
}
2012-06-15 14:19:11 +02:00
n = ( n < < 7 ) | ( chData & 0x7F ) ;
2017-02-06 02:52:27 +00:00
if ( chData & 0x80 ) {
if ( n = = std : : numeric_limits < I > : : max ( ) ) {
throw std : : ios_base : : failure ( " ReadVarInt(): size too large " ) ;
}
2012-06-15 14:19:11 +02:00
n + + ;
2017-02-06 02:52:27 +00:00
} else {
2012-06-15 14:19:11 +02:00
return n ;
2017-02-06 02:52:27 +00:00
}
2012-06-15 14:19:11 +02:00
}
}
2010-08-29 16:58:15 +00:00
2020-01-08 08:56:19 -08:00
/** Simple wrapper class to serialize objects using a formatter; used by Using(). */
template < typename Formatter , typename T >
class Wrapper
{
static_assert ( std : : is_lvalue_reference < T > : : value , " Wrapper needs an lvalue reference type T " ) ;
protected :
T m_object ;
public :
explicit Wrapper ( T obj ) : m_object ( obj ) { }
template < typename Stream > void Serialize ( Stream & s ) const { Formatter ( ) . Ser ( s , m_object ) ; }
template < typename Stream > void Unserialize ( Stream & s ) { Formatter ( ) . Unser ( s , m_object ) ; }
} ;
/** Cause serialization/deserialization of an object to be done using a specified formatter class.
*
* To use this , you need a class Formatter that has public functions Ser ( stream , const object & ) for
* serialization , and Unser ( stream , object & ) for deserialization . Serialization routines ( inside
* READWRITE , or directly with < < and > > operators ) , can then use Using < Formatter > ( object ) .
*
* This works by constructing a Wrapper < Formatter , T > - wrapped version of object , where T is
* const during serialization , and non - const during deserialization , which maintains const
* correctness .
*/
template < typename Formatter , typename T >
static inline Wrapper < Formatter , T & > Using ( T & & t ) { return Wrapper < Formatter , T & > ( t ) ; }
2020-02-06 19:57:32 -08:00
# define VARINT_MODE(obj, mode) Using<VarIntFormatter<mode>>(obj)
# define VARINT(obj) Using<VarIntFormatter<VarIntMode::DEFAULT>>(obj)
2020-10-08 20:27:27 -07:00
# define COMPACTSIZE(obj) Using<CompactSizeFormatter<true>>(obj)
2020-05-20 11:13:06 -07:00
# define LIMITED_STRING(obj,n) Using<LimitedStringFormatter<n>>(obj)
2012-03-26 16:48:23 +02:00
2020-01-08 09:05:44 -08:00
/** Serialization wrapper class for integers in VarInt format. */
2020-02-06 19:57:32 -08:00
template < VarIntMode Mode >
2020-01-08 09:05:44 -08:00
struct VarIntFormatter
2012-06-15 14:19:11 +02:00
{
2020-01-08 09:05:44 -08:00
template < typename Stream , typename I > void Ser ( Stream & s , I v )
{
WriteVarInt < Stream , Mode , typename std : : remove_cv < I > : : type > ( s , v ) ;
2012-06-15 14:19:11 +02:00
}
2020-01-08 09:05:44 -08:00
template < typename Stream , typename I > void Unser ( Stream & s , I & v )
{
v = ReadVarInt < Stream , Mode , typename std : : remove_cv < I > : : type > ( s ) ;
2012-06-15 14:19:11 +02:00
}
} ;
2020-05-19 14:30:30 -07:00
/** Serialization wrapper class for custom integers and enums.
*
* It permits specifying the serialized size ( 1 to 8 bytes ) and endianness .
*
* Use the big endian mode for values that are stored in memory in native
* byte order , but serialized in big endian notation . This is only intended
* to implement serializers that are compatible with existing formats , and
* its use is not recommended for new data structures .
*/
2020-03-11 08:30:08 -07:00
template < int Bytes , bool BigEndian = false >
2020-02-15 19:48:42 -08:00
struct CustomUintFormatter
{
static_assert ( Bytes > 0 & & Bytes < = 8 , " CustomUintFormatter Bytes out of range " ) ;
static constexpr uint64_t MAX = 0xffffffffffffffff > > ( 8 * ( 8 - Bytes ) ) ;
template < typename Stream , typename I > void Ser ( Stream & s , I v )
{
if ( v < 0 | | v > MAX ) throw std : : ios_base : : failure ( " CustomUintFormatter value out of range " ) ;
2020-03-11 08:30:08 -07:00
if ( BigEndian ) {
uint64_t raw = htobe64 ( v ) ;
2023-06-26 12:12:20 -04:00
s . write ( AsBytes ( Span { & raw , 1 } ) . last ( Bytes ) ) ;
2020-03-11 08:30:08 -07:00
} else {
uint64_t raw = htole64 ( v ) ;
2023-06-26 12:12:20 -04:00
s . write ( AsBytes ( Span { & raw , 1 } ) . first ( Bytes ) ) ;
2020-03-11 08:30:08 -07:00
}
2020-02-15 19:48:42 -08:00
}
template < typename Stream , typename I > void Unser ( Stream & s , I & v )
{
2020-03-30 15:32:39 -07:00
using U = typename std : : conditional < std : : is_enum < I > : : value , std : : underlying_type < I > , std : : common_type < I > > : : type : : type ;
static_assert ( std : : numeric_limits < U > : : max ( ) > = MAX & & std : : numeric_limits < U > : : min ( ) < = 0 , " Assigned type too small " ) ;
2020-02-15 19:48:42 -08:00
uint64_t raw = 0 ;
2020-03-11 08:30:08 -07:00
if ( BigEndian ) {
2023-06-26 12:12:20 -04:00
s . read ( AsWritableBytes ( Span { & raw , 1 } ) . last ( Bytes ) ) ;
2020-03-30 15:32:39 -07:00
v = static_cast < I > ( be64toh ( raw ) ) ;
2020-03-11 08:30:08 -07:00
} else {
2023-06-26 12:12:20 -04:00
s . read ( AsWritableBytes ( Span { & raw , 1 } ) . first ( Bytes ) ) ;
2020-03-30 15:32:39 -07:00
v = static_cast < I > ( le64toh ( raw ) ) ;
2020-03-11 08:30:08 -07:00
}
2020-02-15 19:48:42 -08:00
}
} ;
2020-03-11 08:30:08 -07:00
template < int Bytes > using BigEndianFormatter = CustomUintFormatter < Bytes , true > ;
2018-04-08 09:39:05 -07:00
2020-02-03 19:49:10 -08:00
/** Formatter for integers in CompactSize format. */
2020-10-08 20:27:27 -07:00
template < bool RangeCheck >
2020-02-03 19:49:10 -08:00
struct CompactSizeFormatter
2016-05-18 13:11:42 -07:00
{
2020-02-03 19:49:10 -08:00
template < typename Stream , typename I >
void Unser ( Stream & s , I & v )
{
2020-10-08 20:27:27 -07:00
uint64_t n = ReadCompactSize < Stream > ( s , RangeCheck ) ;
2020-02-03 19:49:10 -08:00
if ( n < std : : numeric_limits < I > : : min ( ) | | n > std : : numeric_limits < I > : : max ( ) ) {
throw std : : ios_base : : failure ( " CompactSize exceeds limit of type " ) ;
}
v = n ;
2016-05-18 13:11:42 -07:00
}
2020-02-03 19:49:10 -08:00
template < typename Stream , typename I >
void Ser ( Stream & s , I v )
{
static_assert ( std : : is_unsigned < I > : : value , " CompactSize only supported for unsigned integers " ) ;
static_assert ( std : : numeric_limits < I > : : max ( ) < = std : : numeric_limits < uint64_t > : : max ( ) , " CompactSize only supports 64-bit integers and below " ) ;
WriteCompactSize < Stream > ( s , v ) ;
2016-05-18 13:11:42 -07:00
}
} ;
2022-04-07 19:47:52 +02:00
template < typename U , bool LOSSY = false >
struct ChronoFormatter {
template < typename Stream , typename Tp >
void Unser ( Stream & s , Tp & tp )
{
U u ;
s > > u ;
// Lossy deserialization does not make sense, so force Wnarrowing
tp = Tp { typename Tp : : duration { typename Tp : : duration : : rep { u } } } ;
}
template < typename Stream , typename Tp >
void Ser ( Stream & s , Tp tp )
{
if constexpr ( LOSSY ) {
s < < U ( tp . time_since_epoch ( ) . count ( ) ) ;
} else {
s < < U { tp . time_since_epoch ( ) . count ( ) } ;
}
}
} ;
template < typename U >
using LossyChronoFormatter = ChronoFormatter < U , true > ;
2019-10-02 15:49:33 -04:00
class CompactSizeWriter
{
protected :
uint64_t n ;
public :
explicit CompactSizeWriter ( uint64_t n_in ) : n ( n_in ) { }
template < typename Stream >
void Serialize ( Stream & s ) const {
WriteCompactSize < Stream > ( s , n ) ;
}
} ;
2014-08-07 23:00:01 +02:00
template < size_t Limit >
2020-05-20 11:13:06 -07:00
struct LimitedStringFormatter
2014-08-07 23:00:01 +02:00
{
template < typename Stream >
2020-05-20 11:13:06 -07:00
void Unser ( Stream & s , std : : string & v )
2014-08-07 23:00:01 +02:00
{
size_t size = ReadCompactSize ( s ) ;
if ( size > Limit ) {
throw std : : ios_base : : failure ( " String length limit exceeded " ) ;
}
2020-05-20 11:13:06 -07:00
v . resize ( size ) ;
2022-01-02 11:31:25 +01:00
if ( size ! = 0 ) s . read ( MakeWritableByteSpan ( v ) ) ;
2014-08-07 23:00:01 +02:00
}
template < typename Stream >
2020-05-20 11:13:06 -07:00
void Ser ( Stream & s , const std : : string & v )
2014-08-07 23:00:01 +02:00
{
2020-05-20 11:13:06 -07:00
s < < v ;
2014-08-07 23:00:01 +02:00
}
} ;
2020-01-18 06:49:14 -08:00
/** Formatter to serialize/deserialize vector elements using another formatter
*
* Example :
* struct X {
* std : : vector < uint64_t > v ;
* SERIALIZE_METHODS ( X , obj ) { READWRITE ( Using < VectorFormatter < VarInt > > ( obj . v ) ) ; }
* } ;
* will define a struct that contains a vector of uint64_t , which is serialized
* as a vector of VarInt - encoded integers .
*
* V is not required to be an std : : vector type . It works for any class that
2020-02-15 19:09:09 -08:00
* exposes a value_type , size , reserve , emplace_back , back , and const iterators .
2020-01-18 06:49:14 -08:00
*/
template < class Formatter >
struct VectorFormatter
{
template < typename Stream , typename V >
void Ser ( Stream & s , const V & v )
{
2020-02-15 19:09:09 -08:00
Formatter formatter ;
2020-01-18 06:49:14 -08:00
WriteCompactSize ( s , v . size ( ) ) ;
for ( const typename V : : value_type & elem : v ) {
2020-02-15 19:09:09 -08:00
formatter . Ser ( s , elem ) ;
2020-01-18 06:49:14 -08:00
}
}
template < typename Stream , typename V >
void Unser ( Stream & s , V & v )
{
2020-02-15 19:09:09 -08:00
Formatter formatter ;
2020-01-18 06:49:14 -08:00
v . clear ( ) ;
size_t size = ReadCompactSize ( s ) ;
size_t allocated = 0 ;
while ( allocated < size ) {
// For DoS prevention, do not blindly allocate as much as the stream claims to contain.
// Instead, allocate in 5MiB batches, so that an attacker actually needs to provide
// X MiB of data to make us allocate X+5 Mib.
static_assert ( sizeof ( typename V : : value_type ) < = MAX_VECTOR_ALLOCATE , " Vector element size too large " ) ;
allocated = std : : min ( size , allocated + MAX_VECTOR_ALLOCATE / sizeof ( typename V : : value_type ) ) ;
v . reserve ( allocated ) ;
while ( v . size ( ) < allocated ) {
2020-02-15 19:09:09 -08:00
v . emplace_back ( ) ;
formatter . Unser ( s , v . back ( ) ) ;
2020-01-18 06:49:14 -08:00
}
}
} ;
} ;
2014-10-31 11:34:30 +08:00
/**
* Forward declarations
*/
2010-08-29 16:58:15 +00:00
2014-10-31 11:34:30 +08:00
/**
* string
*/
2016-10-28 16:29:17 -07:00
template < typename Stream , typename C > void Serialize ( Stream & os , const std : : basic_string < C > & str ) ;
template < typename Stream , typename C > void Unserialize ( Stream & is , std : : basic_string < C > & str ) ;
2010-08-29 16:58:15 +00:00
2015-10-29 07:11:24 +01:00
/**
* prevector
* prevectors of unsigned char are a special case and are intended to be serialized as a single opaque blob .
*/
2016-10-28 16:29:17 -07:00
template < typename Stream , unsigned int N , typename T > inline void Serialize ( Stream & os , const prevector < N , T > & v ) ;
template < typename Stream , unsigned int N , typename T > inline void Unserialize ( Stream & is , prevector < N , T > & v ) ;
2015-10-29 07:11:24 +01:00
2014-10-31 11:34:30 +08:00
/**
* vector
* vectors of unsigned char are a special case and are intended to be serialized as a single opaque blob .
*/
2016-10-28 16:29:17 -07:00
template < typename Stream , typename T , typename A > inline void Serialize ( Stream & os , const std : : vector < T , A > & v ) ;
template < typename Stream , typename T , typename A > inline void Unserialize ( Stream & is , std : : vector < T , A > & v ) ;
2010-08-29 16:58:15 +00:00
2014-10-31 11:34:30 +08:00
/**
* pair
*/
2016-10-28 16:29:17 -07:00
template < typename Stream , typename K , typename T > void Serialize ( Stream & os , const std : : pair < K , T > & item ) ;
template < typename Stream , typename K , typename T > void Unserialize ( Stream & is , std : : pair < K , T > & item ) ;
2010-08-29 16:58:15 +00:00
2014-10-31 11:34:30 +08:00
/**
* map
*/
2016-10-28 16:29:17 -07:00
template < typename Stream , typename K , typename T , typename Pred , typename A > void Serialize ( Stream & os , const std : : map < K , T , Pred , A > & m ) ;
template < typename Stream , typename K , typename T , typename Pred , typename A > void Unserialize ( Stream & is , std : : map < K , T , Pred , A > & m ) ;
2010-08-29 16:58:15 +00:00
2014-10-31 11:34:30 +08:00
/**
* set
*/
2016-10-28 16:29:17 -07:00
template < typename Stream , typename K , typename Pred , typename A > void Serialize ( Stream & os , const std : : set < K , Pred , A > & m ) ;
template < typename Stream , typename K , typename Pred , typename A > void Unserialize ( Stream & is , std : : set < K , Pred , A > & m ) ;
2010-08-29 16:58:15 +00:00
2016-11-10 10:54:14 -08:00
/**
* shared_ptr
*/
template < typename Stream , typename T > void Serialize ( Stream & os , const std : : shared_ptr < const T > & p ) ;
template < typename Stream , typename T > void Unserialize ( Stream & os , std : : shared_ptr < const T > & p ) ;
2010-08-29 16:58:15 +00:00
2016-11-10 10:54:14 -08:00
/**
* unique_ptr
*/
template < typename Stream , typename T > void Serialize ( Stream & os , const std : : unique_ptr < const T > & p ) ;
template < typename Stream , typename T > void Unserialize ( Stream & os , std : : unique_ptr < const T > & p ) ;
2010-08-29 16:58:15 +00:00
2014-10-31 11:34:30 +08:00
/**
* If none of the specialized versions above matched , default to calling member function .
*/
2010-08-29 16:58:15 +00:00
template < typename Stream , typename T >
2016-10-28 16:29:17 -07:00
inline void Serialize ( Stream & os , const T & a )
2010-08-29 16:58:15 +00:00
{
2016-10-28 16:29:17 -07:00
a . Serialize ( os ) ;
2010-08-29 16:58:15 +00:00
}
template < typename Stream , typename T >
2017-07-07 19:09:55 -07:00
inline void Unserialize ( Stream & is , T & & a )
2010-08-29 16:58:15 +00:00
{
2016-10-28 16:29:17 -07:00
a . Unserialize ( is ) ;
2010-08-29 16:58:15 +00:00
}
2020-01-29 10:44:52 -08:00
/** Default formatter. Serializes objects as themselves.
*
* The vector / prevector serialization code passes this to VectorFormatter
* to enable reusing that logic . It shouldn ' t be needed elsewhere .
*/
struct DefaultFormatter
{
template < typename Stream , typename T >
static void Ser ( Stream & s , const T & t ) { Serialize ( s , t ) ; }
template < typename Stream , typename T >
static void Unser ( Stream & s , T & t ) { Unserialize ( s , t ) ; }
} ;
2010-08-29 16:58:15 +00:00
2014-10-31 11:34:30 +08:00
/**
* string
*/
2010-08-29 16:58:15 +00:00
template < typename Stream , typename C >
2016-10-28 16:29:17 -07:00
void Serialize ( Stream & os , const std : : basic_string < C > & str )
2010-08-29 16:58:15 +00:00
{
WriteCompactSize ( os , str . size ( ) ) ;
if ( ! str . empty ( ) )
2022-01-02 11:31:25 +01:00
os . write ( MakeByteSpan ( str ) ) ;
2010-08-29 16:58:15 +00:00
}
template < typename Stream , typename C >
2016-10-28 16:29:17 -07:00
void Unserialize ( Stream & is , std : : basic_string < C > & str )
2010-08-29 16:58:15 +00:00
{
unsigned int nSize = ReadCompactSize ( is ) ;
str . resize ( nSize ) ;
if ( nSize ! = 0 )
2022-01-02 11:31:25 +01:00
is . read ( MakeWritableByteSpan ( str ) ) ;
2010-08-29 16:58:15 +00:00
}
2015-10-29 07:11:24 +01:00
/**
* prevector
*/
2023-08-02 19:49:40 +02:00
template < typename Stream , unsigned int N , typename T >
void Serialize ( Stream & os , const prevector < N , T > & v )
{
if constexpr ( std : : is_same_v < T , unsigned char > ) {
WriteCompactSize ( os , v . size ( ) ) ;
if ( ! v . empty ( ) )
os . write ( MakeByteSpan ( v ) ) ;
} else {
Serialize ( os , Using < VectorFormatter < DefaultFormatter > > ( v ) ) ;
}
2015-10-29 07:11:24 +01:00
}
2023-08-02 19:51:55 +02:00
template < typename Stream , unsigned int N , typename T >
void Unserialize ( Stream & is , prevector < N , T > & v )
2015-10-29 07:11:24 +01:00
{
2023-08-02 19:51:55 +02:00
if constexpr ( std : : is_same_v < T , unsigned char > ) {
// Limit size per read so bogus size value won't cause out of memory
v . clear ( ) ;
unsigned int nSize = ReadCompactSize ( is ) ;
unsigned int i = 0 ;
while ( i < nSize ) {
unsigned int blk = std : : min ( nSize - i , ( unsigned int ) ( 1 + 4999999 / sizeof ( T ) ) ) ;
v . resize_uninitialized ( i + blk ) ;
is . read ( AsWritableBytes ( Span { & v [ i ] , blk } ) ) ;
i + = blk ;
}
} else {
Unserialize ( is , Using < VectorFormatter < DefaultFormatter > > ( v ) ) ;
2015-10-29 07:11:24 +01:00
}
}
2014-10-31 11:34:30 +08:00
/**
* vector
*/
2023-08-02 19:54:11 +02:00
template < typename Stream , typename T , typename A >
void Serialize ( Stream & os , const std : : vector < T , A > & v )
2010-08-29 16:58:15 +00:00
{
2023-08-02 19:54:11 +02:00
if constexpr ( std : : is_same_v < T , unsigned char > ) {
WriteCompactSize ( os , v . size ( ) ) ;
if ( ! v . empty ( ) )
os . write ( MakeByteSpan ( v ) ) ;
} else if constexpr ( std : : is_same_v < T , bool > ) {
// A special case for std::vector<bool>, as dereferencing
// std::vector<bool>::const_iterator does not result in a const bool&
// due to std::vector's special casing for bool arguments.
WriteCompactSize ( os , v . size ( ) ) ;
for ( bool elem : v ) {
: : Serialize ( os , elem ) ;
}
} else {
Serialize ( os , Using < VectorFormatter < DefaultFormatter > > ( v ) ) ;
2019-08-26 11:32:47 -07:00
}
}
2010-08-29 16:58:15 +00:00
2023-08-02 19:55:20 +02:00
template < typename Stream , typename T , typename A >
void Unserialize ( Stream & is , std : : vector < T , A > & v )
2010-08-29 16:58:15 +00:00
{
2023-08-02 19:55:20 +02:00
if constexpr ( std : : is_same_v < T , unsigned char > ) {
// Limit size per read so bogus size value won't cause out of memory
v . clear ( ) ;
unsigned int nSize = ReadCompactSize ( is ) ;
unsigned int i = 0 ;
while ( i < nSize ) {
unsigned int blk = std : : min ( nSize - i , ( unsigned int ) ( 1 + 4999999 / sizeof ( T ) ) ) ;
v . resize ( i + blk ) ;
is . read ( AsWritableBytes ( Span { & v [ i ] , blk } ) ) ;
i + = blk ;
}
} else {
Unserialize ( is , Using < VectorFormatter < DefaultFormatter > > ( v ) ) ;
2010-08-29 16:58:15 +00:00
}
}
2014-10-31 11:34:30 +08:00
/**
* pair
*/
2010-08-29 16:58:15 +00:00
template < typename Stream , typename K , typename T >
2016-10-28 16:29:17 -07:00
void Serialize ( Stream & os , const std : : pair < K , T > & item )
2010-08-29 16:58:15 +00:00
{
2016-10-28 16:29:17 -07:00
Serialize ( os , item . first ) ;
Serialize ( os , item . second ) ;
2010-08-29 16:58:15 +00:00
}
template < typename Stream , typename K , typename T >
2016-10-28 16:29:17 -07:00
void Unserialize ( Stream & is , std : : pair < K , T > & item )
2010-08-29 16:58:15 +00:00
{
2016-10-28 16:29:17 -07:00
Unserialize ( is , item . first ) ;
Unserialize ( is , item . second ) ;
2010-08-29 16:58:15 +00:00
}
2014-10-31 11:34:30 +08:00
/**
* map
*/
2010-08-29 16:58:15 +00:00
template < typename Stream , typename K , typename T , typename Pred , typename A >
2016-10-28 16:29:17 -07:00
void Serialize ( Stream & os , const std : : map < K , T , Pred , A > & m )
2010-08-29 16:58:15 +00:00
{
WriteCompactSize ( os , m . size ( ) ) ;
2017-06-04 22:02:43 +02:00
for ( const auto & entry : m )
Serialize ( os , entry ) ;
2010-08-29 16:58:15 +00:00
}
template < typename Stream , typename K , typename T , typename Pred , typename A >
2016-10-28 16:29:17 -07:00
void Unserialize ( Stream & is , std : : map < K , T , Pred , A > & m )
2010-08-29 16:58:15 +00:00
{
m . clear ( ) ;
unsigned int nSize = ReadCompactSize ( is ) ;
typename std : : map < K , T , Pred , A > : : iterator mi = m . begin ( ) ;
for ( unsigned int i = 0 ; i < nSize ; i + + )
{
2011-05-15 09:11:04 +02:00
std : : pair < K , T > item ;
2016-10-28 16:29:17 -07:00
Unserialize ( is , item ) ;
2010-08-29 16:58:15 +00:00
mi = m . insert ( mi , item ) ;
}
}
2014-10-31 11:34:30 +08:00
/**
* set
*/
2010-08-29 16:58:15 +00:00
template < typename Stream , typename K , typename Pred , typename A >
2016-10-28 16:29:17 -07:00
void Serialize ( Stream & os , const std : : set < K , Pred , A > & m )
2010-08-29 16:58:15 +00:00
{
WriteCompactSize ( os , m . size ( ) ) ;
for ( typename std : : set < K , Pred , A > : : const_iterator it = m . begin ( ) ; it ! = m . end ( ) ; + + it )
2016-10-28 16:29:17 -07:00
Serialize ( os , ( * it ) ) ;
2010-08-29 16:58:15 +00:00
}
template < typename Stream , typename K , typename Pred , typename A >
2016-10-28 16:29:17 -07:00
void Unserialize ( Stream & is , std : : set < K , Pred , A > & m )
2010-08-29 16:58:15 +00:00
{
m . clear ( ) ;
unsigned int nSize = ReadCompactSize ( is ) ;
typename std : : set < K , Pred , A > : : iterator it = m . begin ( ) ;
for ( unsigned int i = 0 ; i < nSize ; i + + )
{
K key ;
2016-10-28 16:29:17 -07:00
Unserialize ( is , key ) ;
2010-08-29 16:58:15 +00:00
it = m . insert ( it , key ) ;
}
}
2016-11-10 10:54:14 -08:00
/**
* unique_ptr
*/
template < typename Stream , typename T > void
Serialize ( Stream & os , const std : : unique_ptr < const T > & p )
{
Serialize ( os , * p ) ;
}
template < typename Stream , typename T >
void Unserialize ( Stream & is , std : : unique_ptr < const T > & p )
{
p . reset ( new T ( deserialize , is ) ) ;
}
/**
* shared_ptr
*/
template < typename Stream , typename T > void
Serialize ( Stream & os , const std : : shared_ptr < const T > & p )
{
Serialize ( os , * p ) ;
}
template < typename Stream , typename T >
void Unserialize ( Stream & is , std : : shared_ptr < const T > & p )
{
p = std : : make_shared < const T > ( deserialize , is ) ;
}
2023-09-14 10:00:45 +10:00
/**
* Support for ( un ) serializing many things at once
*/
template < typename Stream , typename . . . Args >
void SerializeMany ( Stream & s , const Args & . . . args )
{
( : : Serialize ( s , args ) , . . . ) ;
}
template < typename Stream , typename . . . Args >
inline void UnserializeMany ( Stream & s , Args & & . . . args )
{
( : : Unserialize ( s , args ) , . . . ) ;
}
2016-11-10 10:54:14 -08:00
2014-10-31 11:34:30 +08:00
/**
2023-01-31 14:18:42 +01:00
* Support for all macros providing or using the ser_action parameter of the SerializationOps method .
2014-10-31 11:34:30 +08:00
*/
2023-01-31 14:18:42 +01:00
struct ActionSerialize {
2023-09-14 10:00:45 +10:00
static constexpr bool ForRead ( ) { return false ; }
template < typename Stream , typename . . . Args >
static void SerReadWriteMany ( Stream & s , const Args & . . . args )
{
: : SerializeMany ( s , args . . . ) ;
}
template < typename Stream , typename Type , typename Fn >
static void SerRead ( Stream & s , Type & & , Fn & & )
{
}
template < typename Stream , typename Type , typename Fn >
static void SerWrite ( Stream & s , Type & & obj , Fn & & fn )
{
fn ( s , std : : forward < Type > ( obj ) ) ;
}
2014-08-21 00:49:32 +02:00
} ;
2023-01-31 14:18:42 +01:00
struct ActionUnserialize {
2023-09-14 10:00:45 +10:00
static constexpr bool ForRead ( ) { return true ; }
2010-08-29 16:58:15 +00:00
2023-09-14 10:00:45 +10:00
template < typename Stream , typename . . . Args >
static void SerReadWriteMany ( Stream & s , Args & & . . . args )
{
: : UnserializeMany ( s , args . . . ) ;
}
template < typename Stream , typename Type , typename Fn >
static void SerRead ( Stream & s , Type & & obj , Fn & & fn )
{
fn ( s , std : : forward < Type > ( obj ) ) ;
}
template < typename Stream , typename Type , typename Fn >
static void SerWrite ( Stream & s , Type & & , Fn & & )
{
}
} ;
2010-08-29 16:58:15 +00:00
2016-10-28 17:50:04 -07:00
/* ::GetSerializeSize implementations
*
* Computing the serialized size of objects is done through a special stream
* object of type CSizeComputer , which only records the number of bytes written
* to it .
*
* If your Serialize or SerializationOp method has non - trivial overhead for
* serialization , it may be worthwhile to implement a specialized version for
* CSizeComputer , which uses the s . seek ( ) method to record bytes that would
* be written instead .
*/
2014-07-10 20:16:58 +02:00
class CSizeComputer
{
protected :
2023-01-31 11:50:10 +00:00
size_t nSize { 0 } ;
2014-07-10 20:16:58 +02:00
2016-10-28 16:57:24 -07:00
const int nVersion ;
2014-07-10 20:16:58 +02:00
public :
2023-01-31 11:50:10 +00:00
explicit CSizeComputer ( int nVersionIn ) : nVersion ( nVersionIn ) { }
2014-07-10 20:16:58 +02:00
2022-01-02 11:31:25 +01:00
void write ( Span < const std : : byte > src )
2014-07-10 20:16:58 +02:00
{
2022-01-02 11:31:25 +01:00
this - > nSize + = src . size ( ) ;
2014-07-10 20:16:58 +02:00
}
2016-10-28 17:50:04 -07:00
/** Pretend _nSize bytes are written, without specifying them. */
void seek ( size_t _nSize )
{
this - > nSize + = _nSize ;
}
2014-07-10 20:16:58 +02:00
template < typename T >
CSizeComputer & operator < < ( const T & obj )
{
2016-10-28 16:29:17 -07:00
: : Serialize ( * this , obj ) ;
2014-07-10 20:16:58 +02:00
return ( * this ) ;
}
size_t size ( ) const {
return nSize ;
}
2016-10-28 16:29:17 -07:00
int GetVersion ( ) const { return nVersion ; }
2014-07-10 20:16:58 +02:00
} ;
2016-10-28 17:50:04 -07:00
template < typename I >
inline void WriteVarInt ( CSizeComputer & s , I n )
{
s . seek ( GetSizeOfVarInt < I > ( n ) ) ;
}
inline void WriteCompactSize ( CSizeComputer & s , uint64_t nSize )
{
s . seek ( GetSizeOfCompactSize ( nSize ) ) ;
}
2016-10-28 16:51:33 -07:00
template < typename T >
2018-06-22 18:27:18 +00:00
size_t GetSerializeSize ( const T & t , int nVersion = 0 )
2016-10-28 16:51:33 -07:00
{
2018-06-22 18:27:18 +00:00
return ( CSizeComputer ( nVersion ) < < t ) . size ( ) ;
2016-10-28 16:51:33 -07:00
}
2018-06-14 19:48:30 -05:00
template < typename . . . T >
size_t GetSerializeSizeMany ( int nVersion , const T & . . . t )
2016-10-28 16:51:33 -07:00
{
2018-06-14 19:48:30 -05:00
CSizeComputer sc ( nVersion ) ;
2018-07-18 17:52:43 -07:00
SerializeMany ( sc , t . . . ) ;
return sc . size ( ) ;
}
2020-07-11 05:12:43 +02:00
/** Wrapper that overrides the GetParams() function of a stream (and hides GetVersion/GetType). */
template < typename Params , typename SubStream >
class ParamsStream
{
const Params & m_params ;
SubStream & m_substream ; // private to avoid leaking version/type into serialization code that shouldn't see it
public :
ParamsStream ( const Params & params LIFETIMEBOUND , SubStream & substream LIFETIMEBOUND ) : m_params { params } , m_substream { substream } { }
template < typename U > ParamsStream & operator < < ( const U & obj ) { : : Serialize ( * this , obj ) ; return * this ; }
template < typename U > ParamsStream & operator > > ( U & & obj ) { : : Unserialize ( * this , obj ) ; return * this ; }
void write ( Span < const std : : byte > src ) { m_substream . write ( src ) ; }
void read ( Span < std : : byte > dst ) { m_substream . read ( dst ) ; }
void ignore ( size_t num ) { m_substream . ignore ( num ) ; }
bool eof ( ) const { return m_substream . eof ( ) ; }
size_t size ( ) const { return m_substream . size ( ) ; }
const Params & GetParams ( ) const { return m_params ; }
int GetVersion ( ) = delete ; // Deprecated with Params usage
int GetType ( ) = delete ; // Deprecated with Params usage
} ;
/** Wrapper that serializes objects with the specified parameters. */
template < typename Params , typename T >
class ParamsWrapper
{
const Params & m_params ;
2023-09-14 10:05:23 +10:00
T & m_object ;
2020-07-11 05:12:43 +02:00
public :
2023-09-14 10:05:23 +10:00
explicit ParamsWrapper ( const Params & params , T & obj ) : m_params { params } , m_object { obj } { }
2020-07-11 05:12:43 +02:00
template < typename Stream >
void Serialize ( Stream & s ) const
{
ParamsStream ss { m_params , s } ;
: : Serialize ( ss , m_object ) ;
}
template < typename Stream >
void Unserialize ( Stream & s )
{
ParamsStream ss { m_params , s } ;
: : Unserialize ( ss , m_object ) ;
}
} ;
/**
* Return a wrapper around t that ( de ) serializes it with specified parameter params .
*
* See FORMATTER_METHODS_PARAMS for more information on serialization parameters .
*/
template < typename Params , typename T >
static auto WithParams ( const Params & params , T & & t )
{
2023-09-14 10:05:23 +10:00
return ParamsWrapper < Params , T > { params , t } ;
2020-07-11 05:12:43 +02:00
}
2014-08-28 22:21:03 +02:00
# endif // BITCOIN_SERIALIZE_H