docs/blockfilter_8cpp_source.html

 // Copyright (c) 2018 The Bitcoin Core developers
 // Distributed under the MIT software license, see the accompanying
 // file COPYING or http://www.opensource.org/licenses/mit-license.php.

 #include <blockfilter.h>
 #include <hash.h>
 #include <primitives/transaction.h>
 #include <script/script.h>
 #include <streams.h>

 static constexpr int GCS_SER_TYPE = SER_NETWORK;

 static constexpr int GCS_SER_VERSION = 0;

 template <typename OStream>
 static void GolombRiceEncode(BitStreamWriter<OStream>& bitwriter, uint8_t P, uint64_t x)
 {
     // Write quotient as unary-encoded: q 1's followed by one 0.
     uint64_t q = x >> P;
     while (q > 0) {
         int nbits = q <= 64 ? static_cast<int>(q) : 64;
         bitwriter.Write(~0ULL, nbits);
         q -= nbits;
     }
     bitwriter.Write(0, 1);

     // Write the remainder in P bits. Since the remainder is just the bottom
     // P bits of x, there is no need to mask first.
     bitwriter.Write(x, P);
 }

 template <typename IStream>
 static uint64_t GolombRiceDecode(BitStreamReader<IStream>& bitreader, uint8_t P)
 {
     // Read unary-encoded quotient: q 1's followed by one 0.
     uint64_t q = 0;
     while (bitreader.Read(1) == 1) {
         ++q;
     }

     uint64_t r = bitreader.Read(P);

     return (q << P) + r;
 }

 // Map a value x that is uniformly distributed in the range [0, 2^64) to a
 // value uniformly distributed in [0, n) by returning the upper 64 bits of
 // x * n.
 //
 // See: https://lemire.me/blog/2016/06/27/a-fast-alternative-to-the-modulo-reduction/
 static uint64_t MapIntoRange(uint64_t x, uint64_t n)
 {
 #ifdef __SIZEOF_INT128__
     return (static_cast<unsigned __int128>(x) * static_cast<unsigned __int128>(n)) >> 64;
 #else
     // To perform the calculation on 64-bit numbers without losing the
     // result to overflow, split the numbers into the most significant and
     // least significant 32 bits and perform multiplication piece-wise.
     //
     // See: https://stackoverflow.com/a/26855440
     uint64_t x_hi = x >> 32;
     uint64_t x_lo = x & 0xFFFFFFFF;
     uint64_t n_hi = n >> 32;
     uint64_t n_lo = n & 0xFFFFFFFF;

     uint64_t ac = x_hi * n_hi;
     uint64_t ad = x_hi * n_lo;
     uint64_t bc = x_lo * n_hi;
     uint64_t bd = x_lo * n_lo;

     uint64_t mid34 = (bd >> 32) + (bc & 0xFFFFFFFF) + (ad & 0xFFFFFFFF);
     uint64_t upper64 = ac + (bc >> 32) + (ad >> 32) + (mid34 >> 32);
     return upper64;
 #endif
 }

 uint64_t GCSFilter::HashToRange(const Element& element) const
 {
     uint64_t hash = CSipHasher(m_siphash_k0, m_siphash_k1)
         .Write(element.data(), element.size())
         .Finalize();
     return MapIntoRange(hash, m_F);
 }

 std::vector<uint64_t> GCSFilter::BuildHashedSet(const ElementSet& elements) const
 {
     std::vector<uint64_t> hashed_elements;
     hashed_elements.reserve(elements.size());
     for (const Element& element : elements) {
         hashed_elements.push_back(HashToRange(element));
     }
     std::sort(hashed_elements.begin(), hashed_elements.end());
     return hashed_elements;
 }

 GCSFilter::GCSFilter(uint64_t siphash_k0, uint64_t siphash_k1, uint8_t P, uint32_t M)
     : m_siphash_k0(siphash_k0), m_siphash_k1(siphash_k1), m_P(P), m_M(M), m_N(0), m_F(0)
 {}

 GCSFilter::GCSFilter(uint64_t siphash_k0, uint64_t siphash_k1, uint8_t P, uint32_t M,
                      std::vector<unsigned char> encoded_filter)
     : GCSFilter(siphash_k0, siphash_k1, P, M)
 {
     m_encoded = std::move(encoded_filter);

     VectorReader stream(GCS_SER_TYPE, GCS_SER_VERSION, m_encoded, 0);

     uint64_t N = ReadCompactSize(stream);
     m_N = static_cast<uint32_t>(N);
     if (m_N != N) {
         throw std::ios_base::failure("N must be <2^32");
     }
     m_F = static_cast<uint64_t>(m_N) * static_cast<uint64_t>(m_M);

     // Verify that the encoded filter contains exactly N elements. If it has too much or too little
     // data, a std::ios_base::failure exception will be raised.
     BitStreamReader<VectorReader> bitreader(stream);
     for (uint64_t i = 0; i < m_N; ++i) {
         GolombRiceDecode(bitreader, m_P);
     }
     if (!stream.empty()) {
         throw std::ios_base::failure("encoded_filter contains excess data");
     }
 }

 GCSFilter::GCSFilter(uint64_t siphash_k0, uint64_t siphash_k1, uint8_t P, uint32_t M,
                      const ElementSet& elements)
     : GCSFilter(siphash_k0, siphash_k1, P, M)
 {
     size_t N = elements.size();
     m_N = static_cast<uint32_t>(N);
     if (m_N != N) {
         throw std::invalid_argument("N must be <2^32");
     }
     m_F = static_cast<uint64_t>(m_N) * static_cast<uint64_t>(m_M);

     CVectorWriter stream(GCS_SER_TYPE, GCS_SER_VERSION, m_encoded, 0);

     WriteCompactSize(stream, m_N);

     if (elements.empty()) {
         return;
     }

     BitStreamWriter<CVectorWriter> bitwriter(stream);

     uint64_t last_value = 0;
     for (uint64_t value : BuildHashedSet(elements)) {
         uint64_t delta = value - last_value;
         GolombRiceEncode(bitwriter, m_P, delta);
         last_value = value;
     }

     bitwriter.Flush();
 }

 bool GCSFilter::MatchInternal(const uint64_t* element_hashes, size_t size) const
 {
     VectorReader stream(GCS_SER_TYPE, GCS_SER_VERSION, m_encoded, 0);

     // Seek forward by size of N
     uint64_t N = ReadCompactSize(stream);
     assert(N == m_N);

     BitStreamReader<VectorReader> bitreader(stream);

     uint64_t value = 0;
     size_t hashes_index = 0;
     for (uint32_t i = 0; i < m_N; ++i) {
         uint64_t delta = GolombRiceDecode(bitreader, m_P);
         value += delta;

         while (true) {
             if (hashes_index == size) {
                 return false;
             } else if (element_hashes[hashes_index] == value) {
                 return true;
             } else if (element_hashes[hashes_index] > value) {
                 break;
             }

             hashes_index++;
         }
     }

     return false;
 }

 bool GCSFilter::Match(const Element& element) const
 {
     uint64_t query = HashToRange(element);
     return MatchInternal(&query, 1);
 }

 bool GCSFilter::MatchAny(const ElementSet& elements) const
 {
     const std::vector<uint64_t> queries = BuildHashedSet(elements);
     return MatchInternal(queries.data(), queries.size());
 }

 static GCSFilter::ElementSet BasicFilterElements(const CBlock& block,
                                                  const CBlockUndo& block_undo)
 {
     GCSFilter::ElementSet elements;

     for (const CTransactionRef& tx : block.vtx) {
         for (const CTxOut& txout : tx->vout) {
             const CScript& script = txout.scriptPubKey;
             if (script.empty() || script[0] == OP_RETURN) continue;
             elements.emplace(script.begin(), script.end());
         }
     }

     for (const CTxUndo& tx_undo : block_undo.vtxundo) {
         for (const Coin& prevout : tx_undo.vprevout) {
             const CScript& script = prevout.out.scriptPubKey;
             if (script.empty()) continue;
             elements.emplace(script.begin(), script.end());
         }
     }

     return elements;
 }

 BlockFilter::BlockFilter(BlockFilterType filter_type, const CBlock& block, const CBlockUndo& block_undo)
     : m_filter_type(filter_type), m_block_hash(block.GetHash())
 {
     switch (m_filter_type) {
     case BlockFilterType::BASIC:
         m_filter = GCSFilter(m_block_hash.GetUint64(0), m_block_hash.GetUint64(1),
                              BASIC_FILTER_P, BASIC_FILTER_M,
                              BasicFilterElements(block, block_undo));
         break;

     default:
         throw std::invalid_argument("unknown filter_type");
     }
 }

 uint256 BlockFilter::GetHash() const
 {
     const std::vector<unsigned char>& data = GetEncodedFilter();

     uint256 result;
     CHash256().Write(data.data(), data.size()).Finalize(result.begin());
     return result;
 }

 uint256 BlockFilter::ComputeHeader(const uint256& prev_header) const
 {
     const uint256& filter_hash = GetHash();

     uint256 result;
     CHash256()
         .Write(filter_hash.begin(), filter_hash.size())
         .Write(prev_header.begin(), prev_header.size())
         .Finalize(result.begin());
     return result;
 }
CTxUndo::vprevout
std::vector< Coin > vprevout
Definition: undo.h:72

BitStreamReader
Definition: streams.h:514

BASIC_FILTER_M
constexpr uint32_t BASIC_FILTER_M
Definition: blockfilter.h:77

CTxOut::scriptPubKey
CScript scriptPubKey
Definition: transaction.h:135

CSipHasher::Write
CSipHasher & Write(uint64_t data)
Hash a 64-bit integer worth of data It is treated as if this was the little-endian interpretation of ...
Definition: hash.cpp:102

streams.h

Coin
A UTXO entry.
Definition: coins.h:29

CBlock
Definition: block.h:74

ReadCompactSize
uint64_t ReadCompactSize(Stream &is)
Definition: serialize.h:278

WriteCompactSize
void WriteCompactSize(CSizeComputer &os, uint64_t nSize)
Definition: serialize.h:975

CHash256::Write
CHash256 & Write(const unsigned char *data, size_t len)
Definition: hash.h:58

Coin::out
CTxOut out
unspent transaction output
Definition: coins.h:33

BlockFilter::BlockFilter
BlockFilter(BlockFilterType filter_type, const CBlock &block, const CBlockUndo &block_undo)
Definition: blockfilter.cpp:227

BASIC_FILTER_P
constexpr uint8_t BASIC_FILTER_P
Definition: blockfilter.h:76

GCSFilter::MatchAny
bool MatchAny(const ElementSet &elements) const
Checks if any of the given elements may be in the set.
Definition: blockfilter.cpp:197

BASIC
Definition: blockfilter.h:81

CHash256
A hasher class for Bitcoin&#39;s 256-bit hash (double SHA-256).
Definition: hash.h:46

BitStreamWriter
Definition: streams.h:557

GCSFilter::BuildHashedSet
std::vector< uint64_t > BuildHashedSet(const ElementSet &elements) const
Definition: blockfilter.cpp:87

BitStreamWriter::Write
void Write(uint64_t data, int nbits)
Write the nbits least significant bits of a 64-bit int to the output stream.
Definition: streams.h:582

BlockFilter::m_filter
GCSFilter m_filter
Definition: blockfilter.h:93

script.h

base_blob::begin
unsigned char * begin()
Definition: uint256.h:56

CTransactionRef
std::shared_ptr< const CTransaction > CTransactionRef
Definition: transaction.h:402

BlockFilter::GetHash
uint256 GetHash() const
Definition: blockfilter.cpp:242

GCSFilter::Match
bool Match(const Element &element) const
Checks if the element may be in the set.
Definition: blockfilter.cpp:191

GCSFilter::MatchInternal
bool MatchInternal(const uint64_t *sorted_element_hashes, size_t size) const
Helper method used to implement Match and MatchAny.
Definition: blockfilter.cpp:159

prevector::end
iterator end()
Definition: prevector.h:303

BlockFilterType
BlockFilterType
Definition: blockfilter.h:79

OP_RETURN
Definition: script.h:86

BlockFilter::GetEncodedFilter
const std::vector< unsigned char > & GetEncodedFilter() const
Definition: blockfilter.h:104

GCSFilter::GCSFilter
GCSFilter(uint64_t siphash_k0=0, uint64_t siphash_k1=0, uint8_t P=0, uint32_t M=0)
Constructs an empty filter.
Definition: blockfilter.cpp:98

VectorReader
Minimal stream for reading from an existing vector by reference.
Definition: streams.h:144

blockfilter.h

GCSFilter::HashToRange
uint64_t HashToRange(const Element &element) const
Hash a data element to an integer in the range [0, N * M).
Definition: blockfilter.cpp:79

CTxOut
An output of a transaction.
Definition: transaction.h:131

base_blob::size
unsigned int size() const
Definition: uint256.h:76

GCSFilter::m_siphash_k0
uint64_t m_siphash_k0
Definition: blockfilter.h:28

BitStreamReader::Read
uint64_t Read(int nbits)
Read the specified number of bits from the stream.
Definition: streams.h:534

GCSFilter
This implements a Golomb-coded set as defined in BIP 158.
Definition: blockfilter.h:21

BitStreamWriter::Flush
void Flush()
Flush any unwritten bits to the output stream, padding with 0&#39;s to the next byte boundary.
Definition: streams.h:602

GCSFilter::m_P
uint8_t m_P
Golomb-Rice coding parameter.
Definition: blockfilter.h:30

BlockFilter::ComputeHeader
uint256 ComputeHeader(const uint256 &prev_header) const
Definition: blockfilter.cpp:251

uint256
256-bit opaque blob.
Definition: uint256.h:122

CBlock::vtx
std::vector< CTransactionRef > vtx
Definition: block.h:78

CBlockUndo
Undo information for a CBlock.
Definition: undo.h:100

CScript
Serialized script, used inside transaction inputs and outputs.
Definition: script.h:384

CTxUndo
Undo information for a CTransaction.
Definition: undo.h:68

BlockFilter::m_filter_type
BlockFilterType m_filter_type
Definition: blockfilter.h:91

SER_NETWORK
Definition: serialize.h:164

prevector::empty
bool empty() const
Definition: prevector.h:297

CSipHasher
SipHash-2-4.
Definition: hash.h:247

BlockFilter::m_block_hash
uint256 m_block_hash
Definition: blockfilter.h:92

prevector::begin
iterator begin()
Definition: prevector.h:301

GCSFilter::Element
std::vector< unsigned char > Element
Definition: blockfilter.h:24

VectorReader::empty
bool empty() const
Definition: streams.h:190

CVectorWriter
Definition: streams.h:77

GCSFilter::m_N
uint32_t m_N
Number of elements in the filter.
Definition: blockfilter.h:32

hash.h

base_blob::GetUint64
uint64_t GetUint64(int pos) const
Definition: uint256.h:81

CBlockUndo::vtxundo
std::vector< CTxUndo > vtxundo
Definition: undo.h:103

GCSFilter::m_F
uint64_t m_F
Range of element hashes, F = N * M.
Definition: blockfilter.h:33

transaction.h

GCSFilter::m_M
uint32_t m_M
Inverse false positive rate.
Definition: blockfilter.h:31

GCSFilter::ElementSet
std::set< Element > ElementSet
Definition: blockfilter.h:25

GCSFilter::m_siphash_k1
uint64_t m_siphash_k1
Definition: blockfilter.h:29

GCSFilter::m_encoded
std::vector< unsigned char > m_encoded
Definition: blockfilter.h:34