/root/bitcoin/src/headerssync.h

Source (jump to first uncovered line)
// Copyright (c) 2022 The Bitcoin Core developers
// Distributed under the MIT software license, see the accompanying
// file COPYING or http://www.opensource.org/licenses/mit-license.php.

#ifndef BITCOIN_HEADERSSYNC_H
#define BITCOIN_HEADERSSYNC_H

#include <arith_uint256.h>
#include <chain.h>
#include <consensus/params.h>
#include <net.h> // For NodeId
#include <primitives/block.h>
#include <uint256.h>
#include <util/bitdeque.h>
#include <util/hasher.h>

#include <deque>
#include <vector>

// A compressed CBlockHeader, which leaves out the prevhash
struct CompressedHeader {
    // header
    int32_t nVersion{0};
    uint256 hashMerkleRoot;
    uint32_t nTime{0};
    uint32_t nBits{0};
    uint32_t nNonce{0};

    CompressedHeader()
    {
        hashMerkleRoot.SetNull();
    }

    CompressedHeader(const CBlockHeader& header)
    {
        nVersion = header.nVersion;
        hashMerkleRoot = header.hashMerkleRoot;
        nTime = header.nTime;
        nBits = header.nBits;
        nNonce = header.nNonce;
    }

    CBlockHeader GetFullHeader(const uint256& hash_prev_block) {
        CBlockHeader ret;
        ret.nVersion = nVersion;
        ret.hashPrevBlock = hash_prev_block;
        ret.hashMerkleRoot = hashMerkleRoot;
        ret.nTime = nTime;
        ret.nBits = nBits;
        ret.nNonce = nNonce;
        return ret;
    };
};

/** HeadersSyncState:
 *
 * We wish to download a peer's headers chain in a DoS-resistant way.
 *
 * The Bitcoin protocol does not offer an easy way to determine the work on a
 * peer's chain. Currently, we can query a peer's headers by using a GETHEADERS
 * message, and our peer can return a set of up to 2000 headers that connect to
 * something we know. If a peer's chain has more than 2000 blocks, then we need
 * a way to verify that the chain actually has enough work on it to be useful to
 * us -- by being above our anti-DoS minimum-chain-work threshold -- before we
 * commit to storing those headers in memory. Otherwise, it would be cheap for
 * an attacker to waste all our memory by serving us low-work headers
 * (particularly for a new node coming online for the first time).
 *
 * To prevent memory-DoS with low-work headers, while still always being
 * able to reorg to whatever the most-work chain is, we require that a chain
 * meet a work threshold before committing it to memory. We can do this by
 * downloading a peer's headers twice, whenever we are not sure that the chain
 * has sufficient work:
 *
 * - In the first download phase, called pre-synchronization, we can calculate
 * the work on the chain as we go (just by checking the nBits value on each
 * header, and validating the proof-of-work).
 *
 * - Once we have reached a header where the cumulative chain work is
 * sufficient, we switch to downloading the headers a second time, this time
 * processing them fully, and possibly storing them in memory.
 *
 * To prevent an attacker from using (eg) the honest chain to convince us that
 * they have a high-work chain, but then feeding us an alternate set of
 * low-difficulty headers in the second phase, we store commitments to the
 * chain we see in the first download phase that we check in the second phase,
 * as follows:
 *
 * - In phase 1 (presync), store 1 bit (using a salted hash function) for every
 * N headers that we see. With a reasonable choice of N, this uses relatively
 * little memory even for a very long chain.
 *
 * - In phase 2 (redownload), keep a lookahead buffer and only accept headers
 * from that buffer into the block index (permanent memory usage) once they
 * have some target number of verified commitments on top of them. With this
 * parametrization, we can achieve a given security target for potential
 * permanent memory usage, while choosing N to minimize memory use during the
 * sync (temporary, per-peer storage).
 */

class HeadersSyncState {
public:
    ~HeadersSyncState() = default;

    enum class State {
        /** PRESYNC means the peer has not yet demonstrated their chain has
         * sufficient work and we're only building commitments to the chain they
         * serve us. */
        PRESYNC,
        /** REDOWNLOAD means the peer has given us a high-enough-work chain,
         * and now we're redownloading the headers we saw before and trying to
         * accept them */
        REDOWNLOAD,
        /** We're done syncing with this peer and can discard any remaining state */
        FINAL
    };

    /** Return the current state of our download */
    State GetState() const { return m_download_state; }

    /** Return the height reached during the PRESYNC phase */
    int64_t GetPresyncHeight() const { return m_current_height; }

    /** Return the block timestamp of the last header received during the PRESYNC phase. */
    uint32_t GetPresyncTime() const { return m_last_header_received.nTime; }

    /** Return the amount of work in the chain received during the PRESYNC phase. */
    arith_uint256 GetPresyncWork() const { return m_current_chain_work; }

    /** Construct a HeadersSyncState object representing a headers sync via this
     *  download-twice mechanism).
     *
     * id: node id (for logging)
     * consensus_params: parameters needed for difficulty adjustment validation
     * chain_start: best known fork point that the peer's headers branch from
     * minimum_required_work: amount of chain work required to accept the chain
     */
    HeadersSyncState(NodeId id, const Consensus::Params& consensus_params,
            const CBlockIndex* chain_start, const arith_uint256& minimum_required_work);

    /** Result data structure for ProcessNextHeaders. */
    struct ProcessingResult {
        std::vector<CBlockHeader> pow_validated_headers;
        bool success{false};
        bool request_more{false};
    };

    /** Process a batch of headers, once a sync via this mechanism has started
     *
     * received_headers: headers that were received over the network for processing.
     *                   Assumes the caller has already verified the headers
     *                   are continuous, and has checked that each header
     *                   satisfies the proof-of-work target included in the
     *                   header (but not necessarily verified that the
     *                   proof-of-work target is correct and passes consensus
     *                   rules).
     * full_headers_message: true if the message was at max capacity,
     *                       indicating more headers may be available
     * ProcessingResult.pow_validated_headers: will be filled in with any
     *                       headers that the caller can fully process and
     *                       validate now (because these returned headers are
     *                       on a chain with sufficient work)
     * ProcessingResult.success: set to false if an error is detected and the sync is
     *                       aborted; true otherwise.
     * ProcessingResult.request_more: if true, the caller is suggested to call
     *                       NextHeadersRequestLocator and send a getheaders message using it.
     */
    ProcessingResult ProcessNextHeaders(const std::vector<CBlockHeader>&
            received_headers, bool full_headers_message);

    /** Issue the next GETHEADERS message to our peer.
     *
     * This will return a locator appropriate for the current sync object, to continue the
     * synchronization phase it is in.
     */
    CBlockLocator NextHeadersRequestLocator() const;

protected:
    /** The (secret) offset on the heights for which to create commitments.
     *
     * m_header_commitments entries are created at any height h for which
     * (h % HEADER_COMMITMENT_PERIOD) == m_commit_offset. */
    const unsigned m_commit_offset;

private:
    /** Clear out all download state that might be in progress (freeing any used
     * memory), and mark this object as no longer usable.
     */
    void Finalize();

    /**
     *  Only called in PRESYNC.
     *  Validate the work on the headers we received from the network, and
     *  store commitments for later. Update overall state with successfully
     *  processed headers.
     *  On failure, this invokes Finalize() and returns false.
     */
    bool ValidateAndStoreHeadersCommitments(const std::vector<CBlockHeader>& headers);

    /** In PRESYNC, process and update state for a single header */
    bool ValidateAndProcessSingleHeader(const CBlockHeader& current);

    /** In REDOWNLOAD, check a header's commitment (if applicable) and add to
     * buffer for later processing */
    bool ValidateAndStoreRedownloadedHeader(const CBlockHeader& header);

    /** Return a set of headers that satisfy our proof-of-work threshold */
    std::vector<CBlockHeader> PopHeadersReadyForAcceptance();

private:
    /** NodeId of the peer (used for log messages) **/
    const NodeId m_id;

    /** We use the consensus params in our anti-DoS calculations */
    const Consensus::Params& m_consensus_params;

    /** Store the last block in our block index that the peer's chain builds from */
    const CBlockIndex* m_chain_start{nullptr};

    /** Minimum work that we're looking for on this chain. */
    const arith_uint256 m_minimum_required_work;

    /** Work that we've seen so far on the peer's chain */
    arith_uint256 m_current_chain_work;

    /** m_hasher is a salted hasher for making our 1-bit commitments to headers we've seen. */
    const SaltedTxidHasher m_hasher;

    /** A queue of commitment bits, created during the 1st phase, and verified during the 2nd. */
    bitdeque<> m_header_commitments;

    /** m_max_commitments is a bound we calculate on how long an honest peer's chain could be,
     * given the MTP rule.
     *
     * Any peer giving us more headers than this will have its sync aborted. This serves as a
     * memory bound on m_header_commitments. */
    uint64_t m_max_commitments{0};

    /** Store the latest header received while in PRESYNC (initialized to m_chain_start) */
    CBlockHeader m_last_header_received;

    /** Height of m_last_header_received */
    int64_t m_current_height{0};

    /** During phase 2 (REDOWNLOAD), we buffer redownloaded headers in memory
     *  until enough commitments have been verified; those are stored in
     *  m_redownloaded_headers */
    std::deque<CompressedHeader> m_redownloaded_headers;

    /** Height of last header in m_redownloaded_headers */
    int64_t m_redownload_buffer_last_height{0};

    /** Hash of last header in m_redownloaded_headers (initialized to
     * m_chain_start). We have to cache it because we don't have hashPrevBlock
     * available in a CompressedHeader.
     */
    uint256 m_redownload_buffer_last_hash;

    /** The hashPrevBlock entry for the first header in m_redownloaded_headers
     * We need this to reconstruct the full header when it's time for
     * processing.
     */
    uint256 m_redownload_buffer_first_prev_hash;

    /** The accumulated work on the redownloaded chain. */
    arith_uint256 m_redownload_chain_work;

    /** Set this to true once we encounter the target blockheader during phase
     * 2 (REDOWNLOAD). At this point, we can process and store all remaining
     * headers still in m_redownloaded_headers.
     */
    bool m_process_all_remaining_headers{false};

    /** Current state of our headers sync. */
    State m_download_state{State::PRESYNC};
};

#endif // BITCOIN_HEADERSSYNC_H

Coverage Report

Created: 2025-02-21 14:37

Line	Count	Source (jump to first uncovered line)
1		// Copyright (c) 2022 The Bitcoin Core developers
2		// Distributed under the MIT software license, see the accompanying
3		// file COPYING or http://www.opensource.org/licenses/mit-license.php.
4
5		#ifndef BITCOIN_HEADERSSYNC_H
6		#define BITCOIN_HEADERSSYNC_H
7
8		#include <arith_uint256.h>
9		#include <chain.h>
10		#include <consensus/params.h>
11		#include <net.h> // For NodeId
12		#include <primitives/block.h>
13		#include <uint256.h>
14		#include <util/bitdeque.h>
15		#include <util/hasher.h>
16
17		#include <deque>
18		#include <vector>
19
20		// A compressed CBlockHeader, which leaves out the prevhash
21		struct CompressedHeader {
22		// header
23		int32_t nVersion{0};
24		uint256 hashMerkleRoot;
25		uint32_t nTime{0};
26		uint32_t nBits{0};
27		uint32_t nNonce{0};
28
29		CompressedHeader()
30	0	{
31	0	hashMerkleRoot.SetNull();
32	0	}
33
34		CompressedHeader(const CBlockHeader& header)
35	0	{
36	0	nVersion = header.nVersion;
37	0	hashMerkleRoot = header.hashMerkleRoot;
38	0	nTime = header.nTime;
39	0	nBits = header.nBits;
40	0	nNonce = header.nNonce;
41	0	}
42
43	0	CBlockHeader GetFullHeader(const uint256& hash_prev_block) {
44	0	CBlockHeader ret;
45	0	ret.nVersion = nVersion;
46	0	ret.hashPrevBlock = hash_prev_block;
47	0	ret.hashMerkleRoot = hashMerkleRoot;
48	0	ret.nTime = nTime;
49	0	ret.nBits = nBits;
50	0	ret.nNonce = nNonce;
51	0	return ret;
52	0	};
53		};
54
55		/** HeadersSyncState:
56		*
57		* We wish to download a peer's headers chain in a DoS-resistant way.
58		*
59		* The Bitcoin protocol does not offer an easy way to determine the work on a
60		* peer's chain. Currently, we can query a peer's headers by using a GETHEADERS
61		* message, and our peer can return a set of up to 2000 headers that connect to
62		* something we know. If a peer's chain has more than 2000 blocks, then we need
63		* a way to verify that the chain actually has enough work on it to be useful to
64		* us -- by being above our anti-DoS minimum-chain-work threshold -- before we
65		* commit to storing those headers in memory. Otherwise, it would be cheap for
66		* an attacker to waste all our memory by serving us low-work headers
67		* (particularly for a new node coming online for the first time).
68		*
69		* To prevent memory-DoS with low-work headers, while still always being
70		* able to reorg to whatever the most-work chain is, we require that a chain
71		* meet a work threshold before committing it to memory. We can do this by
72		* downloading a peer's headers twice, whenever we are not sure that the chain
73		* has sufficient work:
74		*
75		* - In the first download phase, called pre-synchronization, we can calculate
76		* the work on the chain as we go (just by checking the nBits value on each
77		* header, and validating the proof-of-work).
78		*
79		* - Once we have reached a header where the cumulative chain work is
80		* sufficient, we switch to downloading the headers a second time, this time
81		* processing them fully, and possibly storing them in memory.
82		*
83		* To prevent an attacker from using (eg) the honest chain to convince us that
84		* they have a high-work chain, but then feeding us an alternate set of
85		* low-difficulty headers in the second phase, we store commitments to the
86		* chain we see in the first download phase that we check in the second phase,
87		* as follows:
88		*
89		* - In phase 1 (presync), store 1 bit (using a salted hash function) for every
90		* N headers that we see. With a reasonable choice of N, this uses relatively
91		* little memory even for a very long chain.
92		*
93		* - In phase 2 (redownload), keep a lookahead buffer and only accept headers
94		* from that buffer into the block index (permanent memory usage) once they
95		* have some target number of verified commitments on top of them. With this
96		* parametrization, we can achieve a given security target for potential
97		* permanent memory usage, while choosing N to minimize memory use during the
98		* sync (temporary, per-peer storage).
99		*/
100
101		class HeadersSyncState {
102		public:
103	0	~HeadersSyncState() = default;
104
105		enum class State {
106		/** PRESYNC means the peer has not yet demonstrated their chain has
107		* sufficient work and we're only building commitments to the chain they
108		* serve us. */
109		PRESYNC,
110		/** REDOWNLOAD means the peer has given us a high-enough-work chain,
111		* and now we're redownloading the headers we saw before and trying to
112		* accept them */
113		REDOWNLOAD,
114		/** We're done syncing with this peer and can discard any remaining state */
115		FINAL
116		};
117
118		/** Return the current state of our download */
119	0	State GetState() const { return m_download_state; }
120
121		/** Return the height reached during the PRESYNC phase */
122	0	int64_t GetPresyncHeight() const { return m_current_height; }
123
124		/** Return the block timestamp of the last header received during the PRESYNC phase. */
125	0	uint32_t GetPresyncTime() const { return m_last_header_received.nTime; }
126
127		/** Return the amount of work in the chain received during the PRESYNC phase. */
128	0	arith_uint256 GetPresyncWork() const { return m_current_chain_work; }
129
130		/** Construct a HeadersSyncState object representing a headers sync via this
131		* download-twice mechanism).
132		*
133		* id: node id (for logging)
134		* consensus_params: parameters needed for difficulty adjustment validation
135		* chain_start: best known fork point that the peer's headers branch from
136		* minimum_required_work: amount of chain work required to accept the chain
137		*/
138		HeadersSyncState(NodeId id, const Consensus::Params& consensus_params,
139		const CBlockIndex* chain_start, const arith_uint256& minimum_required_work);
140
141		/** Result data structure for ProcessNextHeaders. */
142		struct ProcessingResult {
143		std::vector<CBlockHeader> pow_validated_headers;
144		bool success{false};
145		bool request_more{false};
146		};
147
148		/** Process a batch of headers, once a sync via this mechanism has started
149		*
150		* received_headers: headers that were received over the network for processing.
151		* Assumes the caller has already verified the headers
152		* are continuous, and has checked that each header
153		* satisfies the proof-of-work target included in the
154		* header (but not necessarily verified that the
155		* proof-of-work target is correct and passes consensus
156		* rules).
157		* full_headers_message: true if the message was at max capacity,
158		* indicating more headers may be available
159		* ProcessingResult.pow_validated_headers: will be filled in with any
160		* headers that the caller can fully process and
161		* validate now (because these returned headers are
162		* on a chain with sufficient work)
163		* ProcessingResult.success: set to false if an error is detected and the sync is
164		* aborted; true otherwise.
165		* ProcessingResult.request_more: if true, the caller is suggested to call
166		* NextHeadersRequestLocator and send a getheaders message using it.
167		*/
168		ProcessingResult ProcessNextHeaders(const std::vector<CBlockHeader>&
169		received_headers, bool full_headers_message);
170
171		/** Issue the next GETHEADERS message to our peer.
172		*
173		* This will return a locator appropriate for the current sync object, to continue the
174		* synchronization phase it is in.
175		*/
176		CBlockLocator NextHeadersRequestLocator() const;
177
178		protected:
179		/** The (secret) offset on the heights for which to create commitments.
180		*
181		* m_header_commitments entries are created at any height h for which
182		* (h % HEADER_COMMITMENT_PERIOD) == m_commit_offset. */
183		const unsigned m_commit_offset;
184
185		private:
186		/** Clear out all download state that might be in progress (freeing any used
187		* memory), and mark this object as no longer usable.
188		*/
189		void Finalize();
190
191		/**
192		* Only called in PRESYNC.
193		* Validate the work on the headers we received from the network, and
194		* store commitments for later. Update overall state with successfully
195		* processed headers.
196		* On failure, this invokes Finalize() and returns false.
197		*/
198		bool ValidateAndStoreHeadersCommitments(const std::vector<CBlockHeader>& headers);
199
200		/** In PRESYNC, process and update state for a single header */
201		bool ValidateAndProcessSingleHeader(const CBlockHeader& current);
202
203		/** In REDOWNLOAD, check a header's commitment (if applicable) and add to
204		* buffer for later processing */
205		bool ValidateAndStoreRedownloadedHeader(const CBlockHeader& header);
206
207		/** Return a set of headers that satisfy our proof-of-work threshold */
208		std::vector<CBlockHeader> PopHeadersReadyForAcceptance();
209
210		private:
211		/ NodeId of the peer (used for log messages) /
212		const NodeId m_id;
213
214		/** We use the consensus params in our anti-DoS calculations */
215		const Consensus::Params& m_consensus_params;
216
217		/** Store the last block in our block index that the peer's chain builds from */
218		const CBlockIndex* m_chain_start{nullptr};
219
220		/** Minimum work that we're looking for on this chain. */
221		const arith_uint256 m_minimum_required_work;
222
223		/** Work that we've seen so far on the peer's chain */
224		arith_uint256 m_current_chain_work;
225
226		/** m_hasher is a salted hasher for making our 1-bit commitments to headers we've seen. */
227		const SaltedTxidHasher m_hasher;
228
229		/** A queue of commitment bits, created during the 1st phase, and verified during the 2nd. */
230		bitdeque<> m_header_commitments;
231
232		/** m_max_commitments is a bound we calculate on how long an honest peer's chain could be,
233		* given the MTP rule.
234		*
235		* Any peer giving us more headers than this will have its sync aborted. This serves as a
236		* memory bound on m_header_commitments. */
237		uint64_t m_max_commitments{0};
238
239		/** Store the latest header received while in PRESYNC (initialized to m_chain_start) */
240		CBlockHeader m_last_header_received;
241
242		/** Height of m_last_header_received */
243		int64_t m_current_height{0};
244
245		/** During phase 2 (REDOWNLOAD), we buffer redownloaded headers in memory
246		* until enough commitments have been verified; those are stored in
247		* m_redownloaded_headers */
248		std::deque<CompressedHeader> m_redownloaded_headers;
249
250		/** Height of last header in m_redownloaded_headers */
251		int64_t m_redownload_buffer_last_height{0};
252
253		/** Hash of last header in m_redownloaded_headers (initialized to
254		* m_chain_start). We have to cache it because we don't have hashPrevBlock
255		* available in a CompressedHeader.
256		*/
257		uint256 m_redownload_buffer_last_hash;
258
259		/** The hashPrevBlock entry for the first header in m_redownloaded_headers
260		* We need this to reconstruct the full header when it's time for
261		* processing.
262		*/
263		uint256 m_redownload_buffer_first_prev_hash;
264
265		/** The accumulated work on the redownloaded chain. */
266		arith_uint256 m_redownload_chain_work;
267
268		/** Set this to true once we encounter the target blockheader during phase
269		* 2 (REDOWNLOAD). At this point, we can process and store all remaining
270		* headers still in m_redownloaded_headers.
271		*/
272		bool m_process_all_remaining_headers{false};
273
274		/** Current state of our headers sync. */
275		State m_download_state{State::PRESYNC};
276		};
277
278		#endif // BITCOIN_HEADERSSYNC_H