/root/bitcoin/src/index/blockfilterindex.cpp

Source (jump to first uncovered line)
// Copyright (c) 2018-2022 The Bitcoin Core developers
// Distributed under the MIT software license, see the accompanying
// file COPYING or http://www.opensource.org/licenses/mit-license.php.

#include <map>

#include <clientversion.h>
#include <common/args.h>
#include <dbwrapper.h>
#include <hash.h>
#include <index/blockfilterindex.h>
#include <logging.h>
#include <node/blockstorage.h>
#include <undo.h>
#include <util/fs_helpers.h>
#include <validation.h>

/* The index database stores three items for each block: the disk location of the encoded filter,
 * its dSHA256 hash, and the header. Those belonging to blocks on the active chain are indexed by
 * height, and those belonging to blocks that have been reorganized out of the active chain are
 * indexed by block hash. This ensures that filter data for any block that becomes part of the
 * active chain can always be retrieved, alleviating timing concerns.
 *
 * The filters themselves are stored in flat files and referenced by the LevelDB entries. This
 * minimizes the amount of data written to LevelDB and keeps the database values constant size. The
 * disk location of the next block filter to be written (represented as a FlatFilePos) is stored
 * under the DB_FILTER_POS key.
 *
 * Keys for the height index have the type [DB_BLOCK_HEIGHT, uint32 (BE)]. The height is represented
 * as big-endian so that sequential reads of filters by height are fast.
 * Keys for the hash index have the type [DB_BLOCK_HASH, uint256].
 */
constexpr uint8_t DB_BLOCK_HASH{'s'};
constexpr uint8_t DB_BLOCK_HEIGHT{'t'};
constexpr uint8_t DB_FILTER_POS{'P'};

constexpr unsigned int MAX_FLTR_FILE_SIZE = 0x1000000; // 16 MiB
/** The pre-allocation chunk size for fltr?????.dat files */
constexpr unsigned int FLTR_FILE_CHUNK_SIZE = 0x100000; // 1 MiB
/** Maximum size of the cfheaders cache
 *  We have a limit to prevent a bug in filling this cache
 *  potentially turning into an OOM. At 2000 entries, this cache
 *  is big enough for a 2,000,000 length block chain, which
 *  we should be enough until ~2047. */
constexpr size_t CF_HEADERS_CACHE_MAX_SZ{2000};

namespace {

struct DBVal {
    uint256 hash;
    uint256 header;
    FlatFilePos pos;

    SERIALIZE_METHODS(DBVal, obj) { READWRITE(obj.hash, obj.header, obj.pos); }
};

struct DBHeightKey {
    int height;

    explicit DBHeightKey(int height_in) : height(height_in) {}

    template<typename Stream>
    void Serialize(Stream& s) const
    {
        ser_writedata8(s, DB_BLOCK_HEIGHT);
        ser_writedata32be(s, height);
    }

    template<typename Stream>
    void Unserialize(Stream& s)
    {
        const uint8_t prefix{ser_readdata8(s)};
        if (prefix != DB_BLOCK_HEIGHT) {
            throw std::ios_base::failure("Invalid format for block filter index DB height key");
        }
        height = ser_readdata32be(s);
    }
};

struct DBHashKey {
    uint256 hash;

    explicit DBHashKey(const uint256& hash_in) : hash(hash_in) {}

    SERIALIZE_METHODS(DBHashKey, obj) {
        uint8_t prefix{DB_BLOCK_HASH};
        READWRITE(prefix);
        if (prefix != DB_BLOCK_HASH) {
            throw std::ios_base::failure("Invalid format for block filter index DB hash key");
        }

        READWRITE(obj.hash);
    }
};

}; // namespace

static std::map<BlockFilterType, BlockFilterIndex> g_filter_indexes;

BlockFilterIndex::BlockFilterIndex(std::unique_ptr<interfaces::Chain> chain, BlockFilterType filter_type,
                                   size_t n_cache_size, bool f_memory, bool f_wipe)
    : BaseIndex(std::move(chain), BlockFilterTypeName(filter_type) + " block filter index")
    , m_filter_type(filter_type)
{
    const std::string& filter_name = BlockFilterTypeName(filter_type);
    if (filter_name.empty()) throw std::invalid_argument("unknown filter_type");

    fs::path path = gArgs.GetDataDirNet() / "indexes" / "blockfilter" / fs::u8path(filter_name);
    fs::create_directories(path);

    m_db = std::make_unique<BaseIndex::DB>(path / "db", n_cache_size, f_memory, f_wipe);
    m_filter_fileseq = std::make_unique<FlatFileSeq>(std::move(path), "fltr", FLTR_FILE_CHUNK_SIZE);
}

bool BlockFilterIndex::CustomInit(const std::optional<interfaces::BlockRef>& block)
{
    if (!m_db->Read(DB_FILTER_POS, m_next_filter_pos)) {
        // Check that the cause of the read failure is that the key does not exist. Any other errors
        // indicate database corruption or a disk failure, and starting the index would cause
        // further corruption.
        if (m_db->Exists(DB_FILTER_POS)) {
            LogError("%s: Cannot read current %s state; index may be corrupted\n",
                         __func__, GetName());
            return false;
        }

        // If the DB_FILTER_POS is not set, then initialize to the first location.
        m_next_filter_pos.nFile = 0;
        m_next_filter_pos.nPos = 0;
    }

    if (block) {
        auto op_last_header = ReadFilterHeader(block->height, block->hash);
        if (!op_last_header) {
            LogError("Cannot read last block filter header; index may be corrupted\n");
            return false;
        }
        m_last_header = *op_last_header;
    }

    return true;
}

bool BlockFilterIndex::CustomCommit(CDBBatch& batch)
{
    const FlatFilePos& pos = m_next_filter_pos;

    // Flush current filter file to disk.
    AutoFile file{m_filter_fileseq->Open(pos)};
    if (file.IsNull()) {
        LogError("%s: Failed to open filter file %d\n", __func__, pos.nFile);
        return false;
    }
    if (!file.Commit()) {
        LogError("%s: Failed to commit filter file %d\n", __func__, pos.nFile);
        return false;
    }

    batch.Write(DB_FILTER_POS, pos);
    return true;
}

bool BlockFilterIndex::ReadFilterFromDisk(const FlatFilePos& pos, const uint256& hash, BlockFilter& filter) const
{
    AutoFile filein{m_filter_fileseq->Open(pos, true)};
    if (filein.IsNull()) {
        return false;
    }

    // Check that the hash of the encoded_filter matches the one stored in the db.
    uint256 block_hash;
    std::vector<uint8_t> encoded_filter;
    try {
        filein >> block_hash >> encoded_filter;
        if (Hash(encoded_filter) != hash) {
            LogError("Checksum mismatch in filter decode.\n");
            return false;
        }
        filter = BlockFilter(GetFilterType(), block_hash, std::move(encoded_filter), /*skip_decode_check=*/true);
    }
    catch (const std::exception& e) {
        LogError("%s: Failed to deserialize block filter from disk: %s\n", __func__, e.what());
        return false;
    }

    return true;
}

size_t BlockFilterIndex::WriteFilterToDisk(FlatFilePos& pos, const BlockFilter& filter)
{
    assert(filter.GetFilterType() == GetFilterType());

    size_t data_size =
        GetSerializeSize(filter.GetBlockHash()) +
        GetSerializeSize(filter.GetEncodedFilter());

    // If writing the filter would overflow the file, flush and move to the next one.
    if (pos.nPos + data_size > MAX_FLTR_FILE_SIZE) {
        AutoFile last_file{m_filter_fileseq->Open(pos)};
        if (last_file.IsNull()) {
            LogPrintf("%s: Failed to open filter file %d\n", __func__, pos.nFile);
            return 0;
        }
        if (!last_file.Truncate(pos.nPos)) {
            LogPrintf("%s: Failed to truncate filter file %d\n", __func__, pos.nFile);
            return 0;
        }
        if (!last_file.Commit()) {
            LogPrintf("%s: Failed to commit filter file %d\n", __func__, pos.nFile);
            return 0;
        }

        pos.nFile++;
        pos.nPos = 0;
    }

    // Pre-allocate sufficient space for filter data.
    bool out_of_space;
    m_filter_fileseq->Allocate(pos, data_size, out_of_space);
    if (out_of_space) {
        LogPrintf("%s: out of disk space\n", __func__);
        return 0;
    }

    AutoFile fileout{m_filter_fileseq->Open(pos)};
    if (fileout.IsNull()) {
        LogPrintf("%s: Failed to open filter file %d\n", __func__, pos.nFile);
        return 0;
    }

    fileout << filter.GetBlockHash() << filter.GetEncodedFilter();
    return data_size;
}

std::optional<uint256> BlockFilterIndex::ReadFilterHeader(int height, const uint256& expected_block_hash)
{
    std::pair<uint256, DBVal> read_out;
    if (!m_db->Read(DBHeightKey(height), read_out)) {
        return std::nullopt;
    }

    if (read_out.first != expected_block_hash) {
        LogError("%s: previous block header belongs to unexpected block %s; expected %s\n",
                         __func__, read_out.first.ToString(), expected_block_hash.ToString());
        return std::nullopt;
    }

    return read_out.second.header;
}

bool BlockFilterIndex::CustomAppend(const interfaces::BlockInfo& block)
{
    CBlockUndo block_undo;

    if (block.height > 0) {
        // pindex variable gives indexing code access to node internals. It
        // will be removed in upcoming commit
        const CBlockIndex* pindex = WITH_LOCK(cs_main, return m_chainstate->m_blockman.LookupBlockIndex(block.hash));
        if (!m_chainstate->m_blockman.UndoReadFromDisk(block_undo, *pindex)) {
            return false;
        }
    }

    BlockFilter filter(m_filter_type, *Assert(block.data), block_undo);

    const uint256& header = filter.ComputeHeader(m_last_header);
    bool res = Write(filter, block.height, header);
    if (res) m_last_header = header; // update last header
    return res;
}

bool BlockFilterIndex::Write(const BlockFilter& filter, uint32_t block_height, const uint256& filter_header)
{
    size_t bytes_written = WriteFilterToDisk(m_next_filter_pos, filter);
    if (bytes_written == 0) return false;

    std::pair<uint256, DBVal> value;
    value.first = filter.GetBlockHash();
    value.second.hash = filter.GetHash();
    value.second.header = filter_header;
    value.second.pos = m_next_filter_pos;

    if (!m_db->Write(DBHeightKey(block_height), value)) {
        return false;
    }

    m_next_filter_pos.nPos += bytes_written;
    return true;
}

[[nodiscard]] static bool CopyHeightIndexToHashIndex(CDBIterator& db_it, CDBBatch& batch,
                                       const std::string& index_name,
                                       int start_height, int stop_height)
{
    DBHeightKey key(start_height);
    db_it.Seek(key);

    for (int height = start_height; height <= stop_height; ++height) {
        if (!db_it.GetKey(key) || key.height != height) {
            LogError("%s: unexpected key in %s: expected (%c, %d)\n",
                         __func__, index_name, DB_BLOCK_HEIGHT, height);
            return false;
        }

        std::pair<uint256, DBVal> value;
        if (!db_it.GetValue(value)) {
            LogError("%s: unable to read value in %s at key (%c, %d)\n",
                         __func__, index_name, DB_BLOCK_HEIGHT, height);
            return false;
        }

        batch.Write(DBHashKey(value.first), std::move(value.second));

        db_it.Next();
    }
    return true;
}

bool BlockFilterIndex::CustomRewind(const interfaces::BlockRef& current_tip, const interfaces::BlockRef& new_tip)
{
    CDBBatch batch(*m_db);
    std::unique_ptr<CDBIterator> db_it(m_db->NewIterator());

    // During a reorg, we need to copy all filters for blocks that are getting disconnected from the
    // height index to the hash index so we can still find them when the height index entries are
    // overwritten.
    if (!CopyHeightIndexToHashIndex(*db_it, batch, m_name, new_tip.height, current_tip.height)) {
        return false;
    }

    // The latest filter position gets written in Commit by the call to the BaseIndex::Rewind.
    // But since this creates new references to the filter, the position should get updated here
    // atomically as well in case Commit fails.
    batch.Write(DB_FILTER_POS, m_next_filter_pos);
    if (!m_db->WriteBatch(batch)) return false;

    // Update cached header
    m_last_header = *Assert(ReadFilterHeader(new_tip.height, new_tip.hash));
    return true;
}

static bool LookupOne(const CDBWrapper& db, const CBlockIndex* block_index, DBVal& result)
{
    // First check if the result is stored under the height index and the value there matches the
    // block hash. This should be the case if the block is on the active chain.
    std::pair<uint256, DBVal> read_out;
    if (!db.Read(DBHeightKey(block_index->nHeight), read_out)) {
        return false;
    }
    if (read_out.first == block_index->GetBlockHash()) {
        result = std::move(read_out.second);
        return true;
    }

    // If value at the height index corresponds to an different block, the result will be stored in
    // the hash index.
    return db.Read(DBHashKey(block_index->GetBlockHash()), result);
}

static bool LookupRange(CDBWrapper& db, const std::string& index_name, int start_height,
                        const CBlockIndex* stop_index, std::vector<DBVal>& results)
{
    if (start_height < 0) {
        LogError("%s: start height (%d) is negative\n", __func__, start_height);
        return false;
    }
    if (start_height > stop_index->nHeight) {
        LogError("%s: start height (%d) is greater than stop height (%d)\n",
                     __func__, start_height, stop_index->nHeight);
        return false;
    }

    size_t results_size = static_cast<size_t>(stop_index->nHeight - start_height + 1);
    std::vector<std::pair<uint256, DBVal>> values(results_size);

    DBHeightKey key(start_height);
    std::unique_ptr<CDBIterator> db_it(db.NewIterator());
    db_it->Seek(DBHeightKey(start_height));
    for (int height = start_height; height <= stop_index->nHeight; ++height) {
        if (!db_it->Valid() || !db_it->GetKey(key) || key.height != height) {
            return false;
        }

        size_t i = static_cast<size_t>(height - start_height);
        if (!db_it->GetValue(values[i])) {
            LogError("%s: unable to read value in %s at key (%c, %d)\n",
                         __func__, index_name, DB_BLOCK_HEIGHT, height);
            return false;
        }

        db_it->Next();
    }

    results.resize(results_size);

    // Iterate backwards through block indexes collecting results in order to access the block hash
    // of each entry in case we need to look it up in the hash index.
    for (const CBlockIndex* block_index = stop_index;
         block_index && block_index->nHeight >= start_height;
         block_index = block_index->pprev) {
        uint256 block_hash = block_index->GetBlockHash();

        size_t i = static_cast<size_t>(block_index->nHeight - start_height);
        if (block_hash == values[i].first) {
            results[i] = std::move(values[i].second);
            continue;
        }

        if (!db.Read(DBHashKey(block_hash), results[i])) {
            LogError("%s: unable to read value in %s at key (%c, %s)\n",
                         __func__, index_name, DB_BLOCK_HASH, block_hash.ToString());
            return false;
        }
    }

    return true;
}

bool BlockFilterIndex::LookupFilter(const CBlockIndex* block_index, BlockFilter& filter_out) const
{
    DBVal entry;
    if (!LookupOne(*m_db, block_index, entry)) {
        return false;
    }

    return ReadFilterFromDisk(entry.pos, entry.hash, filter_out);
}

bool BlockFilterIndex::LookupFilterHeader(const CBlockIndex* block_index, uint256& header_out)
{
    LOCK(m_cs_headers_cache);

    bool is_checkpoint{block_index->nHeight % CFCHECKPT_INTERVAL == 0};

    if (is_checkpoint) {
        // Try to find the block in the headers cache if this is a checkpoint height.
        auto header = m_headers_cache.find(block_index->GetBlockHash());
        if (header != m_headers_cache.end()) {
            header_out = header->second;
            return true;
        }
    }

    DBVal entry;
    if (!LookupOne(*m_db, block_index, entry)) {
        return false;
    }

    if (is_checkpoint &&
        m_headers_cache.size() < CF_HEADERS_CACHE_MAX_SZ) {
        // Add to the headers cache if this is a checkpoint height.
        m_headers_cache.emplace(block_index->GetBlockHash(), entry.header);
    }

    header_out = entry.header;
    return true;
}

bool BlockFilterIndex::LookupFilterRange(int start_height, const CBlockIndex* stop_index,
                                         std::vector<BlockFilter>& filters_out) const
{
    std::vector<DBVal> entries;
    if (!LookupRange(*m_db, m_name, start_height, stop_index, entries)) {
        return false;
    }

    filters_out.resize(entries.size());
    auto filter_pos_it = filters_out.begin();
    for (const auto& entry : entries) {
        if (!ReadFilterFromDisk(entry.pos, entry.hash, *filter_pos_it)) {
            return false;
        }
        ++filter_pos_it;
    }

    return true;
}

bool BlockFilterIndex::LookupFilterHashRange(int start_height, const CBlockIndex* stop_index,
                                             std::vector<uint256>& hashes_out) const

{
    std::vector<DBVal> entries;
    if (!LookupRange(*m_db, m_name, start_height, stop_index, entries)) {
        return false;
    }

    hashes_out.clear();
    hashes_out.reserve(entries.size());
    for (const auto& entry : entries) {
        hashes_out.push_back(entry.hash);
    }
    return true;
}

BlockFilterIndex* GetBlockFilterIndex(BlockFilterType filter_type)
{
    auto it = g_filter_indexes.find(filter_type);
    return it != g_filter_indexes.end() ? &it->second : nullptr;
}

void ForEachBlockFilterIndex(std::function<void (BlockFilterIndex&)> fn)
{
    for (auto& entry : g_filter_indexes) fn(entry.second);
}

bool InitBlockFilterIndex(std::function<std::unique_ptr<interfaces::Chain>()> make_chain, BlockFilterType filter_type,
                          size_t n_cache_size, bool f_memory, bool f_wipe)
{
    auto result = g_filter_indexes.emplace(std::piecewise_construct,
                                           std::forward_as_tuple(filter_type),
                                           std::forward_as_tuple(make_chain(), filter_type,
                                                                 n_cache_size, f_memory, f_wipe));
    return result.second;
}

bool DestroyBlockFilterIndex(BlockFilterType filter_type)
{
    return g_filter_indexes.erase(filter_type);
}

void DestroyAllBlockFilterIndexes()
{
    g_filter_indexes.clear();
}

Coverage Report

Created: 2024-10-21 15:10

Line	Count	Source (jump to first uncovered line)
1		// Copyright (c) 2018-2022 The Bitcoin Core developers
2		// Distributed under the MIT software license, see the accompanying
3		// file COPYING or http://www.opensource.org/licenses/mit-license.php.
4
5		#include <map>
6
7		#include <clientversion.h>
8		#include <common/args.h>
9		#include <dbwrapper.h>
10		#include <hash.h>
11		#include <index/blockfilterindex.h>
12		#include <logging.h>
13		#include <node/blockstorage.h>
14		#include <undo.h>
15		#include <util/fs_helpers.h>
16		#include <validation.h>
17
18		/* The index database stores three items for each block: the disk location of the encoded filter,
19		* its dSHA256 hash, and the header. Those belonging to blocks on the active chain are indexed by
20		* height, and those belonging to blocks that have been reorganized out of the active chain are
21		* indexed by block hash. This ensures that filter data for any block that becomes part of the
22		* active chain can always be retrieved, alleviating timing concerns.
23		*
24		* The filters themselves are stored in flat files and referenced by the LevelDB entries. This
25		* minimizes the amount of data written to LevelDB and keeps the database values constant size. The
26		* disk location of the next block filter to be written (represented as a FlatFilePos) is stored
27		* under the DB_FILTER_POS key.
28		*
29		* Keys for the height index have the type [DB_BLOCK_HEIGHT, uint32 (BE)]. The height is represented
30		* as big-endian so that sequential reads of filters by height are fast.
31		* Keys for the hash index have the type [DB_BLOCK_HASH, uint256].
32		*/
33		constexpr uint8_t DB_BLOCK_HASH{'s'};
34		constexpr uint8_t DB_BLOCK_HEIGHT{'t'};
35		constexpr uint8_t DB_FILTER_POS{'P'};
36
37		constexpr unsigned int MAX_FLTR_FILE_SIZE = 0x1000000; // 16 MiB
38		/** The pre-allocation chunk size for fltr?????.dat files */
39		constexpr unsigned int FLTR_FILE_CHUNK_SIZE = 0x100000; // 1 MiB
40		/** Maximum size of the cfheaders cache
41		* We have a limit to prevent a bug in filling this cache
42		* potentially turning into an OOM. At 2000 entries, this cache
43		* is big enough for a 2,000,000 length block chain, which
44		* we should be enough until ~2047. */
45		constexpr size_t CF_HEADERS_CACHE_MAX_SZ{2000};
46
47		namespace {
48
49		struct DBVal {
50		uint256 hash;
51		uint256 header;
52		FlatFilePos pos;
53
54	0	SERIALIZE_METHODS(DBVal, obj) { READWRITE(obj.hash, obj.header, obj.pos); } Unexecuted instantiation: blockfilterindex.cpp:_ZN12_GLOBAL__N_15DBVal16SerializationOpsI10DataStreamS0_17ActionUnserializeEEvRT0_RT_T1_ Unexecuted instantiation: blockfilterindex.cpp:_ZN12_GLOBAL__N_15DBVal16SerializationOpsI10DataStreamKS0_15ActionSerializeEEvRT0_RT_T1_
55		};
56
57		struct DBHeightKey {
58		int height;
59
60	0	explicit DBHeightKey(int height_in) : height(height_in) {}
61
62		template<typename Stream>
63		void Serialize(Stream& s) const
64	0	{
65	0	ser_writedata8(s, DB_BLOCK_HEIGHT);
66	0	ser_writedata32be(s, height);
67	0	}
68
69		template<typename Stream>
70		void Unserialize(Stream& s)
71	0	{
72	0	const uint8_t prefix{ser_readdata8(s)};
73	0	if (prefix != DB_BLOCK_HEIGHT) {
74	0	throw std::ios_base::failure("Invalid format for block filter index DB height key");
75	0	}
76	0	height = ser_readdata32be(s);
77	0	}
78		};
79
80		struct DBHashKey {
81		uint256 hash;
82
83	0	explicit DBHashKey(const uint256& hash_in) : hash(hash_in) {}
84
85	0	SERIALIZE_METHODS(DBHashKey, obj) {
86	0	uint8_t prefix{DB_BLOCK_HASH};
87	0	READWRITE(prefix);
88	0	if (prefix != DB_BLOCK_HASH) {
89	0	throw std::ios_base::failure("Invalid format for block filter index DB hash key");
90	0	}
91
92	0	READWRITE(obj.hash);
93	0	}
94		};
95
96		}; // namespace
97
98		static std::map<BlockFilterType, BlockFilterIndex> g_filter_indexes;
99
100		BlockFilterIndex::BlockFilterIndex(std::unique_ptr<interfaces::Chain> chain, BlockFilterType filter_type,
101		size_t n_cache_size, bool f_memory, bool f_wipe)
102	0	: BaseIndex(std::move(chain), BlockFilterTypeName(filter_type) + " block filter index")
103	0	, m_filter_type(filter_type)
104	0	{
105	0	const std::string& filter_name = BlockFilterTypeName(filter_type);
106	0	if (filter_name.empty()) throw std::invalid_argument("unknown filter_type");
107
108	0	fs::path path = gArgs.GetDataDirNet() / "indexes" / "blockfilter" / fs::u8path(filter_name);
109	0	fs::create_directories(path);
110
111	0	m_db = std::make_unique<BaseIndex::DB>(path / "db", n_cache_size, f_memory, f_wipe);
112	0	m_filter_fileseq = std::make_unique<FlatFileSeq>(std::move(path), "fltr", FLTR_FILE_CHUNK_SIZE);
113	0	}
114
115		bool BlockFilterIndex::CustomInit(const std::optional<interfaces::BlockRef>& block)
116	0	{
117	0	if (!m_db->Read(DB_FILTER_POS, m_next_filter_pos)) {
118		// Check that the cause of the read failure is that the key does not exist. Any other errors
119		// indicate database corruption or a disk failure, and starting the index would cause
120		// further corruption.
121	0	if (m_db->Exists(DB_FILTER_POS)) {
122	0	LogError("%s: Cannot read current %s state; index may be corrupted\n",
123	0	__func__, GetName());
124	0	return false;
125	0	}
126
127		// If the DB_FILTER_POS is not set, then initialize to the first location.
128	0	m_next_filter_pos.nFile = 0;
129	0	m_next_filter_pos.nPos = 0;
130	0	}
131
132	0	if (block) {
133	0	auto op_last_header = ReadFilterHeader(block->height, block->hash);
134	0	if (!op_last_header) {
135	0	LogError("Cannot read last block filter header; index may be corrupted\n");
136	0	return false;
137	0	}
138	0	m_last_header = *op_last_header;
139	0	}
140
141	0	return true;
142	0	}
143
144		bool BlockFilterIndex::CustomCommit(CDBBatch& batch)
145	0	{
146	0	const FlatFilePos& pos = m_next_filter_pos;
147
148		// Flush current filter file to disk.
149	0	AutoFile file{m_filter_fileseq->Open(pos)};
150	0	if (file.IsNull()) {
151	0	LogError("%s: Failed to open filter file %d\n", __func__, pos.nFile);
152	0	return false;
153	0	}
154	0	if (!file.Commit()) {
155	0	LogError("%s: Failed to commit filter file %d\n", __func__, pos.nFile);
156	0	return false;
157	0	}
158
159	0	batch.Write(DB_FILTER_POS, pos);
160	0	return true;
161	0	}
162
163		bool BlockFilterIndex::ReadFilterFromDisk(const FlatFilePos& pos, const uint256& hash, BlockFilter& filter) const
164	0	{
165	0	AutoFile filein{m_filter_fileseq->Open(pos, true)};
166	0	if (filein.IsNull()) {
167	0	return false;
168	0	}
169
170		// Check that the hash of the encoded_filter matches the one stored in the db.
171	0	uint256 block_hash;
172	0	std::vector<uint8_t> encoded_filter;
173	0	try {
174	0	filein >> block_hash >> encoded_filter;
175	0	if (Hash(encoded_filter) != hash) {
176	0	LogError("Checksum mismatch in filter decode.\n");
177	0	return false;
178	0	}
179	0	filter = BlockFilter(GetFilterType(), block_hash, std::move(encoded_filter), /skip_decode_check=/true);
180	0	}
181	0	catch (const std::exception& e) {
182	0	LogError("%s: Failed to deserialize block filter from disk: %s\n", __func__, e.what());
183	0	return false;
184	0	}
185
186	0	return true;
187	0	}
188
189		size_t BlockFilterIndex::WriteFilterToDisk(FlatFilePos& pos, const BlockFilter& filter)
190	0	{
191	0	assert(filter.GetFilterType() == GetFilterType());
192
193	0	size_t data_size =
194	0	GetSerializeSize(filter.GetBlockHash()) +
195	0	GetSerializeSize(filter.GetEncodedFilter());
196
197		// If writing the filter would overflow the file, flush and move to the next one.
198	0	if (pos.nPos + data_size > MAX_FLTR_FILE_SIZE) {
199	0	AutoFile last_file{m_filter_fileseq->Open(pos)};
200	0	if (last_file.IsNull()) {
201	0	LogPrintf("%s: Failed to open filter file %d\n", __func__, pos.nFile);
202	0	return 0;
203	0	}
204	0	if (!last_file.Truncate(pos.nPos)) {
205	0	LogPrintf("%s: Failed to truncate filter file %d\n", __func__, pos.nFile);
206	0	return 0;
207	0	}
208	0	if (!last_file.Commit()) {
209	0	LogPrintf("%s: Failed to commit filter file %d\n", __func__, pos.nFile);
210	0	return 0;
211	0	}
212
213	0	pos.nFile++;
214	0	pos.nPos = 0;
215	0	}
216
217		// Pre-allocate sufficient space for filter data.
218	0	bool out_of_space;
219	0	m_filter_fileseq->Allocate(pos, data_size, out_of_space);
220	0	if (out_of_space) {
221	0	LogPrintf("%s: out of disk space\n", __func__);
222	0	return 0;
223	0	}
224
225	0	AutoFile fileout{m_filter_fileseq->Open(pos)};
226	0	if (fileout.IsNull()) {
227	0	LogPrintf("%s: Failed to open filter file %d\n", __func__, pos.nFile);
228	0	return 0;
229	0	}
230
231	0	fileout << filter.GetBlockHash() << filter.GetEncodedFilter();
232	0	return data_size;
233	0	}
234
235		std::optional<uint256> BlockFilterIndex::ReadFilterHeader(int height, const uint256& expected_block_hash)
236	0	{
237	0	std::pair<uint256, DBVal> read_out;
238	0	if (!m_db->Read(DBHeightKey(height), read_out)) {
239	0	return std::nullopt;
240	0	}
241
242	0	if (read_out.first != expected_block_hash) {
243	0	LogError("%s: previous block header belongs to unexpected block %s; expected %s\n",
244	0	__func__, read_out.first.ToString(), expected_block_hash.ToString());
245	0	return std::nullopt;
246	0	}
247
248	0	return read_out.second.header;
249	0	}
250
251		bool BlockFilterIndex::CustomAppend(const interfaces::BlockInfo& block)
252	0	{
253	0	CBlockUndo block_undo;
254
255	0	if (block.height > 0) {
256		// pindex variable gives indexing code access to node internals. It
257		// will be removed in upcoming commit
258	0	const CBlockIndex* pindex = WITH_LOCK(cs_main, return m_chainstate->m_blockman.LookupBlockIndex(block.hash));
259	0	if (!m_chainstate->m_blockman.UndoReadFromDisk(block_undo, *pindex)) {
260	0	return false;
261	0	}
262	0	}
263
264	0	BlockFilter filter(m_filter_type, *Assert(block.data), block_undo);
265
266	0	const uint256& header = filter.ComputeHeader(m_last_header);
267	0	bool res = Write(filter, block.height, header);
268	0	if (res) m_last_header = header; // update last header
269	0	return res;
270	0	}
271
272		bool BlockFilterIndex::Write(const BlockFilter& filter, uint32_t block_height, const uint256& filter_header)
273	0	{
274	0	size_t bytes_written = WriteFilterToDisk(m_next_filter_pos, filter);
275	0	if (bytes_written == 0) return false;
276
277	0	std::pair<uint256, DBVal> value;
278	0	value.first = filter.GetBlockHash();
279	0	value.second.hash = filter.GetHash();
280	0	value.second.header = filter_header;
281	0	value.second.pos = m_next_filter_pos;
282
283	0	if (!m_db->Write(DBHeightKey(block_height), value)) {
284	0	return false;
285	0	}
286
287	0	m_next_filter_pos.nPos += bytes_written;
288	0	return true;
289	0	}
290
291		[[nodiscard]] static bool CopyHeightIndexToHashIndex(CDBIterator& db_it, CDBBatch& batch,
292		const std::string& index_name,
293		int start_height, int stop_height)
294	0	{
295	0	DBHeightKey key(start_height);
296	0	db_it.Seek(key);
297
298	0	for (int height = start_height; height <= stop_height; ++height) {
299	0	if (!db_it.GetKey(key) \|\| key.height != height) {
300	0	LogError("%s: unexpected key in %s: expected (%c, %d)\n",
301	0	__func__, index_name, DB_BLOCK_HEIGHT, height);
302	0	return false;
303	0	}
304
305	0	std::pair<uint256, DBVal> value;
306	0	if (!db_it.GetValue(value)) {
307	0	LogError("%s: unable to read value in %s at key (%c, %d)\n",
308	0	__func__, index_name, DB_BLOCK_HEIGHT, height);
309	0	return false;
310	0	}
311
312	0	batch.Write(DBHashKey(value.first), std::move(value.second));
313
314	0	db_it.Next();
315	0	}
316	0	return true;
317	0	}
318
319		bool BlockFilterIndex::CustomRewind(const interfaces::BlockRef& current_tip, const interfaces::BlockRef& new_tip)
320	0	{
321	0	CDBBatch batch(*m_db);
322	0	std::unique_ptr<CDBIterator> db_it(m_db->NewIterator());
323
324		// During a reorg, we need to copy all filters for blocks that are getting disconnected from the
325		// height index to the hash index so we can still find them when the height index entries are
326		// overwritten.
327	0	if (!CopyHeightIndexToHashIndex(*db_it, batch, m_name, new_tip.height, current_tip.height)) {
328	0	return false;
329	0	}
330
331		// The latest filter position gets written in Commit by the call to the BaseIndex::Rewind.
332		// But since this creates new references to the filter, the position should get updated here
333		// atomically as well in case Commit fails.
334	0	batch.Write(DB_FILTER_POS, m_next_filter_pos);
335	0	if (!m_db->WriteBatch(batch)) return false;
336
337		// Update cached header
338	0	m_last_header = *Assert(ReadFilterHeader(new_tip.height, new_tip.hash));
339	0	return true;
340	0	}
341
342		static bool LookupOne(const CDBWrapper& db, const CBlockIndex* block_index, DBVal& result)
343	0	{
344		// First check if the result is stored under the height index and the value there matches the
345		// block hash. This should be the case if the block is on the active chain.
346	0	std::pair<uint256, DBVal> read_out;
347	0	if (!db.Read(DBHeightKey(block_index->nHeight), read_out)) {
348	0	return false;
349	0	}
350	0	if (read_out.first == block_index->GetBlockHash()) {
351	0	result = std::move(read_out.second);
352	0	return true;
353	0	}
354
355		// If value at the height index corresponds to an different block, the result will be stored in
356		// the hash index.
357	0	return db.Read(DBHashKey(block_index->GetBlockHash()), result);
358	0	}
359
360		static bool LookupRange(CDBWrapper& db, const std::string& index_name, int start_height,
361		const CBlockIndex* stop_index, std::vector<DBVal>& results)
362	0	{
363	0	if (start_height < 0) {
364	0	LogError("%s: start height (%d) is negative\n", __func__, start_height);
365	0	return false;
366	0	}
367	0	if (start_height > stop_index->nHeight) {
368	0	LogError("%s: start height (%d) is greater than stop height (%d)\n",
369	0	__func__, start_height, stop_index->nHeight);
370	0	return false;
371	0	}
372
373	0	size_t results_size = static_cast<size_t>(stop_index->nHeight - start_height + 1);
374	0	std::vector<std::pair<uint256, DBVal>> values(results_size);
375
376	0	DBHeightKey key(start_height);
377	0	std::unique_ptr<CDBIterator> db_it(db.NewIterator());
378	0	db_it->Seek(DBHeightKey(start_height));
379	0	for (int height = start_height; height <= stop_index->nHeight; ++height) {
380	0	if (!db_it->Valid() \|\| !db_it->GetKey(key) \|\| key.height != height) {
381	0	return false;
382	0	}
383
384	0	size_t i = static_cast<size_t>(height - start_height);
385	0	if (!db_it->GetValue(values[i])) {
386	0	LogError("%s: unable to read value in %s at key (%c, %d)\n",
387	0	__func__, index_name, DB_BLOCK_HEIGHT, height);
388	0	return false;
389	0	}
390
391	0	db_it->Next();
392	0	}
393
394	0	results.resize(results_size);
395
396		// Iterate backwards through block indexes collecting results in order to access the block hash
397		// of each entry in case we need to look it up in the hash index.
398	0	for (const CBlockIndex* block_index = stop_index;
399	0	block_index && block_index->nHeight >= start_height;
400	0	block_index = block_index->pprev) {
401	0	uint256 block_hash = block_index->GetBlockHash();
402
403	0	size_t i = static_cast<size_t>(block_index->nHeight - start_height);
404	0	if (block_hash == values[i].first) {
405	0	results[i] = std::move(values[i].second);
406	0	continue;
407	0	}
408
409	0	if (!db.Read(DBHashKey(block_hash), results[i])) {
410	0	LogError("%s: unable to read value in %s at key (%c, %s)\n",
411	0	__func__, index_name, DB_BLOCK_HASH, block_hash.ToString());
412	0	return false;
413	0	}
414	0	}
415
416	0	return true;
417	0	}
418
419		bool BlockFilterIndex::LookupFilter(const CBlockIndex* block_index, BlockFilter& filter_out) const
420	0	{
421	0	DBVal entry;
422	0	if (!LookupOne(*m_db, block_index, entry)) {
423	0	return false;
424	0	}
425
426	0	return ReadFilterFromDisk(entry.pos, entry.hash, filter_out);
427	0	}
428
429		bool BlockFilterIndex::LookupFilterHeader(const CBlockIndex* block_index, uint256& header_out)
430	0	{
431	0	LOCK(m_cs_headers_cache);
432
433	0	bool is_checkpoint{block_index->nHeight % CFCHECKPT_INTERVAL == 0};
434
435	0	if (is_checkpoint) {
436		// Try to find the block in the headers cache if this is a checkpoint height.
437	0	auto header = m_headers_cache.find(block_index->GetBlockHash());
438	0	if (header != m_headers_cache.end()) {
439	0	header_out = header->second;
440	0	return true;
441	0	}
442	0	}
443
444	0	DBVal entry;
445	0	if (!LookupOne(*m_db, block_index, entry)) {
446	0	return false;
447	0	}
448
449	0	if (is_checkpoint &&
450	0	m_headers_cache.size() < CF_HEADERS_CACHE_MAX_SZ) {
451		// Add to the headers cache if this is a checkpoint height.
452	0	m_headers_cache.emplace(block_index->GetBlockHash(), entry.header);
453	0	}
454
455	0	header_out = entry.header;
456	0	return true;
457	0	}
458
459		bool BlockFilterIndex::LookupFilterRange(int start_height, const CBlockIndex* stop_index,
460		std::vector<BlockFilter>& filters_out) const
461	0	{
462	0	std::vector<DBVal> entries;
463	0	if (!LookupRange(*m_db, m_name, start_height, stop_index, entries)) {
464	0	return false;
465	0	}
466
467	0	filters_out.resize(entries.size());
468	0	auto filter_pos_it = filters_out.begin();
469	0	for (const auto& entry : entries) {
470	0	if (!ReadFilterFromDisk(entry.pos, entry.hash, *filter_pos_it)) {
471	0	return false;
472	0	}
473	0	++filter_pos_it;
474	0	}
475
476	0	return true;
477	0	}
478
479		bool BlockFilterIndex::LookupFilterHashRange(int start_height, const CBlockIndex* stop_index,
480		std::vector<uint256>& hashes_out) const
481
482	0	{
483	0	std::vector<DBVal> entries;
484	0	if (!LookupRange(*m_db, m_name, start_height, stop_index, entries)) {
485	0	return false;
486	0	}
487
488	0	hashes_out.clear();
489	0	hashes_out.reserve(entries.size());
490	0	for (const auto& entry : entries) {
491	0	hashes_out.push_back(entry.hash);
492	0	}
493	0	return true;
494	0	}
495
496		BlockFilterIndex* GetBlockFilterIndex(BlockFilterType filter_type)
497	0	{
498	0	auto it = g_filter_indexes.find(filter_type);
499	0	return it != g_filter_indexes.end() ? &it->second : nullptr;
500	0	}
501
502		void ForEachBlockFilterIndex(std::function<void (BlockFilterIndex&)> fn)
503	0	{
504	0	for (auto& entry : g_filter_indexes) fn(entry.second);
505	0	}
506
507		bool InitBlockFilterIndex(std::function<std::unique_ptr<interfaces::Chain>()> make_chain, BlockFilterType filter_type,
508		size_t n_cache_size, bool f_memory, bool f_wipe)
509	0	{
510	0	auto result = g_filter_indexes.emplace(std::piecewise_construct,
511	0	std::forward_as_tuple(filter_type),
512	0	std::forward_as_tuple(make_chain(), filter_type,
513	0	n_cache_size, f_memory, f_wipe));
514	0	return result.second;
515	0	}
516
517		bool DestroyBlockFilterIndex(BlockFilterType filter_type)
518	0	{
519	0	return g_filter_indexes.erase(filter_type);
520	0	}
521
522		void DestroyAllBlockFilterIndexes()
523	0	{
524	0	g_filter_indexes.clear();
525	0	}