/root/bitcoin/src/dbwrapper.cpp
Line | Count | Source (jump to first uncovered line) |
1 | | // Copyright (c) 2012-2022 The Bitcoin Core developers |
2 | | // Distributed under the MIT software license, see the accompanying |
3 | | // file COPYING or http://www.opensource.org/licenses/mit-license.php. |
4 | | |
5 | | #include <dbwrapper.h> |
6 | | |
7 | | #include <logging.h> |
8 | | #include <random.h> |
9 | | #include <serialize.h> |
10 | | #include <span.h> |
11 | | #include <streams.h> |
12 | | #include <util/fs.h> |
13 | | #include <util/fs_helpers.h> |
14 | | #include <util/strencodings.h> |
15 | | |
16 | | #include <algorithm> |
17 | | #include <cassert> |
18 | | #include <cstdarg> |
19 | | #include <cstdint> |
20 | | #include <cstdio> |
21 | | #include <leveldb/cache.h> |
22 | | #include <leveldb/db.h> |
23 | | #include <leveldb/env.h> |
24 | | #include <leveldb/filter_policy.h> |
25 | | #include <leveldb/helpers/memenv/memenv.h> |
26 | | #include <leveldb/iterator.h> |
27 | | #include <leveldb/options.h> |
28 | | #include <leveldb/slice.h> |
29 | | #include <leveldb/status.h> |
30 | | #include <leveldb/write_batch.h> |
31 | | #include <memory> |
32 | | #include <optional> |
33 | | #include <utility> |
34 | | |
35 | 0 | static auto CharCast(const std::byte* data) { return reinterpret_cast<const char*>(data); } |
36 | | |
37 | | bool DestroyDB(const std::string& path_str) |
38 | 0 | { |
39 | 0 | return leveldb::DestroyDB(path_str, {}).ok(); |
40 | 0 | } |
41 | | |
42 | | /** Handle database error by throwing dbwrapper_error exception. |
43 | | */ |
44 | | static void HandleError(const leveldb::Status& status) |
45 | 0 | { |
46 | 0 | if (status.ok()) |
47 | 0 | return; |
48 | 0 | const std::string errmsg = "Fatal LevelDB error: " + status.ToString(); |
49 | 0 | LogPrintf("%s\n", errmsg); |
50 | 0 | LogPrintf("You can use -debug=leveldb to get more complete diagnostic messages\n"); |
51 | 0 | throw dbwrapper_error(errmsg); |
52 | 0 | } |
53 | | |
54 | | class CBitcoinLevelDBLogger : public leveldb::Logger { |
55 | | public: |
56 | | // This code is adapted from posix_logger.h, which is why it is using vsprintf. |
57 | | // Please do not do this in normal code |
58 | 0 | void Logv(const char * format, va_list ap) override { |
59 | 0 | if (!LogAcceptCategory(BCLog::LEVELDB, BCLog::Level::Debug)) { |
60 | 0 | return; |
61 | 0 | } |
62 | 0 | char buffer[500]; |
63 | 0 | for (int iter = 0; iter < 2; iter++) { |
64 | 0 | char* base; |
65 | 0 | int bufsize; |
66 | 0 | if (iter == 0) { |
67 | 0 | bufsize = sizeof(buffer); |
68 | 0 | base = buffer; |
69 | 0 | } |
70 | 0 | else { |
71 | 0 | bufsize = 30000; |
72 | 0 | base = new char[bufsize]; |
73 | 0 | } |
74 | 0 | char* p = base; |
75 | 0 | char* limit = base + bufsize; |
76 | | |
77 | | // Print the message |
78 | 0 | if (p < limit) { |
79 | 0 | va_list backup_ap; |
80 | 0 | va_copy(backup_ap, ap); |
81 | | // Do not use vsnprintf elsewhere in bitcoin source code, see above. |
82 | 0 | p += vsnprintf(p, limit - p, format, backup_ap); |
83 | 0 | va_end(backup_ap); |
84 | 0 | } |
85 | | |
86 | | // Truncate to available space if necessary |
87 | 0 | if (p >= limit) { |
88 | 0 | if (iter == 0) { |
89 | 0 | continue; // Try again with larger buffer |
90 | 0 | } |
91 | 0 | else { |
92 | 0 | p = limit - 1; |
93 | 0 | } |
94 | 0 | } |
95 | | |
96 | | // Add newline if necessary |
97 | 0 | if (p == base || p[-1] != '\n') { |
98 | 0 | *p++ = '\n'; |
99 | 0 | } |
100 | |
|
101 | 0 | assert(p <= limit); |
102 | 0 | base[std::min(bufsize - 1, (int)(p - base))] = '\0'; |
103 | 0 | LogDebug(BCLog::LEVELDB, "%s\n", util::RemoveSuffixView(base, "\n")); |
104 | 0 | if (base != buffer) { |
105 | 0 | delete[] base; |
106 | 0 | } |
107 | 0 | break; |
108 | 0 | } |
109 | 0 | } |
110 | | }; |
111 | | |
112 | 0 | static void SetMaxOpenFiles(leveldb::Options *options) { |
113 | | // On most platforms the default setting of max_open_files (which is 1000) |
114 | | // is optimal. On Windows using a large file count is OK because the handles |
115 | | // do not interfere with select() loops. On 64-bit Unix hosts this value is |
116 | | // also OK, because up to that amount LevelDB will use an mmap |
117 | | // implementation that does not use extra file descriptors (the fds are |
118 | | // closed after being mmap'ed). |
119 | | // |
120 | | // Increasing the value beyond the default is dangerous because LevelDB will |
121 | | // fall back to a non-mmap implementation when the file count is too large. |
122 | | // On 32-bit Unix host we should decrease the value because the handles use |
123 | | // up real fds, and we want to avoid fd exhaustion issues. |
124 | | // |
125 | | // See PR #12495 for further discussion. |
126 | |
|
127 | 0 | int default_open_files = options->max_open_files; |
128 | 0 | #ifndef WIN32 |
129 | 0 | if (sizeof(void*) < 8) { |
130 | 0 | options->max_open_files = 64; |
131 | 0 | } |
132 | 0 | #endif |
133 | 0 | LogDebug(BCLog::LEVELDB, "LevelDB using max_open_files=%d (default=%d)\n", |
134 | 0 | options->max_open_files, default_open_files); |
135 | 0 | } |
136 | | |
137 | | static leveldb::Options GetOptions(size_t nCacheSize) |
138 | 0 | { |
139 | 0 | leveldb::Options options; |
140 | 0 | options.block_cache = leveldb::NewLRUCache(nCacheSize / 2); |
141 | 0 | options.write_buffer_size = nCacheSize / 4; // up to two write buffers may be held in memory simultaneously |
142 | 0 | options.filter_policy = leveldb::NewBloomFilterPolicy(10); |
143 | 0 | options.compression = leveldb::kNoCompression; |
144 | 0 | options.info_log = new CBitcoinLevelDBLogger(); |
145 | 0 | if (leveldb::kMajorVersion > 1 || (leveldb::kMajorVersion == 1 && leveldb::kMinorVersion >= 16)) { |
146 | | // LevelDB versions before 1.16 consider short writes to be corruption. Only trigger error |
147 | | // on corruption in later versions. |
148 | 0 | options.paranoid_checks = true; |
149 | 0 | } |
150 | 0 | SetMaxOpenFiles(&options); |
151 | 0 | return options; |
152 | 0 | } |
153 | | |
154 | | struct CDBBatch::WriteBatchImpl { |
155 | | leveldb::WriteBatch batch; |
156 | | }; |
157 | | |
158 | | CDBBatch::CDBBatch(const CDBWrapper& _parent) |
159 | 0 | : parent{_parent}, |
160 | 0 | m_impl_batch{std::make_unique<CDBBatch::WriteBatchImpl>()} {}; |
161 | | |
162 | 0 | CDBBatch::~CDBBatch() = default; |
163 | | |
164 | | void CDBBatch::Clear() |
165 | 0 | { |
166 | 0 | m_impl_batch->batch.Clear(); |
167 | 0 | size_estimate = 0; |
168 | 0 | } |
169 | | |
170 | | void CDBBatch::WriteImpl(Span<const std::byte> key, DataStream& ssValue) |
171 | 0 | { |
172 | 0 | leveldb::Slice slKey(CharCast(key.data()), key.size()); |
173 | 0 | ssValue.Xor(dbwrapper_private::GetObfuscateKey(parent)); |
174 | 0 | leveldb::Slice slValue(CharCast(ssValue.data()), ssValue.size()); |
175 | 0 | m_impl_batch->batch.Put(slKey, slValue); |
176 | | // LevelDB serializes writes as: |
177 | | // - byte: header |
178 | | // - varint: key length (1 byte up to 127B, 2 bytes up to 16383B, ...) |
179 | | // - byte[]: key |
180 | | // - varint: value length |
181 | | // - byte[]: value |
182 | | // The formula below assumes the key and value are both less than 16k. |
183 | 0 | size_estimate += 3 + (slKey.size() > 127) + slKey.size() + (slValue.size() > 127) + slValue.size(); |
184 | 0 | } |
185 | | |
186 | | void CDBBatch::EraseImpl(Span<const std::byte> key) |
187 | 0 | { |
188 | 0 | leveldb::Slice slKey(CharCast(key.data()), key.size()); |
189 | 0 | m_impl_batch->batch.Delete(slKey); |
190 | | // LevelDB serializes erases as: |
191 | | // - byte: header |
192 | | // - varint: key length |
193 | | // - byte[]: key |
194 | | // The formula below assumes the key is less than 16kB. |
195 | 0 | size_estimate += 2 + (slKey.size() > 127) + slKey.size(); |
196 | 0 | } |
197 | | |
198 | | struct LevelDBContext { |
199 | | //! custom environment this database is using (may be nullptr in case of default environment) |
200 | | leveldb::Env* penv; |
201 | | |
202 | | //! database options used |
203 | | leveldb::Options options; |
204 | | |
205 | | //! options used when reading from the database |
206 | | leveldb::ReadOptions readoptions; |
207 | | |
208 | | //! options used when iterating over values of the database |
209 | | leveldb::ReadOptions iteroptions; |
210 | | |
211 | | //! options used when writing to the database |
212 | | leveldb::WriteOptions writeoptions; |
213 | | |
214 | | //! options used when sync writing to the database |
215 | | leveldb::WriteOptions syncoptions; |
216 | | |
217 | | //! the database itself |
218 | | leveldb::DB* pdb; |
219 | | }; |
220 | | |
221 | | CDBWrapper::CDBWrapper(const DBParams& params) |
222 | 0 | : m_db_context{std::make_unique<LevelDBContext>()}, m_name{fs::PathToString(params.path.stem())}, m_path{params.path}, m_is_memory{params.memory_only} |
223 | 0 | { |
224 | 0 | DBContext().penv = nullptr; |
225 | 0 | DBContext().readoptions.verify_checksums = true; |
226 | 0 | DBContext().iteroptions.verify_checksums = true; |
227 | 0 | DBContext().iteroptions.fill_cache = false; |
228 | 0 | DBContext().syncoptions.sync = true; |
229 | 0 | DBContext().options = GetOptions(params.cache_bytes); |
230 | 0 | DBContext().options.create_if_missing = true; |
231 | 0 | if (params.memory_only) { |
232 | 0 | DBContext().penv = leveldb::NewMemEnv(leveldb::Env::Default()); |
233 | 0 | DBContext().options.env = DBContext().penv; |
234 | 0 | } else { |
235 | 0 | if (params.wipe_data) { |
236 | 0 | LogPrintf("Wiping LevelDB in %s\n", fs::PathToString(params.path)); |
237 | 0 | leveldb::Status result = leveldb::DestroyDB(fs::PathToString(params.path), DBContext().options); |
238 | 0 | HandleError(result); |
239 | 0 | } |
240 | 0 | TryCreateDirectories(params.path); |
241 | 0 | LogPrintf("Opening LevelDB in %s\n", fs::PathToString(params.path)); |
242 | 0 | } |
243 | | // PathToString() return value is safe to pass to leveldb open function, |
244 | | // because on POSIX leveldb passes the byte string directly to ::open(), and |
245 | | // on Windows it converts from UTF-8 to UTF-16 before calling ::CreateFileW |
246 | | // (see env_posix.cc and env_windows.cc). |
247 | 0 | leveldb::Status status = leveldb::DB::Open(DBContext().options, fs::PathToString(params.path), &DBContext().pdb); |
248 | 0 | HandleError(status); |
249 | 0 | LogPrintf("Opened LevelDB successfully\n"); |
250 | |
|
251 | 0 | if (params.options.force_compact) { |
252 | 0 | LogPrintf("Starting database compaction of %s\n", fs::PathToString(params.path)); |
253 | 0 | DBContext().pdb->CompactRange(nullptr, nullptr); |
254 | 0 | LogPrintf("Finished database compaction of %s\n", fs::PathToString(params.path)); |
255 | 0 | } |
256 | | |
257 | | // The base-case obfuscation key, which is a noop. |
258 | 0 | obfuscate_key = std::vector<unsigned char>(OBFUSCATE_KEY_NUM_BYTES, '\000'); |
259 | |
|
260 | 0 | bool key_exists = Read(OBFUSCATE_KEY_KEY, obfuscate_key); |
261 | |
|
262 | 0 | if (!key_exists && params.obfuscate && IsEmpty()) { |
263 | | // Initialize non-degenerate obfuscation if it won't upset |
264 | | // existing, non-obfuscated data. |
265 | 0 | std::vector<unsigned char> new_key = CreateObfuscateKey(); |
266 | | |
267 | | // Write `new_key` so we don't obfuscate the key with itself |
268 | 0 | Write(OBFUSCATE_KEY_KEY, new_key); |
269 | 0 | obfuscate_key = new_key; |
270 | |
|
271 | 0 | LogPrintf("Wrote new obfuscate key for %s: %s\n", fs::PathToString(params.path), HexStr(obfuscate_key)); |
272 | 0 | } |
273 | |
|
274 | 0 | LogPrintf("Using obfuscation key for %s: %s\n", fs::PathToString(params.path), HexStr(obfuscate_key)); |
275 | 0 | } |
276 | | |
277 | | CDBWrapper::~CDBWrapper() |
278 | 0 | { |
279 | 0 | delete DBContext().pdb; |
280 | 0 | DBContext().pdb = nullptr; |
281 | 0 | delete DBContext().options.filter_policy; |
282 | 0 | DBContext().options.filter_policy = nullptr; |
283 | 0 | delete DBContext().options.info_log; |
284 | 0 | DBContext().options.info_log = nullptr; |
285 | 0 | delete DBContext().options.block_cache; |
286 | 0 | DBContext().options.block_cache = nullptr; |
287 | 0 | delete DBContext().penv; |
288 | 0 | DBContext().options.env = nullptr; |
289 | 0 | } |
290 | | |
291 | | bool CDBWrapper::WriteBatch(CDBBatch& batch, bool fSync) |
292 | 0 | { |
293 | 0 | const bool log_memory = LogAcceptCategory(BCLog::LEVELDB, BCLog::Level::Debug); |
294 | 0 | double mem_before = 0; |
295 | 0 | if (log_memory) { |
296 | 0 | mem_before = DynamicMemoryUsage() / 1024.0 / 1024; |
297 | 0 | } |
298 | 0 | leveldb::Status status = DBContext().pdb->Write(fSync ? DBContext().syncoptions : DBContext().writeoptions, &batch.m_impl_batch->batch); |
299 | 0 | HandleError(status); |
300 | 0 | if (log_memory) { |
301 | 0 | double mem_after = DynamicMemoryUsage() / 1024.0 / 1024; |
302 | 0 | LogDebug(BCLog::LEVELDB, "WriteBatch memory usage: db=%s, before=%.1fMiB, after=%.1fMiB\n", |
303 | 0 | m_name, mem_before, mem_after); |
304 | 0 | } |
305 | 0 | return true; |
306 | 0 | } |
307 | | |
308 | | size_t CDBWrapper::DynamicMemoryUsage() const |
309 | 0 | { |
310 | 0 | std::string memory; |
311 | 0 | std::optional<size_t> parsed; |
312 | 0 | if (!DBContext().pdb->GetProperty("leveldb.approximate-memory-usage", &memory) || !(parsed = ToIntegral<size_t>(memory))) { |
313 | 0 | LogDebug(BCLog::LEVELDB, "Failed to get approximate-memory-usage property\n"); |
314 | 0 | return 0; |
315 | 0 | } |
316 | 0 | return parsed.value(); |
317 | 0 | } |
318 | | |
319 | | // Prefixed with null character to avoid collisions with other keys |
320 | | // |
321 | | // We must use a string constructor which specifies length so that we copy |
322 | | // past the null-terminator. |
323 | | const std::string CDBWrapper::OBFUSCATE_KEY_KEY("\000obfuscate_key", 14); |
324 | | |
325 | | const unsigned int CDBWrapper::OBFUSCATE_KEY_NUM_BYTES = 8; |
326 | | |
327 | | /** |
328 | | * Returns a string (consisting of 8 random bytes) suitable for use as an |
329 | | * obfuscating XOR key. |
330 | | */ |
331 | | std::vector<unsigned char> CDBWrapper::CreateObfuscateKey() const |
332 | 0 | { |
333 | 0 | std::vector<uint8_t> ret(OBFUSCATE_KEY_NUM_BYTES); |
334 | 0 | GetRandBytes(ret); |
335 | 0 | return ret; |
336 | 0 | } |
337 | | |
338 | | std::optional<std::string> CDBWrapper::ReadImpl(Span<const std::byte> key) const |
339 | 0 | { |
340 | 0 | leveldb::Slice slKey(CharCast(key.data()), key.size()); |
341 | 0 | std::string strValue; |
342 | 0 | leveldb::Status status = DBContext().pdb->Get(DBContext().readoptions, slKey, &strValue); |
343 | 0 | if (!status.ok()) { |
344 | 0 | if (status.IsNotFound()) |
345 | 0 | return std::nullopt; |
346 | 0 | LogPrintf("LevelDB read failure: %s\n", status.ToString()); |
347 | 0 | HandleError(status); |
348 | 0 | } |
349 | 0 | return strValue; |
350 | 0 | } |
351 | | |
352 | | bool CDBWrapper::ExistsImpl(Span<const std::byte> key) const |
353 | 0 | { |
354 | 0 | leveldb::Slice slKey(CharCast(key.data()), key.size()); |
355 | |
|
356 | 0 | std::string strValue; |
357 | 0 | leveldb::Status status = DBContext().pdb->Get(DBContext().readoptions, slKey, &strValue); |
358 | 0 | if (!status.ok()) { |
359 | 0 | if (status.IsNotFound()) |
360 | 0 | return false; |
361 | 0 | LogPrintf("LevelDB read failure: %s\n", status.ToString()); |
362 | 0 | HandleError(status); |
363 | 0 | } |
364 | 0 | return true; |
365 | 0 | } |
366 | | |
367 | | size_t CDBWrapper::EstimateSizeImpl(Span<const std::byte> key1, Span<const std::byte> key2) const |
368 | 0 | { |
369 | 0 | leveldb::Slice slKey1(CharCast(key1.data()), key1.size()); |
370 | 0 | leveldb::Slice slKey2(CharCast(key2.data()), key2.size()); |
371 | 0 | uint64_t size = 0; |
372 | 0 | leveldb::Range range(slKey1, slKey2); |
373 | 0 | DBContext().pdb->GetApproximateSizes(&range, 1, &size); |
374 | 0 | return size; |
375 | 0 | } |
376 | | |
377 | | bool CDBWrapper::IsEmpty() |
378 | 0 | { |
379 | 0 | std::unique_ptr<CDBIterator> it(NewIterator()); |
380 | 0 | it->SeekToFirst(); |
381 | 0 | return !(it->Valid()); |
382 | 0 | } |
383 | | |
384 | | struct CDBIterator::IteratorImpl { |
385 | | const std::unique_ptr<leveldb::Iterator> iter; |
386 | | |
387 | 0 | explicit IteratorImpl(leveldb::Iterator* _iter) : iter{_iter} {} |
388 | | }; |
389 | | |
390 | 0 | CDBIterator::CDBIterator(const CDBWrapper& _parent, std::unique_ptr<IteratorImpl> _piter) : parent(_parent), |
391 | 0 | m_impl_iter(std::move(_piter)) {} |
392 | | |
393 | | CDBIterator* CDBWrapper::NewIterator() |
394 | 0 | { |
395 | 0 | return new CDBIterator{*this, std::make_unique<CDBIterator::IteratorImpl>(DBContext().pdb->NewIterator(DBContext().iteroptions))}; |
396 | 0 | } |
397 | | |
398 | | void CDBIterator::SeekImpl(Span<const std::byte> key) |
399 | 0 | { |
400 | 0 | leveldb::Slice slKey(CharCast(key.data()), key.size()); |
401 | 0 | m_impl_iter->iter->Seek(slKey); |
402 | 0 | } |
403 | | |
404 | | Span<const std::byte> CDBIterator::GetKeyImpl() const |
405 | 0 | { |
406 | 0 | return MakeByteSpan(m_impl_iter->iter->key()); |
407 | 0 | } |
408 | | |
409 | | Span<const std::byte> CDBIterator::GetValueImpl() const |
410 | 0 | { |
411 | 0 | return MakeByteSpan(m_impl_iter->iter->value()); |
412 | 0 | } |
413 | | |
414 | 0 | CDBIterator::~CDBIterator() = default; |
415 | 0 | bool CDBIterator::Valid() const { return m_impl_iter->iter->Valid(); } |
416 | 0 | void CDBIterator::SeekToFirst() { m_impl_iter->iter->SeekToFirst(); } |
417 | 0 | void CDBIterator::Next() { m_impl_iter->iter->Next(); } |
418 | | |
419 | | namespace dbwrapper_private { |
420 | | |
421 | | const std::vector<unsigned char>& GetObfuscateKey(const CDBWrapper &w) |
422 | 0 | { |
423 | 0 | return w.obfuscate_key; |
424 | 0 | } |
425 | | |
426 | | } // namespace dbwrapper_private |