/root/bitcoin/src/leveldb/table/table.cc
| Line | Count | Source | 
| 1 |  | // Copyright (c) 2011 The LevelDB Authors. All rights reserved. | 
| 2 |  | // Use of this source code is governed by a BSD-style license that can be | 
| 3 |  | // found in the LICENSE file. See the AUTHORS file for names of contributors. | 
| 4 |  |  | 
| 5 |  | #include "leveldb/table.h" | 
| 6 |  |  | 
| 7 |  | #include "leveldb/cache.h" | 
| 8 |  | #include "leveldb/comparator.h" | 
| 9 |  | #include "leveldb/env.h" | 
| 10 |  | #include "leveldb/filter_policy.h" | 
| 11 |  | #include "leveldb/options.h" | 
| 12 |  | #include "table/block.h" | 
| 13 |  | #include "table/filter_block.h" | 
| 14 |  | #include "table/format.h" | 
| 15 |  | #include "table/two_level_iterator.h" | 
| 16 |  | #include "util/coding.h" | 
| 17 |  |  | 
| 18 |  | namespace leveldb { | 
| 19 |  |  | 
| 20 |  | struct Table::Rep { | 
| 21 | 0 |   ~Rep() { | 
| 22 | 0 |     delete filter; | 
| 23 | 0 |     delete[] filter_data; | 
| 24 | 0 |     delete index_block; | 
| 25 | 0 |   } | 
| 26 |  |  | 
| 27 |  |   Options options; | 
| 28 |  |   Status status; | 
| 29 |  |   RandomAccessFile* file; | 
| 30 |  |   uint64_t cache_id; | 
| 31 |  |   FilterBlockReader* filter; | 
| 32 |  |   const char* filter_data; | 
| 33 |  |  | 
| 34 |  |   BlockHandle metaindex_handle;  // Handle to metaindex_block: saved from footer | 
| 35 |  |   Block* index_block; | 
| 36 |  | }; | 
| 37 |  |  | 
| 38 |  | Status Table::Open(const Options& options, RandomAccessFile* file, | 
| 39 | 0 |                    uint64_t size, Table** table) { | 
| 40 | 0 |   *table = nullptr; | 
| 41 | 0 |   if (size < Footer::kEncodedLength) { | 
| 42 | 0 |     return Status::Corruption("file is too short to be an sstable"); | 
| 43 | 0 |   } | 
| 44 |  |  | 
| 45 | 0 |   char footer_space[Footer::kEncodedLength]; | 
| 46 | 0 |   Slice footer_input; | 
| 47 | 0 |   Status s = file->Read(size - Footer::kEncodedLength, Footer::kEncodedLength, | 
| 48 | 0 |                         &footer_input, footer_space); | 
| 49 | 0 |   if (!s.ok()) return s; | 
| 50 |  |  | 
| 51 | 0 |   Footer footer; | 
| 52 | 0 |   s = footer.DecodeFrom(&footer_input); | 
| 53 | 0 |   if (!s.ok()) return s; | 
| 54 |  |  | 
| 55 |  |   // Read the index block | 
| 56 | 0 |   BlockContents index_block_contents; | 
| 57 | 0 |   if (s.ok()) { | 
| 58 | 0 |     ReadOptions opt; | 
| 59 | 0 |     if (options.paranoid_checks) { | 
| 60 | 0 |       opt.verify_checksums = true; | 
| 61 | 0 |     } | 
| 62 | 0 |     s = ReadBlock(file, opt, footer.index_handle(), &index_block_contents); | 
| 63 | 0 |   } | 
| 64 |  | 
 | 
| 65 | 0 |   if (s.ok()) { | 
| 66 |  |     // We've successfully read the footer and the index block: we're | 
| 67 |  |     // ready to serve requests. | 
| 68 | 0 |     Block* index_block = new Block(index_block_contents); | 
| 69 | 0 |     Rep* rep = new Table::Rep; | 
| 70 | 0 |     rep->options = options; | 
| 71 | 0 |     rep->file = file; | 
| 72 | 0 |     rep->metaindex_handle = footer.metaindex_handle(); | 
| 73 | 0 |     rep->index_block = index_block; | 
| 74 | 0 |     rep->cache_id = (options.block_cache ? options.block_cache->NewId() : 0); | 
| 75 | 0 |     rep->filter_data = nullptr; | 
| 76 | 0 |     rep->filter = nullptr; | 
| 77 | 0 |     *table = new Table(rep); | 
| 78 | 0 |     (*table)->ReadMeta(footer); | 
| 79 | 0 |   } | 
| 80 |  | 
 | 
| 81 | 0 |   return s; | 
| 82 | 0 | } | 
| 83 |  |  | 
| 84 | 0 | void Table::ReadMeta(const Footer& footer) { | 
| 85 | 0 |   if (rep_->options.filter_policy == nullptr) { | 
| 86 | 0 |     return;  // Do not need any metadata | 
| 87 | 0 |   } | 
| 88 |  |  | 
| 89 |  |   // TODO(sanjay): Skip this if footer.metaindex_handle() size indicates | 
| 90 |  |   // it is an empty block. | 
| 91 | 0 |   ReadOptions opt; | 
| 92 | 0 |   if (rep_->options.paranoid_checks) { | 
| 93 | 0 |     opt.verify_checksums = true; | 
| 94 | 0 |   } | 
| 95 | 0 |   BlockContents contents; | 
| 96 | 0 |   if (!ReadBlock(rep_->file, opt, footer.metaindex_handle(), &contents).ok()) { | 
| 97 |  |     // Do not propagate errors since meta info is not needed for operation | 
| 98 | 0 |     return; | 
| 99 | 0 |   } | 
| 100 | 0 |   Block* meta = new Block(contents); | 
| 101 |  | 
 | 
| 102 | 0 |   Iterator* iter = meta->NewIterator(BytewiseComparator()); | 
| 103 | 0 |   std::string key = "filter."; | 
| 104 | 0 |   key.append(rep_->options.filter_policy->Name()); | 
| 105 | 0 |   iter->Seek(key); | 
| 106 | 0 |   if (iter->Valid() && iter->key() == Slice(key)) { | 
| 107 | 0 |     ReadFilter(iter->value()); | 
| 108 | 0 |   } | 
| 109 | 0 |   delete iter; | 
| 110 | 0 |   delete meta; | 
| 111 | 0 | } | 
| 112 |  |  | 
| 113 | 0 | void Table::ReadFilter(const Slice& filter_handle_value) { | 
| 114 | 0 |   Slice v = filter_handle_value; | 
| 115 | 0 |   BlockHandle filter_handle; | 
| 116 | 0 |   if (!filter_handle.DecodeFrom(&v).ok()) { | 
| 117 | 0 |     return; | 
| 118 | 0 |   } | 
| 119 |  |  | 
| 120 |  |   // We might want to unify with ReadBlock() if we start | 
| 121 |  |   // requiring checksum verification in Table::Open. | 
| 122 | 0 |   ReadOptions opt; | 
| 123 | 0 |   if (rep_->options.paranoid_checks) { | 
| 124 | 0 |     opt.verify_checksums = true; | 
| 125 | 0 |   } | 
| 126 | 0 |   BlockContents block; | 
| 127 | 0 |   if (!ReadBlock(rep_->file, opt, filter_handle, &block).ok()) { | 
| 128 | 0 |     return; | 
| 129 | 0 |   } | 
| 130 | 0 |   if (block.heap_allocated) { | 
| 131 | 0 |     rep_->filter_data = block.data.data();  // Will need to delete later | 
| 132 | 0 |   } | 
| 133 | 0 |   rep_->filter = new FilterBlockReader(rep_->options.filter_policy, block.data); | 
| 134 | 0 | } | 
| 135 |  |  | 
| 136 | 0 | Table::~Table() { delete rep_; } | 
| 137 |  |  | 
| 138 | 0 | static void DeleteBlock(void* arg, void* ignored) { | 
| 139 | 0 |   delete reinterpret_cast<Block*>(arg); | 
| 140 | 0 | } | 
| 141 |  |  | 
| 142 | 0 | static void DeleteCachedBlock(const Slice& key, void* value) { | 
| 143 | 0 |   Block* block = reinterpret_cast<Block*>(value); | 
| 144 | 0 |   delete block; | 
| 145 | 0 | } | 
| 146 |  |  | 
| 147 | 0 | static void ReleaseBlock(void* arg, void* h) { | 
| 148 | 0 |   Cache* cache = reinterpret_cast<Cache*>(arg); | 
| 149 | 0 |   Cache::Handle* handle = reinterpret_cast<Cache::Handle*>(h); | 
| 150 | 0 |   cache->Release(handle); | 
| 151 | 0 | } | 
| 152 |  |  | 
| 153 |  | // Convert an index iterator value (i.e., an encoded BlockHandle) | 
| 154 |  | // into an iterator over the contents of the corresponding block. | 
| 155 |  | Iterator* Table::BlockReader(void* arg, const ReadOptions& options, | 
| 156 | 0 |                              const Slice& index_value) { | 
| 157 | 0 |   Table* table = reinterpret_cast<Table*>(arg); | 
| 158 | 0 |   Cache* block_cache = table->rep_->options.block_cache; | 
| 159 | 0 |   Block* block = nullptr; | 
| 160 | 0 |   Cache::Handle* cache_handle = nullptr; | 
| 161 |  | 
 | 
| 162 | 0 |   BlockHandle handle; | 
| 163 | 0 |   Slice input = index_value; | 
| 164 | 0 |   Status s = handle.DecodeFrom(&input); | 
| 165 |  |   // We intentionally allow extra stuff in index_value so that we | 
| 166 |  |   // can add more features in the future. | 
| 167 |  | 
 | 
| 168 | 0 |   if (s.ok()) { | 
| 169 | 0 |     BlockContents contents; | 
| 170 | 0 |     if (block_cache != nullptr) { | 
| 171 | 0 |       char cache_key_buffer[16]; | 
| 172 | 0 |       EncodeFixed64(cache_key_buffer, table->rep_->cache_id); | 
| 173 | 0 |       EncodeFixed64(cache_key_buffer + 8, handle.offset()); | 
| 174 | 0 |       Slice key(cache_key_buffer, sizeof(cache_key_buffer)); | 
| 175 | 0 |       cache_handle = block_cache->Lookup(key); | 
| 176 | 0 |       if (cache_handle != nullptr) { | 
| 177 | 0 |         block = reinterpret_cast<Block*>(block_cache->Value(cache_handle)); | 
| 178 | 0 |       } else { | 
| 179 | 0 |         s = ReadBlock(table->rep_->file, options, handle, &contents); | 
| 180 | 0 |         if (s.ok()) { | 
| 181 | 0 |           block = new Block(contents); | 
| 182 | 0 |           if (contents.cachable && options.fill_cache) { | 
| 183 | 0 |             cache_handle = block_cache->Insert(key, block, block->size(), | 
| 184 | 0 |                                                &DeleteCachedBlock); | 
| 185 | 0 |           } | 
| 186 | 0 |         } | 
| 187 | 0 |       } | 
| 188 | 0 |     } else { | 
| 189 | 0 |       s = ReadBlock(table->rep_->file, options, handle, &contents); | 
| 190 | 0 |       if (s.ok()) { | 
| 191 | 0 |         block = new Block(contents); | 
| 192 | 0 |       } | 
| 193 | 0 |     } | 
| 194 | 0 |   } | 
| 195 |  | 
 | 
| 196 | 0 |   Iterator* iter; | 
| 197 | 0 |   if (block != nullptr) { | 
| 198 | 0 |     iter = block->NewIterator(table->rep_->options.comparator); | 
| 199 | 0 |     if (cache_handle == nullptr) { | 
| 200 | 0 |       iter->RegisterCleanup(&DeleteBlock, block, nullptr); | 
| 201 | 0 |     } else { | 
| 202 | 0 |       iter->RegisterCleanup(&ReleaseBlock, block_cache, cache_handle); | 
| 203 | 0 |     } | 
| 204 | 0 |   } else { | 
| 205 | 0 |     iter = NewErrorIterator(s); | 
| 206 | 0 |   } | 
| 207 | 0 |   return iter; | 
| 208 | 0 | } | 
| 209 |  |  | 
| 210 | 0 | Iterator* Table::NewIterator(const ReadOptions& options) const { | 
| 211 | 0 |   return NewTwoLevelIterator( | 
| 212 | 0 |       rep_->index_block->NewIterator(rep_->options.comparator), | 
| 213 | 0 |       &Table::BlockReader, const_cast<Table*>(this), options); | 
| 214 | 0 | } | 
| 215 |  |  | 
| 216 |  | Status Table::InternalGet(const ReadOptions& options, const Slice& k, void* arg, | 
| 217 |  |                           void (*handle_result)(void*, const Slice&, | 
| 218 | 0 |                                                 const Slice&)) { | 
| 219 | 0 |   Status s; | 
| 220 | 0 |   Iterator* iiter = rep_->index_block->NewIterator(rep_->options.comparator); | 
| 221 | 0 |   iiter->Seek(k); | 
| 222 | 0 |   if (iiter->Valid()) { | 
| 223 | 0 |     Slice handle_value = iiter->value(); | 
| 224 | 0 |     FilterBlockReader* filter = rep_->filter; | 
| 225 | 0 |     BlockHandle handle; | 
| 226 | 0 |     if (filter != nullptr && handle.DecodeFrom(&handle_value).ok() && | 
| 227 | 0 |         !filter->KeyMayMatch(handle.offset(), k)) { | 
| 228 |  |       // Not found | 
| 229 | 0 |     } else { | 
| 230 | 0 |       Iterator* block_iter = BlockReader(this, options, iiter->value()); | 
| 231 | 0 |       block_iter->Seek(k); | 
| 232 | 0 |       if (block_iter->Valid()) { | 
| 233 | 0 |         (*handle_result)(arg, block_iter->key(), block_iter->value()); | 
| 234 | 0 |       } | 
| 235 | 0 |       s = block_iter->status(); | 
| 236 | 0 |       delete block_iter; | 
| 237 | 0 |     } | 
| 238 | 0 |   } | 
| 239 | 0 |   if (s.ok()) { | 
| 240 | 0 |     s = iiter->status(); | 
| 241 | 0 |   } | 
| 242 | 0 |   delete iiter; | 
| 243 | 0 |   return s; | 
| 244 | 0 | } | 
| 245 |  |  | 
| 246 | 0 | uint64_t Table::ApproximateOffsetOf(const Slice& key) const { | 
| 247 | 0 |   Iterator* index_iter = | 
| 248 | 0 |       rep_->index_block->NewIterator(rep_->options.comparator); | 
| 249 | 0 |   index_iter->Seek(key); | 
| 250 | 0 |   uint64_t result; | 
| 251 | 0 |   if (index_iter->Valid()) { | 
| 252 | 0 |     BlockHandle handle; | 
| 253 | 0 |     Slice input = index_iter->value(); | 
| 254 | 0 |     Status s = handle.DecodeFrom(&input); | 
| 255 | 0 |     if (s.ok()) { | 
| 256 | 0 |       result = handle.offset(); | 
| 257 | 0 |     } else { | 
| 258 |  |       // Strange: we can't decode the block handle in the index block. | 
| 259 |  |       // We'll just return the offset of the metaindex block, which is | 
| 260 |  |       // close to the whole file size for this case. | 
| 261 | 0 |       result = rep_->metaindex_handle.offset(); | 
| 262 | 0 |     } | 
| 263 | 0 |   } else { | 
| 264 |  |     // key is past the last key in the file.  Approximate the offset | 
| 265 |  |     // by returning the offset of the metaindex block (which is | 
| 266 |  |     // right near the end of the file). | 
| 267 | 0 |     result = rep_->metaindex_handle.offset(); | 
| 268 | 0 |   } | 
| 269 | 0 |   delete index_iter; | 
| 270 | 0 |   return result; | 
| 271 | 0 | } | 
| 272 |  |  | 
| 273 |  | }  // namespace leveldb |