Coverage Report

Created: 2023-01-25 06:32

/src/leveldb/table/block.cc
Line
Count
Source (jump to first uncovered line)
1
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
2
// Use of this source code is governed by a BSD-style license that can be
3
// found in the LICENSE file. See the AUTHORS file for names of contributors.
4
//
5
// Decodes the blocks generated by block_builder.cc.
6
7
#include "table/block.h"
8
9
#include <algorithm>
10
#include <cstdint>
11
#include <vector>
12
13
#include "leveldb/comparator.h"
14
#include "table/format.h"
15
#include "util/coding.h"
16
#include "util/logging.h"
17
18
namespace leveldb {
19
20
3.15M
inline uint32_t Block::NumRestarts() const {
21
3.15M
  assert(size_ >= sizeof(uint32_t));
22
3.15M
  return DecodeFixed32(data_ + size_ - sizeof(uint32_t));
23
3.15M
}
24
25
Block::Block(const BlockContents& contents)
26
    : data_(contents.data.data()),
27
      size_(contents.data.size()),
28
978k
      owned_(contents.heap_allocated) {
29
978k
  if (size_ < sizeof(uint32_t)) {
30
0
    size_ = 0;  // Error marker
31
978k
  } else {
32
978k
    size_t max_restarts_allowed = (size_ - sizeof(uint32_t)) / sizeof(uint32_t);
33
978k
    if (NumRestarts() > max_restarts_allowed) {
34
      // The size is too small for NumRestarts()
35
0
      size_ = 0;
36
978k
    } else {
37
978k
      restart_offset_ = size_ - (1 + NumRestarts()) * sizeof(uint32_t);
38
978k
    }
39
978k
  }
40
978k
}
41
42
978k
Block::~Block() {
43
978k
  if (owned_) {
44
0
    delete[] data_;
45
0
  }
46
978k
}
47
48
// Helper routine: decode the next block entry starting at "p",
49
// storing the number of shared key bytes, non_shared key bytes,
50
// and the length of the value in "*shared", "*non_shared", and
51
// "*value_length", respectively.  Will not dereference past "limit".
52
//
53
// If any errors are detected, returns nullptr.  Otherwise, returns a
54
// pointer to the key delta (just past the three decoded values).
55
static inline const char* DecodeEntry(const char* p, const char* limit,
56
                                      uint32_t* shared, uint32_t* non_shared,
57
4.28M
                                      uint32_t* value_length) {
58
4.28M
  if (limit - p < 3) return nullptr;
59
4.28M
  *shared = reinterpret_cast<const uint8_t*>(p)[0];
60
4.28M
  *non_shared = reinterpret_cast<const uint8_t*>(p)[1];
61
4.28M
  *value_length = reinterpret_cast<const uint8_t*>(p)[2];
62
4.28M
  if ((*shared | *non_shared | *value_length) < 128) {
63
    // Fast path: all three values are encoded in one byte each
64
4.09M
    p += 3;
65
4.09M
  } else {
66
194k
    if ((p = GetVarint32Ptr(p, limit, shared)) == nullptr) return nullptr;
67
194k
    if ((p = GetVarint32Ptr(p, limit, non_shared)) == nullptr) return nullptr;
68
194k
    if ((p = GetVarint32Ptr(p, limit, value_length)) == nullptr) return nullptr;
69
194k
  }
70
71
4.28M
  if (static_cast<uint32_t>(limit - p) < (*non_shared + *value_length)) {
72
0
    return nullptr;
73
0
  }
74
4.28M
  return p;
75
4.28M
}
76
77
class Block::Iter : public Iterator {
78
 private:
79
  const Comparator* const comparator_;
80
  const char* const data_;       // underlying block contents
81
  uint32_t const restarts_;      // Offset of restart array (list of fixed32)
82
  uint32_t const num_restarts_;  // Number of uint32_t entries in restart array
83
84
  // current_ is offset in data_ of current entry.  >= restarts_ if !Valid
85
  uint32_t current_;
86
  uint32_t restart_index_;  // Index of restart block in which current_ falls
87
  std::string key_;
88
  Slice value_;
89
  Status status_;
90
91
196k
  inline int Compare(const Slice& a, const Slice& b) const {
92
196k
    return comparator_->Compare(a, b);
93
196k
  }
94
95
  // Return the offset in data_ just past the end of the current entry.
96
5.16M
  inline uint32_t NextEntryOffset() const {
97
5.16M
    return (value_.data() + value_.size()) - data_;
98
5.16M
  }
99
100
4.07M
  uint32_t GetRestartPoint(uint32_t index) {
101
4.07M
    assert(index < num_restarts_);
102
4.07M
    return DecodeFixed32(data_ + restarts_ + index * sizeof(uint32_t));
103
4.07M
  }
104
105
991k
  void SeekToRestartPoint(uint32_t index) {
106
991k
    key_.clear();
107
991k
    restart_index_ = index;
108
    // current_ will be fixed by ParseNextKey();
109
110
    // ParseNextKey() starts at the end of value_, so set value_ accordingly
111
991k
    uint32_t offset = GetRestartPoint(index);
112
991k
    value_ = Slice(data_ + offset, 0);
113
991k
  }
114
115
 public:
116
  Iter(const Comparator* comparator, const char* data, uint32_t restarts,
117
       uint32_t num_restarts)
118
      : comparator_(comparator),
119
        data_(data),
120
        restarts_(restarts),
121
        num_restarts_(num_restarts),
122
        current_(restarts_),
123
1.19M
        restart_index_(num_restarts_) {
124
1.19M
    assert(num_restarts_ > 0);
125
1.19M
  }
126
127
6.26M
  bool Valid() const override { return current_ < restarts_; }
128
954k
  Status status() const override { return status_; }
129
4.12M
  Slice key() const override {
130
4.12M
    assert(Valid());
131
4.12M
    return key_;
132
4.12M
  }
133
3.41M
  Slice value() const override {
134
3.41M
    assert(Valid());
135
3.41M
    return value_;
136
3.41M
  }
137
138
4.07M
  void Next() override {
139
4.07M
    assert(Valid());
140
4.07M
    ParseNextKey();
141
4.07M
  }
142
143
0
  void Prev() override {
144
0
    assert(Valid());
145
146
    // Scan backwards to a restart point before current_
147
0
    const uint32_t original = current_;
148
0
    while (GetRestartPoint(restart_index_) >= original) {
149
0
      if (restart_index_ == 0) {
150
        // No more entries
151
0
        current_ = restarts_;
152
0
        restart_index_ = num_restarts_;
153
0
        return;
154
0
      }
155
0
      restart_index_--;
156
0
    }
157
158
0
    SeekToRestartPoint(restart_index_);
159
0
    do {
160
      // Loop until end of current entry hits the start of original entry
161
0
    } while (ParseNextKey() && NextEntryOffset() < original);
162
0
  }
163
164
66.9k
  void Seek(const Slice& target) override {
165
    // Binary search in restart array to find the last restart point
166
    // with a key < target
167
66.9k
    uint32_t left = 0;
168
66.9k
    uint32_t right = num_restarts_ - 1;
169
66.9k
    int current_key_compare = 0;
170
171
66.9k
    if (Valid()) {
172
      // If we're already scanning, use the current position as a starting
173
      // point. This is beneficial if the key we're seeking to is ahead of the
174
      // current position.
175
0
      current_key_compare = Compare(key_, target);
176
0
      if (current_key_compare < 0) {
177
        // key_ is smaller than target
178
0
        left = restart_index_;
179
0
      } else if (current_key_compare > 0) {
180
0
        right = restart_index_;
181
0
      } else {
182
        // We're seeking to the key we're already at.
183
0
        return;
184
0
      }
185
0
    }
186
187
94.4k
    while (left < right) {
188
27.4k
      uint32_t mid = (left + right + 1) / 2;
189
27.4k
      uint32_t region_offset = GetRestartPoint(mid);
190
27.4k
      uint32_t shared, non_shared, value_length;
191
27.4k
      const char* key_ptr =
192
27.4k
          DecodeEntry(data_ + region_offset, data_ + restarts_, &shared,
193
27.4k
                      &non_shared, &value_length);
194
27.4k
      if (key_ptr == nullptr || (shared != 0)) {
195
0
        CorruptionError();
196
0
        return;
197
0
      }
198
27.4k
      Slice mid_key(key_ptr, non_shared);
199
27.4k
      if (Compare(mid_key, target) < 0) {
200
        // Key at "mid" is smaller than "target".  Therefore all
201
        // blocks before "mid" are uninteresting.
202
10.1k
        left = mid;
203
17.3k
      } else {
204
        // Key at "mid" is >= "target".  Therefore all blocks at or
205
        // after "mid" are uninteresting.
206
17.3k
        right = mid - 1;
207
17.3k
      }
208
27.4k
    }
209
210
    // We might be able to use our current position within the restart block.
211
    // This is true if we determined the key we desire is in the current block
212
    // and is after than the current key.
213
66.9k
    assert(current_key_compare == 0 || Valid());
214
66.9k
    bool skip_seek = left == restart_index_ && current_key_compare < 0;
215
66.9k
    if (!skip_seek) {
216
66.9k
      SeekToRestartPoint(left);
217
66.9k
    }
218
    // Linear search (within restart block) for first key >= target
219
168k
    while (true) {
220
168k
      if (!ParseNextKey()) {
221
215
        return;
222
215
      }
223
168k
      if (Compare(key_, target) >= 0) {
224
66.7k
        return;
225
66.7k
      }
226
168k
    }
227
66.9k
  }
228
229
924k
  void SeekToFirst() override {
230
924k
    SeekToRestartPoint(0);
231
924k
    ParseNextKey();
232
924k
  }
233
234
0
  void SeekToLast() override {
235
0
    SeekToRestartPoint(num_restarts_ - 1);
236
0
    while (ParseNextKey() && NextEntryOffset() < restarts_) {
237
      // Keep skipping
238
0
    }
239
0
  }
240
241
 private:
242
0
  void CorruptionError() {
243
0
    current_ = restarts_;
244
0
    restart_index_ = num_restarts_;
245
0
    status_ = Status::Corruption("bad entry in block");
246
0
    key_.clear();
247
0
    value_.clear();
248
0
  }
249
250
5.16M
  bool ParseNextKey() {
251
5.16M
    current_ = NextEntryOffset();
252
5.16M
    const char* p = data_ + current_;
253
5.16M
    const char* limit = data_ + restarts_;  // Restarts come right after data
254
5.16M
    if (p >= limit) {
255
      // No more entries to return.  Mark as invalid.
256
910k
      current_ = restarts_;
257
910k
      restart_index_ = num_restarts_;
258
910k
      return false;
259
910k
    }
260
261
    // Decode next entry
262
4.25M
    uint32_t shared, non_shared, value_length;
263
4.25M
    p = DecodeEntry(p, limit, &shared, &non_shared, &value_length);
264
4.25M
    if (p == nullptr || key_.size() < shared) {
265
0
      CorruptionError();
266
0
      return false;
267
4.25M
    } else {
268
4.25M
      key_.resize(shared);
269
4.25M
      key_.append(p, non_shared);
270
4.25M
      value_ = Slice(p + non_shared, value_length);
271
4.44M
      while (restart_index_ + 1 < num_restarts_ &&
272
4.44M
             GetRestartPoint(restart_index_ + 1) < current_) {
273
193k
        ++restart_index_;
274
193k
      }
275
4.25M
      return true;
276
4.25M
    }
277
4.25M
  }
278
};
279
280
1.19M
Iterator* Block::NewIterator(const Comparator* comparator) {
281
1.19M
  if (size_ < sizeof(uint32_t)) {
282
0
    return NewErrorIterator(Status::Corruption("bad block contents"));
283
0
  }
284
1.19M
  const uint32_t num_restarts = NumRestarts();
285
1.19M
  if (num_restarts == 0) {
286
0
    return NewEmptyIterator();
287
1.19M
  } else {
288
1.19M
    return new Iter(comparator, data_, restart_offset_, num_restarts);
289
1.19M
  }
290
1.19M
}
291
292
}  // namespace leveldb