Coverage Report

Created: 2026-05-30 06:41

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/leveldb/table/block.cc
Line
Count
Source
1
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
2
// Use of this source code is governed by a BSD-style license that can be
3
// found in the LICENSE file. See the AUTHORS file for names of contributors.
4
//
5
// Decodes the blocks generated by block_builder.cc.
6
7
#include "table/block.h"
8
9
#include <algorithm>
10
#include <cstdint>
11
#include <vector>
12
13
#include "leveldb/comparator.h"
14
#include "table/format.h"
15
#include "util/coding.h"
16
#include "util/logging.h"
17
18
namespace leveldb {
19
20
1.16k
inline uint32_t Block::NumRestarts() const {
21
1.16k
  assert(size_ >= sizeof(uint32_t));
22
1.16k
  return DecodeFixed32(data_ + size_ - sizeof(uint32_t));
23
1.16k
}
24
25
Block::Block(const BlockContents& contents)
26
376
    : data_(contents.data.data()),
27
376
      size_(contents.data.size()),
28
376
      owned_(contents.heap_allocated) {
29
376
  if (size_ < sizeof(uint32_t)) {
30
0
    size_ = 0;  // Error marker
31
376
  } else {
32
376
    size_t max_restarts_allowed = (size_ - sizeof(uint32_t)) / sizeof(uint32_t);
33
376
    if (NumRestarts() > max_restarts_allowed) {
34
      // The size is too small for NumRestarts()
35
0
      size_ = 0;
36
376
    } else {
37
376
      restart_offset_ = size_ - (1 + NumRestarts()) * sizeof(uint32_t);
38
376
    }
39
376
  }
40
376
}
41
42
376
Block::~Block() {
43
376
  if (owned_) {
44
0
    delete[] data_;
45
0
  }
46
376
}
47
48
// Helper routine: decode the next block entry starting at "p",
49
// storing the number of shared key bytes, non_shared key bytes,
50
// and the length of the value in "*shared", "*non_shared", and
51
// "*value_length", respectively.  Will not dereference past "limit".
52
//
53
// If any errors are detected, returns nullptr.  Otherwise, returns a
54
// pointer to the key delta (just past the three decoded values).
55
static inline const char* DecodeEntry(const char* p, const char* limit,
56
                                      uint32_t* shared, uint32_t* non_shared,
57
820
                                      uint32_t* value_length) {
58
820
  if (limit - p < 3) return nullptr;
59
820
  *shared = reinterpret_cast<const uint8_t*>(p)[0];
60
820
  *non_shared = reinterpret_cast<const uint8_t*>(p)[1];
61
820
  *value_length = reinterpret_cast<const uint8_t*>(p)[2];
62
820
  if ((*shared | *non_shared | *value_length) < 128) {
63
    // Fast path: all three values are encoded in one byte each
64
352
    p += 3;
65
468
  } else {
66
468
    if ((p = GetVarint32Ptr(p, limit, shared)) == nullptr) return nullptr;
67
468
    if ((p = GetVarint32Ptr(p, limit, non_shared)) == nullptr) return nullptr;
68
468
    if ((p = GetVarint32Ptr(p, limit, value_length)) == nullptr) return nullptr;
69
468
  }
70
71
820
  if (static_cast<uint32_t>(limit - p) < (*non_shared + *value_length)) {
72
0
    return nullptr;
73
0
  }
74
820
  return p;
75
820
}
76
77
class Block::Iter : public Iterator {
78
 private:
79
  const Comparator* const comparator_;
80
  const char* const data_;       // underlying block contents
81
  uint32_t const restarts_;      // Offset of restart array (list of fixed32)
82
  uint32_t const num_restarts_;  // Number of uint32_t entries in restart array
83
84
  // current_ is offset in data_ of current entry.  >= restarts_ if !Valid
85
  uint32_t current_;
86
  uint32_t restart_index_;  // Index of restart block in which current_ falls
87
  std::string key_;
88
  Slice value_;
89
  Status status_;
90
91
58
  inline int Compare(const Slice& a, const Slice& b) const {
92
58
    return comparator_->Compare(a, b);
93
58
  }
94
95
  // Return the offset in data_ just past the end of the current entry.
96
1.12k
  inline uint32_t NextEntryOffset() const {
97
1.12k
    return (value_.data() + value_.size()) - data_;
98
1.12k
  }
99
100
910
  uint32_t GetRestartPoint(uint32_t index) {
101
910
    assert(index < num_restarts_);
102
910
    return DecodeFixed32(data_ + restarts_ + index * sizeof(uint32_t));
103
910
  }
104
105
350
  void SeekToRestartPoint(uint32_t index) {
106
350
    key_.clear();
107
350
    restart_index_ = index;
108
    // current_ will be fixed by ParseNextKey();
109
110
    // ParseNextKey() starts at the end of value_, so set value_ accordingly
111
350
    uint32_t offset = GetRestartPoint(index);
112
350
    value_ = Slice(data_ + offset, 0);
113
350
  }
114
115
 public:
116
  Iter(const Comparator* comparator, const char* data, uint32_t restarts,
117
       uint32_t num_restarts)
118
414
      : comparator_(comparator),
119
414
        data_(data),
120
414
        restarts_(restarts),
121
414
        num_restarts_(num_restarts),
122
414
        current_(restarts_),
123
414
        restart_index_(num_restarts_) {
124
414
    assert(num_restarts_ > 0);
125
414
  }
126
127
1.52k
  bool Valid() const override { return current_ < restarts_; }
128
400
  Status status() const override { return status_; }
129
772
  Slice key() const override {
130
772
    assert(Valid());
131
772
    return key_;
132
772
  }
133
786
  Slice value() const override {
134
786
    assert(Valid());
135
786
    return value_;
136
786
  }
137
138
762
  void Next() override {
139
762
    assert(Valid());
140
762
    ParseNextKey();
141
762
  }
142
143
0
  void Prev() override {
144
0
    assert(Valid());
145
146
    // Scan backwards to a restart point before current_
147
0
    const uint32_t original = current_;
148
0
    while (GetRestartPoint(restart_index_) >= original) {
149
0
      if (restart_index_ == 0) {
150
        // No more entries
151
0
        current_ = restarts_;
152
0
        restart_index_ = num_restarts_;
153
0
        return;
154
0
      }
155
0
      restart_index_--;
156
0
    }
157
158
0
    SeekToRestartPoint(restart_index_);
159
0
    do {
160
      // Loop until end of current entry hits the start of original entry
161
0
    } while (ParseNextKey() && NextEntryOffset() < original);
162
0
  }
163
164
20
  void Seek(const Slice& target) override {
165
    // Binary search in restart array to find the last restart point
166
    // with a key < target
167
20
    uint32_t left = 0;
168
20
    uint32_t right = num_restarts_ - 1;
169
20
    int current_key_compare = 0;
170
171
20
    if (Valid()) {
172
      // If we're already scanning, use the current position as a starting
173
      // point. This is beneficial if the key we're seeking to is ahead of the
174
      // current position.
175
0
      current_key_compare = Compare(key_, target);
176
0
      if (current_key_compare < 0) {
177
        // key_ is smaller than target
178
0
        left = restart_index_;
179
0
      } else if (current_key_compare > 0) {
180
0
        right = restart_index_;
181
0
      } else {
182
        // We're seeking to the key we're already at.
183
0
        return;
184
0
      }
185
0
    }
186
187
44
    while (left < right) {
188
24
      uint32_t mid = (left + right + 1) / 2;
189
24
      uint32_t region_offset = GetRestartPoint(mid);
190
24
      uint32_t shared, non_shared, value_length;
191
24
      const char* key_ptr =
192
24
          DecodeEntry(data_ + region_offset, data_ + restarts_, &shared,
193
24
                      &non_shared, &value_length);
194
24
      if (key_ptr == nullptr || (shared != 0)) {
195
0
        CorruptionError();
196
0
        return;
197
0
      }
198
24
      Slice mid_key(key_ptr, non_shared);
199
24
      if (Compare(mid_key, target) < 0) {
200
        // Key at "mid" is smaller than "target".  Therefore all
201
        // blocks before "mid" are uninteresting.
202
10
        left = mid;
203
14
      } else {
204
        // Key at "mid" is >= "target".  Therefore all blocks at or
205
        // after "mid" are uninteresting.
206
14
        right = mid - 1;
207
14
      }
208
24
    }
209
210
    // We might be able to use our current position within the restart block.
211
    // This is true if we determined the key we desire is in the current block
212
    // and is after than the current key.
213
20
    assert(current_key_compare == 0 || Valid());
214
20
    bool skip_seek = left == restart_index_ && current_key_compare < 0;
215
20
    if (!skip_seek) {
216
20
      SeekToRestartPoint(left);
217
20
    }
218
    // Linear search (within restart block) for first key >= target
219
34
    while (true) {
220
34
      if (!ParseNextKey()) {
221
0
        return;
222
0
      }
223
34
      if (Compare(key_, target) >= 0) {
224
20
        return;
225
20
      }
226
34
    }
227
20
  }
228
229
330
  void SeekToFirst() override {
230
330
    SeekToRestartPoint(0);
231
330
    ParseNextKey();
232
330
  }
233
234
0
  void SeekToLast() override {
235
0
    SeekToRestartPoint(num_restarts_ - 1);
236
0
    while (ParseNextKey() && NextEntryOffset() < restarts_) {
237
      // Keep skipping
238
0
    }
239
0
  }
240
241
 private:
242
0
  void CorruptionError() {
243
0
    current_ = restarts_;
244
0
    restart_index_ = num_restarts_;
245
0
    status_ = Status::Corruption("bad entry in block");
246
0
    key_.clear();
247
0
    value_.clear();
248
0
  }
249
250
1.12k
  bool ParseNextKey() {
251
1.12k
    current_ = NextEntryOffset();
252
1.12k
    const char* p = data_ + current_;
253
1.12k
    const char* limit = data_ + restarts_;  // Restarts come right after data
254
1.12k
    if (p >= limit) {
255
      // No more entries to return.  Mark as invalid.
256
330
      current_ = restarts_;
257
330
      restart_index_ = num_restarts_;
258
330
      return false;
259
330
    }
260
261
    // Decode next entry
262
796
    uint32_t shared, non_shared, value_length;
263
796
    p = DecodeEntry(p, limit, &shared, &non_shared, &value_length);
264
796
    if (p == nullptr || key_.size() < shared) {
265
0
      CorruptionError();
266
0
      return false;
267
796
    } else {
268
796
      key_.resize(shared);
269
796
      key_.append(p, non_shared);
270
796
      value_ = Slice(p + non_shared, value_length);
271
1.03k
      while (restart_index_ + 1 < num_restarts_ &&
272
536
             GetRestartPoint(restart_index_ + 1) < current_) {
273
234
        ++restart_index_;
274
234
      }
275
796
      return true;
276
796
    }
277
796
  }
278
};
279
280
414
Iterator* Block::NewIterator(const Comparator* comparator) {
281
414
  if (size_ < sizeof(uint32_t)) {
282
0
    return NewErrorIterator(Status::Corruption("bad block contents"));
283
0
  }
284
414
  const uint32_t num_restarts = NumRestarts();
285
414
  if (num_restarts == 0) {
286
0
    return NewEmptyIterator();
287
414
  } else {
288
414
    return new Iter(comparator, data_, restart_offset_, num_restarts);
289
414
  }
290
414
}
291
292
}  // namespace leveldb