Coverage Report

Created: 2025-07-23 06:38

/src/brunsli/c/dec/huffman_decode.cc
Line
Count
Source (jump to first uncovered line)
1
// Copyright (c) Google LLC 2019
2
//
3
// Use of this source code is governed by an MIT-style
4
// license that can be found in the LICENSE file or at
5
// https://opensource.org/licenses/MIT.
6
7
#include "./huffman_decode.h"
8
9
#include <cstring>  /* for memset */
10
#include <vector>
11
12
#include "../common/constants.h"
13
#include "../common/platform.h"
14
#include <brunsli/types.h>
15
#include "./bit_reader.h"
16
#include "./huffman_table.h"
17
18
namespace brunsli {
19
20
static const int kCodeLengthCodes = 18;
21
static const uint8_t kCodeLengthCodeOrder[kCodeLengthCodes] = {
22
    1, 2, 3, 4, 0, 5, 17, 6, 16, 7, 8, 9, 10, 11, 12, 13, 14, 15,
23
};
24
static const uint8_t kDefaultCodeLength = 8;
25
static const uint8_t kCodeLengthRepeatCode = 16;
26
27
bool ReadHuffmanCodeLengths(const uint8_t* code_length_code_lengths,
28
                           size_t num_symbols, uint8_t* code_lengths,
29
357
                           BrunsliBitReader* br) {
30
357
  size_t symbol = 0;
31
357
  uint8_t prev_code_len = kDefaultCodeLength;
32
357
  size_t repeat = 0;
33
357
  uint8_t repeat_code_len = 0;
34
357
  const int kFullSpace = 1 << 15;
35
357
  int space = kFullSpace;
36
357
  HuffmanCode table[32];
37
38
357
  uint16_t counts[16] = {0};
39
6.78k
  for (int i = 0; i < kCodeLengthCodes; ++i) {
40
6.42k
    ++counts[code_length_code_lengths[i]];
41
6.42k
  }
42
357
  if (!BuildHuffmanTable(table, 5, code_length_code_lengths, kCodeLengthCodes,
43
357
                         &counts[0])) {
44
0
    return false;
45
0
  }
46
47
9.99k
  while (symbol < num_symbols && space > 0) {
48
9.69k
    const HuffmanCode* p = table;
49
9.69k
    uint8_t code_len;
50
9.69k
    p += BrunsliBitReaderGet(br, 5);
51
9.69k
    BrunsliBitReaderDrop(br, p->bits);
52
9.69k
    code_len = (uint8_t)p->value;
53
9.69k
    if (code_len < kCodeLengthRepeatCode) {
54
8.48k
      repeat = 0;
55
8.48k
      code_lengths[symbol++] = code_len;
56
8.48k
      if (code_len != 0) {
57
6.54k
        prev_code_len = code_len;
58
6.54k
        space -= kFullSpace >> code_len;
59
6.54k
      }
60
8.48k
    } else {
61
1.20k
      uint32_t extra_bits = code_len - 14;  // >= 2
62
1.20k
      size_t old_repeat;
63
1.20k
      size_t repeat_delta;
64
1.20k
      uint8_t new_len = 0;
65
1.20k
      if (code_len == kCodeLengthRepeatCode) {
66
872
        new_len = prev_code_len;
67
872
      }
68
1.20k
      if (repeat_code_len != new_len) {
69
345
        repeat = 0;
70
345
        repeat_code_len = new_len;
71
345
      }
72
1.20k
      old_repeat = repeat;
73
1.20k
      if (repeat > 0) {  // >= 3
74
333
        repeat -= 2;
75
333
        repeat <<= extra_bits;
76
333
      }
77
1.20k
      repeat += BrunsliBitReaderRead(br, extra_bits) + 3u;
78
1.20k
      repeat_delta = repeat - old_repeat;
79
1.20k
      if (symbol + repeat_delta > num_symbols) {
80
50
        return false;
81
50
      }
82
1.15k
      memset(&code_lengths[symbol], repeat_code_len, (size_t)repeat_delta);
83
1.15k
      symbol += repeat_delta;
84
1.15k
      if (repeat_code_len != 0) {
85
853
        space -= static_cast<int>(repeat_delta * kFullSpace) >> repeat_code_len;
86
853
      }
87
1.15k
    }
88
9.69k
  }
89
307
  if (space != 0) {
90
102
    return false;
91
102
  }
92
205
  memset(&code_lengths[symbol], 0, (size_t)(num_symbols - symbol));
93
205
  return BrunsliBitReaderIsHealthy(br);
94
307
}
95
96
static BRUNSLI_INLINE bool ReadSimpleCode(uint16_t alphabet_size,
97
                                          BrunsliBitReader* br,
98
700
                                          HuffmanCode* table) {
99
700
  uint32_t max_bits =
100
700
      (alphabet_size > 1u) ? Log2FloorNonZero(alphabet_size - 1u) + 1 : 0;
101
102
700
  size_t num_symbols = BrunsliBitReaderRead(br, 2) + 1;
103
104
700
  uint16_t symbols[4] = {0};
105
1.77k
  for (size_t i = 0; i < num_symbols; ++i) {
106
1.10k
    uint16_t symbol = BrunsliBitReaderRead(br, max_bits);
107
1.10k
    if (symbol >= alphabet_size) {
108
30
      return false;
109
30
    }
110
1.07k
    symbols[i] = symbol;
111
1.07k
  }
112
113
972
  for (size_t i = 0; i < num_symbols - 1; ++i) {
114
865
    for (size_t j = i + 1; j < num_symbols; ++j) {
115
563
      if (symbols[i] == symbols[j]) return false;
116
563
    }
117
330
  }
118
119
  // 4 symbols have to option to encode.
120
642
  if (num_symbols == 4) num_symbols += BrunsliBitReaderRead(br, 1);
121
122
642
  const auto swap_symbols = [&symbols] (size_t i, size_t j) {
123
259
    uint16_t t = symbols[j];
124
259
    symbols[j] = symbols[i];
125
259
    symbols[i] = t;
126
259
  };
127
128
642
  size_t table_size = 1;
129
642
  switch (num_symbols) {
130
496
    case 1:
131
496
      table[0] = {0, symbols[0]};
132
496
      break;
133
64
    case 2:
134
64
      if (symbols[0] > symbols[1]) swap_symbols(0, 1);
135
64
      table[0] = {1, symbols[0]};
136
64
      table[1] = {1, symbols[1]};
137
64
      table_size = 2;
138
64
      break;
139
25
    case 3:
140
25
      if (symbols[1] > symbols[2]) swap_symbols(1, 2);
141
25
      table[0] = {1, symbols[0]};
142
25
      table[2] = {1, symbols[0]};
143
25
      table[1] = {2, symbols[1]};
144
25
      table[3] = {2, symbols[2]};
145
25
      table_size = 4;
146
25
      break;
147
48
    case 4: {
148
192
      for (size_t i = 0; i < 3; ++i) {
149
432
        for (size_t j = i + 1; j < 4; ++j) {
150
288
          if (symbols[i] > symbols[j]) swap_symbols(i, j);
151
288
        }
152
144
      }
153
48
      table[0] = {2, symbols[0]};
154
48
      table[2] = {2, symbols[1]};
155
48
      table[1] = {2, symbols[2]};
156
48
      table[3] = {2, symbols[3]};
157
48
      table_size = 4;
158
48
      break;
159
0
    }
160
9
    case 5: {
161
9
      if (symbols[2] > symbols[3]) swap_symbols(2, 3);
162
9
      table[0] = {1, symbols[0]};
163
9
      table[1] = {2, symbols[1]};
164
9
      table[2] = {1, symbols[0]};
165
9
      table[3] = {3, symbols[2]};
166
9
      table[4] = {1, symbols[0]};
167
9
      table[5] = {2, symbols[1]};
168
9
      table[6] = {1, symbols[0]};
169
9
      table[7] = {3, symbols[3]};
170
9
      table_size = 8;
171
9
      break;
172
0
    }
173
0
    default: {
174
      // Unreachable.
175
0
      return false;
176
0
    }
177
642
  }
178
179
642
  const uint32_t goal_size = 1u << kHuffmanTableBits;
180
5.54k
  while (table_size != goal_size) {
181
4.89k
    memcpy(&table[table_size], &table[0],
182
4.89k
           (size_t)table_size * sizeof(table[0]));
183
4.89k
    table_size <<= 1;
184
4.89k
  }
185
186
642
  return BrunsliBitReaderIsHealthy(br);
187
642
}
188
189
bool HuffmanDecodingData::ReadFromBitStream(
190
    size_t alphabet_size, BrunsliBitReader* br,
191
1.12k
    Arena<HuffmanCode>* arena) {
192
1.12k
  Arena<HuffmanCode> local_arena;
193
1.12k
  if (arena == nullptr) arena = &local_arena;
194
195
1.12k
  if (alphabet_size > (1 << kMaxHuffmanBits)) return false;
196
197
1.12k
  std::vector<uint8_t> code_lengths(alphabet_size, 0);
198
  /* simple_code_or_skip is used as follows:
199
     1 for simple code;
200
     0 for no skipping, 2 skips 2 code lengths, 3 skips 3 code lengths */
201
1.12k
  uint32_t simple_code_or_skip = BrunsliBitReaderRead(br, 2);
202
1.12k
  if (simple_code_or_skip == 1u) {
203
700
    table_.resize(1u << kHuffmanTableBits);
204
700
    return ReadSimpleCode(static_cast<uint16_t>(alphabet_size), br,
205
700
                          table_.data());
206
700
  }
207
208
425
  uint8_t code_length_code_lengths[kCodeLengthCodes] = {0};
209
425
  int space = 32;
210
425
  int num_codes = 0;
211
  /* Static Huffman code for the code length code lengths */
212
425
  static const HuffmanCode huff[16] = {
213
425
      {2, 0}, {2, 4}, {2, 3}, {3, 2}, {2, 0}, {2, 4}, {2, 3}, {4, 1},
214
425
      {2, 0}, {2, 4}, {2, 3}, {3, 2}, {2, 0}, {2, 4}, {2, 3}, {4, 5},
215
425
  };
216
5.43k
  for (size_t i = simple_code_or_skip; i < kCodeLengthCodes && space > 0; ++i) {
217
5.00k
    const int code_len_idx = kCodeLengthCodeOrder[i];
218
5.00k
    const HuffmanCode* p = huff;
219
5.00k
    uint8_t v;
220
5.00k
    p += BrunsliBitReaderGet(br, 4);
221
5.00k
    BrunsliBitReaderDrop(br, p->bits);
222
5.00k
    v = (uint8_t)p->value;
223
5.00k
    code_length_code_lengths[code_len_idx] = v;
224
5.00k
    if (v != 0) {
225
2.33k
      space -= (32u >> v);
226
2.33k
      ++num_codes;
227
2.33k
    }
228
5.00k
  }
229
425
  bool ok = (num_codes == 1 || space == 0) &&
230
425
       ReadHuffmanCodeLengths(code_length_code_lengths, alphabet_size,
231
357
                              &code_lengths[0], br);
232
233
425
  if (!ok || !BrunsliBitReaderIsHealthy(br)) return false;
234
190
  uint16_t counts[16] = {0};
235
21.5k
  for (size_t i = 0; i < alphabet_size; ++i) {
236
21.3k
    ++counts[code_lengths[i]];
237
21.3k
  }
238
190
  arena->reserve(alphabet_size + 376);
239
190
  uint32_t table_size =
240
190
      BuildHuffmanTable(arena->data(), kHuffmanTableBits, &code_lengths[0],
241
190
                        alphabet_size, &counts[0]);
242
190
  table_ = std::vector<HuffmanCode>(arena->data(), arena->data() + table_size);
243
190
  return (table_size > 0);
244
425
}
245
246
// Decodes the next Huffman coded symbol from the bit-stream.
247
965k
uint16_t HuffmanDecodingData::ReadSymbol(BrunsliBitReader* br) const {
248
965k
  uint32_t n_bits;
249
965k
  const HuffmanCode* table = table_.data();
250
965k
  table += BrunsliBitReaderGet(br, kHuffmanTableBits);
251
965k
  n_bits = table->bits;
252
965k
  if (n_bits > kHuffmanTableBits) {
253
736
    BrunsliBitReaderDrop(br, kHuffmanTableBits);
254
736
    n_bits -= kHuffmanTableBits;
255
736
    table += table->value;
256
736
    table += BrunsliBitReaderGet(br, n_bits);
257
736
  }
258
965k
  BrunsliBitReaderDrop(br, table->bits);
259
965k
  return table->value;
260
965k
}
261
262
}  // namespace brunsli