Coverage Report

Created: 2025-06-10 07:27

/src/ghostpdl/brotli/c/enc/block_splitter.c
Line
Count
Source (jump to first uncovered line)
1
/* Copyright 2013 Google Inc. All Rights Reserved.
2
3
   Distributed under MIT license.
4
   See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
5
*/
6
7
/* Block split point selection utilities. */
8
9
#include "block_splitter.h"
10
11
#include <string.h>  /* memcpy, memset */
12
13
#include "../common/platform.h"
14
#include "bit_cost.h"
15
#include "cluster.h"
16
#include "command.h"
17
#include "fast_log.h"
18
#include "histogram.h"
19
#include "memory.h"
20
#include "quality.h"
21
22
#if defined(__cplusplus) || defined(c_plusplus)
23
extern "C" {
24
#endif
25
26
static const size_t kMaxLiteralHistograms = 100;
27
static const size_t kMaxCommandHistograms = 50;
28
static const double kLiteralBlockSwitchCost = 28.1;
29
static const double kCommandBlockSwitchCost = 13.5;
30
static const double kDistanceBlockSwitchCost = 14.6;
31
static const size_t kLiteralStrideLength = 70;
32
static const size_t kCommandStrideLength = 40;
33
static const size_t kDistanceStrideLength = 40;
34
static const size_t kSymbolsPerLiteralHistogram = 544;
35
static const size_t kSymbolsPerCommandHistogram = 530;
36
static const size_t kSymbolsPerDistanceHistogram = 544;
37
static const size_t kMinLengthForBlockSplitting = 128;
38
static const size_t kIterMulForRefining = 2;
39
static const size_t kMinItersForRefining = 100;
40
41
0
static size_t CountLiterals(const Command* cmds, const size_t num_commands) {
42
  /* Count how many we have. */
43
0
  size_t total_length = 0;
44
0
  size_t i;
45
0
  for (i = 0; i < num_commands; ++i) {
46
0
    total_length += cmds[i].insert_len_;
47
0
  }
48
0
  return total_length;
49
0
}
50
51
static void CopyLiteralsToByteArray(const Command* cmds,
52
                                    const size_t num_commands,
53
                                    const uint8_t* data,
54
                                    const size_t offset,
55
                                    const size_t mask,
56
0
                                    uint8_t* literals) {
57
0
  size_t pos = 0;
58
0
  size_t from_pos = offset & mask;
59
0
  size_t i;
60
0
  for (i = 0; i < num_commands; ++i) {
61
0
    size_t insert_len = cmds[i].insert_len_;
62
0
    if (from_pos + insert_len > mask) {
63
0
      size_t head_size = mask + 1 - from_pos;
64
0
      memcpy(literals + pos, data + from_pos, head_size);
65
0
      from_pos = 0;
66
0
      pos += head_size;
67
0
      insert_len -= head_size;
68
0
    }
69
0
    if (insert_len > 0) {
70
0
      memcpy(literals + pos, data + from_pos, insert_len);
71
0
      pos += insert_len;
72
0
    }
73
0
    from_pos = (from_pos + insert_len + CommandCopyLen(&cmds[i])) & mask;
74
0
  }
75
0
}
76
77
0
static BROTLI_INLINE uint32_t MyRand(uint32_t* seed) {
78
  /* Initial seed should be 7. In this case, loop length is (1 << 29). */
79
0
  *seed *= 16807U;
80
0
  return *seed;
81
0
}
82
83
0
static BROTLI_INLINE double BitCost(size_t count) {
84
0
  return count == 0 ? -2.0 : FastLog2(count);
85
0
}
86
87
0
#define HISTOGRAMS_PER_BATCH 64
88
0
#define CLUSTERS_PER_BATCH 16
89
90
0
#define FN(X) X ## Literal
91
#define DataType uint8_t
92
/* NOLINTNEXTLINE(build/include) */
93
#include "block_splitter_inc.h"
94
#undef DataType
95
#undef FN
96
97
0
#define FN(X) X ## Command
98
#define DataType uint16_t
99
/* NOLINTNEXTLINE(build/include) */
100
#include "block_splitter_inc.h"
101
#undef FN
102
103
0
#define FN(X) X ## Distance
104
/* NOLINTNEXTLINE(build/include) */
105
#include "block_splitter_inc.h"
106
#undef DataType
107
#undef FN
108
109
0
void BrotliInitBlockSplit(BlockSplit* self) {
110
0
  self->num_types = 0;
111
0
  self->num_blocks = 0;
112
0
  self->types = 0;
113
0
  self->lengths = 0;
114
0
  self->types_alloc_size = 0;
115
0
  self->lengths_alloc_size = 0;
116
0
}
117
118
0
void BrotliDestroyBlockSplit(MemoryManager* m, BlockSplit* self) {
119
0
  BROTLI_FREE(m, self->types);
120
0
  BROTLI_FREE(m, self->lengths);
121
0
}
122
123
/* Extracts literals, command distance and prefix codes, then applies
124
 * SplitByteVector to create partitioning. */
125
void BrotliSplitBlock(MemoryManager* m,
126
                      const Command* cmds,
127
                      const size_t num_commands,
128
                      const uint8_t* data,
129
                      const size_t pos,
130
                      const size_t mask,
131
                      const BrotliEncoderParams* params,
132
                      BlockSplit* literal_split,
133
                      BlockSplit* insert_and_copy_split,
134
0
                      BlockSplit* dist_split) {
135
0
  {
136
0
    size_t literals_count = CountLiterals(cmds, num_commands);
137
0
    uint8_t* literals = BROTLI_ALLOC(m, uint8_t, literals_count);
138
0
    if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(literals)) return;
139
    /* Create a continuous array of literals. */
140
0
    CopyLiteralsToByteArray(cmds, num_commands, data, pos, mask, literals);
141
    /* Create the block split on the array of literals.
142
     * Literal histograms can have alphabet size up to 256.
143
     * Though, to accomodate context modeling, less than half of maximum size
144
     * is allowed. */
145
0
    SplitByteVectorLiteral(
146
0
        m, literals, literals_count,
147
0
        kSymbolsPerLiteralHistogram, kMaxLiteralHistograms,
148
0
        kLiteralStrideLength, kLiteralBlockSwitchCost, params,
149
0
        literal_split);
150
0
    if (BROTLI_IS_OOM(m)) return;
151
0
    BROTLI_FREE(m, literals);
152
    /* NB: this might be a good place for injecting extra splitting without
153
     *     increasing encoder complexity; however, output parition would be less
154
     *     optimal than one produced with forced splitting inside
155
     *     SplitByteVector (FindBlocks / ClusterBlocks). */
156
0
  }
157
158
0
  {
159
    /* Compute prefix codes for commands. */
160
0
    uint16_t* insert_and_copy_codes = BROTLI_ALLOC(m, uint16_t, num_commands);
161
0
    size_t i;
162
0
    if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(insert_and_copy_codes)) return;
163
0
    for (i = 0; i < num_commands; ++i) {
164
0
      insert_and_copy_codes[i] = cmds[i].cmd_prefix_;
165
0
    }
166
    /* Create the block split on the array of command prefixes. */
167
0
    SplitByteVectorCommand(
168
0
        m, insert_and_copy_codes, num_commands,
169
0
        kSymbolsPerCommandHistogram, kMaxCommandHistograms,
170
0
        kCommandStrideLength, kCommandBlockSwitchCost, params,
171
0
        insert_and_copy_split);
172
0
    if (BROTLI_IS_OOM(m)) return;
173
    /* TODO(eustas): reuse for distances? */
174
0
    BROTLI_FREE(m, insert_and_copy_codes);
175
0
  }
176
177
0
  {
178
    /* Create a continuous array of distance prefixes. */
179
0
    uint16_t* distance_prefixes = BROTLI_ALLOC(m, uint16_t, num_commands);
180
0
    size_t j = 0;
181
0
    size_t i;
182
0
    if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(distance_prefixes)) return;
183
0
    for (i = 0; i < num_commands; ++i) {
184
0
      const Command* cmd = &cmds[i];
185
0
      if (CommandCopyLen(cmd) && cmd->cmd_prefix_ >= 128) {
186
0
        distance_prefixes[j++] = cmd->dist_prefix_ & 0x3FF;
187
0
      }
188
0
    }
189
    /* Create the block split on the array of distance prefixes. */
190
0
    SplitByteVectorDistance(
191
0
        m, distance_prefixes, j,
192
0
        kSymbolsPerDistanceHistogram, kMaxCommandHistograms,
193
0
        kDistanceStrideLength, kDistanceBlockSwitchCost, params,
194
0
        dist_split);
195
0
    if (BROTLI_IS_OOM(m)) return;
196
0
    BROTLI_FREE(m, distance_prefixes);
197
0
  }
198
0
}
199
200
#if defined(BROTLI_TEST)
201
size_t CountLiteralsForTest(const Command*, const size_t);
202
size_t CountLiteralsForTest(const Command* cmds, const size_t num_commands) {
203
  return CountLiterals(cmds, num_commands);
204
}
205
206
void CopyLiteralsToByteArrayForTest(const Command*,
207
    const size_t, const uint8_t*, const size_t, const size_t, uint8_t*);
208
void CopyLiteralsToByteArrayForTest(const Command* cmds,
209
    const size_t num_commands, const uint8_t* data, const size_t offset,
210
    const size_t mask, uint8_t* literals) {
211
  CopyLiteralsToByteArray(cmds, num_commands, data, offset, mask, literals);
212
}
213
#endif
214
215
#if defined(__cplusplus) || defined(c_plusplus)
216
}  /* extern "C" */
217
#endif