/src/ghostpdl/brotli/c/enc/block_splitter.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* Copyright 2013 Google Inc. All Rights Reserved. |
2 | | |
3 | | Distributed under MIT license. |
4 | | See file LICENSE for detail or copy at https://opensource.org/licenses/MIT |
5 | | */ |
6 | | |
7 | | /* Block split point selection utilities. */ |
8 | | |
9 | | #include "block_splitter.h" |
10 | | |
11 | | #include <string.h> /* memcpy, memset */ |
12 | | |
13 | | #include "../common/platform.h" |
14 | | #include "bit_cost.h" |
15 | | #include "cluster.h" |
16 | | #include "command.h" |
17 | | #include "fast_log.h" |
18 | | #include "histogram.h" |
19 | | #include "memory.h" |
20 | | #include "quality.h" |
21 | | |
22 | | #if defined(__cplusplus) || defined(c_plusplus) |
23 | | extern "C" { |
24 | | #endif |
25 | | |
26 | | static const size_t kMaxLiteralHistograms = 100; |
27 | | static const size_t kMaxCommandHistograms = 50; |
28 | | static const double kLiteralBlockSwitchCost = 28.1; |
29 | | static const double kCommandBlockSwitchCost = 13.5; |
30 | | static const double kDistanceBlockSwitchCost = 14.6; |
31 | | static const size_t kLiteralStrideLength = 70; |
32 | | static const size_t kCommandStrideLength = 40; |
33 | | static const size_t kDistanceStrideLength = 40; |
34 | | static const size_t kSymbolsPerLiteralHistogram = 544; |
35 | | static const size_t kSymbolsPerCommandHistogram = 530; |
36 | | static const size_t kSymbolsPerDistanceHistogram = 544; |
37 | | static const size_t kMinLengthForBlockSplitting = 128; |
38 | | static const size_t kIterMulForRefining = 2; |
39 | | static const size_t kMinItersForRefining = 100; |
40 | | |
41 | 0 | static size_t CountLiterals(const Command* cmds, const size_t num_commands) { |
42 | | /* Count how many we have. */ |
43 | 0 | size_t total_length = 0; |
44 | 0 | size_t i; |
45 | 0 | for (i = 0; i < num_commands; ++i) { |
46 | 0 | total_length += cmds[i].insert_len_; |
47 | 0 | } |
48 | 0 | return total_length; |
49 | 0 | } |
50 | | |
51 | | static void CopyLiteralsToByteArray(const Command* cmds, |
52 | | const size_t num_commands, |
53 | | const uint8_t* data, |
54 | | const size_t offset, |
55 | | const size_t mask, |
56 | 0 | uint8_t* literals) { |
57 | 0 | size_t pos = 0; |
58 | 0 | size_t from_pos = offset & mask; |
59 | 0 | size_t i; |
60 | 0 | for (i = 0; i < num_commands; ++i) { |
61 | 0 | size_t insert_len = cmds[i].insert_len_; |
62 | 0 | if (from_pos + insert_len > mask) { |
63 | 0 | size_t head_size = mask + 1 - from_pos; |
64 | 0 | memcpy(literals + pos, data + from_pos, head_size); |
65 | 0 | from_pos = 0; |
66 | 0 | pos += head_size; |
67 | 0 | insert_len -= head_size; |
68 | 0 | } |
69 | 0 | if (insert_len > 0) { |
70 | 0 | memcpy(literals + pos, data + from_pos, insert_len); |
71 | 0 | pos += insert_len; |
72 | 0 | } |
73 | 0 | from_pos = (from_pos + insert_len + CommandCopyLen(&cmds[i])) & mask; |
74 | 0 | } |
75 | 0 | } |
76 | | |
77 | 0 | static BROTLI_INLINE uint32_t MyRand(uint32_t* seed) { |
78 | | /* Initial seed should be 7. In this case, loop length is (1 << 29). */ |
79 | 0 | *seed *= 16807U; |
80 | 0 | return *seed; |
81 | 0 | } |
82 | | |
83 | 0 | static BROTLI_INLINE double BitCost(size_t count) { |
84 | 0 | return count == 0 ? -2.0 : FastLog2(count); |
85 | 0 | } |
86 | | |
87 | 0 | #define HISTOGRAMS_PER_BATCH 64 |
88 | 0 | #define CLUSTERS_PER_BATCH 16 |
89 | | |
90 | 0 | #define FN(X) X ## Literal |
91 | | #define DataType uint8_t |
92 | | /* NOLINTNEXTLINE(build/include) */ |
93 | | #include "block_splitter_inc.h" |
94 | | #undef DataType |
95 | | #undef FN |
96 | | |
97 | 0 | #define FN(X) X ## Command |
98 | | #define DataType uint16_t |
99 | | /* NOLINTNEXTLINE(build/include) */ |
100 | | #include "block_splitter_inc.h" |
101 | | #undef FN |
102 | | |
103 | 0 | #define FN(X) X ## Distance |
104 | | /* NOLINTNEXTLINE(build/include) */ |
105 | | #include "block_splitter_inc.h" |
106 | | #undef DataType |
107 | | #undef FN |
108 | | |
109 | 0 | void BrotliInitBlockSplit(BlockSplit* self) { |
110 | 0 | self->num_types = 0; |
111 | 0 | self->num_blocks = 0; |
112 | 0 | self->types = 0; |
113 | 0 | self->lengths = 0; |
114 | 0 | self->types_alloc_size = 0; |
115 | 0 | self->lengths_alloc_size = 0; |
116 | 0 | } |
117 | | |
118 | 0 | void BrotliDestroyBlockSplit(MemoryManager* m, BlockSplit* self) { |
119 | 0 | BROTLI_FREE(m, self->types); |
120 | 0 | BROTLI_FREE(m, self->lengths); |
121 | 0 | } |
122 | | |
123 | | /* Extracts literals, command distance and prefix codes, then applies |
124 | | * SplitByteVector to create partitioning. */ |
125 | | void BrotliSplitBlock(MemoryManager* m, |
126 | | const Command* cmds, |
127 | | const size_t num_commands, |
128 | | const uint8_t* data, |
129 | | const size_t pos, |
130 | | const size_t mask, |
131 | | const BrotliEncoderParams* params, |
132 | | BlockSplit* literal_split, |
133 | | BlockSplit* insert_and_copy_split, |
134 | 0 | BlockSplit* dist_split) { |
135 | 0 | { |
136 | 0 | size_t literals_count = CountLiterals(cmds, num_commands); |
137 | 0 | uint8_t* literals = BROTLI_ALLOC(m, uint8_t, literals_count); |
138 | 0 | if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(literals)) return; |
139 | | /* Create a continuous array of literals. */ |
140 | 0 | CopyLiteralsToByteArray(cmds, num_commands, data, pos, mask, literals); |
141 | | /* Create the block split on the array of literals. |
142 | | * Literal histograms can have alphabet size up to 256. |
143 | | * Though, to accomodate context modeling, less than half of maximum size |
144 | | * is allowed. */ |
145 | 0 | SplitByteVectorLiteral( |
146 | 0 | m, literals, literals_count, |
147 | 0 | kSymbolsPerLiteralHistogram, kMaxLiteralHistograms, |
148 | 0 | kLiteralStrideLength, kLiteralBlockSwitchCost, params, |
149 | 0 | literal_split); |
150 | 0 | if (BROTLI_IS_OOM(m)) return; |
151 | 0 | BROTLI_FREE(m, literals); |
152 | | /* NB: this might be a good place for injecting extra splitting without |
153 | | * increasing encoder complexity; however, output parition would be less |
154 | | * optimal than one produced with forced splitting inside |
155 | | * SplitByteVector (FindBlocks / ClusterBlocks). */ |
156 | 0 | } |
157 | | |
158 | 0 | { |
159 | | /* Compute prefix codes for commands. */ |
160 | 0 | uint16_t* insert_and_copy_codes = BROTLI_ALLOC(m, uint16_t, num_commands); |
161 | 0 | size_t i; |
162 | 0 | if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(insert_and_copy_codes)) return; |
163 | 0 | for (i = 0; i < num_commands; ++i) { |
164 | 0 | insert_and_copy_codes[i] = cmds[i].cmd_prefix_; |
165 | 0 | } |
166 | | /* Create the block split on the array of command prefixes. */ |
167 | 0 | SplitByteVectorCommand( |
168 | 0 | m, insert_and_copy_codes, num_commands, |
169 | 0 | kSymbolsPerCommandHistogram, kMaxCommandHistograms, |
170 | 0 | kCommandStrideLength, kCommandBlockSwitchCost, params, |
171 | 0 | insert_and_copy_split); |
172 | 0 | if (BROTLI_IS_OOM(m)) return; |
173 | | /* TODO(eustas): reuse for distances? */ |
174 | 0 | BROTLI_FREE(m, insert_and_copy_codes); |
175 | 0 | } |
176 | | |
177 | 0 | { |
178 | | /* Create a continuous array of distance prefixes. */ |
179 | 0 | uint16_t* distance_prefixes = BROTLI_ALLOC(m, uint16_t, num_commands); |
180 | 0 | size_t j = 0; |
181 | 0 | size_t i; |
182 | 0 | if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(distance_prefixes)) return; |
183 | 0 | for (i = 0; i < num_commands; ++i) { |
184 | 0 | const Command* cmd = &cmds[i]; |
185 | 0 | if (CommandCopyLen(cmd) && cmd->cmd_prefix_ >= 128) { |
186 | 0 | distance_prefixes[j++] = cmd->dist_prefix_ & 0x3FF; |
187 | 0 | } |
188 | 0 | } |
189 | | /* Create the block split on the array of distance prefixes. */ |
190 | 0 | SplitByteVectorDistance( |
191 | 0 | m, distance_prefixes, j, |
192 | 0 | kSymbolsPerDistanceHistogram, kMaxCommandHistograms, |
193 | 0 | kDistanceStrideLength, kDistanceBlockSwitchCost, params, |
194 | 0 | dist_split); |
195 | 0 | if (BROTLI_IS_OOM(m)) return; |
196 | 0 | BROTLI_FREE(m, distance_prefixes); |
197 | 0 | } |
198 | 0 | } |
199 | | |
200 | | #if defined(BROTLI_TEST) |
201 | | size_t CountLiteralsForTest(const Command*, const size_t); |
202 | | size_t CountLiteralsForTest(const Command* cmds, const size_t num_commands) { |
203 | | return CountLiterals(cmds, num_commands); |
204 | | } |
205 | | |
206 | | void CopyLiteralsToByteArrayForTest(const Command*, |
207 | | const size_t, const uint8_t*, const size_t, const size_t, uint8_t*); |
208 | | void CopyLiteralsToByteArrayForTest(const Command* cmds, |
209 | | const size_t num_commands, const uint8_t* data, const size_t offset, |
210 | | const size_t mask, uint8_t* literals) { |
211 | | CopyLiteralsToByteArray(cmds, num_commands, data, offset, mask, literals); |
212 | | } |
213 | | #endif |
214 | | |
215 | | #if defined(__cplusplus) || defined(c_plusplus) |
216 | | } /* extern "C" */ |
217 | | #endif |