/src/c-blosc2/internal-complibs/zlib-ng-2.0.7/match_tpl.h
Line | Count | Source (jump to first uncovered line) |
1 | | |
2 | | #include "zbuild.h" |
3 | | #include "deflate.h" |
4 | | #include "functable.h" |
5 | | |
6 | | #ifndef MATCH_TPL_H |
7 | | #define MATCH_TPL_H |
8 | | |
9 | | #ifdef UNALIGNED_OK |
10 | | # ifdef UNALIGNED64_OK |
11 | | typedef uint64_t bestcmp_t; |
12 | | # else |
13 | | typedef uint32_t bestcmp_t; |
14 | | # endif |
15 | | #else |
16 | | typedef uint8_t bestcmp_t; |
17 | | #endif |
18 | | |
19 | 3.13M | #define EARLY_EXIT_TRIGGER_LEVEL 5 |
20 | | |
21 | | #endif |
22 | | |
23 | | /* Set match_start to the longest match starting at the given string and |
24 | | * return its length. Matches shorter or equal to prev_length are discarded, |
25 | | * in which case the result is equal to prev_length and match_start is garbage. |
26 | | * |
27 | | * IN assertions: cur_match is the head of the hash chain for the current |
28 | | * string (strstart) and its distance is <= MAX_DIST, and prev_length >=1 |
29 | | * OUT assertion: the match length is not greater than s->lookahead |
30 | | */ |
31 | 3.13M | Z_INTERNAL uint32_t LONGEST_MATCH(deflate_state *const s, Pos cur_match) { |
32 | 3.13M | unsigned int strstart = s->strstart; |
33 | 3.13M | const unsigned wmask = s->w_mask; |
34 | 3.13M | unsigned char *window = s->window; |
35 | 3.13M | unsigned char *scan = window + strstart; |
36 | 3.13M | Z_REGISTER unsigned char *mbase_start = window; |
37 | 3.13M | Z_REGISTER unsigned char *mbase_end; |
38 | 3.13M | const Pos *prev = s->prev; |
39 | 3.13M | Pos limit; |
40 | 3.13M | int32_t early_exit; |
41 | 3.13M | uint32_t chain_length, nice_match, best_len, offset; |
42 | 3.13M | uint32_t lookahead = s->lookahead; |
43 | 3.13M | bestcmp_t scan_end; |
44 | 3.13M | #ifndef UNALIGNED_OK |
45 | 3.13M | bestcmp_t scan_end0; |
46 | | #else |
47 | | bestcmp_t scan_start; |
48 | | #endif |
49 | | |
50 | 3.13M | #define GOTO_NEXT_CHAIN \ |
51 | 54.4M | if (--chain_length && (cur_match = prev[cur_match & wmask]) > limit) \ |
52 | 51.6M | continue; \ |
53 | 2.79M | return best_len; |
54 | | |
55 | | /* The code is optimized for MAX_MATCH-2 multiple of 16. */ |
56 | 3.13M | Assert(MAX_MATCH == 258, "Code too clever"); |
57 | | |
58 | 3.13M | best_len = s->prev_length ? s->prev_length : 1; |
59 | | |
60 | | /* Calculate read offset which should only extend an extra byte |
61 | | * to find the next best match length. |
62 | | */ |
63 | 3.13M | offset = best_len-1; |
64 | | #ifdef UNALIGNED_OK |
65 | | if (best_len >= sizeof(uint32_t)) { |
66 | | offset -= 2; |
67 | | #ifdef UNALIGNED64_OK |
68 | | if (best_len >= sizeof(uint64_t)) |
69 | | offset -= 4; |
70 | | #endif |
71 | | } |
72 | | #endif |
73 | | |
74 | 3.13M | scan_end = *(bestcmp_t *)(scan+offset); |
75 | 3.13M | #ifndef UNALIGNED_OK |
76 | 3.13M | scan_end0 = *(bestcmp_t *)(scan+offset+1); |
77 | | #else |
78 | | scan_start = *(bestcmp_t *)(scan); |
79 | | #endif |
80 | 3.13M | mbase_end = (mbase_start+offset); |
81 | | |
82 | | /* Do not waste too much time if we already have a good match */ |
83 | 3.13M | chain_length = s->max_chain_length; |
84 | 3.13M | early_exit = s->level < EARLY_EXIT_TRIGGER_LEVEL; |
85 | 3.13M | if (best_len >= s->good_match) |
86 | 36.4k | chain_length >>= 2; |
87 | 3.13M | nice_match = (uint32_t)s->nice_match; |
88 | | |
89 | | /* Stop when cur_match becomes <= limit. To simplify the code, |
90 | | * we prevent matches with the string of window index 0 |
91 | | */ |
92 | 3.13M | limit = strstart > MAX_DIST(s) ? (Pos)(strstart - MAX_DIST(s)) : 0; |
93 | | |
94 | 3.13M | Assert((unsigned long)strstart <= s->window_size - MIN_LOOKAHEAD, "need lookahead"); |
95 | 9.33M | for (;;) { |
96 | 9.33M | if (cur_match >= strstart) |
97 | 0 | break; |
98 | | |
99 | | /* Skip to next match if the match length cannot increase or if the match length is |
100 | | * less than 2. Note that the checks below for insufficient lookahead only occur |
101 | | * occasionally for performance reasons. |
102 | | * Therefore uninitialized memory will be accessed and conditional jumps will be made |
103 | | * that depend on those values. However the length of the match is limited to the |
104 | | * lookahead, so the output of deflate is not affected by the uninitialized values. |
105 | | */ |
106 | | #ifdef UNALIGNED_OK |
107 | | if (best_len < sizeof(uint32_t)) { |
108 | | for (;;) { |
109 | | if (*(uint16_t *)(mbase_end+cur_match) == (uint16_t)scan_end && |
110 | | *(uint16_t *)(mbase_start+cur_match) == (uint16_t)scan_start) |
111 | | break; |
112 | | GOTO_NEXT_CHAIN; |
113 | | } |
114 | | # ifdef UNALIGNED64_OK |
115 | | } else if (best_len >= sizeof(uint64_t)) { |
116 | | for (;;) { |
117 | | if (*(uint64_t *)(mbase_end+cur_match) == (uint64_t)scan_end && |
118 | | *(uint64_t *)(mbase_start+cur_match) == (uint64_t)scan_start) |
119 | | break; |
120 | | GOTO_NEXT_CHAIN; |
121 | | } |
122 | | # endif |
123 | | } else { |
124 | | for (;;) { |
125 | | if (*(uint32_t *)(mbase_end+cur_match) == (uint32_t)scan_end && |
126 | | *(uint32_t *)(mbase_start+cur_match) == (uint32_t)scan_start) |
127 | | break; |
128 | | GOTO_NEXT_CHAIN; |
129 | | } |
130 | | } |
131 | | #else |
132 | 54.7M | for (;;) { |
133 | 54.7M | if (mbase_end[cur_match] == scan_end && mbase_end[cur_match+1] == scan_end0 && |
134 | 54.7M | mbase_start[cur_match] == scan[0] && mbase_start[cur_match+1] == scan[1]) |
135 | 7.05M | break; |
136 | 47.7M | GOTO_NEXT_CHAIN; |
137 | 47.7M | } |
138 | 7.05M | #endif |
139 | 7.05M | uint32_t len = COMPARE256(scan+2, mbase_start+cur_match+2) + 2; |
140 | 7.05M | Assert(scan+len <= window+(unsigned)(s->window_size-1), "wild scan"); |
141 | | |
142 | 7.05M | if (len > best_len) { |
143 | 3.07M | s->match_start = cur_match; |
144 | | /* Do not look for matches beyond the end of the input. */ |
145 | 3.07M | if (len > lookahead) |
146 | 2.31k | return lookahead; |
147 | 3.06M | best_len = len; |
148 | 3.06M | if (best_len >= nice_match) |
149 | 294k | return best_len; |
150 | | |
151 | 2.77M | offset = best_len-1; |
152 | | #ifdef UNALIGNED_OK |
153 | | if (best_len >= sizeof(uint32_t)) { |
154 | | offset -= 2; |
155 | | #ifdef UNALIGNED64_OK |
156 | | if (best_len >= sizeof(uint64_t)) |
157 | | offset -= 4; |
158 | | #endif |
159 | | } |
160 | | #endif |
161 | 2.77M | scan_end = *(bestcmp_t *)(scan+offset); |
162 | 2.77M | #ifndef UNALIGNED_OK |
163 | 2.77M | scan_end0 = *(bestcmp_t *)(scan+offset+1); |
164 | 2.77M | #endif |
165 | 2.77M | mbase_end = (mbase_start+offset); |
166 | 3.97M | } else if (UNLIKELY(early_exit)) { |
167 | | /* The probability of finding a match later if we here is pretty low, so for |
168 | | * performance it's best to outright stop here for the lower compression levels |
169 | | */ |
170 | 41.2k | break; |
171 | 41.2k | } |
172 | 6.71M | GOTO_NEXT_CHAIN; |
173 | 6.71M | } |
174 | | |
175 | 41.2k | return best_len; |
176 | 3.13M | } |
177 | | |
178 | | #undef LONGEST_MATCH |
179 | | #undef COMPARE256 |
180 | | #undef COMPARE258 |