/src/zlib-ng/deflate_slow.c
Line | Count | Source |
1 | | /* deflate_slow.c -- compress data using the slow strategy of deflation algorithm |
2 | | * |
3 | | * Copyright (C) 1995-2024 Jean-loup Gailly and Mark Adler |
4 | | * For conditions of distribution and use, see copyright notice in zlib.h |
5 | | */ |
6 | | |
7 | | #include "zbuild.h" |
8 | | #include "deflate.h" |
9 | | #include "deflate_p.h" |
10 | | #include "functable.h" |
11 | | |
12 | | /* =========================================================================== |
13 | | * Same as deflate_medium, but achieves better compression. We use a lazy |
14 | | * evaluation for matches: a match is finally adopted only if there is |
15 | | * no better match at the next window position. |
16 | | */ |
17 | 14.9k | Z_INTERNAL block_state deflate_slow(deflate_state *s, int flush) { |
18 | 14.9k | Pos hash_head; /* head of hash chain */ |
19 | 14.9k | int bflush; /* set if current block must be flushed */ |
20 | 14.9k | int64_t dist; |
21 | 14.9k | uint32_t match_len; |
22 | 14.9k | match_func longest_match; |
23 | | |
24 | 14.9k | if (s->max_chain_length <= 1024) |
25 | 6.34k | longest_match = FUNCTABLE_FPTR(longest_match); |
26 | 8.65k | else |
27 | 8.65k | longest_match = FUNCTABLE_FPTR(longest_match_slow); |
28 | | |
29 | | /* Process the input block. */ |
30 | 149M | for (;;) { |
31 | | /* Make sure that we always have enough lookahead, except |
32 | | * at the end of the input file. We need STD_MAX_MATCH bytes |
33 | | * for the next match, plus WANT_MIN_MATCH bytes to insert the |
34 | | * string following the next match. |
35 | | */ |
36 | 149M | if (s->lookahead < MIN_LOOKAHEAD) { |
37 | 540k | PREFIX(fill_window)(s); |
38 | 540k | if (UNLIKELY(s->lookahead < MIN_LOOKAHEAD && flush == Z_NO_FLUSH)) { |
39 | 3.07k | return need_more; |
40 | 3.07k | } |
41 | 537k | if (UNLIKELY(s->lookahead == 0)) |
42 | 11.7k | break; /* flush the current block */ |
43 | 537k | } |
44 | | |
45 | | /* Insert the string window[strstart .. strstart+2] in the |
46 | | * dictionary, and set hash_head to the head of the hash chain: |
47 | | */ |
48 | 149M | hash_head = 0; |
49 | 149M | if (LIKELY(s->lookahead >= WANT_MIN_MATCH)) { |
50 | 149M | hash_head = s->quick_insert_string(s, s->strstart); |
51 | 149M | } |
52 | | |
53 | | /* Find the longest match, discarding those <= prev_length. |
54 | | */ |
55 | 149M | s->prev_match = (Pos)s->match_start; |
56 | 149M | match_len = STD_MIN_MATCH - 1; |
57 | 149M | dist = (int64_t)s->strstart - hash_head; |
58 | | |
59 | 149M | if (dist <= MAX_DIST(s) && dist > 0 && s->prev_length < s->max_lazy_match && hash_head != 0) { |
60 | | /* To simplify the code, we prevent matches with the string |
61 | | * of window index 0 (in particular we have to avoid a match |
62 | | * of the string with itself at the start of the input file). |
63 | | */ |
64 | 63.7M | match_len = longest_match(s, hash_head); |
65 | | /* longest_match() sets match_start */ |
66 | | |
67 | 63.7M | if (match_len <= 5 && (s->strategy == Z_FILTERED)) { |
68 | | /* If prev_match is also WANT_MIN_MATCH, match_start is garbage |
69 | | * but we will ignore the current match anyway. |
70 | | */ |
71 | 3.91M | match_len = STD_MIN_MATCH - 1; |
72 | 3.91M | } |
73 | 63.7M | } |
74 | | /* If there was a match at the previous step and the current |
75 | | * match is not better, output the previous match: |
76 | | */ |
77 | 149M | if (s->prev_length >= STD_MIN_MATCH && match_len <= s->prev_length) { |
78 | 11.3M | unsigned int max_insert = s->strstart + s->lookahead - STD_MIN_MATCH; |
79 | | /* Do not insert strings in hash table beyond this. */ |
80 | | |
81 | 11.3M | Assert((s->strstart-1) <= UINT16_MAX, "strstart-1 should fit in uint16_t"); |
82 | 11.3M | check_match(s, (Pos)(s->strstart - 1), s->prev_match, s->prev_length); |
83 | | |
84 | 11.3M | bflush = zng_tr_tally_dist(s, s->strstart -1 - s->prev_match, s->prev_length - STD_MIN_MATCH); |
85 | | |
86 | | /* Insert in hash table all strings up to the end of the match. |
87 | | * strstart-1 and strstart are already inserted. If there is not |
88 | | * enough lookahead, the last two strings are not inserted in |
89 | | * the hash table. |
90 | | */ |
91 | 11.3M | s->prev_length -= 1; |
92 | 11.3M | s->lookahead -= s->prev_length; |
93 | | |
94 | 11.3M | unsigned int mov_fwd = s->prev_length - 1; |
95 | 11.3M | if (max_insert > s->strstart) { |
96 | 11.3M | unsigned int insert_cnt = mov_fwd; |
97 | 11.3M | if (UNLIKELY(insert_cnt > max_insert - s->strstart)) |
98 | 6.33k | insert_cnt = max_insert - s->strstart; |
99 | 11.3M | s->insert_string(s, s->strstart + 1, insert_cnt); |
100 | 11.3M | } |
101 | 11.3M | s->prev_length = 0; |
102 | 11.3M | s->match_available = 0; |
103 | 11.3M | s->strstart += mov_fwd + 1; |
104 | | |
105 | 11.3M | if (UNLIKELY(bflush)) |
106 | 11.3M | FLUSH_BLOCK(s, 0); |
107 | | |
108 | 138M | } else if (s->match_available) { |
109 | | /* If there was no match at the previous position, output a |
110 | | * single literal. If there was a match but the current match |
111 | | * is longer, truncate the previous match to a single literal. |
112 | | */ |
113 | 127M | bflush = zng_tr_tally_lit(s, s->window[s->strstart-1]); |
114 | 127M | if (UNLIKELY(bflush)) |
115 | 12.1k | FLUSH_BLOCK_ONLY(s, 0); |
116 | 127M | s->prev_length = match_len; |
117 | 127M | s->strstart++; |
118 | 127M | s->lookahead--; |
119 | 127M | if (UNLIKELY(s->strm->avail_out == 0)) |
120 | 159 | return need_more; |
121 | 127M | } else { |
122 | | /* There is no previous match to compare with, wait for |
123 | | * the next step to decide. |
124 | | */ |
125 | 11.3M | s->prev_length = match_len; |
126 | 11.3M | s->match_available = 1; |
127 | 11.3M | s->strstart++; |
128 | 11.3M | s->lookahead--; |
129 | 11.3M | } |
130 | 149M | } |
131 | 11.7k | Assert(flush != Z_NO_FLUSH, "no flush?"); |
132 | 11.7k | if (UNLIKELY(s->match_available)) { |
133 | 5.56k | Z_UNUSED(zng_tr_tally_lit(s, s->window[s->strstart-1])); |
134 | 5.56k | s->match_available = 0; |
135 | 5.56k | } |
136 | 11.7k | s->insert = s->strstart < (STD_MIN_MATCH - 1) ? s->strstart : (STD_MIN_MATCH - 1); |
137 | 11.7k | if (UNLIKELY(flush == Z_FINISH)) { |
138 | 10.4k | FLUSH_BLOCK(s, 1); |
139 | 10.3k | return finish_done; |
140 | 10.4k | } |
141 | 1.30k | if (UNLIKELY(s->sym_next)) |
142 | 1.30k | FLUSH_BLOCK(s, 0); |
143 | 1.30k | return block_done; |
144 | 1.30k | } |