/src/php-src/Zend/Optimizer/block_pass.c
Line | Count | Source |
1 | | /* |
2 | | +----------------------------------------------------------------------+ |
3 | | | Zend OPcache | |
4 | | +----------------------------------------------------------------------+ |
5 | | | Copyright © The PHP Group and Contributors. | |
6 | | +----------------------------------------------------------------------+ |
7 | | | This source file is subject to the Modified BSD License that is | |
8 | | | bundled with this package in the file LICENSE, and is available | |
9 | | | through the World Wide Web at <https://www.php.net/license/>. | |
10 | | | | |
11 | | | SPDX-License-Identifier: BSD-3-Clause | |
12 | | +----------------------------------------------------------------------+ |
13 | | | Authors: Andi Gutmans <andi@php.net> | |
14 | | | Zeev Suraski <zeev@php.net> | |
15 | | | Stanislav Malyshev <stas@zend.com> | |
16 | | | Dmitry Stogov <dmitry@php.net> | |
17 | | +----------------------------------------------------------------------+ |
18 | | */ |
19 | | |
20 | | #include "Optimizer/zend_optimizer.h" |
21 | | #include "Optimizer/zend_optimizer_internal.h" |
22 | | #include "zend_API.h" |
23 | | #include "zend_constants.h" |
24 | | #include "zend_execute.h" |
25 | | #include "zend_vm.h" |
26 | | #include "zend_bitset.h" |
27 | | #include "zend_cfg.h" |
28 | | #include "zend_dump.h" |
29 | | |
30 | | /* Checks if a constant (like "true") may be replaced by its value */ |
31 | | bool zend_optimizer_get_persistent_constant(zend_string *name, zval *result, bool copy) |
32 | 23.6k | { |
33 | 23.6k | const zend_constant *c = zend_hash_find_ptr(EG(zend_constants), name); |
34 | 23.6k | if (c) { |
35 | 42 | if ((ZEND_CONSTANT_FLAGS(c) & CONST_PERSISTENT) |
36 | 42 | && !(ZEND_CONSTANT_FLAGS(c) & CONST_DEPRECATED) |
37 | 0 | && (!(ZEND_CONSTANT_FLAGS(c) & CONST_NO_FILE_CACHE) |
38 | 0 | || !(CG(compiler_options) & ZEND_COMPILE_WITH_FILE_CACHE))) { |
39 | 0 | ZVAL_COPY_VALUE(result, &c->value); |
40 | 0 | if (copy) { |
41 | 0 | Z_TRY_ADDREF_P(result); |
42 | 0 | } |
43 | 0 | return true; |
44 | 42 | } else { |
45 | 42 | return false; |
46 | 42 | } |
47 | 42 | } |
48 | | |
49 | | /* Special constants null/true/false can always be substituted. */ |
50 | 23.6k | c = zend_get_special_const(ZSTR_VAL(name), ZSTR_LEN(name)); |
51 | 23.6k | if (c) { |
52 | 0 | ZVAL_COPY_VALUE(result, &c->value); |
53 | 0 | return true; |
54 | 0 | } |
55 | 23.6k | return false; |
56 | 23.6k | } |
57 | | |
58 | | /* Data dependencies macros */ |
59 | | |
60 | 1.80M | #define VAR_SOURCE(op) Tsource[VAR_NUM(op.var)] |
61 | 1.42M | #define SET_VAR_SOURCE(opline) Tsource[VAR_NUM(opline->result.var)] = opline |
62 | | |
63 | | static void strip_leading_nops(const zend_op_array *op_array, zend_basic_block *b) |
64 | 9.50k | { |
65 | 9.50k | const zend_op *opcodes = op_array->opcodes; |
66 | | |
67 | 11.7k | do { |
68 | 11.7k | b->start++; |
69 | 11.7k | b->len--; |
70 | 11.7k | } while (b->len > 0 && opcodes[b->start].opcode == ZEND_NOP); |
71 | 9.50k | } |
72 | | |
73 | | static void strip_nops(const zend_op_array *op_array, zend_basic_block *b) |
74 | 503k | { |
75 | 503k | uint32_t i, j; |
76 | | |
77 | 503k | if (b->len == 0) { |
78 | 1.05k | return; |
79 | 1.05k | } |
80 | | |
81 | 502k | if (op_array->opcodes[b->start].opcode == ZEND_NOP) { |
82 | 3.92k | strip_leading_nops(op_array, b); |
83 | 3.92k | } |
84 | | |
85 | 502k | if (b->len == 0) { |
86 | 316 | return; |
87 | 316 | } |
88 | | |
89 | | /* strip the inside NOPs */ |
90 | 502k | i = j = b->start + 1; |
91 | 3.10M | while (i < b->start + b->len) { |
92 | 2.60M | if (op_array->opcodes[i].opcode != ZEND_NOP) { |
93 | 2.57M | if (i != j) { |
94 | 65.9k | op_array->opcodes[j] = op_array->opcodes[i]; |
95 | 65.9k | } |
96 | 2.57M | j++; |
97 | 2.57M | } |
98 | 2.60M | i++; |
99 | 2.60M | } |
100 | 502k | b->len = j - b->start; |
101 | 529k | while (j < i) { |
102 | 27.1k | MAKE_NOP(op_array->opcodes + j); |
103 | 27.1k | j++; |
104 | 27.1k | } |
105 | 502k | } |
106 | | |
107 | 72 | static uint32_t get_const_switch_target(const zend_cfg *cfg, const zend_op_array *op_array, const zend_basic_block *block, zend_op *opline, const zval *val) { |
108 | 72 | HashTable *jumptable = Z_ARRVAL(ZEND_OP2_LITERAL(opline)); |
109 | 72 | zval *zv; |
110 | 72 | if ((opline->opcode == ZEND_SWITCH_LONG && Z_TYPE_P(val) != IS_LONG) |
111 | 72 | || (opline->opcode == ZEND_SWITCH_STRING && Z_TYPE_P(val) != IS_STRING)) { |
112 | | /* fallback to next block */ |
113 | 0 | return block->successors[block->successors_count - 1]; |
114 | 0 | } |
115 | 72 | if (opline->opcode == ZEND_MATCH && Z_TYPE_P(val) != IS_LONG && Z_TYPE_P(val) != IS_STRING) { |
116 | | /* always jump to the default arm */ |
117 | 16 | return block->successors[block->successors_count - 1]; |
118 | 16 | } |
119 | 56 | if (Z_TYPE_P(val) == IS_LONG) { |
120 | 28 | zv = zend_hash_index_find(jumptable, Z_LVAL_P(val)); |
121 | 28 | } else { |
122 | 28 | ZEND_ASSERT(Z_TYPE_P(val) == IS_STRING); |
123 | 28 | zv = zend_hash_find(jumptable, Z_STR_P(val)); |
124 | 28 | } |
125 | 56 | if (!zv) { |
126 | | /* default */ |
127 | 32 | return block->successors[block->successors_count - (opline->opcode == ZEND_MATCH ? 1 : 2)]; |
128 | 32 | } |
129 | 24 | return cfg->map[ZEND_OFFSET_TO_OPLINE_NUM(op_array, opline, Z_LVAL_P(zv))]; |
130 | 56 | } |
131 | | |
132 | | static void zend_optimize_block(zend_basic_block *block, zend_op_array *op_array, zend_bitset used_ext, zend_cfg *cfg, zend_op **Tsource, uint32_t *opt_count) |
133 | 503k | { |
134 | 503k | zend_op *opline, *src; |
135 | 503k | zend_op *end, *last_op = NULL; |
136 | | |
137 | 503k | if (block->len == 0) { |
138 | 260 | return; |
139 | 260 | } |
140 | | |
141 | 503k | if (op_array->opcodes[block->start].opcode == ZEND_NOP) { |
142 | | /* remove leading NOPs */ |
143 | 5.58k | strip_leading_nops(op_array, block); |
144 | 5.58k | } |
145 | | |
146 | 503k | opline = op_array->opcodes + block->start; |
147 | 503k | end = opline + block->len; |
148 | 3.61M | while (opline < end) { |
149 | | /* Constant Propagation: strip X = QM_ASSIGN(const) */ |
150 | 3.11M | if (opline->op1_type == IS_TMP_VAR && |
151 | 865k | opline->opcode != ZEND_FREE) { |
152 | 829k | src = VAR_SOURCE(opline->op1); |
153 | 829k | if (src && |
154 | 738k | src->opcode == ZEND_QM_ASSIGN && |
155 | 3.04k | src->op1_type == IS_CONST |
156 | 829k | ) { |
157 | 1.91k | znode_op op1 = opline->op1; |
158 | 1.91k | if (opline->opcode == ZEND_VERIFY_RETURN_TYPE) { |
159 | 2 | COPY_NODE(opline->result, opline->op1); |
160 | 2 | COPY_NODE(opline->op1, src->op1); |
161 | 2 | VAR_SOURCE(op1) = NULL; |
162 | 2 | MAKE_NOP(src); |
163 | 2 | ++(*opt_count); |
164 | 1.90k | } else { |
165 | 1.90k | zval c; |
166 | 1.90k | ZVAL_COPY(&c, &ZEND_OP1_LITERAL(src)); |
167 | 1.90k | if (opline->opcode != ZEND_CASE |
168 | 1.90k | && opline->opcode != ZEND_CASE_STRICT |
169 | 1.88k | && opline->opcode != ZEND_FETCH_LIST_R |
170 | 1.86k | && opline->opcode != ZEND_SWITCH_LONG |
171 | 1.86k | && opline->opcode != ZEND_SWITCH_STRING |
172 | 1.86k | && opline->opcode != ZEND_MATCH |
173 | 1.85k | && opline->opcode != ZEND_MATCH_ERROR |
174 | 1.85k | && zend_optimizer_update_op1_const(op_array, opline, &c)) { |
175 | 1.81k | VAR_SOURCE(op1) = NULL; |
176 | 1.81k | if (opline->opcode != ZEND_JMP_NULL |
177 | 1.80k | && !zend_bitset_in(used_ext, VAR_NUM(src->result.var)) |
178 | | /* FETCH_W with ZEND_FETCH_GLOBAL_LOCK does not free op1, which will be used again. */ |
179 | 1.28k | && !(opline->opcode == ZEND_FETCH_W && (opline->extended_value & ZEND_FETCH_GLOBAL_LOCK))) { |
180 | 1.28k | literal_dtor(&ZEND_OP1_LITERAL(src)); |
181 | 1.28k | MAKE_NOP(src); |
182 | 1.28k | } |
183 | 1.81k | ++(*opt_count); |
184 | 1.81k | } else { |
185 | 98 | zval_ptr_dtor_nogc(&c); |
186 | 98 | } |
187 | 1.90k | } |
188 | 1.91k | } |
189 | 829k | } |
190 | | |
191 | | /* Constant Propagation: strip X = QM_ASSIGN(const) */ |
192 | 3.11M | if (opline->op2_type == IS_TMP_VAR) { |
193 | 480k | src = VAR_SOURCE(opline->op2); |
194 | 480k | if (src && |
195 | 447k | src->opcode == ZEND_QM_ASSIGN && |
196 | 696 | src->op1_type == IS_CONST) { |
197 | | |
198 | 220 | znode_op op2 = opline->op2; |
199 | 220 | zval c; |
200 | | |
201 | 220 | ZVAL_COPY(&c, &ZEND_OP1_LITERAL(src)); |
202 | 220 | if (zend_optimizer_update_op2_const(op_array, opline, &c)) { |
203 | 210 | VAR_SOURCE(op2) = NULL; |
204 | 210 | if (!zend_bitset_in(used_ext, VAR_NUM(src->result.var))) { |
205 | 210 | literal_dtor(&ZEND_OP1_LITERAL(src)); |
206 | 210 | MAKE_NOP(src); |
207 | 210 | } |
208 | 210 | ++(*opt_count); |
209 | 210 | } else { |
210 | 10 | zval_ptr_dtor_nogc(&c); |
211 | 10 | } |
212 | 220 | } |
213 | 480k | } |
214 | | |
215 | 3.11M | switch (opline->opcode) { |
216 | 157k | case ZEND_ECHO: |
217 | 157k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
218 | 38.6k | src = VAR_SOURCE(opline->op1); |
219 | 38.6k | if (src && |
220 | 35.4k | src->opcode == ZEND_CAST && |
221 | 138 | src->extended_value == IS_STRING) { |
222 | | /* T = CAST(X, String), ECHO(T) => NOP, ECHO(X) */ |
223 | 82 | VAR_SOURCE(opline->op1) = NULL; |
224 | 82 | COPY_NODE(opline->op1, src->op1); |
225 | 82 | MAKE_NOP(src); |
226 | 82 | ++(*opt_count); |
227 | 82 | } |
228 | 119k | } else if (opline->op1_type == IS_CONST && |
229 | 117k | Z_TYPE(ZEND_OP1_LITERAL(opline)) != IS_DOUBLE) { |
230 | 117k | if (last_op == opline - 1) { |
231 | | /* compress consecutive ECHO's. |
232 | | * Float to string conversion may be affected by current |
233 | | * locale setting. |
234 | | */ |
235 | 5.05k | size_t l, old_len; |
236 | | |
237 | 5.05k | if (Z_TYPE(ZEND_OP1_LITERAL(opline)) != IS_STRING) { |
238 | 57 | convert_to_string(&ZEND_OP1_LITERAL(opline)); |
239 | 57 | } |
240 | 5.05k | if (Z_TYPE(ZEND_OP1_LITERAL(last_op)) != IS_STRING) { |
241 | 22 | convert_to_string(&ZEND_OP1_LITERAL(last_op)); |
242 | 22 | } |
243 | 5.05k | old_len = Z_STRLEN(ZEND_OP1_LITERAL(last_op)); |
244 | 5.05k | l = old_len + Z_STRLEN(ZEND_OP1_LITERAL(opline)); |
245 | 5.05k | if (!Z_REFCOUNTED(ZEND_OP1_LITERAL(last_op))) { |
246 | 1.72k | zend_string *tmp = zend_string_alloc(l, 0); |
247 | 1.72k | memcpy(ZSTR_VAL(tmp), Z_STRVAL(ZEND_OP1_LITERAL(last_op)), old_len); |
248 | 1.72k | Z_STR(ZEND_OP1_LITERAL(last_op)) = tmp; |
249 | 3.33k | } else { |
250 | 3.33k | Z_STR(ZEND_OP1_LITERAL(last_op)) = zend_string_extend(Z_STR(ZEND_OP1_LITERAL(last_op)), l, 0); |
251 | 3.33k | } |
252 | 5.05k | Z_TYPE_INFO(ZEND_OP1_LITERAL(last_op)) = IS_STRING_EX; |
253 | 5.05k | memcpy(Z_STRVAL(ZEND_OP1_LITERAL(last_op)) + old_len, Z_STRVAL(ZEND_OP1_LITERAL(opline)), Z_STRLEN(ZEND_OP1_LITERAL(opline))); |
254 | 5.05k | Z_STRVAL(ZEND_OP1_LITERAL(last_op))[l] = '\0'; |
255 | 5.05k | zval_ptr_dtor_nogc(&ZEND_OP1_LITERAL(opline)); |
256 | 5.05k | ZVAL_STR(&ZEND_OP1_LITERAL(opline), zend_new_interned_string(Z_STR(ZEND_OP1_LITERAL(last_op)))); |
257 | 5.05k | ZVAL_NULL(&ZEND_OP1_LITERAL(last_op)); |
258 | 5.05k | MAKE_NOP(last_op); |
259 | 5.05k | ++(*opt_count); |
260 | 5.05k | } |
261 | 117k | last_op = opline; |
262 | 117k | } |
263 | 157k | break; |
264 | | |
265 | 572 | case ZEND_MATCH_ERROR: |
266 | 572 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
267 | 182 | src = VAR_SOURCE(opline->op1); |
268 | 182 | VAR_SOURCE(opline->op1) = NULL; |
269 | 182 | } |
270 | 572 | break; |
271 | | |
272 | 35.6k | case ZEND_FREE: |
273 | | /* Note: Only remove the source if the source is local to this block. |
274 | | * If it's not local, then the other blocks successors must also eventually either FREE or consume the temporary, |
275 | | * hence removing the temporary is not safe in the general case, especially when other consumers are not FREE. |
276 | | * A FREE may not be removed without also removing the source's result, because otherwise that would cause a memory leak. */ |
277 | 35.6k | if (opline->extended_value == ZEND_FREE_VOID_CAST) { |
278 | | /* Keep the ZEND_FREE opcode alive. */ |
279 | 35.6k | } else if (opline->op1_type == IS_TMP_VAR) { |
280 | 35.2k | src = VAR_SOURCE(opline->op1); |
281 | 35.2k | if (src) { |
282 | 29.6k | switch (src->opcode) { |
283 | 31 | case ZEND_BOOL: |
284 | 262 | case ZEND_BOOL_NOT: |
285 | | /* T = BOOL(X), FREE(T) => T = BOOL(X) */ |
286 | | /* The remaining BOOL is removed by a separate optimization */ |
287 | | /* The source is a bool, no source removals take place, so this may be done non-locally. */ |
288 | 262 | VAR_SOURCE(opline->op1) = NULL; |
289 | 262 | MAKE_NOP(opline); |
290 | 262 | ++(*opt_count); |
291 | 262 | break; |
292 | 232 | case ZEND_QM_ASSIGN: |
293 | 232 | if (src < op_array->opcodes + block->start) { |
294 | 20 | break; |
295 | 20 | } |
296 | 212 | src->result_type = IS_UNUSED; |
297 | 212 | VAR_SOURCE(opline->op1) = NULL; |
298 | 212 | MAKE_NOP(opline); |
299 | 212 | ++(*opt_count); |
300 | 212 | if (src->op1_type & (IS_VAR|IS_TMP_VAR)) { |
301 | 86 | src->opcode = ZEND_FREE; |
302 | 126 | } else if (src->op1_type == IS_CONST) { |
303 | 118 | MAKE_NOP(src); |
304 | 118 | } else if (src->op1_type == IS_CV) { |
305 | 8 | src->opcode = ZEND_CHECK_VAR; |
306 | 8 | SET_UNUSED(src->result); |
307 | 8 | } |
308 | 212 | break; |
309 | 29.1k | default: |
310 | 29.1k | if (!zend_op_may_elide_result(src->opcode)) { |
311 | 26.5k | break; |
312 | 26.5k | } |
313 | 2.62k | if (src < op_array->opcodes + block->start) { |
314 | 4 | break; |
315 | 4 | } |
316 | 2.61k | src->result_type = IS_UNUSED; |
317 | 2.61k | VAR_SOURCE(opline->op1) = NULL; |
318 | 2.61k | MAKE_NOP(opline); |
319 | 2.61k | ++(*opt_count); |
320 | 2.61k | break; |
321 | 29.6k | } |
322 | 29.6k | } |
323 | 35.2k | } else if (opline->op1_type == IS_VAR) { |
324 | 302 | src = VAR_SOURCE(opline->op1); |
325 | | /* V = OP, FREE(V) => OP. NOP */ |
326 | 302 | if (src >= op_array->opcodes + block->start && |
327 | 12 | src->opcode != ZEND_FETCH_R && |
328 | 8 | src->opcode != ZEND_FETCH_STATIC_PROP_R && |
329 | 8 | src->opcode != ZEND_FETCH_DIM_R && |
330 | 8 | src->opcode != ZEND_FETCH_OBJ_R && |
331 | 4 | src->opcode != ZEND_NEW && |
332 | 4 | src->opcode != ZEND_FETCH_THIS) { |
333 | 4 | src->result_type = IS_UNUSED; |
334 | 4 | MAKE_NOP(opline); |
335 | 4 | ++(*opt_count); |
336 | 4 | if (src->opcode == ZEND_QM_ASSIGN) { |
337 | 0 | if (src->op1_type & (IS_VAR|IS_TMP_VAR)) { |
338 | 0 | src->opcode = ZEND_FREE; |
339 | 0 | } else { |
340 | 0 | MAKE_NOP(src); |
341 | 0 | } |
342 | 0 | } |
343 | 4 | } |
344 | 302 | } |
345 | 35.6k | break; |
346 | | |
347 | 35.6k | case ZEND_FETCH_LIST_R: |
348 | 2.10k | case ZEND_FETCH_LIST_W: |
349 | 2.10k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
350 | | /* LIST variable will be deleted later by FREE */ |
351 | 1.79k | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
352 | 1.79k | } |
353 | 2.10k | break; |
354 | | |
355 | 10 | case ZEND_SWITCH_LONG: |
356 | 89 | case ZEND_SWITCH_STRING: |
357 | 377 | case ZEND_MATCH: |
358 | 377 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
359 | | /* SWITCH variable will be deleted later by FREE, so we can't optimize it */ |
360 | 109 | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
361 | 109 | break; |
362 | 109 | } |
363 | 268 | if (opline->op1_type == IS_CONST) { |
364 | 72 | uint32_t target = get_const_switch_target(cfg, op_array, block, opline, &ZEND_OP1_LITERAL(opline)); |
365 | 72 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
366 | 72 | literal_dtor(&ZEND_OP2_LITERAL(opline)); |
367 | 72 | opline->opcode = ZEND_JMP; |
368 | 72 | opline->op1_type = IS_UNUSED; |
369 | 72 | opline->op2_type = IS_UNUSED; |
370 | 72 | block->successors_count = 1; |
371 | 72 | block->successors[0] = target; |
372 | 72 | } |
373 | 268 | break; |
374 | | |
375 | 0 | case ZEND_EXT_STMT: |
376 | 0 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
377 | | /* Variable will be deleted later by FREE, so we can't optimize it */ |
378 | 0 | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
379 | 0 | break; |
380 | 0 | } |
381 | 0 | break; |
382 | | |
383 | 284 | case ZEND_CASE: |
384 | 626 | case ZEND_CASE_STRICT: |
385 | 4.19k | case ZEND_COPY_TMP: |
386 | 4.19k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
387 | | /* Variable will be deleted later by FREE, so we can't optimize it */ |
388 | 4.19k | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
389 | 4.19k | break; |
390 | 4.19k | } |
391 | 0 | if (opline->op1_type == IS_CONST && |
392 | 0 | opline->op2_type == IS_CONST) { |
393 | 0 | goto optimize_constant_binary_op; |
394 | 0 | } |
395 | | /* |
396 | | * CASE(TRUE, X) => BOOL(X) |
397 | | * CASE(FALSE, X) => BOOL_NOT(X) |
398 | | */ |
399 | 0 | if (opline->op1_type == IS_CONST && |
400 | 0 | (Z_TYPE(ZEND_OP1_LITERAL(opline)) == IS_FALSE || |
401 | 0 | Z_TYPE(ZEND_OP1_LITERAL(opline)) == IS_TRUE)) { |
402 | | /* Optimization of comparison with "null" is not safe, |
403 | | * because ("0" == null) is not equal to !("0") |
404 | | */ |
405 | 0 | opline->opcode = |
406 | 0 | ((opline->opcode != ZEND_IS_NOT_EQUAL) == ((Z_TYPE(ZEND_OP1_LITERAL(opline))) == IS_TRUE)) ? |
407 | 0 | ZEND_BOOL : ZEND_BOOL_NOT; |
408 | 0 | COPY_NODE(opline->op1, opline->op2); |
409 | 0 | SET_UNUSED(opline->op2); |
410 | 0 | ++(*opt_count); |
411 | 0 | goto optimize_bool; |
412 | 0 | } else if (opline->op2_type == IS_CONST && |
413 | 0 | (Z_TYPE(ZEND_OP2_LITERAL(opline)) == IS_FALSE || |
414 | 0 | Z_TYPE(ZEND_OP2_LITERAL(opline)) == IS_TRUE)) { |
415 | | /* Optimization of comparison with "null" is not safe, |
416 | | * because ("0" == null) is not equal to !("0") |
417 | | */ |
418 | 0 | opline->opcode = |
419 | 0 | ((opline->opcode != ZEND_IS_NOT_EQUAL) == ((Z_TYPE(ZEND_OP2_LITERAL(opline))) == IS_TRUE)) ? |
420 | 0 | ZEND_BOOL : ZEND_BOOL_NOT; |
421 | 0 | SET_UNUSED(opline->op2); |
422 | 0 | ++(*opt_count); |
423 | 0 | goto optimize_bool; |
424 | 0 | } |
425 | 0 | break; |
426 | | |
427 | 22.5k | case ZEND_IS_EQUAL: |
428 | 26.6k | case ZEND_IS_NOT_EQUAL: |
429 | 26.6k | if (opline->op1_type == IS_CONST && |
430 | 0 | opline->op2_type == IS_CONST) { |
431 | 0 | goto optimize_constant_binary_op; |
432 | 0 | } |
433 | | /* IS_EQ(TRUE, X) => BOOL(X) |
434 | | * IS_EQ(FALSE, X) => BOOL_NOT(X) |
435 | | * IS_NOT_EQ(TRUE, X) => BOOL_NOT(X) |
436 | | * IS_NOT_EQ(FALSE, X) => BOOL(X) |
437 | | * Those optimizations are not safe if the other operand ends up being NAN |
438 | | * as BOOL/BOOL_NOT will warn, while IS_EQUAL/IS_NOT_EQUAL do not. |
439 | | */ |
440 | 26.6k | break; |
441 | 26.6k | case ZEND_IS_IDENTICAL: |
442 | 3.01k | if (opline->op1_type == IS_CONST && |
443 | 0 | opline->op2_type == IS_CONST) { |
444 | 0 | goto optimize_constant_binary_op; |
445 | 0 | } |
446 | | |
447 | 3.01k | if (opline->op1_type == IS_CONST && |
448 | 0 | (Z_TYPE(ZEND_OP1_LITERAL(opline)) <= IS_TRUE && Z_TYPE(ZEND_OP1_LITERAL(opline)) >= IS_NULL)) { |
449 | | /* IS_IDENTICAL(TRUE, T) => TYPE_CHECK(T, TRUE) |
450 | | * IS_IDENTICAL(FALSE, T) => TYPE_CHECK(T, FALSE) |
451 | | * IS_IDENTICAL(NULL, T) => TYPE_CHECK(T, NULL) |
452 | | */ |
453 | 0 | opline->opcode = ZEND_TYPE_CHECK; |
454 | 0 | opline->extended_value = (1 << Z_TYPE(ZEND_OP1_LITERAL(opline))); |
455 | 0 | COPY_NODE(opline->op1, opline->op2); |
456 | 0 | SET_UNUSED(opline->op2); |
457 | 0 | ++(*opt_count); |
458 | 0 | goto optimize_type_check; |
459 | 3.01k | } else if (opline->op2_type == IS_CONST && |
460 | 2.08k | (Z_TYPE(ZEND_OP2_LITERAL(opline)) <= IS_TRUE && Z_TYPE(ZEND_OP2_LITERAL(opline)) >= IS_NULL)) { |
461 | | /* IS_IDENTICAL(T, TRUE) => TYPE_CHECK(T, TRUE) |
462 | | * IS_IDENTICAL(T, FALSE) => TYPE_CHECK(T, FALSE) |
463 | | * IS_IDENTICAL(T, NULL) => TYPE_CHECK(T, NULL) |
464 | | */ |
465 | 138 | opline->opcode = ZEND_TYPE_CHECK; |
466 | 138 | opline->extended_value = (1 << Z_TYPE(ZEND_OP2_LITERAL(opline))); |
467 | 138 | SET_UNUSED(opline->op2); |
468 | 138 | ++(*opt_count); |
469 | 138 | goto optimize_type_check; |
470 | 138 | } |
471 | 2.87k | break; |
472 | 2.87k | case ZEND_TYPE_CHECK: |
473 | 1.71k | optimize_type_check: |
474 | 1.71k | if (opline->extended_value == (1 << IS_TRUE) || opline->extended_value == (1 << IS_FALSE)) { |
475 | 212 | if (opline->op1_type == IS_TMP_VAR && |
476 | 180 | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
477 | 180 | src = VAR_SOURCE(opline->op1); |
478 | | |
479 | 180 | if (src) { |
480 | 180 | switch (src->opcode) { |
481 | 0 | case ZEND_BOOL: |
482 | 0 | case ZEND_BOOL_NOT: |
483 | | /* T = BOOL(X) + TYPE_CHECK(T, TRUE) -> BOOL(X), NOP |
484 | | * T = BOOL(X) + TYPE_CHECK(T, FALSE) -> BOOL_NOT(X), NOP |
485 | | * T = BOOL_NOT(X) + TYPE_CHECK(T, TRUE) -> BOOL_NOT(X), NOP |
486 | | * T = BOOL_NOT(X) + TYPE_CHECK(T, FALSE) -> BOOL(X), NOP |
487 | | */ |
488 | 0 | src->opcode = |
489 | 0 | ((src->opcode == ZEND_BOOL) == (opline->extended_value == (1 << IS_TRUE))) ? |
490 | 0 | ZEND_BOOL : ZEND_BOOL_NOT; |
491 | 0 | COPY_NODE(src->result, opline->result); |
492 | 0 | SET_VAR_SOURCE(src); |
493 | 0 | MAKE_NOP(opline); |
494 | 0 | ++(*opt_count); |
495 | 0 | break; |
496 | 180 | } |
497 | 180 | } |
498 | 180 | } |
499 | 212 | } |
500 | 1.71k | break; |
501 | | |
502 | 5.68k | case ZEND_BOOL: |
503 | 13.6k | case ZEND_BOOL_NOT: |
504 | 16.8k | optimize_bool: |
505 | 16.8k | if (opline->op1_type == IS_CONST) { |
506 | 1.65k | goto optimize_const_unary_op; |
507 | 1.65k | } |
508 | 15.1k | if (opline->op1_type == IS_TMP_VAR && |
509 | 12.9k | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
510 | 12.3k | src = VAR_SOURCE(opline->op1); |
511 | 12.3k | if (src) { |
512 | 12.3k | switch (src->opcode) { |
513 | 1.77k | case ZEND_BOOL_NOT: |
514 | | /* T = BOOL_NOT(X) + BOOL(T) -> NOP, BOOL_NOT(X) */ |
515 | 1.77k | VAR_SOURCE(opline->op1) = NULL; |
516 | 1.77k | COPY_NODE(opline->op1, src->op1); |
517 | 1.77k | opline->opcode = (opline->opcode == ZEND_BOOL) ? ZEND_BOOL_NOT : ZEND_BOOL; |
518 | 1.77k | MAKE_NOP(src); |
519 | 1.77k | ++(*opt_count); |
520 | 1.77k | goto optimize_bool; |
521 | 1.34k | case ZEND_BOOL: |
522 | | /* T = BOOL(X) + BOOL(T) -> NOP, BOOL(X) */ |
523 | 1.34k | VAR_SOURCE(opline->op1) = NULL; |
524 | 1.34k | COPY_NODE(opline->op1, src->op1); |
525 | 1.34k | MAKE_NOP(src); |
526 | 1.34k | ++(*opt_count); |
527 | 1.34k | goto optimize_bool; |
528 | 237 | case ZEND_IS_EQUAL: |
529 | 237 | if (opline->opcode == ZEND_BOOL_NOT) { |
530 | 0 | src->opcode = ZEND_IS_NOT_EQUAL; |
531 | 0 | } |
532 | 237 | COPY_NODE(src->result, opline->result); |
533 | 237 | SET_VAR_SOURCE(src); |
534 | 237 | MAKE_NOP(opline); |
535 | 237 | ++(*opt_count); |
536 | 237 | break; |
537 | 180 | case ZEND_IS_NOT_EQUAL: |
538 | 180 | if (opline->opcode == ZEND_BOOL_NOT) { |
539 | 0 | src->opcode = ZEND_IS_EQUAL; |
540 | 0 | } |
541 | 180 | COPY_NODE(src->result, opline->result); |
542 | 180 | SET_VAR_SOURCE(src); |
543 | 180 | MAKE_NOP(opline); |
544 | 180 | ++(*opt_count); |
545 | 180 | break; |
546 | 225 | case ZEND_IS_IDENTICAL: |
547 | 225 | if (opline->opcode == ZEND_BOOL_NOT) { |
548 | 0 | src->opcode = ZEND_IS_NOT_IDENTICAL; |
549 | 0 | } |
550 | 225 | COPY_NODE(src->result, opline->result); |
551 | 225 | SET_VAR_SOURCE(src); |
552 | 225 | MAKE_NOP(opline); |
553 | 225 | ++(*opt_count); |
554 | 225 | break; |
555 | 126 | case ZEND_IS_NOT_IDENTICAL: |
556 | 126 | if (opline->opcode == ZEND_BOOL_NOT) { |
557 | 0 | src->opcode = ZEND_IS_IDENTICAL; |
558 | 0 | } |
559 | 126 | COPY_NODE(src->result, opline->result); |
560 | 126 | SET_VAR_SOURCE(src); |
561 | 126 | MAKE_NOP(opline); |
562 | 126 | ++(*opt_count); |
563 | 126 | break; |
564 | 156 | case ZEND_IS_SMALLER: |
565 | 156 | if (opline->opcode == ZEND_BOOL_NOT) { |
566 | 0 | uint8_t tmp_type; |
567 | 0 | uint32_t tmp; |
568 | |
|
569 | 0 | src->opcode = ZEND_IS_SMALLER_OR_EQUAL; |
570 | 0 | tmp_type = src->op1_type; |
571 | 0 | src->op1_type = src->op2_type; |
572 | 0 | src->op2_type = tmp_type; |
573 | 0 | tmp = src->op1.num; |
574 | 0 | src->op1.num = src->op2.num; |
575 | 0 | src->op2.num = tmp; |
576 | 0 | } |
577 | 156 | COPY_NODE(src->result, opline->result); |
578 | 156 | SET_VAR_SOURCE(src); |
579 | 156 | MAKE_NOP(opline); |
580 | 156 | ++(*opt_count); |
581 | 156 | break; |
582 | 436 | case ZEND_IS_SMALLER_OR_EQUAL: |
583 | 436 | if (opline->opcode == ZEND_BOOL_NOT) { |
584 | 0 | uint8_t tmp_type; |
585 | 0 | uint32_t tmp; |
586 | |
|
587 | 0 | src->opcode = ZEND_IS_SMALLER; |
588 | 0 | tmp_type = src->op1_type; |
589 | 0 | src->op1_type = src->op2_type; |
590 | 0 | src->op2_type = tmp_type; |
591 | 0 | tmp = src->op1.num; |
592 | 0 | src->op1.num = src->op2.num; |
593 | 0 | src->op2.num = tmp; |
594 | 0 | } |
595 | 436 | COPY_NODE(src->result, opline->result); |
596 | 436 | SET_VAR_SOURCE(src); |
597 | 436 | MAKE_NOP(opline); |
598 | 436 | ++(*opt_count); |
599 | 436 | break; |
600 | 6 | case ZEND_ISSET_ISEMPTY_CV: |
601 | 16 | case ZEND_ISSET_ISEMPTY_VAR: |
602 | 327 | case ZEND_ISSET_ISEMPTY_DIM_OBJ: |
603 | 375 | case ZEND_ISSET_ISEMPTY_PROP_OBJ: |
604 | 397 | case ZEND_ISSET_ISEMPTY_STATIC_PROP: |
605 | 448 | case ZEND_INSTANCEOF: |
606 | 662 | case ZEND_TYPE_CHECK: |
607 | 676 | case ZEND_DEFINED: |
608 | 676 | case ZEND_IN_ARRAY: |
609 | 716 | case ZEND_ARRAY_KEY_EXISTS: |
610 | 716 | if (opline->opcode == ZEND_BOOL_NOT) { |
611 | 465 | break; |
612 | 465 | } |
613 | 251 | COPY_NODE(src->result, opline->result); |
614 | 251 | SET_VAR_SOURCE(src); |
615 | 251 | MAKE_NOP(opline); |
616 | 251 | ++(*opt_count); |
617 | 251 | break; |
618 | 12.3k | } |
619 | 12.3k | } |
620 | 12.3k | } |
621 | 12.0k | break; |
622 | | |
623 | 29.7k | case ZEND_JMPZ: |
624 | 42.9k | case ZEND_JMPNZ: |
625 | 44.7k | while (1) { |
626 | 44.7k | if (opline->op1_type == IS_CONST) { |
627 | 617 | ++(*opt_count); |
628 | 617 | block->successors_count = 1; |
629 | 617 | if (zend_is_true(&ZEND_OP1_LITERAL(opline)) == |
630 | 617 | (opline->opcode == ZEND_JMPZ)) { |
631 | | |
632 | 248 | MAKE_NOP(opline); |
633 | 248 | block->successors[0] = block->successors[1]; |
634 | 248 | block->len--; |
635 | 248 | cfg->blocks[block->successors[0]].flags |= ZEND_BB_FOLLOW; |
636 | 248 | break; |
637 | 369 | } else { |
638 | 369 | zend_basic_block *next = cfg->blocks + block->successors[1]; |
639 | | |
640 | 369 | next->flags &= ~ZEND_BB_FOLLOW; |
641 | 369 | if (!(next->flags & (ZEND_BB_TARGET|ZEND_BB_PROTECTED))) { |
642 | 303 | next->flags &= ~ZEND_BB_REACHABLE; |
643 | 303 | } |
644 | 369 | opline->opcode = ZEND_JMP; |
645 | 369 | COPY_NODE(opline->op1, opline->op2); |
646 | 369 | break; |
647 | 369 | } |
648 | 44.1k | } else if (opline->op1_type == IS_TMP_VAR && |
649 | 41.8k | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
650 | 41.3k | src = VAR_SOURCE(opline->op1); |
651 | 41.3k | if (src) { |
652 | 41.3k | if (src->opcode == ZEND_BOOL_NOT) { |
653 | 1.05k | VAR_SOURCE(opline->op1) = NULL; |
654 | 1.05k | COPY_NODE(opline->op1, src->op1); |
655 | | /* T = BOOL_NOT(X) + JMPZ(T) -> NOP, JMPNZ(X) */ |
656 | 1.05k | opline->opcode = INV_COND(opline->opcode); |
657 | 1.05k | MAKE_NOP(src); |
658 | 1.05k | ++(*opt_count); |
659 | 1.05k | continue; |
660 | 40.3k | } else if (src->opcode == ZEND_BOOL || |
661 | 39.5k | src->opcode == ZEND_QM_ASSIGN) { |
662 | 747 | VAR_SOURCE(opline->op1) = NULL; |
663 | 747 | COPY_NODE(opline->op1, src->op1); |
664 | 747 | MAKE_NOP(src); |
665 | 747 | ++(*opt_count); |
666 | 747 | continue; |
667 | 747 | } |
668 | 41.3k | } |
669 | 41.3k | } |
670 | 42.3k | break; |
671 | 44.7k | } |
672 | 42.9k | break; |
673 | | |
674 | 1.72k | case ZEND_JMPZ_EX: |
675 | 3.73k | case ZEND_JMPNZ_EX: |
676 | 4.12k | while (1) { |
677 | 4.12k | if (opline->op1_type == IS_CONST) { |
678 | 792 | bool is_jmpz_ex = opline->opcode == ZEND_JMPZ_EX; |
679 | 792 | if (zend_is_true(&ZEND_OP1_LITERAL(opline)) == is_jmpz_ex) { |
680 | | |
681 | 190 | ++(*opt_count); |
682 | 190 | opline->opcode = ZEND_QM_ASSIGN; |
683 | 190 | zval_ptr_dtor_nogc(&ZEND_OP1_LITERAL(opline)); |
684 | 190 | ZVAL_BOOL(&ZEND_OP1_LITERAL(opline), is_jmpz_ex); |
685 | 190 | opline->op2.num = 0; |
686 | 190 | block->successors_count = 1; |
687 | 190 | block->successors[0] = block->successors[1]; |
688 | 190 | cfg->blocks[block->successors[0]].flags |= ZEND_BB_FOLLOW; |
689 | 190 | break; |
690 | 190 | } |
691 | 3.33k | } else if (opline->op1_type == IS_TMP_VAR && |
692 | 3.24k | (!zend_bitset_in(used_ext, VAR_NUM(opline->op1.var)) || |
693 | 2.82k | opline->result.var == opline->op1.var)) { |
694 | 2.82k | src = VAR_SOURCE(opline->op1); |
695 | 2.82k | if (src) { |
696 | 2.44k | if (src->opcode == ZEND_BOOL || |
697 | 2.06k | src->opcode == ZEND_QM_ASSIGN) { |
698 | 385 | VAR_SOURCE(opline->op1) = NULL; |
699 | 385 | COPY_NODE(opline->op1, src->op1); |
700 | 385 | MAKE_NOP(src); |
701 | 385 | ++(*opt_count); |
702 | 385 | continue; |
703 | 385 | } |
704 | 2.44k | } |
705 | 2.82k | } |
706 | 3.54k | break; |
707 | 4.12k | } |
708 | 3.73k | break; |
709 | | |
710 | 61.3k | case ZEND_CONCAT: |
711 | 90.3k | case ZEND_FAST_CONCAT: |
712 | 90.3k | if (opline->op1_type == IS_CONST && |
713 | 23.7k | opline->op2_type == IS_CONST) { |
714 | 12 | goto optimize_constant_binary_op; |
715 | 12 | } |
716 | | |
717 | 90.3k | if (opline->op2_type == IS_CONST && |
718 | 39.4k | opline->op1_type == IS_TMP_VAR) { |
719 | | |
720 | 30.6k | src = VAR_SOURCE(opline->op1); |
721 | 30.6k | if (src && |
722 | 30.5k | (src->opcode == ZEND_CONCAT || |
723 | 26.1k | src->opcode == ZEND_FAST_CONCAT) && |
724 | 23.9k | src->op2_type == IS_CONST) { |
725 | | /* compress consecutive CONCATs */ |
726 | 1.29k | size_t l, old_len; |
727 | | |
728 | 1.29k | if (Z_TYPE(ZEND_OP2_LITERAL(opline)) != IS_STRING) { |
729 | 0 | convert_to_string(&ZEND_OP2_LITERAL(opline)); |
730 | 0 | } |
731 | 1.29k | if (Z_TYPE(ZEND_OP2_LITERAL(src)) != IS_STRING) { |
732 | 0 | convert_to_string(&ZEND_OP2_LITERAL(src)); |
733 | 0 | } |
734 | | |
735 | 1.29k | VAR_SOURCE(opline->op1) = NULL; |
736 | 1.29k | COPY_NODE(opline->op1, src->op1); |
737 | 1.29k | old_len = Z_STRLEN(ZEND_OP2_LITERAL(src)); |
738 | 1.29k | l = old_len + Z_STRLEN(ZEND_OP2_LITERAL(opline)); |
739 | 1.29k | if (!Z_REFCOUNTED(ZEND_OP2_LITERAL(src))) { |
740 | 556 | zend_string *tmp = zend_string_alloc(l, 0); |
741 | 556 | memcpy(ZSTR_VAL(tmp), Z_STRVAL(ZEND_OP2_LITERAL(src)), old_len); |
742 | 556 | Z_STR(ZEND_OP2_LITERAL(src)) = tmp; |
743 | 737 | } else { |
744 | 737 | Z_STR(ZEND_OP2_LITERAL(src)) = zend_string_extend(Z_STR(ZEND_OP2_LITERAL(src)), l, 0); |
745 | 737 | } |
746 | 1.29k | Z_TYPE_INFO(ZEND_OP2_LITERAL(src)) = IS_STRING_EX; |
747 | 1.29k | memcpy(Z_STRVAL(ZEND_OP2_LITERAL(src)) + old_len, Z_STRVAL(ZEND_OP2_LITERAL(opline)), Z_STRLEN(ZEND_OP2_LITERAL(opline))); |
748 | 1.29k | Z_STRVAL(ZEND_OP2_LITERAL(src))[l] = '\0'; |
749 | 1.29k | zval_ptr_dtor_str(&ZEND_OP2_LITERAL(opline)); |
750 | 1.29k | ZVAL_STR(&ZEND_OP2_LITERAL(opline), zend_new_interned_string(Z_STR(ZEND_OP2_LITERAL(src)))); |
751 | 1.29k | ZVAL_NULL(&ZEND_OP2_LITERAL(src)); |
752 | 1.29k | MAKE_NOP(src); |
753 | 1.29k | ++(*opt_count); |
754 | 1.29k | } |
755 | 30.6k | } |
756 | | |
757 | 90.3k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
758 | 37.3k | src = VAR_SOURCE(opline->op1); |
759 | 37.3k | if (src && |
760 | 36.9k | src->opcode == ZEND_CAST && |
761 | 151 | src->extended_value == IS_STRING && |
762 | 19 | src->op1_type != IS_CONST) { |
763 | | /* convert T1 = CAST(STRING, X), T2 = CONCAT(T1, Y) to T2 = CONCAT(X,Y) */ |
764 | 10 | VAR_SOURCE(opline->op1) = NULL; |
765 | 10 | COPY_NODE(opline->op1, src->op1); |
766 | 10 | MAKE_NOP(src); |
767 | 10 | ++(*opt_count); |
768 | 10 | } |
769 | 37.3k | } |
770 | 90.3k | if (opline->op2_type & (IS_TMP_VAR|IS_VAR)) { |
771 | 47.6k | src = VAR_SOURCE(opline->op2); |
772 | 47.6k | if (src && |
773 | 47.4k | src->opcode == ZEND_CAST && |
774 | 211 | src->extended_value == IS_STRING && |
775 | 99 | src->op1_type != IS_CONST) { |
776 | | /* convert T1 = CAST(STRING, X), T2 = CONCAT(Y, T1) to T2 = CONCAT(Y,X) */ |
777 | 61 | VAR_SOURCE(opline->op2) = NULL; |
778 | 61 | COPY_NODE(opline->op2, src->op1); |
779 | 61 | MAKE_NOP(src); |
780 | 61 | ++(*opt_count); |
781 | 61 | } |
782 | 47.6k | } |
783 | 90.3k | if (opline->op1_type == IS_CONST && |
784 | 23.7k | Z_TYPE(ZEND_OP1_LITERAL(opline)) == IS_STRING && |
785 | 23.7k | Z_STRLEN(ZEND_OP1_LITERAL(opline)) == 0) { |
786 | | /* convert CONCAT('', X) => CAST(STRING, X) */ |
787 | 12 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
788 | 12 | opline->opcode = ZEND_CAST; |
789 | 12 | opline->extended_value = IS_STRING; |
790 | 12 | COPY_NODE(opline->op1, opline->op2); |
791 | 12 | opline->op2_type = IS_UNUSED; |
792 | 12 | opline->op2.var = 0; |
793 | 12 | ++(*opt_count); |
794 | 90.3k | } else if (opline->op2_type == IS_CONST && |
795 | 39.4k | Z_TYPE(ZEND_OP2_LITERAL(opline)) == IS_STRING && |
796 | 39.4k | Z_STRLEN(ZEND_OP2_LITERAL(opline)) == 0) { |
797 | | /* convert CONCAT(X, '') => CAST(STRING, X) */ |
798 | 116 | literal_dtor(&ZEND_OP2_LITERAL(opline)); |
799 | 116 | opline->opcode = ZEND_CAST; |
800 | 116 | opline->extended_value = IS_STRING; |
801 | 116 | opline->op2_type = IS_UNUSED; |
802 | 116 | opline->op2.var = 0; |
803 | 116 | ++(*opt_count); |
804 | 90.2k | } else if (opline->opcode == ZEND_CONCAT && |
805 | 61.2k | (opline->op1_type == IS_CONST || |
806 | 48.4k | (opline->op1_type == IS_TMP_VAR && |
807 | 27.3k | VAR_SOURCE(opline->op1) && |
808 | 27.0k | (VAR_SOURCE(opline->op1)->opcode == ZEND_FAST_CONCAT || |
809 | 15.9k | VAR_SOURCE(opline->op1)->opcode == ZEND_ROPE_END || |
810 | 15.5k | VAR_SOURCE(opline->op1)->opcode == ZEND_FETCH_CONSTANT || |
811 | 14.2k | VAR_SOURCE(opline->op1)->opcode == ZEND_FETCH_CLASS_CONSTANT))) && |
812 | 25.5k | (opline->op2_type == IS_CONST || |
813 | 15.0k | (opline->op2_type == IS_TMP_VAR && |
814 | 14.6k | VAR_SOURCE(opline->op2) && |
815 | 14.5k | (VAR_SOURCE(opline->op2)->opcode == ZEND_FAST_CONCAT || |
816 | 14.4k | VAR_SOURCE(opline->op2)->opcode == ZEND_ROPE_END || |
817 | 4.66k | VAR_SOURCE(opline->op2)->opcode == ZEND_FETCH_CONSTANT || |
818 | 21.8k | VAR_SOURCE(opline->op2)->opcode == ZEND_FETCH_CLASS_CONSTANT)))) { |
819 | 21.8k | opline->opcode = ZEND_FAST_CONCAT; |
820 | 21.8k | ++(*opt_count); |
821 | 21.8k | } |
822 | 90.3k | break; |
823 | | |
824 | 10.0k | case ZEND_ADD: |
825 | 18.1k | case ZEND_SUB: |
826 | 28.2k | case ZEND_MUL: |
827 | 33.2k | case ZEND_DIV: |
828 | 37.4k | case ZEND_MOD: |
829 | 40.1k | case ZEND_SL: |
830 | 41.9k | case ZEND_SR: |
831 | 53.7k | case ZEND_IS_SMALLER: |
832 | 57.9k | case ZEND_IS_SMALLER_OR_EQUAL: |
833 | 58.8k | case ZEND_IS_NOT_IDENTICAL: |
834 | 60.7k | case ZEND_BOOL_XOR: |
835 | 62.6k | case ZEND_BW_OR: |
836 | 75.6k | case ZEND_BW_AND: |
837 | 85.9k | case ZEND_BW_XOR: |
838 | 85.9k | if (opline->op1_type == IS_CONST && |
839 | 15.9k | opline->op2_type == IS_CONST) { |
840 | | /* evaluate constant expressions */ |
841 | 10.6k | zval result; |
842 | | |
843 | 10.6k | optimize_constant_binary_op: |
844 | 10.6k | if (zend_optimizer_eval_binary_op(&result, opline->opcode, &ZEND_OP1_LITERAL(opline), &ZEND_OP2_LITERAL(opline)) == SUCCESS) { |
845 | 76 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
846 | 76 | literal_dtor(&ZEND_OP2_LITERAL(opline)); |
847 | 76 | opline->opcode = ZEND_QM_ASSIGN; |
848 | 76 | SET_UNUSED(opline->op2); |
849 | 76 | zend_optimizer_update_op1_const(op_array, opline, &result); |
850 | 76 | ++(*opt_count); |
851 | 76 | } |
852 | 10.6k | } |
853 | 85.9k | break; |
854 | | |
855 | 85.9k | case ZEND_BW_NOT: |
856 | 20.8k | if (opline->op1_type == IS_CONST) { |
857 | | /* evaluate constant unary ops */ |
858 | 119 | zval result; |
859 | | |
860 | 1.77k | optimize_const_unary_op: |
861 | 1.77k | if (zend_optimizer_eval_unary_op(&result, opline->opcode, &ZEND_OP1_LITERAL(opline)) == SUCCESS) { |
862 | 1.60k | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
863 | 1.60k | opline->opcode = ZEND_QM_ASSIGN; |
864 | 1.60k | zend_optimizer_update_op1_const(op_array, opline, &result); |
865 | 1.60k | ++(*opt_count); |
866 | 1.60k | } |
867 | 1.77k | } |
868 | 22.5k | break; |
869 | | |
870 | 22.5k | case ZEND_CAST: |
871 | 3.87k | if (opline->op1_type == IS_CONST) { |
872 | | /* cast of constant operand */ |
873 | 450 | zval result; |
874 | | |
875 | 450 | if (zend_optimizer_eval_cast(&result, opline->extended_value, &ZEND_OP1_LITERAL(opline)) == SUCCESS) { |
876 | 4 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
877 | 4 | opline->opcode = ZEND_QM_ASSIGN; |
878 | 4 | opline->extended_value = 0; |
879 | 4 | zend_optimizer_update_op1_const(op_array, opline, &result); |
880 | 4 | ++(*opt_count); |
881 | 4 | } |
882 | 450 | } |
883 | 3.87k | break; |
884 | | |
885 | 3.20k | case ZEND_STRLEN: |
886 | 3.20k | if (opline->op1_type == IS_CONST) { |
887 | 20 | zval result; |
888 | | |
889 | 20 | if (zend_optimizer_eval_strlen(&result, &ZEND_OP1_LITERAL(opline)) == SUCCESS) { |
890 | 0 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
891 | 0 | opline->opcode = ZEND_QM_ASSIGN; |
892 | 0 | zend_optimizer_update_op1_const(op_array, opline, &result); |
893 | 0 | ++(*opt_count); |
894 | 0 | } |
895 | 20 | } |
896 | 3.20k | break; |
897 | | |
898 | 118k | case ZEND_RETURN: |
899 | 118k | if (opline->op1_type == IS_TMP_VAR) { |
900 | 7.53k | src = VAR_SOURCE(opline->op1); |
901 | 7.53k | if (src && src->opcode == ZEND_QM_ASSIGN) { |
902 | 35 | zend_op *op = src + 1; |
903 | 35 | bool optimize = true; |
904 | | |
905 | 35 | while (op < opline) { |
906 | 35 | if ((op->op1_type == opline->op1_type |
907 | 17 | && op->op1.var == opline->op1.var) |
908 | 18 | || (op->op2_type == opline->op1_type |
909 | 35 | && op->op2.var == opline->op1.var)) { |
910 | 35 | optimize = false; |
911 | 35 | break; |
912 | 35 | } |
913 | 0 | op++; |
914 | 0 | } |
915 | | |
916 | 35 | if (optimize) { |
917 | | /* T = QM_ASSIGN(X), RETURN(T) to NOP, RETURN(X) */ |
918 | 0 | VAR_SOURCE(opline->op1) = NULL; |
919 | 0 | COPY_NODE(opline->op1, src->op1); |
920 | 0 | MAKE_NOP(src); |
921 | 0 | ++(*opt_count); |
922 | 0 | } |
923 | 35 | } |
924 | 7.53k | } |
925 | 118k | break; |
926 | | |
927 | 18.9k | case ZEND_QM_ASSIGN: |
928 | 18.9k | if (opline->op1_type == opline->result_type && |
929 | 5.31k | opline->op1.var == opline->result.var) { |
930 | | /* strip T = QM_ASSIGN(T) */ |
931 | 0 | MAKE_NOP(opline); |
932 | 0 | ++(*opt_count); |
933 | 18.9k | } else if (opline->op1_type == IS_TMP_VAR && |
934 | 5.31k | opline->result_type == IS_TMP_VAR && |
935 | 5.31k | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
936 | | /* T1 = ..., T2 = QM_ASSIGN(T1) to T2 = ..., NOP */ |
937 | 3.56k | src = VAR_SOURCE(opline->op1); |
938 | 3.56k | if (src && |
939 | 3.56k | src->opcode != ZEND_COPY_TMP && |
940 | | /* See gh20628_borked_live_range_calc.phpt. */ |
941 | 3.56k | src->opcode != ZEND_NEW && |
942 | 3.52k | src->opcode != ZEND_ADD_ARRAY_ELEMENT && |
943 | 3.52k | src->opcode != ZEND_ADD_ARRAY_UNPACK && |
944 | 3.52k | (src->opcode != ZEND_DECLARE_LAMBDA_FUNCTION || |
945 | 3.52k | src == opline -1)) { |
946 | 3.52k | src->result.var = opline->result.var; |
947 | 3.52k | VAR_SOURCE(opline->op1) = NULL; |
948 | 3.52k | VAR_SOURCE(opline->result) = src; |
949 | 3.52k | MAKE_NOP(opline); |
950 | 3.52k | ++(*opt_count); |
951 | 3.52k | } |
952 | 3.56k | } |
953 | 18.9k | break; |
954 | 3.11M | } |
955 | | |
956 | | /* get variable source */ |
957 | 3.11M | if (opline->result_type & (IS_VAR|IS_TMP_VAR)) { |
958 | 1.41M | SET_VAR_SOURCE(opline); |
959 | 1.41M | } |
960 | 3.11M | opline++; |
961 | 3.11M | } |
962 | 503k | } |
963 | | |
964 | | /* Rebuild plain (optimized) op_array from CFG */ |
965 | | static void assemble_code_blocks(const zend_cfg *cfg, zend_op_array *op_array, zend_optimizer_ctx *ctx) |
966 | 94.6k | { |
967 | 94.6k | zend_basic_block *blocks = cfg->blocks; |
968 | 94.6k | const zend_basic_block *end = blocks + cfg->blocks_count; |
969 | 94.6k | zend_basic_block *b; |
970 | 94.6k | zend_op *new_opcodes; |
971 | 94.6k | zend_op *opline; |
972 | 94.6k | uint32_t len = 0; |
973 | | |
974 | 481k | for (b = blocks; b < end; b++) { |
975 | 386k | if (b->len == 0) { |
976 | 27.6k | continue; |
977 | 27.6k | } |
978 | 359k | if (b->flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
979 | 340k | opline = op_array->opcodes + b->start + b->len - 1; |
980 | 340k | if (opline->opcode == ZEND_JMP) { |
981 | 51.8k | const zend_basic_block *next = b + 1; |
982 | | |
983 | 63.1k | while (next < end && !(next->flags & ZEND_BB_REACHABLE)) { |
984 | 11.3k | next++; |
985 | 11.3k | } |
986 | 51.8k | if (next < end && next == blocks + b->successors[0]) { |
987 | | /* JMP to the next block - strip it */ |
988 | 18 | MAKE_NOP(opline); |
989 | 18 | b->len--; |
990 | 18 | } |
991 | 288k | } else if (b->len == 1 && opline->opcode == ZEND_NOP) { |
992 | | /* skip empty block */ |
993 | 0 | b->len--; |
994 | 0 | } |
995 | 340k | len += b->len; |
996 | 340k | } else { |
997 | | /* this block will not be used, delete all constants there */ |
998 | 19.0k | const zend_op *op = op_array->opcodes + b->start; |
999 | 19.0k | const zend_op *last_op = op + b->len; |
1000 | 44.7k | for (; op < last_op; op++) { |
1001 | 25.6k | if (op->op1_type == IS_CONST) { |
1002 | 16.4k | literal_dtor(&ZEND_OP1_LITERAL(op)); |
1003 | 16.4k | } |
1004 | 25.6k | if (op->op2_type == IS_CONST) { |
1005 | 1.36k | literal_dtor(&ZEND_OP2_LITERAL(op)); |
1006 | 1.36k | } |
1007 | 25.6k | } |
1008 | 19.0k | } |
1009 | 359k | } |
1010 | | |
1011 | 94.6k | new_opcodes = emalloc(len * sizeof(zend_op)); |
1012 | 94.6k | opline = new_opcodes; |
1013 | | |
1014 | | /* Copy code of reachable blocks into a single buffer */ |
1015 | 481k | for (b = blocks; b < end; b++) { |
1016 | 386k | if (b->flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1017 | 340k | memcpy(opline, op_array->opcodes + b->start, b->len * sizeof(zend_op)); |
1018 | 340k | b->start = opline - new_opcodes; |
1019 | 340k | opline += b->len; |
1020 | 340k | } |
1021 | 386k | } |
1022 | | |
1023 | | /* adjust jump targets */ |
1024 | 94.6k | efree(op_array->opcodes); |
1025 | 94.6k | op_array->opcodes = new_opcodes; |
1026 | 94.6k | op_array->last = len; |
1027 | | |
1028 | 481k | for (b = blocks; b < end; b++) { |
1029 | 386k | if (!(b->flags & ZEND_BB_REACHABLE) || b->len == 0) { |
1030 | 46.7k | continue; |
1031 | 46.7k | } |
1032 | 340k | opline = op_array->opcodes + b->start + b->len - 1; |
1033 | 340k | switch (opline->opcode) { |
1034 | 746 | case ZEND_FAST_CALL: |
1035 | 52.5k | case ZEND_JMP: |
1036 | 52.5k | ZEND_SET_OP_JMP_ADDR(opline, opline->op1, new_opcodes + blocks[b->successors[0]].start); |
1037 | 52.5k | break; |
1038 | 18.0k | case ZEND_JMPZ: |
1039 | 29.1k | case ZEND_JMPNZ: |
1040 | 30.1k | case ZEND_JMPZ_EX: |
1041 | 31.2k | case ZEND_JMPNZ_EX: |
1042 | 44.0k | case ZEND_FE_RESET_R: |
1043 | 45.0k | case ZEND_FE_RESET_RW: |
1044 | 46.9k | case ZEND_JMP_SET: |
1045 | 50.9k | case ZEND_COALESCE: |
1046 | 52.4k | case ZEND_ASSERT_CHECK: |
1047 | 82.3k | case ZEND_JMP_NULL: |
1048 | 82.5k | case ZEND_BIND_INIT_STATIC_OR_JMP: |
1049 | 82.5k | case ZEND_JMP_FRAMELESS: |
1050 | 82.5k | ZEND_SET_OP_JMP_ADDR(opline, opline->op2, new_opcodes + blocks[b->successors[0]].start); |
1051 | 82.5k | break; |
1052 | 5.40k | case ZEND_CATCH: |
1053 | 5.40k | if (!(opline->extended_value & ZEND_LAST_CATCH)) { |
1054 | 4.07k | ZEND_SET_OP_JMP_ADDR(opline, opline->op2, new_opcodes + blocks[b->successors[0]].start); |
1055 | 4.07k | } |
1056 | 5.40k | break; |
1057 | 12.8k | case ZEND_FE_FETCH_R: |
1058 | 13.7k | case ZEND_FE_FETCH_RW: |
1059 | 13.7k | opline->extended_value = ZEND_OPLINE_TO_OFFSET(opline, new_opcodes + blocks[b->successors[0]].start); |
1060 | 13.7k | break; |
1061 | 10 | case ZEND_SWITCH_LONG: |
1062 | 76 | case ZEND_SWITCH_STRING: |
1063 | 230 | case ZEND_MATCH: |
1064 | 230 | { |
1065 | 230 | const HashTable *jumptable = Z_ARRVAL(ZEND_OP2_LITERAL(opline)); |
1066 | 230 | zval *zv; |
1067 | 230 | uint32_t s = 0; |
1068 | 230 | ZEND_ASSERT(b->successors_count == (opline->opcode == ZEND_MATCH ? 1 : 2) + zend_hash_num_elements(jumptable)); |
1069 | | |
1070 | 2.04k | ZEND_HASH_FOREACH_VAL(jumptable, zv) { |
1071 | 2.04k | Z_LVAL_P(zv) = ZEND_OPLINE_TO_OFFSET(opline, new_opcodes + blocks[b->successors[s++]].start); |
1072 | 2.04k | } ZEND_HASH_FOREACH_END(); |
1073 | 230 | opline->extended_value = ZEND_OPLINE_TO_OFFSET(opline, new_opcodes + blocks[b->successors[s++]].start); |
1074 | 230 | break; |
1075 | 230 | } |
1076 | 340k | } |
1077 | 340k | } |
1078 | | |
1079 | | /* adjust exception jump targets & remove unused try_catch_array entries */ |
1080 | 94.6k | if (op_array->last_try_catch) { |
1081 | 18.9k | uint32_t i, j; |
1082 | 18.9k | uint32_t *map; |
1083 | 18.9k | ALLOCA_FLAG(use_heap); |
1084 | | |
1085 | 18.9k | map = (uint32_t *)do_alloca(sizeof(uint32_t) * op_array->last_try_catch, use_heap); |
1086 | 44.1k | for (i = 0, j = 0; i< op_array->last_try_catch; i++) { |
1087 | 25.2k | if (blocks[cfg->map[op_array->try_catch_array[i].try_op]].flags & ZEND_BB_REACHABLE) { |
1088 | 25.2k | map[i] = j; |
1089 | 25.2k | op_array->try_catch_array[j].try_op = blocks[cfg->map[op_array->try_catch_array[i].try_op]].start; |
1090 | 25.2k | if (op_array->try_catch_array[i].catch_op) { |
1091 | 24.5k | op_array->try_catch_array[j].catch_op = blocks[cfg->map[op_array->try_catch_array[i].catch_op]].start; |
1092 | 24.5k | } else { |
1093 | 647 | op_array->try_catch_array[j].catch_op = 0; |
1094 | 647 | } |
1095 | 25.2k | if (op_array->try_catch_array[i].finally_op) { |
1096 | 788 | op_array->try_catch_array[j].finally_op = blocks[cfg->map[op_array->try_catch_array[i].finally_op]].start; |
1097 | 24.4k | } else { |
1098 | 24.4k | op_array->try_catch_array[j].finally_op = 0; |
1099 | 24.4k | } |
1100 | 25.2k | if (!op_array->try_catch_array[i].finally_end) { |
1101 | 24.4k | op_array->try_catch_array[j].finally_end = 0; |
1102 | 24.4k | } else { |
1103 | 788 | op_array->try_catch_array[j].finally_end = blocks[cfg->map[op_array->try_catch_array[i].finally_end]].start; |
1104 | 788 | } |
1105 | 25.2k | j++; |
1106 | 25.2k | } |
1107 | 25.2k | } |
1108 | 18.9k | if (i != j) { |
1109 | 11 | op_array->last_try_catch = j; |
1110 | 11 | if (j == 0) { |
1111 | 7 | efree(op_array->try_catch_array); |
1112 | 7 | op_array->try_catch_array = NULL; |
1113 | 7 | } |
1114 | | |
1115 | 11 | if (op_array->fn_flags & ZEND_ACC_HAS_FINALLY_BLOCK) { |
1116 | 0 | zend_op *finally_opline = new_opcodes; |
1117 | 0 | const zend_op *last_finally_op = finally_opline + len; |
1118 | 0 | while (finally_opline < last_finally_op) { |
1119 | 0 | if (finally_opline->opcode == ZEND_FAST_RET && |
1120 | 0 | finally_opline->op2.num != (uint32_t)-1 && |
1121 | 0 | finally_opline->op2.num < j) { |
1122 | 0 | finally_opline->op2.num = map[finally_opline->op2.num]; |
1123 | 0 | } |
1124 | 0 | finally_opline++; |
1125 | 0 | } |
1126 | 0 | } |
1127 | 11 | } |
1128 | 18.9k | free_alloca(map, use_heap); |
1129 | 18.9k | } |
1130 | | |
1131 | | /* rebuild map (just for printing) */ |
1132 | 94.6k | memset(cfg->map, -1, sizeof(int) * op_array->last); |
1133 | 481k | for (uint32_t n = 0; n < cfg->blocks_count; n++) { |
1134 | 386k | if (cfg->blocks[n].flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1135 | 340k | cfg->map[cfg->blocks[n].start] = n; |
1136 | 340k | } |
1137 | 386k | } |
1138 | 94.6k | } |
1139 | | |
1140 | | static zend_always_inline zend_basic_block *get_target_block(const zend_cfg *cfg, const zend_basic_block *block, int n, uint32_t *opt_count) |
1141 | 173k | { |
1142 | 173k | int b; |
1143 | 173k | zend_basic_block *target_block = cfg->blocks + block->successors[n]; |
1144 | | |
1145 | 173k | if (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)) { |
1146 | 222 | do { |
1147 | 222 | b = target_block->successors[0]; |
1148 | 222 | target_block = cfg->blocks + b; |
1149 | 222 | } while (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)); |
1150 | 154 | block->successors[n] = b; |
1151 | 154 | ++(*opt_count); |
1152 | 154 | } |
1153 | 173k | return target_block; |
1154 | 173k | } |
1155 | | |
1156 | | static zend_always_inline zend_basic_block *get_follow_block(const zend_cfg *cfg, const zend_basic_block *block, int n, uint32_t *opt_count) |
1157 | 45.8k | { |
1158 | 45.8k | int b; |
1159 | 45.8k | zend_basic_block *target_block = cfg->blocks + block->successors[n]; |
1160 | | |
1161 | 45.8k | if (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)) { |
1162 | 845 | do { |
1163 | 845 | b = target_block->successors[0]; |
1164 | 845 | target_block = cfg->blocks + b; |
1165 | 845 | } while (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)); |
1166 | 787 | block->successors[n] = b; |
1167 | 787 | ++(*opt_count); |
1168 | 787 | } |
1169 | 45.8k | return target_block; |
1170 | 45.8k | } |
1171 | | |
1172 | | static zend_always_inline zend_basic_block *get_next_block(const zend_cfg *cfg, zend_basic_block *block) |
1173 | 89.7k | { |
1174 | 89.7k | zend_basic_block *next_block = block + 1; |
1175 | 89.7k | const zend_basic_block *end = cfg->blocks + cfg->blocks_count; |
1176 | | |
1177 | 104k | while (1) { |
1178 | 104k | if (next_block == end) { |
1179 | 871 | return NULL; |
1180 | 104k | } else if (next_block->flags & ZEND_BB_REACHABLE) { |
1181 | 88.9k | break; |
1182 | 88.9k | } |
1183 | 15.1k | next_block++; |
1184 | 15.1k | } |
1185 | 88.9k | while (next_block->len == 0 && !(next_block->flags & (ZEND_BB_TARGET|ZEND_BB_PROTECTED))) { |
1186 | 67 | next_block = cfg->blocks + next_block->successors[0]; |
1187 | 67 | } |
1188 | 88.9k | return next_block; |
1189 | 89.7k | } |
1190 | | |
1191 | | |
1192 | | /* we use "jmp_hitlist" to avoid infinity loops during jmp optimization */ |
1193 | | static zend_always_inline bool in_hitlist(int target, const int *jmp_hitlist, int jmp_hitlist_count) |
1194 | 622 | { |
1195 | 622 | int i; |
1196 | | |
1197 | 622 | for (i = 0; i < jmp_hitlist_count; i++) { |
1198 | 222 | if (jmp_hitlist[i] == target) { |
1199 | 222 | return 1; |
1200 | 222 | } |
1201 | 222 | } |
1202 | 400 | return 0; |
1203 | 622 | } |
1204 | | |
1205 | | #define CHECK_LOOP(target) \ |
1206 | 622 | if (EXPECTED(!in_hitlist(target, jmp_hitlist, jmp_hitlist_count))) { \ |
1207 | 400 | jmp_hitlist[jmp_hitlist_count++] = target; \ |
1208 | 400 | } else { \ |
1209 | 222 | break; \ |
1210 | 222 | } |
1211 | | |
1212 | | static void zend_jmp_optimization(zend_basic_block *block, zend_op_array *op_array, const zend_cfg *cfg, int *jmp_hitlist, uint32_t *opt_count) |
1213 | 503k | { |
1214 | | /* last_op is the last opcode of the current block */ |
1215 | 503k | zend_basic_block *target_block, *follow_block, *next_block; |
1216 | 503k | zend_op *last_op, *target; |
1217 | 503k | int next, jmp_hitlist_count; |
1218 | | |
1219 | 503k | if (block->len == 0) { |
1220 | 1.36k | return; |
1221 | 1.36k | } |
1222 | | |
1223 | 502k | last_op = op_array->opcodes + block->start + block->len - 1; |
1224 | 502k | switch (last_op->opcode) { |
1225 | 88.8k | case ZEND_JMP: |
1226 | 88.8k | jmp_hitlist_count = 0; |
1227 | | |
1228 | 88.8k | target_block = get_target_block(cfg, block, 0, opt_count); |
1229 | 88.8k | while (target_block->len == 1) { |
1230 | 44.7k | target = op_array->opcodes + target_block->start; |
1231 | 44.7k | if (target->opcode == ZEND_JMP) { |
1232 | | /* JMP L, L: JMP L1 -> JMP L1 */ |
1233 | 64 | next = target_block->successors[0]; |
1234 | 44.7k | } else { |
1235 | 44.7k | break; |
1236 | 44.7k | } |
1237 | 64 | CHECK_LOOP(next); |
1238 | 37 | block->successors[0] = next; |
1239 | 37 | ++(*opt_count); |
1240 | 37 | target_block = get_target_block(cfg, block, 0, opt_count); |
1241 | 37 | } |
1242 | | |
1243 | 88.8k | next_block = get_next_block(cfg, block); |
1244 | 88.8k | if (target_block == next_block) { |
1245 | | /* JMP(next) -> NOP */ |
1246 | 931 | MAKE_NOP(last_op); |
1247 | 931 | ++(*opt_count); |
1248 | 931 | block->len--; |
1249 | 87.8k | } else if (target_block->len == 1) { |
1250 | 44.5k | target = op_array->opcodes + target_block->start; |
1251 | 44.5k | if ((target->opcode == ZEND_RETURN || |
1252 | 44.3k | target->opcode == ZEND_RETURN_BY_REF || |
1253 | 44.3k | target->opcode == ZEND_GENERATOR_RETURN) && |
1254 | 307 | !(op_array->fn_flags & ZEND_ACC_HAS_FINALLY_BLOCK)) { |
1255 | | /* JMP L, L: RETURN to immediate RETURN */ |
1256 | 32 | *last_op = *target; |
1257 | 32 | if (last_op->op1_type == IS_CONST) { |
1258 | 32 | zval zv; |
1259 | 32 | ZVAL_COPY(&zv, &ZEND_OP1_LITERAL(last_op)); |
1260 | 32 | last_op->op1.constant = zend_optimizer_add_literal(op_array, &zv); |
1261 | 32 | } |
1262 | 32 | block->successors_count = 0; |
1263 | 32 | ++(*opt_count); |
1264 | 32 | } |
1265 | 44.5k | } |
1266 | 88.8k | break; |
1267 | | |
1268 | 2.29k | case ZEND_JMP_SET: |
1269 | 7.77k | case ZEND_COALESCE: |
1270 | 38.1k | case ZEND_JMP_NULL: |
1271 | 38.1k | jmp_hitlist_count = 0; |
1272 | | |
1273 | 38.1k | target_block = get_target_block(cfg, block, 0, opt_count); |
1274 | 38.1k | while (target_block->len == 1) { |
1275 | 4.19k | target = op_array->opcodes + target_block->start; |
1276 | | |
1277 | 4.19k | if (target->opcode == ZEND_JMP) { |
1278 | | /* JMP_SET(X, L), L: JMP(L2) -> JMP_SET(X, L2) */ |
1279 | 38 | next = target_block->successors[0]; |
1280 | 38 | CHECK_LOOP(next); |
1281 | 38 | block->successors[0] = next; |
1282 | 38 | ++(*opt_count); |
1283 | 4.15k | } else { |
1284 | 4.15k | break; |
1285 | 4.15k | } |
1286 | 38 | target_block = get_target_block(cfg, block, 0, opt_count); |
1287 | 38 | } |
1288 | 38.1k | break; |
1289 | | |
1290 | 28.5k | case ZEND_JMPZ: |
1291 | 42.3k | case ZEND_JMPNZ: |
1292 | 42.3k | jmp_hitlist_count = 0; |
1293 | | |
1294 | 42.3k | target_block = get_target_block(cfg, block, 0, opt_count); |
1295 | 42.6k | while (target_block->len == 1) { |
1296 | 26.6k | target = op_array->opcodes + target_block->start; |
1297 | | |
1298 | 26.6k | if (target->opcode == ZEND_JMP) { |
1299 | | /* JMPZ(X, L), L: JMP(L2) -> JMPZ(X, L2) */ |
1300 | 102 | next = target_block->successors[0]; |
1301 | 26.5k | } else if (target->opcode == last_op->opcode && |
1302 | 840 | SAME_VAR(target->op1, last_op->op1)) { |
1303 | | /* JMPZ(X, L), L: JMPZ(X, L2) -> JMPZ(X, L2) */ |
1304 | 394 | next = target_block->successors[0]; |
1305 | 26.1k | } else if (target->opcode == INV_COND(last_op->opcode) && |
1306 | 182 | SAME_VAR(target->op1, last_op->op1)) { |
1307 | | /* JMPZ(X, L), L: JMPNZ(X, L2) -> JMPZ(X, L+1) */ |
1308 | 20 | next = target_block->successors[1]; |
1309 | 26.0k | } else { |
1310 | 26.0k | break; |
1311 | 26.0k | } |
1312 | 516 | CHECK_LOOP(next); |
1313 | 321 | block->successors[0] = next; |
1314 | 321 | ++(*opt_count); |
1315 | 321 | target_block = get_target_block(cfg, block, 0, opt_count); |
1316 | 321 | } |
1317 | | |
1318 | 42.3k | follow_block = get_follow_block(cfg, block, 1, opt_count); |
1319 | 42.3k | if (target_block == follow_block) { |
1320 | | /* L: JMP[N]Z(X, L+1) -> NOP or FREE(X) */ |
1321 | 555 | zend_optimizer_convert_to_free_op1(op_array, last_op); |
1322 | 555 | if (last_op->opcode == ZEND_NOP) { |
1323 | 0 | block->len--; |
1324 | 0 | } |
1325 | 555 | block->successors_count = 1; |
1326 | 555 | ++(*opt_count); |
1327 | 41.7k | } else if (follow_block->len == 1) { |
1328 | 9.17k | target = op_array->opcodes + follow_block->start; |
1329 | 9.17k | if (target->opcode == ZEND_JMP) { |
1330 | 1.13k | if (block->successors[0] == follow_block->successors[0]) { |
1331 | | /* JMPZ(X,L1), JMP(L1) -> NOP, JMP(L1) */ |
1332 | 191 | zend_optimizer_convert_to_free_op1(op_array, last_op); |
1333 | 191 | if (last_op->opcode == ZEND_NOP) { |
1334 | 0 | block->len--; |
1335 | 0 | } |
1336 | 191 | block->successors[0] = follow_block - cfg->blocks; |
1337 | 191 | block->successors_count = 1; |
1338 | 191 | ++(*opt_count); |
1339 | 191 | break; |
1340 | 948 | } else if (!(follow_block->flags & (ZEND_BB_TARGET | ZEND_BB_PROTECTED))) { |
1341 | 948 | next_block = get_next_block(cfg, follow_block); |
1342 | | |
1343 | 948 | if (target_block == next_block) { |
1344 | | /* JMPZ(X,L1) JMP(L2) L1: -> JMPNZ(X,L2) NOP*/ |
1345 | | |
1346 | 353 | last_op->opcode = INV_COND(last_op->opcode); |
1347 | | |
1348 | 353 | block->successors[0] = follow_block->successors[0]; |
1349 | 353 | block->successors[1] = next_block - cfg->blocks; |
1350 | | |
1351 | 353 | follow_block->flags &= ~ZEND_BB_REACHABLE; |
1352 | 353 | MAKE_NOP(target); |
1353 | 353 | follow_block->len = 0; |
1354 | | |
1355 | 353 | next_block->flags |= ZEND_BB_FOLLOW; |
1356 | | |
1357 | 353 | break; |
1358 | 353 | } |
1359 | 948 | } |
1360 | 1.13k | } |
1361 | 9.17k | } |
1362 | 41.7k | break; |
1363 | | |
1364 | 41.7k | case ZEND_JMPNZ_EX: |
1365 | 3.54k | case ZEND_JMPZ_EX: |
1366 | 3.54k | jmp_hitlist_count = 0; |
1367 | | |
1368 | 3.54k | target_block = get_target_block(cfg, block, 0, opt_count); |
1369 | 3.55k | while (target_block->len == 1) { |
1370 | 1.45k | target = op_array->opcodes + target_block->start; |
1371 | | |
1372 | 1.45k | if (target->opcode == ZEND_JMP) { |
1373 | | /* T = JMPZ_EX(X, L), L: JMP(L2) -> T = JMPZ(X, L2) */ |
1374 | 0 | next = target_block->successors[0]; |
1375 | 1.45k | } else if (target->opcode == last_op->opcode-3 && |
1376 | 2 | (SAME_VAR(target->op1, last_op->result) || |
1377 | 2 | SAME_VAR(target->op1, last_op->op1))) { |
1378 | | /* T = JMPZ_EX(X, L1), L1: JMPZ({X|T}, L2) -> T = JMPZ_EX(X, L2) */ |
1379 | 2 | next = target_block->successors[0]; |
1380 | 1.45k | } else if (target->opcode == last_op->opcode && |
1381 | 0 | target->result.var == last_op->result.var && |
1382 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1383 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1384 | | /* T = JMPZ_EX(X, L1), L1: T = JMPZ_EX({X|T}, L2) -> T = JMPZ_EX(X, L2) */ |
1385 | 0 | next = target_block->successors[0]; |
1386 | 1.45k | } else if (target->opcode == INV_EX_COND(last_op->opcode) && |
1387 | 2 | (SAME_VAR(target->op1, last_op->result) || |
1388 | 2 | SAME_VAR(target->op1, last_op->op1))) { |
1389 | | /* T = JMPZ_EX(X, L1), L1: JMPNZ({X|T1}, L2) -> T = JMPZ_EX(X, L1+1) */ |
1390 | 2 | next = target_block->successors[1]; |
1391 | 1.45k | } else if (target->opcode == INV_EX_COND_EX(last_op->opcode) && |
1392 | 32 | target->result.var == last_op->result.var && |
1393 | 24 | (SAME_VAR(target->op1, last_op->result) || |
1394 | 24 | SAME_VAR(target->op1, last_op->op1))) { |
1395 | | /* T = JMPZ_EX(X, L1), L1: T = JMPNZ_EX({X|T}, L2) -> T = JMPZ_EX(X, L1+1) */ |
1396 | 0 | next = target_block->successors[1]; |
1397 | 1.45k | } else if (target->opcode == ZEND_BOOL && |
1398 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1399 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1400 | | /* convert Y = JMPZ_EX(X,L1), L1: Z = BOOL(Y) to |
1401 | | Z = JMPZ_EX(X,L1+1) */ |
1402 | | |
1403 | | /* NOTE: This optimization pattern is not safe, but works, */ |
1404 | | /* because result of JMPZ_EX instruction */ |
1405 | | /* is not used on the following path and */ |
1406 | | /* should be used once on the branch path. */ |
1407 | | /* */ |
1408 | | /* The pattern works well only if jumps processed in */ |
1409 | | /* direct order, otherwise it breaks JMPZ_EX */ |
1410 | | /* sequences too early. */ |
1411 | 0 | last_op->result.var = target->result.var; |
1412 | 0 | next = target_block->successors[0]; |
1413 | 1.45k | } else { |
1414 | 1.45k | break; |
1415 | 1.45k | } |
1416 | 4 | CHECK_LOOP(next); |
1417 | 4 | block->successors[0] = next; |
1418 | 4 | ++(*opt_count); |
1419 | 4 | target_block = get_target_block(cfg, block, 0, opt_count); |
1420 | 4 | } |
1421 | | |
1422 | 3.54k | follow_block = get_follow_block(cfg, block, 1, opt_count); |
1423 | 3.54k | if (target_block == follow_block) { |
1424 | | /* L: T = JMP[N]Z_EX(X, L+1) -> T = BOOL(X) */ |
1425 | 0 | last_op->opcode = ZEND_BOOL; |
1426 | 0 | last_op->op2.num = 0; |
1427 | 0 | block->successors_count = 1; |
1428 | 0 | ++(*opt_count); |
1429 | 0 | break; |
1430 | 0 | } |
1431 | 3.54k | break; |
1432 | 502k | } |
1433 | 502k | } |
1434 | | |
1435 | | /* Global data dependencies */ |
1436 | | |
1437 | | /* Find a set of variables which are used outside of the block where they are |
1438 | | * defined. We won't apply some optimization patterns for such variables. */ |
1439 | | static void zend_t_usage(const zend_cfg *cfg, const zend_op_array *op_array, zend_bitset used_ext, zend_optimizer_ctx *ctx) |
1440 | 113k | { |
1441 | 113k | uint32_t n; |
1442 | 113k | zend_basic_block *block, *next_block; |
1443 | 113k | uint32_t var_num; |
1444 | 113k | uint32_t bitset_len; |
1445 | 113k | zend_bitset usage; |
1446 | 113k | zend_bitset defined_here; |
1447 | 113k | void *checkpoint; |
1448 | 113k | zend_op *opline, *end; |
1449 | | |
1450 | | |
1451 | 113k | if (op_array->T == 0) { |
1452 | | /* shortcut - if no Ts, nothing to do */ |
1453 | 14.0k | return; |
1454 | 14.0k | } |
1455 | | |
1456 | 99.8k | checkpoint = zend_arena_checkpoint(ctx->arena); |
1457 | 99.8k | bitset_len = zend_bitset_len(op_array->last_var + op_array->T); |
1458 | 99.8k | defined_here = zend_arena_alloc(&ctx->arena, bitset_len * ZEND_BITSET_ELM_SIZE); |
1459 | | |
1460 | 99.8k | zend_bitset_clear(defined_here, bitset_len); |
1461 | 537k | for (n = 1; n < cfg->blocks_count; n++) { |
1462 | 437k | block = cfg->blocks + n; |
1463 | | |
1464 | 437k | if (!(block->flags & ZEND_BB_REACHABLE)) { |
1465 | 47.1k | continue; |
1466 | 47.1k | } |
1467 | | |
1468 | 390k | opline = op_array->opcodes + block->start; |
1469 | 390k | end = opline + block->len; |
1470 | 390k | if (!(block->flags & ZEND_BB_FOLLOW) || |
1471 | 288k | (block->flags & ZEND_BB_TARGET)) { |
1472 | | /* Skip continuation of "extended" BB */ |
1473 | 208k | zend_bitset_clear(defined_here, bitset_len); |
1474 | 208k | } |
1475 | | |
1476 | 2.16M | while (opline<end) { |
1477 | 1.77M | if (opline->op1_type & (IS_VAR|IS_TMP_VAR)) { |
1478 | 523k | var_num = VAR_NUM(opline->op1.var); |
1479 | 523k | if (!zend_bitset_in(defined_here, var_num)) { |
1480 | 234k | zend_bitset_incl(used_ext, var_num); |
1481 | 234k | } |
1482 | 523k | } |
1483 | 1.77M | if (opline->op2_type == IS_VAR) { |
1484 | 895 | var_num = VAR_NUM(opline->op2.var); |
1485 | 895 | if (opline->opcode == ZEND_FE_FETCH_R || |
1486 | 895 | opline->opcode == ZEND_FE_FETCH_RW) { |
1487 | | /* these opcode use the op2 as result */ |
1488 | 22 | zend_bitset_incl(defined_here, var_num); |
1489 | 873 | } else if (!zend_bitset_in(defined_here, var_num)) { |
1490 | 2 | zend_bitset_incl(used_ext, var_num); |
1491 | 2 | } |
1492 | 1.77M | } else if (opline->op2_type == IS_TMP_VAR) { |
1493 | 326k | var_num = VAR_NUM(opline->op2.var); |
1494 | 326k | if (!zend_bitset_in(defined_here, var_num)) { |
1495 | 32.6k | zend_bitset_incl(used_ext, var_num); |
1496 | 32.6k | } |
1497 | 326k | } |
1498 | | |
1499 | 1.77M | if (opline->result_type == IS_VAR) { |
1500 | 11.4k | var_num = VAR_NUM(opline->result.var); |
1501 | 11.4k | zend_bitset_incl(defined_here, var_num); |
1502 | 1.76M | } else if (opline->result_type == IS_TMP_VAR) { |
1503 | 839k | var_num = VAR_NUM(opline->result.var); |
1504 | 839k | switch (opline->opcode) { |
1505 | 4.89k | case ZEND_ADD_ARRAY_ELEMENT: |
1506 | 4.94k | case ZEND_ADD_ARRAY_UNPACK: |
1507 | 217k | case ZEND_ROPE_ADD: |
1508 | | /* these opcodes use the result as argument */ |
1509 | 217k | if (!zend_bitset_in(defined_here, var_num)) { |
1510 | 168k | zend_bitset_incl(used_ext, var_num); |
1511 | 168k | } |
1512 | 217k | break; |
1513 | 622k | default : |
1514 | 622k | zend_bitset_incl(defined_here, var_num); |
1515 | 839k | } |
1516 | 839k | } |
1517 | 1.77M | opline++; |
1518 | 1.77M | } |
1519 | 390k | } |
1520 | | |
1521 | 99.8k | if (ctx->debug_level & ZEND_DUMP_BLOCK_PASS_VARS) { |
1522 | 0 | bool printed = false; |
1523 | 0 | uint32_t i; |
1524 | |
|
1525 | 0 | for (i = op_array->last_var; i< op_array->T; i++) { |
1526 | 0 | if (zend_bitset_in(used_ext, i)) { |
1527 | 0 | if (!printed) { |
1528 | 0 | fprintf(stderr, "NON-LOCAL-VARS: %d", i); |
1529 | 0 | printed = true; |
1530 | 0 | } else { |
1531 | 0 | fprintf(stderr, ", %d", i); |
1532 | 0 | } |
1533 | 0 | } |
1534 | 0 | } |
1535 | 0 | if (printed) { |
1536 | 0 | fprintf(stderr, "\n"); |
1537 | 0 | } |
1538 | 0 | } |
1539 | | |
1540 | 99.8k | usage = defined_here; |
1541 | 99.8k | next_block = NULL; |
1542 | 636k | for (n = cfg->blocks_count; n > 0;) { |
1543 | 537k | block = cfg->blocks + (--n); |
1544 | | |
1545 | 537k | if (!(block->flags & ZEND_BB_REACHABLE) || block->len == 0) { |
1546 | 47.3k | continue; |
1547 | 47.3k | } |
1548 | | |
1549 | 489k | end = op_array->opcodes + block->start; |
1550 | 489k | opline = end + block->len - 1; |
1551 | 489k | if (!next_block || |
1552 | 389k | !(next_block->flags & ZEND_BB_FOLLOW) || |
1553 | 308k | (next_block->flags & ZEND_BB_TARGET)) { |
1554 | | /* Skip continuation of "extended" BB */ |
1555 | 308k | zend_bitset_copy(usage, used_ext, bitset_len); |
1556 | 308k | } else if (block->successors_count > 1) { |
1557 | 119k | zend_bitset_union(usage, used_ext, bitset_len); |
1558 | 119k | } |
1559 | 489k | next_block = block; |
1560 | | |
1561 | 3.57M | while (opline >= end) { |
1562 | | /* usage checks */ |
1563 | 3.08M | if (opline->result_type & (IS_VAR|IS_TMP_VAR)) { |
1564 | 1.43M | if (!zend_bitset_in(usage, VAR_NUM(opline->result.var))) { |
1565 | 8.56k | switch (opline->opcode) { |
1566 | 0 | case ZEND_ASSIGN_OP: |
1567 | 0 | case ZEND_ASSIGN_DIM_OP: |
1568 | 0 | case ZEND_ASSIGN_OBJ_OP: |
1569 | 0 | case ZEND_ASSIGN_STATIC_PROP_OP: |
1570 | 0 | case ZEND_PRE_INC: |
1571 | 0 | case ZEND_PRE_DEC: |
1572 | 0 | case ZEND_ASSIGN: |
1573 | 0 | case ZEND_ASSIGN_REF: |
1574 | 0 | case ZEND_DO_FCALL: |
1575 | 0 | case ZEND_DO_ICALL: |
1576 | 0 | case ZEND_DO_UCALL: |
1577 | 0 | case ZEND_DO_FCALL_BY_NAME: |
1578 | 0 | opline->result_type = IS_UNUSED; |
1579 | 0 | break; |
1580 | 0 | case ZEND_POST_INC: |
1581 | 0 | case ZEND_POST_DEC: |
1582 | 0 | case ZEND_POST_INC_OBJ: |
1583 | 0 | case ZEND_POST_DEC_OBJ: |
1584 | 0 | case ZEND_POST_INC_STATIC_PROP: |
1585 | 0 | case ZEND_POST_DEC_STATIC_PROP: |
1586 | 0 | opline->opcode -= 2; |
1587 | 0 | opline->result_type = IS_UNUSED; |
1588 | 0 | break; |
1589 | 499 | case ZEND_QM_ASSIGN: |
1590 | 1.45k | case ZEND_BOOL: |
1591 | 4.51k | case ZEND_BOOL_NOT: |
1592 | 4.51k | zend_optimizer_convert_to_free_op1(op_array, opline); |
1593 | 4.51k | break; |
1594 | 1.87k | case ZEND_JMPZ_EX: |
1595 | 3.91k | case ZEND_JMPNZ_EX: |
1596 | 3.91k | opline->opcode -= 3; |
1597 | 3.91k | SET_UNUSED(opline->result); |
1598 | 3.91k | break; |
1599 | 0 | case ZEND_ADD_ARRAY_ELEMENT: |
1600 | 0 | case ZEND_ADD_ARRAY_UNPACK: |
1601 | 0 | case ZEND_ROPE_ADD: |
1602 | 0 | zend_bitset_incl(usage, VAR_NUM(opline->result.var)); |
1603 | 0 | break; |
1604 | 8.56k | } |
1605 | 1.42M | } else { |
1606 | 1.42M | switch (opline->opcode) { |
1607 | 42.5k | case ZEND_ADD_ARRAY_ELEMENT: |
1608 | 42.7k | case ZEND_ADD_ARRAY_UNPACK: |
1609 | 334k | case ZEND_ROPE_ADD: |
1610 | 334k | break; |
1611 | 1.08M | default: |
1612 | 1.08M | zend_bitset_excl(usage, VAR_NUM(opline->result.var)); |
1613 | 1.08M | break; |
1614 | 1.42M | } |
1615 | 1.42M | } |
1616 | 1.43M | } |
1617 | | |
1618 | 3.08M | if (opline->op2_type == IS_VAR) { |
1619 | 2.50k | switch (opline->opcode) { |
1620 | 0 | case ZEND_FE_FETCH_R: |
1621 | 22 | case ZEND_FE_FETCH_RW: |
1622 | 22 | zend_bitset_excl(usage, VAR_NUM(opline->op2.var)); |
1623 | 22 | break; |
1624 | 2.48k | default: |
1625 | 2.48k | zend_bitset_incl(usage, VAR_NUM(opline->op2.var)); |
1626 | 2.48k | break; |
1627 | 2.50k | } |
1628 | 3.08M | } else if (opline->op2_type == IS_TMP_VAR) { |
1629 | 480k | zend_bitset_incl(usage, VAR_NUM(opline->op2.var)); |
1630 | 480k | } |
1631 | | |
1632 | 3.08M | if (opline->op1_type & (IS_VAR|IS_TMP_VAR)) { |
1633 | 894k | zend_bitset_incl(usage, VAR_NUM(opline->op1.var)); |
1634 | 894k | } |
1635 | | |
1636 | 3.08M | opline--; |
1637 | 3.08M | } |
1638 | 489k | } |
1639 | | |
1640 | 99.8k | zend_arena_release(&ctx->arena, checkpoint); |
1641 | 99.8k | } |
1642 | | |
1643 | | static void zend_merge_blocks(const zend_op_array *op_array, const zend_cfg *cfg, uint32_t *opt_count) |
1644 | 113k | { |
1645 | 113k | zend_basic_block *b, *bb; |
1646 | 113k | zend_basic_block *prev = NULL; |
1647 | | |
1648 | 668k | for (uint32_t i = 0; i < cfg->blocks_count; i++) { |
1649 | 554k | b = cfg->blocks + i; |
1650 | 554k | if (b->flags & ZEND_BB_REACHABLE) { |
1651 | 501k | if ((b->flags & ZEND_BB_FOLLOW) && |
1652 | 287k | !(b->flags & (ZEND_BB_TARGET | ZEND_BB_PROTECTED)) && |
1653 | 141k | prev && prev->successors_count == 1 && prev->successors[0] == i) |
1654 | 24.7k | { |
1655 | 24.7k | zend_op *last_op = op_array->opcodes + prev->start + prev->len - 1; |
1656 | 24.7k | if (prev->len != 0 && last_op->opcode == ZEND_JMP) { |
1657 | 0 | MAKE_NOP(last_op); |
1658 | 0 | } |
1659 | | |
1660 | 27.6k | for (bb = prev + 1; bb != b; bb++) { |
1661 | 2.89k | zend_op *op = op_array->opcodes + bb->start; |
1662 | 2.89k | const zend_op *end = op + bb->len; |
1663 | 5.55k | while (op < end) { |
1664 | 2.65k | if (op->op1_type == IS_CONST) { |
1665 | 942 | literal_dtor(&ZEND_OP1_LITERAL(op)); |
1666 | 942 | } |
1667 | 2.65k | if (op->op2_type == IS_CONST) { |
1668 | 598 | literal_dtor(&ZEND_OP2_LITERAL(op)); |
1669 | 598 | } |
1670 | 2.65k | MAKE_NOP(op); |
1671 | 2.65k | op++; |
1672 | 2.65k | } |
1673 | | /* make block empty */ |
1674 | 2.89k | bb->len = 0; |
1675 | 2.89k | } |
1676 | | |
1677 | | /* re-link */ |
1678 | 24.7k | prev->flags |= (b->flags & ZEND_BB_EXIT); |
1679 | 24.7k | prev->len = b->start + b->len - prev->start; |
1680 | 24.7k | prev->successors_count = b->successors_count; |
1681 | 24.7k | if (b->successors != b->successors_storage) { |
1682 | 66 | prev->successors = b->successors; |
1683 | 66 | b->successors = b->successors_storage; |
1684 | 24.6k | } else { |
1685 | 24.6k | memcpy(prev->successors, b->successors, b->successors_count * sizeof(int)); |
1686 | 24.6k | } |
1687 | | |
1688 | | /* unlink & make block empty and unreachable */ |
1689 | 24.7k | b->flags = 0; |
1690 | 24.7k | b->len = 0; |
1691 | 24.7k | b->successors_count = 0; |
1692 | 24.7k | ++(*opt_count); |
1693 | 476k | } else { |
1694 | 476k | prev = b; |
1695 | 476k | } |
1696 | 501k | } |
1697 | 554k | } |
1698 | 113k | } |
1699 | | |
1700 | 114k | #define PASSES 3 |
1701 | | |
1702 | | void zend_optimize_cfg(zend_op_array *op_array, zend_optimizer_ctx *ctx) |
1703 | 94.6k | { |
1704 | 94.6k | zend_cfg cfg; |
1705 | 94.6k | zend_basic_block *blocks, *end, *b; |
1706 | 94.6k | int pass; |
1707 | 94.6k | uint32_t bitset_len; |
1708 | 94.6k | zend_bitset usage; |
1709 | 94.6k | void *checkpoint; |
1710 | 94.6k | zend_op **Tsource; |
1711 | 94.6k | uint32_t opt_count; |
1712 | 94.6k | int *jmp_hitlist; |
1713 | | |
1714 | | /* Build CFG */ |
1715 | 94.6k | checkpoint = zend_arena_checkpoint(ctx->arena); |
1716 | 94.6k | zend_build_cfg(&ctx->arena, op_array, 0, &cfg); |
1717 | | |
1718 | 94.6k | if (cfg.blocks_count * (op_array->last_var + op_array->T) > 64 * 1024 * 1024) { |
1719 | 0 | zend_arena_release(&ctx->arena, checkpoint); |
1720 | 0 | return; |
1721 | 0 | } |
1722 | | |
1723 | 94.6k | if (ctx->debug_level & ZEND_DUMP_BEFORE_BLOCK_PASS) { |
1724 | 0 | zend_dump_op_array(op_array, ZEND_DUMP_CFG, "before block pass", &cfg); |
1725 | 0 | } |
1726 | | |
1727 | 94.6k | bitset_len = zend_bitset_len(op_array->last_var + op_array->T); |
1728 | 94.6k | Tsource = zend_arena_calloc(&ctx->arena, op_array->last_var + op_array->T, sizeof(zend_op *)); |
1729 | 94.6k | usage = zend_arena_alloc(&ctx->arena, bitset_len * ZEND_BITSET_ELM_SIZE); |
1730 | 94.6k | jmp_hitlist = zend_arena_alloc(&ctx->arena, cfg.blocks_count * sizeof(int)); |
1731 | | |
1732 | 94.6k | blocks = cfg.blocks; |
1733 | 94.6k | end = blocks + cfg.blocks_count; |
1734 | 114k | for (pass = 0; pass < PASSES; pass++) { |
1735 | 113k | opt_count = 0; |
1736 | | |
1737 | | /* Compute data dependencies */ |
1738 | 113k | zend_bitset_clear(usage, bitset_len); |
1739 | 113k | zend_t_usage(&cfg, op_array, usage, ctx); |
1740 | | |
1741 | | /* optimize each basic block separately */ |
1742 | 668k | for (b = blocks; b < end; b++) { |
1743 | 554k | if (!(b->flags & ZEND_BB_REACHABLE)) { |
1744 | 50.6k | continue; |
1745 | 50.6k | } |
1746 | | /* we track data dependencies only inside a single basic block */ |
1747 | 503k | if (!(b->flags & ZEND_BB_FOLLOW) || |
1748 | 322k | (b->flags & ZEND_BB_TARGET)) { |
1749 | | /* Skip continuation of "extended" BB */ |
1750 | 322k | memset(Tsource, 0, (op_array->last_var + op_array->T) * sizeof(zend_op *)); |
1751 | 322k | } |
1752 | 503k | zend_optimize_block(b, op_array, usage, &cfg, Tsource, &opt_count); |
1753 | 503k | } |
1754 | | |
1755 | | /* Eliminate NOPs */ |
1756 | 668k | for (b = blocks; b < end; b++) { |
1757 | 554k | if (b->flags & ZEND_BB_UNREACHABLE_FREE) { |
1758 | | /* In unreachable_free blocks only preserve loop var frees. */ |
1759 | 96 | for (uint32_t i = b->start; i < b->start + b->len; i++) { |
1760 | 62 | zend_op *opline = &op_array->opcodes[i]; |
1761 | 62 | if (!zend_optimizer_is_loop_var_free(opline)) { |
1762 | 28 | MAKE_NOP(opline); |
1763 | 28 | } |
1764 | 62 | } |
1765 | 34 | } |
1766 | 554k | if (b->flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1767 | 503k | strip_nops(op_array, b); |
1768 | 503k | } |
1769 | 554k | } |
1770 | | |
1771 | 113k | opt_count = 0; |
1772 | | |
1773 | | /* Jump optimization for each block */ |
1774 | 668k | for (b = blocks; b < end; b++) { |
1775 | 554k | if (b->flags & ZEND_BB_REACHABLE) { |
1776 | 503k | zend_jmp_optimization(b, op_array, &cfg, jmp_hitlist, &opt_count); |
1777 | 503k | } |
1778 | 554k | } |
1779 | | |
1780 | | /* Eliminate unreachable basic blocks */ |
1781 | 113k | zend_cfg_remark_reachable_blocks(op_array, &cfg); |
1782 | | |
1783 | | /* Merge Blocks */ |
1784 | 113k | zend_merge_blocks(op_array, &cfg, &opt_count); |
1785 | | |
1786 | 113k | if (opt_count == 0) { |
1787 | 94.5k | break; |
1788 | 94.5k | } |
1789 | 113k | } |
1790 | | |
1791 | 94.6k | assemble_code_blocks(&cfg, op_array, ctx); |
1792 | | |
1793 | 94.6k | if (ctx->debug_level & ZEND_DUMP_AFTER_BLOCK_PASS) { |
1794 | 0 | zend_dump_op_array(op_array, ZEND_DUMP_CFG | ZEND_DUMP_HIDE_UNREACHABLE, "after block pass", &cfg); |
1795 | 0 | } |
1796 | | |
1797 | | /* Destroy CFG */ |
1798 | 94.6k | zend_arena_release(&ctx->arena, checkpoint); |
1799 | 94.6k | } |