/src/php-src/Zend/Optimizer/block_pass.c
Line | Count | Source |
1 | | /* |
2 | | +----------------------------------------------------------------------+ |
3 | | | Zend OPcache | |
4 | | +----------------------------------------------------------------------+ |
5 | | | Copyright (c) The PHP Group | |
6 | | +----------------------------------------------------------------------+ |
7 | | | This source file is subject to version 3.01 of the PHP license, | |
8 | | | that is bundled with this package in the file LICENSE, and is | |
9 | | | available through the world-wide-web at the following url: | |
10 | | | https://www.php.net/license/3_01.txt | |
11 | | | If you did not receive a copy of the PHP license and are unable to | |
12 | | | obtain it through the world-wide-web, please send a note to | |
13 | | | license@php.net so we can mail you a copy immediately. | |
14 | | +----------------------------------------------------------------------+ |
15 | | | Authors: Andi Gutmans <andi@php.net> | |
16 | | | Zeev Suraski <zeev@php.net> | |
17 | | | Stanislav Malyshev <stas@zend.com> | |
18 | | | Dmitry Stogov <dmitry@php.net> | |
19 | | +----------------------------------------------------------------------+ |
20 | | */ |
21 | | |
22 | | #include "Optimizer/zend_optimizer.h" |
23 | | #include "Optimizer/zend_optimizer_internal.h" |
24 | | #include "zend_API.h" |
25 | | #include "zend_constants.h" |
26 | | #include "zend_execute.h" |
27 | | #include "zend_vm.h" |
28 | | #include "zend_bitset.h" |
29 | | #include "zend_cfg.h" |
30 | | #include "zend_dump.h" |
31 | | |
32 | | /* Checks if a constant (like "true") may be replaced by its value */ |
33 | | bool zend_optimizer_get_persistent_constant(zend_string *name, zval *result, int copy) |
34 | 55.6k | { |
35 | 55.6k | zend_constant *c = zend_hash_find_ptr(EG(zend_constants), name); |
36 | 55.6k | if (c) { |
37 | 62 | if ((ZEND_CONSTANT_FLAGS(c) & CONST_PERSISTENT) |
38 | 62 | && !(ZEND_CONSTANT_FLAGS(c) & CONST_DEPRECATED) |
39 | 0 | && (!(ZEND_CONSTANT_FLAGS(c) & CONST_NO_FILE_CACHE) |
40 | 0 | || !(CG(compiler_options) & ZEND_COMPILE_WITH_FILE_CACHE))) { |
41 | 0 | ZVAL_COPY_VALUE(result, &c->value); |
42 | 0 | if (copy) { |
43 | 0 | Z_TRY_ADDREF_P(result); |
44 | 0 | } |
45 | 0 | return true; |
46 | 62 | } else { |
47 | 62 | return false; |
48 | 62 | } |
49 | 62 | } |
50 | | |
51 | | /* Special constants null/true/false can always be substituted. */ |
52 | 55.5k | c = zend_get_special_const(ZSTR_VAL(name), ZSTR_LEN(name)); |
53 | 55.5k | if (c) { |
54 | 0 | ZVAL_COPY_VALUE(result, &c->value); |
55 | 0 | return true; |
56 | 0 | } |
57 | 55.5k | return false; |
58 | 55.5k | } |
59 | | |
60 | | /* Data dependencies macros */ |
61 | | |
62 | 1.82M | #define VAR_SOURCE(op) Tsource[VAR_NUM(op.var)] |
63 | 1.65M | #define SET_VAR_SOURCE(opline) Tsource[VAR_NUM(opline->result.var)] = opline |
64 | | |
65 | | static void strip_leading_nops(zend_op_array *op_array, zend_basic_block *b) |
66 | 9.89k | { |
67 | 9.89k | zend_op *opcodes = op_array->opcodes; |
68 | | |
69 | 11.9k | do { |
70 | 11.9k | b->start++; |
71 | 11.9k | b->len--; |
72 | 11.9k | } while (b->len > 0 && opcodes[b->start].opcode == ZEND_NOP); |
73 | 9.89k | } |
74 | | |
75 | | static void strip_nops(zend_op_array *op_array, zend_basic_block *b) |
76 | 560k | { |
77 | 560k | uint32_t i, j; |
78 | | |
79 | 560k | if (b->len == 0) { |
80 | 1.11k | return; |
81 | 1.11k | } |
82 | | |
83 | 559k | if (op_array->opcodes[b->start].opcode == ZEND_NOP) { |
84 | 4.08k | strip_leading_nops(op_array, b); |
85 | 4.08k | } |
86 | | |
87 | 559k | if (b->len == 0) { |
88 | 360 | return; |
89 | 360 | } |
90 | | |
91 | | /* strip the inside NOPs */ |
92 | 559k | i = j = b->start + 1; |
93 | 3.52M | while (i < b->start + b->len) { |
94 | 2.96M | if (op_array->opcodes[i].opcode != ZEND_NOP) { |
95 | 2.93M | if (i != j) { |
96 | 59.6k | op_array->opcodes[j] = op_array->opcodes[i]; |
97 | 59.6k | } |
98 | 2.93M | j++; |
99 | 2.93M | } |
100 | 2.96M | i++; |
101 | 2.96M | } |
102 | 559k | b->len = j - b->start; |
103 | 591k | while (j < i) { |
104 | 32.2k | MAKE_NOP(op_array->opcodes + j); |
105 | 32.2k | j++; |
106 | 32.2k | } |
107 | 559k | } |
108 | | |
109 | 62 | static int get_const_switch_target(zend_cfg *cfg, zend_op_array *op_array, zend_basic_block *block, zend_op *opline, zval *val) { |
110 | 62 | HashTable *jumptable = Z_ARRVAL(ZEND_OP2_LITERAL(opline)); |
111 | 62 | zval *zv; |
112 | 62 | if ((opline->opcode == ZEND_SWITCH_LONG && Z_TYPE_P(val) != IS_LONG) |
113 | 62 | || (opline->opcode == ZEND_SWITCH_STRING && Z_TYPE_P(val) != IS_STRING)) { |
114 | | /* fallback to next block */ |
115 | 0 | return block->successors[block->successors_count - 1]; |
116 | 0 | } |
117 | 62 | if (opline->opcode == ZEND_MATCH && Z_TYPE_P(val) != IS_LONG && Z_TYPE_P(val) != IS_STRING) { |
118 | | /* always jump to the default arm */ |
119 | 12 | return block->successors[block->successors_count - 1]; |
120 | 12 | } |
121 | 50 | if (Z_TYPE_P(val) == IS_LONG) { |
122 | 26 | zv = zend_hash_index_find(jumptable, Z_LVAL_P(val)); |
123 | 26 | } else { |
124 | 24 | ZEND_ASSERT(Z_TYPE_P(val) == IS_STRING); |
125 | 24 | zv = zend_hash_find(jumptable, Z_STR_P(val)); |
126 | 24 | } |
127 | 50 | if (!zv) { |
128 | | /* default */ |
129 | 32 | return block->successors[block->successors_count - (opline->opcode == ZEND_MATCH ? 1 : 2)]; |
130 | 32 | } |
131 | 18 | return cfg->map[ZEND_OFFSET_TO_OPLINE_NUM(op_array, opline, Z_LVAL_P(zv))]; |
132 | 50 | } |
133 | | |
134 | | static void zend_optimize_block(zend_basic_block *block, zend_op_array *op_array, zend_bitset used_ext, zend_cfg *cfg, zend_op **Tsource, uint32_t *opt_count) |
135 | 560k | { |
136 | 560k | zend_op *opline, *src; |
137 | 560k | zend_op *end, *last_op = NULL; |
138 | | |
139 | 560k | if (block->len == 0) { |
140 | 236 | return; |
141 | 236 | } |
142 | | |
143 | 560k | if (op_array->opcodes[block->start].opcode == ZEND_NOP) { |
144 | | /* remove leading NOPs */ |
145 | 5.80k | strip_leading_nops(op_array, block); |
146 | 5.80k | } |
147 | | |
148 | 560k | opline = op_array->opcodes + block->start; |
149 | 560k | end = opline + block->len; |
150 | 4.09M | while (opline < end) { |
151 | | /* Constant Propagation: strip X = QM_ASSIGN(const) */ |
152 | 3.52M | if (opline->op1_type == IS_TMP_VAR && |
153 | 782k | opline->opcode != ZEND_FREE) { |
154 | 748k | src = VAR_SOURCE(opline->op1); |
155 | 748k | if (src && |
156 | 704k | src->opcode == ZEND_QM_ASSIGN && |
157 | 4.34k | src->op1_type == IS_CONST |
158 | 748k | ) { |
159 | 2.03k | znode_op op1 = opline->op1; |
160 | 2.03k | if (opline->opcode == ZEND_VERIFY_RETURN_TYPE) { |
161 | 2 | COPY_NODE(opline->result, opline->op1); |
162 | 2 | COPY_NODE(opline->op1, src->op1); |
163 | 2 | VAR_SOURCE(op1) = NULL; |
164 | 2 | MAKE_NOP(src); |
165 | 2 | ++(*opt_count); |
166 | 2.03k | } else { |
167 | 2.03k | zval c; |
168 | 2.03k | ZVAL_COPY(&c, &ZEND_OP1_LITERAL(src)); |
169 | 2.03k | if (opline->opcode != ZEND_CASE |
170 | 2.03k | && opline->opcode != ZEND_CASE_STRICT |
171 | 2.03k | && opline->opcode != ZEND_FETCH_LIST_R |
172 | 2.02k | && opline->opcode != ZEND_SWITCH_LONG |
173 | 2.02k | && opline->opcode != ZEND_SWITCH_STRING |
174 | 2.02k | && opline->opcode != ZEND_MATCH |
175 | 2.01k | && opline->opcode != ZEND_MATCH_ERROR |
176 | 2.01k | && zend_optimizer_update_op1_const(op_array, opline, &c)) { |
177 | 2.00k | VAR_SOURCE(op1) = NULL; |
178 | 2.00k | if (opline->opcode != ZEND_JMP_NULL |
179 | 2.00k | && !zend_bitset_in(used_ext, VAR_NUM(src->result.var))) { |
180 | 1.25k | literal_dtor(&ZEND_OP1_LITERAL(src)); |
181 | 1.25k | MAKE_NOP(src); |
182 | 1.25k | } |
183 | 2.00k | ++(*opt_count); |
184 | 2.00k | } else { |
185 | 22 | zval_ptr_dtor_nogc(&c); |
186 | 22 | } |
187 | 2.03k | } |
188 | 2.03k | } |
189 | 748k | } |
190 | | |
191 | | /* Constant Propagation: strip X = QM_ASSIGN(const) */ |
192 | 3.52M | if (opline->op2_type == IS_TMP_VAR) { |
193 | 544k | src = VAR_SOURCE(opline->op2); |
194 | 544k | if (src && |
195 | 511k | src->opcode == ZEND_QM_ASSIGN && |
196 | 116 | src->op1_type == IS_CONST) { |
197 | | |
198 | 88 | znode_op op2 = opline->op2; |
199 | 88 | zval c; |
200 | | |
201 | 88 | ZVAL_COPY(&c, &ZEND_OP1_LITERAL(src)); |
202 | 88 | if (zend_optimizer_update_op2_const(op_array, opline, &c)) { |
203 | 76 | VAR_SOURCE(op2) = NULL; |
204 | 76 | if (!zend_bitset_in(used_ext, VAR_NUM(src->result.var))) { |
205 | 76 | literal_dtor(&ZEND_OP1_LITERAL(src)); |
206 | 76 | MAKE_NOP(src); |
207 | 76 | } |
208 | 76 | ++(*opt_count); |
209 | 76 | } else { |
210 | 12 | zval_ptr_dtor_nogc(&c); |
211 | 12 | } |
212 | 88 | } |
213 | 544k | } |
214 | | |
215 | 3.52M | switch (opline->opcode) { |
216 | 169k | case ZEND_ECHO: |
217 | 169k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
218 | 35.0k | src = VAR_SOURCE(opline->op1); |
219 | 35.0k | if (src && |
220 | 34.6k | src->opcode == ZEND_CAST && |
221 | 135 | src->extended_value == IS_STRING) { |
222 | | /* T = CAST(X, String), ECHO(T) => NOP, ECHO(X) */ |
223 | 85 | VAR_SOURCE(opline->op1) = NULL; |
224 | 85 | COPY_NODE(opline->op1, src->op1); |
225 | 85 | MAKE_NOP(src); |
226 | 85 | ++(*opt_count); |
227 | 85 | } |
228 | 133k | } else if (opline->op1_type == IS_CONST && |
229 | 132k | Z_TYPE(ZEND_OP1_LITERAL(opline)) != IS_DOUBLE) { |
230 | 132k | if (last_op == opline - 1) { |
231 | | /* compress consecutive ECHO's. |
232 | | * Float to string conversion may be affected by current |
233 | | * locale setting. |
234 | | */ |
235 | 5.36k | size_t l, old_len; |
236 | | |
237 | 5.36k | if (Z_TYPE(ZEND_OP1_LITERAL(opline)) != IS_STRING) { |
238 | 60 | convert_to_string(&ZEND_OP1_LITERAL(opline)); |
239 | 60 | } |
240 | 5.36k | if (Z_TYPE(ZEND_OP1_LITERAL(last_op)) != IS_STRING) { |
241 | 35 | convert_to_string(&ZEND_OP1_LITERAL(last_op)); |
242 | 35 | } |
243 | 5.36k | old_len = Z_STRLEN(ZEND_OP1_LITERAL(last_op)); |
244 | 5.36k | l = old_len + Z_STRLEN(ZEND_OP1_LITERAL(opline)); |
245 | 5.36k | if (!Z_REFCOUNTED(ZEND_OP1_LITERAL(last_op))) { |
246 | 1.92k | zend_string *tmp = zend_string_alloc(l, 0); |
247 | 1.92k | memcpy(ZSTR_VAL(tmp), Z_STRVAL(ZEND_OP1_LITERAL(last_op)), old_len); |
248 | 1.92k | Z_STR(ZEND_OP1_LITERAL(last_op)) = tmp; |
249 | 3.43k | } else { |
250 | 3.43k | Z_STR(ZEND_OP1_LITERAL(last_op)) = zend_string_extend(Z_STR(ZEND_OP1_LITERAL(last_op)), l, 0); |
251 | 3.43k | } |
252 | 5.36k | Z_TYPE_INFO(ZEND_OP1_LITERAL(last_op)) = IS_STRING_EX; |
253 | 5.36k | memcpy(Z_STRVAL(ZEND_OP1_LITERAL(last_op)) + old_len, Z_STRVAL(ZEND_OP1_LITERAL(opline)), Z_STRLEN(ZEND_OP1_LITERAL(opline))); |
254 | 5.36k | Z_STRVAL(ZEND_OP1_LITERAL(last_op))[l] = '\0'; |
255 | 5.36k | zval_ptr_dtor_nogc(&ZEND_OP1_LITERAL(opline)); |
256 | 5.36k | ZVAL_STR(&ZEND_OP1_LITERAL(opline), zend_new_interned_string(Z_STR(ZEND_OP1_LITERAL(last_op)))); |
257 | 5.36k | ZVAL_NULL(&ZEND_OP1_LITERAL(last_op)); |
258 | 5.36k | MAKE_NOP(last_op); |
259 | 5.36k | ++(*opt_count); |
260 | 5.36k | } |
261 | 132k | last_op = opline; |
262 | 132k | } |
263 | 169k | break; |
264 | | |
265 | 538 | case ZEND_MATCH_ERROR: |
266 | 538 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
267 | 216 | src = VAR_SOURCE(opline->op1); |
268 | 216 | VAR_SOURCE(opline->op1) = NULL; |
269 | 216 | } |
270 | 538 | break; |
271 | | |
272 | 52.5k | case ZEND_FREE: |
273 | | /* Note: Only remove the source if the source is local to this block. |
274 | | * If it's not local, then the other blocks successors must also eventually either FREE or consume the temporary, |
275 | | * hence removing the temporary is not safe in the general case, especially when other consumers are not FREE. |
276 | | * A FREE may not be removed without also removing the source's result, because otherwise that would cause a memory leak. */ |
277 | 52.5k | if (opline->extended_value == ZEND_FREE_VOID_CAST) { |
278 | | /* Keep the ZEND_FREE opcode alive. */ |
279 | 52.4k | } else if (opline->op1_type == IS_TMP_VAR) { |
280 | 33.2k | src = VAR_SOURCE(opline->op1); |
281 | 33.2k | if (src) { |
282 | 29.6k | switch (src->opcode) { |
283 | 59 | case ZEND_BOOL: |
284 | 281 | case ZEND_BOOL_NOT: |
285 | | /* T = BOOL(X), FREE(T) => T = BOOL(X) */ |
286 | | /* The remaining BOOL is removed by a separate optimization */ |
287 | | /* The source is a bool, no source removals take place, so this may be done non-locally. */ |
288 | 281 | VAR_SOURCE(opline->op1) = NULL; |
289 | 281 | MAKE_NOP(opline); |
290 | 281 | ++(*opt_count); |
291 | 281 | break; |
292 | 920 | case ZEND_ASSIGN: |
293 | 930 | case ZEND_ASSIGN_DIM: |
294 | 937 | case ZEND_ASSIGN_OBJ: |
295 | 937 | case ZEND_ASSIGN_STATIC_PROP: |
296 | 1.29k | case ZEND_ASSIGN_OP: |
297 | 1.29k | case ZEND_ASSIGN_DIM_OP: |
298 | 1.30k | case ZEND_ASSIGN_OBJ_OP: |
299 | 1.30k | case ZEND_ASSIGN_STATIC_PROP_OP: |
300 | 1.30k | case ZEND_PRE_INC: |
301 | 1.30k | case ZEND_PRE_DEC: |
302 | 1.30k | case ZEND_PRE_INC_OBJ: |
303 | 1.30k | case ZEND_PRE_DEC_OBJ: |
304 | 1.30k | case ZEND_PRE_INC_STATIC_PROP: |
305 | 1.30k | case ZEND_PRE_DEC_STATIC_PROP: |
306 | 1.30k | if (src < op_array->opcodes + block->start) { |
307 | 0 | break; |
308 | 0 | } |
309 | 1.30k | src->result_type = IS_UNUSED; |
310 | 1.30k | VAR_SOURCE(opline->op1) = NULL; |
311 | 1.30k | MAKE_NOP(opline); |
312 | 1.30k | ++(*opt_count); |
313 | 1.30k | break; |
314 | 28.0k | default: |
315 | 28.0k | break; |
316 | 29.6k | } |
317 | 29.6k | } |
318 | 33.2k | } else if (opline->op1_type == IS_VAR) { |
319 | 19.1k | src = VAR_SOURCE(opline->op1); |
320 | | /* V = OP, FREE(V) => OP. NOP */ |
321 | 19.1k | if (src >= op_array->opcodes + block->start && |
322 | 18.2k | src->opcode != ZEND_FETCH_R && |
323 | 18.2k | src->opcode != ZEND_FETCH_STATIC_PROP_R && |
324 | 18.2k | src->opcode != ZEND_FETCH_DIM_R && |
325 | 18.2k | src->opcode != ZEND_FETCH_OBJ_R && |
326 | 18.1k | src->opcode != ZEND_NEW && |
327 | 1.25k | src->opcode != ZEND_FETCH_THIS) { |
328 | 1.25k | src->result_type = IS_UNUSED; |
329 | 1.25k | MAKE_NOP(opline); |
330 | 1.25k | ++(*opt_count); |
331 | 1.25k | if (src->opcode == ZEND_QM_ASSIGN) { |
332 | 32 | if (src->op1_type & (IS_VAR|IS_TMP_VAR)) { |
333 | 0 | src->opcode = ZEND_FREE; |
334 | 32 | } else { |
335 | 32 | MAKE_NOP(src); |
336 | 32 | } |
337 | 32 | } |
338 | 1.25k | } |
339 | 19.1k | } |
340 | 52.5k | break; |
341 | | |
342 | | #if 0 |
343 | | /* pre-evaluate functions: |
344 | | constant(x) |
345 | | function_exists(x) |
346 | | extension_loaded(x) |
347 | | BAD: interacts badly with Accelerator |
348 | | */ |
349 | | if((opline->op1_type & IS_VAR) && |
350 | | VAR_SOURCE(opline->op1) && VAR_SOURCE(opline->op1)->opcode == ZEND_DO_CF_FCALL && |
351 | | VAR_SOURCE(opline->op1)->extended_value == 1) { |
352 | | zend_op *fcall = VAR_SOURCE(opline->op1); |
353 | | zend_op *sv = fcall-1; |
354 | | if(sv >= block->start_opline && sv->opcode == ZEND_SEND_VAL && |
355 | | sv->op1_type == IS_CONST && Z_TYPE(OPLINE_OP1_LITERAL(sv)) == IS_STRING && |
356 | | Z_LVAL(OPLINE_OP2_LITERAL(sv)) == 1 |
357 | | ) { |
358 | | zval *arg = &OPLINE_OP1_LITERAL(sv); |
359 | | char *fname = FUNCTION_CACHE->funcs[Z_LVAL(ZEND_OP1_LITERAL(fcall))].function_name; |
360 | | size_t flen = FUNCTION_CACHE->funcs[Z_LVAL(ZEND_OP1_LITERAL(fcall))].name_len; |
361 | | if((flen == sizeof("function_exists")-1 && zend_binary_strcasecmp(fname, flen, "function_exists", sizeof("function_exists")-1) == 0) || |
362 | | (flen == sizeof("is_callable")-1 && zend_binary_strcasecmp(fname, flen, "is_callable", sizeof("is_callable")-1) == 0) |
363 | | ) { |
364 | | zend_function *function; |
365 | | if((function = zend_hash_find_ptr(EG(function_table), Z_STR_P(arg))) != NULL) { |
366 | | literal_dtor(arg); |
367 | | MAKE_NOP(sv); |
368 | | MAKE_NOP(fcall); |
369 | | LITERAL_BOOL(opline->op1, 1); |
370 | | opline->op1_type = IS_CONST; |
371 | | } |
372 | | } else if(flen == sizeof("constant")-1 && zend_binary_strcasecmp(fname, flen, "constant", sizeof("constant")-1) == 0) { |
373 | | zval c; |
374 | | if (zend_optimizer_get_persistent_constant(Z_STR_P(arg), &c, 1 ELS_CC)) { |
375 | | literal_dtor(arg); |
376 | | MAKE_NOP(sv); |
377 | | MAKE_NOP(fcall); |
378 | | ZEND_OP1_LITERAL(opline) = zend_optimizer_add_literal(op_array, &c); |
379 | | /* no copy ctor - get already copied it */ |
380 | | opline->op1_type = IS_CONST; |
381 | | } |
382 | | } else if(flen == sizeof("extension_loaded")-1 && zend_binary_strcasecmp(fname, flen, "extension_loaded", sizeof("extension_loaded")-1) == 0) { |
383 | | if(zend_hash_exists(&module_registry, Z_STR_P(arg))) { |
384 | | literal_dtor(arg); |
385 | | MAKE_NOP(sv); |
386 | | MAKE_NOP(fcall); |
387 | | LITERAL_BOOL(opline->op1, 1); |
388 | | opline->op1_type = IS_CONST; |
389 | | } |
390 | | } |
391 | | } |
392 | | } |
393 | | #endif |
394 | | |
395 | 52.5k | case ZEND_FETCH_LIST_R: |
396 | 1.86k | case ZEND_FETCH_LIST_W: |
397 | 1.86k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
398 | | /* LIST variable will be deleted later by FREE */ |
399 | 1.59k | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
400 | 1.59k | } |
401 | 1.86k | break; |
402 | | |
403 | 8 | case ZEND_SWITCH_LONG: |
404 | 75 | case ZEND_SWITCH_STRING: |
405 | 389 | case ZEND_MATCH: |
406 | 389 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
407 | | /* SWITCH variable will be deleted later by FREE, so we can't optimize it */ |
408 | 125 | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
409 | 125 | break; |
410 | 125 | } |
411 | 264 | if (opline->op1_type == IS_CONST) { |
412 | 62 | int target = get_const_switch_target(cfg, op_array, block, opline, &ZEND_OP1_LITERAL(opline)); |
413 | 62 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
414 | 62 | literal_dtor(&ZEND_OP2_LITERAL(opline)); |
415 | 62 | opline->opcode = ZEND_JMP; |
416 | 62 | opline->op1_type = IS_UNUSED; |
417 | 62 | opline->op2_type = IS_UNUSED; |
418 | 62 | block->successors_count = 1; |
419 | 62 | block->successors[0] = target; |
420 | 62 | } |
421 | 264 | break; |
422 | | |
423 | 0 | case ZEND_EXT_STMT: |
424 | 0 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
425 | | /* Variable will be deleted later by FREE, so we can't optimize it */ |
426 | 0 | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
427 | 0 | break; |
428 | 0 | } |
429 | 0 | break; |
430 | | |
431 | 169 | case ZEND_CASE: |
432 | 409 | case ZEND_CASE_STRICT: |
433 | 895 | case ZEND_COPY_TMP: |
434 | 895 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
435 | | /* Variable will be deleted later by FREE, so we can't optimize it */ |
436 | 895 | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
437 | 895 | break; |
438 | 895 | } |
439 | 0 | if (opline->op1_type == IS_CONST && |
440 | 0 | opline->op2_type == IS_CONST) { |
441 | 0 | goto optimize_constant_binary_op; |
442 | 0 | } |
443 | | /* |
444 | | * CASE(TRUE, X) => BOOL(X) |
445 | | * CASE(FALSE, X) => BOOL_NOT(X) |
446 | | */ |
447 | 0 | if (opline->op1_type == IS_CONST && |
448 | 0 | (Z_TYPE(ZEND_OP1_LITERAL(opline)) == IS_FALSE || |
449 | 0 | Z_TYPE(ZEND_OP1_LITERAL(opline)) == IS_TRUE)) { |
450 | | /* Optimization of comparison with "null" is not safe, |
451 | | * because ("0" == null) is not equal to !("0") |
452 | | */ |
453 | 0 | opline->opcode = |
454 | 0 | ((opline->opcode != ZEND_IS_NOT_EQUAL) == ((Z_TYPE(ZEND_OP1_LITERAL(opline))) == IS_TRUE)) ? |
455 | 0 | ZEND_BOOL : ZEND_BOOL_NOT; |
456 | 0 | COPY_NODE(opline->op1, opline->op2); |
457 | 0 | SET_UNUSED(opline->op2); |
458 | 0 | ++(*opt_count); |
459 | 0 | goto optimize_bool; |
460 | 0 | } else if (opline->op2_type == IS_CONST && |
461 | 0 | (Z_TYPE(ZEND_OP2_LITERAL(opline)) == IS_FALSE || |
462 | 0 | Z_TYPE(ZEND_OP2_LITERAL(opline)) == IS_TRUE)) { |
463 | | /* Optimization of comparison with "null" is not safe, |
464 | | * because ("0" == null) is not equal to !("0") |
465 | | */ |
466 | 0 | opline->opcode = |
467 | 0 | ((opline->opcode != ZEND_IS_NOT_EQUAL) == ((Z_TYPE(ZEND_OP2_LITERAL(opline))) == IS_TRUE)) ? |
468 | 0 | ZEND_BOOL : ZEND_BOOL_NOT; |
469 | 0 | SET_UNUSED(opline->op2); |
470 | 0 | ++(*opt_count); |
471 | 0 | goto optimize_bool; |
472 | 0 | } |
473 | 0 | break; |
474 | | |
475 | 22.9k | case ZEND_IS_EQUAL: |
476 | 25.8k | case ZEND_IS_NOT_EQUAL: |
477 | 25.8k | if (opline->op1_type == IS_CONST && |
478 | 0 | opline->op2_type == IS_CONST) { |
479 | 0 | goto optimize_constant_binary_op; |
480 | 0 | } |
481 | | /* IS_EQ(TRUE, X) => BOOL(X) |
482 | | * IS_EQ(FALSE, X) => BOOL_NOT(X) |
483 | | * IS_NOT_EQ(TRUE, X) => BOOL_NOT(X) |
484 | | * IS_NOT_EQ(FALSE, X) => BOOL(X) |
485 | | * Those optimizations are not safe if the other operand ends up being NAN |
486 | | * as BOOL/BOOL_NOT will warn, while IS_EQUAL/IS_NOT_EQUAL do not. |
487 | | */ |
488 | 25.8k | break; |
489 | 25.8k | case ZEND_IS_IDENTICAL: |
490 | 2.52k | if (opline->op1_type == IS_CONST && |
491 | 0 | opline->op2_type == IS_CONST) { |
492 | 0 | goto optimize_constant_binary_op; |
493 | 0 | } |
494 | | |
495 | 2.52k | if (opline->op1_type == IS_CONST && |
496 | 0 | (Z_TYPE(ZEND_OP1_LITERAL(opline)) <= IS_TRUE && Z_TYPE(ZEND_OP1_LITERAL(opline)) >= IS_NULL)) { |
497 | | /* IS_IDENTICAL(TRUE, T) => TYPE_CHECK(T, TRUE) |
498 | | * IS_IDENTICAL(FALSE, T) => TYPE_CHECK(T, FALSE) |
499 | | * IS_IDENTICAL(NULL, T) => TYPE_CHECK(T, NULL) |
500 | | */ |
501 | 0 | opline->opcode = ZEND_TYPE_CHECK; |
502 | 0 | opline->extended_value = (1 << Z_TYPE(ZEND_OP1_LITERAL(opline))); |
503 | 0 | COPY_NODE(opline->op1, opline->op2); |
504 | 0 | SET_UNUSED(opline->op2); |
505 | 0 | ++(*opt_count); |
506 | 0 | goto optimize_type_check; |
507 | 2.52k | } else if (opline->op2_type == IS_CONST && |
508 | 1.64k | (Z_TYPE(ZEND_OP2_LITERAL(opline)) <= IS_TRUE && Z_TYPE(ZEND_OP2_LITERAL(opline)) >= IS_NULL)) { |
509 | | /* IS_IDENTICAL(T, TRUE) => TYPE_CHECK(T, TRUE) |
510 | | * IS_IDENTICAL(T, FALSE) => TYPE_CHECK(T, FALSE) |
511 | | * IS_IDENTICAL(T, NULL) => TYPE_CHECK(T, NULL) |
512 | | */ |
513 | 102 | opline->opcode = ZEND_TYPE_CHECK; |
514 | 102 | opline->extended_value = (1 << Z_TYPE(ZEND_OP2_LITERAL(opline))); |
515 | 102 | SET_UNUSED(opline->op2); |
516 | 102 | ++(*opt_count); |
517 | 102 | goto optimize_type_check; |
518 | 102 | } |
519 | 2.41k | break; |
520 | 2.41k | case ZEND_TYPE_CHECK: |
521 | 1.39k | optimize_type_check: |
522 | 1.39k | if (opline->extended_value == (1 << IS_TRUE) || opline->extended_value == (1 << IS_FALSE)) { |
523 | 186 | if (opline->op1_type == IS_TMP_VAR && |
524 | 146 | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
525 | 146 | src = VAR_SOURCE(opline->op1); |
526 | | |
527 | 146 | if (src) { |
528 | 146 | switch (src->opcode) { |
529 | 0 | case ZEND_BOOL: |
530 | 0 | case ZEND_BOOL_NOT: |
531 | | /* T = BOOL(X) + TYPE_CHECK(T, TRUE) -> BOOL(X), NOP |
532 | | * T = BOOL(X) + TYPE_CHECK(T, FALSE) -> BOOL_NOT(X), NOP |
533 | | * T = BOOL_NOT(X) + TYPE_CHECK(T, TRUE) -> BOOL_NOT(X), NOP |
534 | | * T = BOOL_NOT(X) + TYPE_CHECK(T, FALSE) -> BOOL(X), NOP |
535 | | */ |
536 | 0 | src->opcode = |
537 | 0 | ((src->opcode == ZEND_BOOL) == (opline->extended_value == (1 << IS_TRUE))) ? |
538 | 0 | ZEND_BOOL : ZEND_BOOL_NOT; |
539 | 0 | COPY_NODE(src->result, opline->result); |
540 | 0 | SET_VAR_SOURCE(src); |
541 | 0 | MAKE_NOP(opline); |
542 | 0 | ++(*opt_count); |
543 | 0 | break; |
544 | 146 | } |
545 | 146 | } |
546 | 146 | } |
547 | 186 | } |
548 | 1.39k | break; |
549 | | |
550 | 6.36k | case ZEND_BOOL: |
551 | 19.5k | case ZEND_BOOL_NOT: |
552 | 29.1k | optimize_bool: |
553 | 29.1k | if (opline->op1_type == IS_CONST) { |
554 | 2.29k | goto optimize_const_unary_op; |
555 | 2.29k | } |
556 | 26.8k | if (opline->op1_type == IS_TMP_VAR && |
557 | 24.1k | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
558 | 23.3k | src = VAR_SOURCE(opline->op1); |
559 | 23.3k | if (src) { |
560 | 23.3k | switch (src->opcode) { |
561 | 4.95k | case ZEND_BOOL_NOT: |
562 | | /* T = BOOL_NOT(X) + BOOL(T) -> NOP, BOOL_NOT(X) */ |
563 | 4.95k | VAR_SOURCE(opline->op1) = NULL; |
564 | 4.95k | COPY_NODE(opline->op1, src->op1); |
565 | 4.95k | opline->opcode = (opline->opcode == ZEND_BOOL) ? ZEND_BOOL_NOT : ZEND_BOOL; |
566 | 4.95k | MAKE_NOP(src); |
567 | 4.95k | ++(*opt_count); |
568 | 4.95k | goto optimize_bool; |
569 | 4.69k | case ZEND_BOOL: |
570 | | /* T = BOOL(X) + BOOL(T) -> NOP, BOOL(X) */ |
571 | 4.69k | VAR_SOURCE(opline->op1) = NULL; |
572 | 4.69k | COPY_NODE(opline->op1, src->op1); |
573 | 4.69k | MAKE_NOP(src); |
574 | 4.69k | ++(*opt_count); |
575 | 4.69k | goto optimize_bool; |
576 | 214 | case ZEND_IS_EQUAL: |
577 | 214 | if (opline->opcode == ZEND_BOOL_NOT) { |
578 | 0 | src->opcode = ZEND_IS_NOT_EQUAL; |
579 | 0 | } |
580 | 214 | COPY_NODE(src->result, opline->result); |
581 | 214 | SET_VAR_SOURCE(src); |
582 | 214 | MAKE_NOP(opline); |
583 | 214 | ++(*opt_count); |
584 | 214 | break; |
585 | 170 | case ZEND_IS_NOT_EQUAL: |
586 | 170 | if (opline->opcode == ZEND_BOOL_NOT) { |
587 | 0 | src->opcode = ZEND_IS_EQUAL; |
588 | 0 | } |
589 | 170 | COPY_NODE(src->result, opline->result); |
590 | 170 | SET_VAR_SOURCE(src); |
591 | 170 | MAKE_NOP(opline); |
592 | 170 | ++(*opt_count); |
593 | 170 | break; |
594 | 185 | case ZEND_IS_IDENTICAL: |
595 | 185 | if (opline->opcode == ZEND_BOOL_NOT) { |
596 | 0 | src->opcode = ZEND_IS_NOT_IDENTICAL; |
597 | 0 | } |
598 | 185 | COPY_NODE(src->result, opline->result); |
599 | 185 | SET_VAR_SOURCE(src); |
600 | 185 | MAKE_NOP(opline); |
601 | 185 | ++(*opt_count); |
602 | 185 | break; |
603 | 62 | case ZEND_IS_NOT_IDENTICAL: |
604 | 62 | if (opline->opcode == ZEND_BOOL_NOT) { |
605 | 0 | src->opcode = ZEND_IS_IDENTICAL; |
606 | 0 | } |
607 | 62 | COPY_NODE(src->result, opline->result); |
608 | 62 | SET_VAR_SOURCE(src); |
609 | 62 | MAKE_NOP(opline); |
610 | 62 | ++(*opt_count); |
611 | 62 | break; |
612 | 130 | case ZEND_IS_SMALLER: |
613 | 130 | if (opline->opcode == ZEND_BOOL_NOT) { |
614 | 0 | uint8_t tmp_type; |
615 | 0 | uint32_t tmp; |
616 | |
|
617 | 0 | src->opcode = ZEND_IS_SMALLER_OR_EQUAL; |
618 | 0 | tmp_type = src->op1_type; |
619 | 0 | src->op1_type = src->op2_type; |
620 | 0 | src->op2_type = tmp_type; |
621 | 0 | tmp = src->op1.num; |
622 | 0 | src->op1.num = src->op2.num; |
623 | 0 | src->op2.num = tmp; |
624 | 0 | } |
625 | 130 | COPY_NODE(src->result, opline->result); |
626 | 130 | SET_VAR_SOURCE(src); |
627 | 130 | MAKE_NOP(opline); |
628 | 130 | ++(*opt_count); |
629 | 130 | break; |
630 | 247 | case ZEND_IS_SMALLER_OR_EQUAL: |
631 | 247 | if (opline->opcode == ZEND_BOOL_NOT) { |
632 | 0 | uint8_t tmp_type; |
633 | 0 | uint32_t tmp; |
634 | |
|
635 | 0 | src->opcode = ZEND_IS_SMALLER; |
636 | 0 | tmp_type = src->op1_type; |
637 | 0 | src->op1_type = src->op2_type; |
638 | 0 | src->op2_type = tmp_type; |
639 | 0 | tmp = src->op1.num; |
640 | 0 | src->op1.num = src->op2.num; |
641 | 0 | src->op2.num = tmp; |
642 | 0 | } |
643 | 247 | COPY_NODE(src->result, opline->result); |
644 | 247 | SET_VAR_SOURCE(src); |
645 | 247 | MAKE_NOP(opline); |
646 | 247 | ++(*opt_count); |
647 | 247 | break; |
648 | 10 | case ZEND_ISSET_ISEMPTY_CV: |
649 | 26 | case ZEND_ISSET_ISEMPTY_VAR: |
650 | 298 | case ZEND_ISSET_ISEMPTY_DIM_OBJ: |
651 | 352 | case ZEND_ISSET_ISEMPTY_PROP_OBJ: |
652 | 366 | case ZEND_ISSET_ISEMPTY_STATIC_PROP: |
653 | 401 | case ZEND_INSTANCEOF: |
654 | 528 | case ZEND_TYPE_CHECK: |
655 | 535 | case ZEND_DEFINED: |
656 | 535 | case ZEND_IN_ARRAY: |
657 | 563 | case ZEND_ARRAY_KEY_EXISTS: |
658 | 563 | if (opline->opcode == ZEND_BOOL_NOT) { |
659 | 419 | break; |
660 | 419 | } |
661 | 144 | COPY_NODE(src->result, opline->result); |
662 | 144 | SET_VAR_SOURCE(src); |
663 | 144 | MAKE_NOP(opline); |
664 | 144 | ++(*opt_count); |
665 | 144 | break; |
666 | 23.3k | } |
667 | 23.3k | } |
668 | 23.3k | } |
669 | 17.2k | break; |
670 | | |
671 | 28.9k | case ZEND_JMPZ: |
672 | 41.3k | case ZEND_JMPNZ: |
673 | 42.8k | while (1) { |
674 | 42.8k | if (opline->op1_type == IS_CONST) { |
675 | 788 | ++(*opt_count); |
676 | 788 | block->successors_count = 1; |
677 | 788 | if (zend_is_true(&ZEND_OP1_LITERAL(opline)) == |
678 | 788 | (opline->opcode == ZEND_JMPZ)) { |
679 | | |
680 | 358 | MAKE_NOP(opline); |
681 | 358 | block->successors[0] = block->successors[1]; |
682 | 358 | block->len--; |
683 | 358 | cfg->blocks[block->successors[0]].flags |= ZEND_BB_FOLLOW; |
684 | 358 | break; |
685 | 430 | } else { |
686 | 430 | zend_basic_block *next = cfg->blocks + block->successors[1]; |
687 | | |
688 | 430 | next->flags &= ~ZEND_BB_FOLLOW; |
689 | 430 | if (!(next->flags & (ZEND_BB_TARGET|ZEND_BB_PROTECTED))) { |
690 | 352 | next->flags &= ~ZEND_BB_REACHABLE; |
691 | 352 | } |
692 | 430 | opline->opcode = ZEND_JMP; |
693 | 430 | COPY_NODE(opline->op1, opline->op2); |
694 | 430 | break; |
695 | 430 | } |
696 | 42.0k | } else if (opline->op1_type == IS_TMP_VAR && |
697 | 39.2k | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
698 | 38.4k | src = VAR_SOURCE(opline->op1); |
699 | 38.4k | if (src) { |
700 | 38.4k | if (src->opcode == ZEND_BOOL_NOT) { |
701 | 723 | VAR_SOURCE(opline->op1) = NULL; |
702 | 723 | COPY_NODE(opline->op1, src->op1); |
703 | | /* T = BOOL_NOT(X) + JMPZ(T) -> NOP, JMPNZ(X) */ |
704 | 723 | opline->opcode = INV_COND(opline->opcode); |
705 | 723 | MAKE_NOP(src); |
706 | 723 | ++(*opt_count); |
707 | 723 | continue; |
708 | 37.7k | } else if (src->opcode == ZEND_BOOL || |
709 | 36.9k | src->opcode == ZEND_QM_ASSIGN) { |
710 | 811 | VAR_SOURCE(opline->op1) = NULL; |
711 | 811 | COPY_NODE(opline->op1, src->op1); |
712 | 811 | MAKE_NOP(src); |
713 | 811 | ++(*opt_count); |
714 | 811 | continue; |
715 | 811 | } |
716 | 38.4k | } |
717 | 38.4k | } |
718 | 40.5k | break; |
719 | 42.8k | } |
720 | 41.3k | break; |
721 | | |
722 | 2.22k | case ZEND_JMPZ_EX: |
723 | 4.88k | case ZEND_JMPNZ_EX: |
724 | 5.47k | while (1) { |
725 | 5.47k | if (opline->op1_type == IS_CONST) { |
726 | 1.11k | bool is_jmpz_ex = opline->opcode == ZEND_JMPZ_EX; |
727 | 1.11k | if (zend_is_true(&ZEND_OP1_LITERAL(opline)) == is_jmpz_ex) { |
728 | | |
729 | 317 | ++(*opt_count); |
730 | 317 | opline->opcode = ZEND_QM_ASSIGN; |
731 | 317 | zval_ptr_dtor_nogc(&ZEND_OP1_LITERAL(opline)); |
732 | 317 | ZVAL_BOOL(&ZEND_OP1_LITERAL(opline), is_jmpz_ex); |
733 | 317 | opline->op2.num = 0; |
734 | 317 | block->successors_count = 1; |
735 | 317 | block->successors[0] = block->successors[1]; |
736 | 317 | cfg->blocks[block->successors[0]].flags |= ZEND_BB_FOLLOW; |
737 | 317 | break; |
738 | 317 | } |
739 | 4.36k | } else if (opline->op1_type == IS_TMP_VAR && |
740 | 4.06k | (!zend_bitset_in(used_ext, VAR_NUM(opline->op1.var)) || |
741 | 3.56k | opline->result.var == opline->op1.var)) { |
742 | 3.56k | src = VAR_SOURCE(opline->op1); |
743 | 3.56k | if (src) { |
744 | 3.09k | if (src->opcode == ZEND_BOOL || |
745 | 2.50k | src->opcode == ZEND_QM_ASSIGN) { |
746 | 595 | VAR_SOURCE(opline->op1) = NULL; |
747 | 595 | COPY_NODE(opline->op1, src->op1); |
748 | 595 | MAKE_NOP(src); |
749 | 595 | ++(*opt_count); |
750 | 595 | continue; |
751 | 595 | } |
752 | 3.09k | } |
753 | 3.56k | } |
754 | 4.56k | break; |
755 | 5.47k | } |
756 | 4.88k | break; |
757 | | |
758 | 73.9k | case ZEND_CONCAT: |
759 | 103k | case ZEND_FAST_CONCAT: |
760 | 103k | if (opline->op1_type == IS_CONST && |
761 | 24.6k | opline->op2_type == IS_CONST) { |
762 | 0 | goto optimize_constant_binary_op; |
763 | 0 | } |
764 | | |
765 | 103k | if (opline->op2_type == IS_CONST && |
766 | 38.9k | opline->op1_type == IS_TMP_VAR) { |
767 | | |
768 | 25.7k | src = VAR_SOURCE(opline->op1); |
769 | 25.7k | if (src && |
770 | 25.7k | (src->opcode == ZEND_CONCAT || |
771 | 21.2k | src->opcode == ZEND_FAST_CONCAT) && |
772 | 23.7k | src->op2_type == IS_CONST) { |
773 | | /* compress consecutive CONCATs */ |
774 | 953 | size_t l, old_len; |
775 | | |
776 | 953 | if (Z_TYPE(ZEND_OP2_LITERAL(opline)) != IS_STRING) { |
777 | 0 | convert_to_string(&ZEND_OP2_LITERAL(opline)); |
778 | 0 | } |
779 | 953 | if (Z_TYPE(ZEND_OP2_LITERAL(src)) != IS_STRING) { |
780 | 0 | convert_to_string(&ZEND_OP2_LITERAL(src)); |
781 | 0 | } |
782 | | |
783 | 953 | VAR_SOURCE(opline->op1) = NULL; |
784 | 953 | COPY_NODE(opline->op1, src->op1); |
785 | 953 | old_len = Z_STRLEN(ZEND_OP2_LITERAL(src)); |
786 | 953 | l = old_len + Z_STRLEN(ZEND_OP2_LITERAL(opline)); |
787 | 953 | if (!Z_REFCOUNTED(ZEND_OP2_LITERAL(src))) { |
788 | 274 | zend_string *tmp = zend_string_alloc(l, 0); |
789 | 274 | memcpy(ZSTR_VAL(tmp), Z_STRVAL(ZEND_OP2_LITERAL(src)), old_len); |
790 | 274 | Z_STR(ZEND_OP2_LITERAL(src)) = tmp; |
791 | 679 | } else { |
792 | 679 | Z_STR(ZEND_OP2_LITERAL(src)) = zend_string_extend(Z_STR(ZEND_OP2_LITERAL(src)), l, 0); |
793 | 679 | } |
794 | 953 | Z_TYPE_INFO(ZEND_OP2_LITERAL(src)) = IS_STRING_EX; |
795 | 953 | memcpy(Z_STRVAL(ZEND_OP2_LITERAL(src)) + old_len, Z_STRVAL(ZEND_OP2_LITERAL(opline)), Z_STRLEN(ZEND_OP2_LITERAL(opline))); |
796 | 953 | Z_STRVAL(ZEND_OP2_LITERAL(src))[l] = '\0'; |
797 | 953 | zval_ptr_dtor_str(&ZEND_OP2_LITERAL(opline)); |
798 | 953 | ZVAL_STR(&ZEND_OP2_LITERAL(opline), zend_new_interned_string(Z_STR(ZEND_OP2_LITERAL(src)))); |
799 | 953 | ZVAL_NULL(&ZEND_OP2_LITERAL(src)); |
800 | 953 | MAKE_NOP(src); |
801 | 953 | ++(*opt_count); |
802 | 953 | } |
803 | 25.7k | } |
804 | | |
805 | 103k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
806 | 40.2k | src = VAR_SOURCE(opline->op1); |
807 | 40.2k | if (src && |
808 | 39.9k | src->opcode == ZEND_CAST && |
809 | 12 | src->extended_value == IS_STRING && |
810 | 6 | src->op1_type != IS_CONST) { |
811 | | /* convert T1 = CAST(STRING, X), T2 = CONCAT(T1, Y) to T2 = CONCAT(X,Y) */ |
812 | 4 | VAR_SOURCE(opline->op1) = NULL; |
813 | 4 | COPY_NODE(opline->op1, src->op1); |
814 | 4 | MAKE_NOP(src); |
815 | 4 | ++(*opt_count); |
816 | 4 | } |
817 | 40.2k | } |
818 | 103k | if (opline->op2_type & (IS_TMP_VAR|IS_VAR)) { |
819 | 60.5k | src = VAR_SOURCE(opline->op2); |
820 | 60.5k | if (src && |
821 | 60.3k | src->opcode == ZEND_CAST && |
822 | 203 | src->extended_value == IS_STRING && |
823 | 103 | src->op1_type != IS_CONST) { |
824 | | /* convert T1 = CAST(STRING, X), T2 = CONCAT(Y, T1) to T2 = CONCAT(Y,X) */ |
825 | 15 | zend_op *src = VAR_SOURCE(opline->op2); |
826 | 15 | VAR_SOURCE(opline->op2) = NULL; |
827 | 15 | COPY_NODE(opline->op2, src->op1); |
828 | 15 | MAKE_NOP(src); |
829 | 15 | ++(*opt_count); |
830 | 15 | } |
831 | 60.5k | } |
832 | 103k | if (opline->op1_type == IS_CONST && |
833 | 24.6k | Z_TYPE(ZEND_OP1_LITERAL(opline)) == IS_STRING && |
834 | 24.6k | Z_STRLEN(ZEND_OP1_LITERAL(opline)) == 0) { |
835 | | /* convert CONCAT('', X) => CAST(STRING, X) */ |
836 | 14 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
837 | 14 | opline->opcode = ZEND_CAST; |
838 | 14 | opline->extended_value = IS_STRING; |
839 | 14 | COPY_NODE(opline->op1, opline->op2); |
840 | 14 | opline->op2_type = IS_UNUSED; |
841 | 14 | opline->op2.var = 0; |
842 | 14 | ++(*opt_count); |
843 | 103k | } else if (opline->op2_type == IS_CONST && |
844 | 38.9k | Z_TYPE(ZEND_OP2_LITERAL(opline)) == IS_STRING && |
845 | 38.9k | Z_STRLEN(ZEND_OP2_LITERAL(opline)) == 0) { |
846 | | /* convert CONCAT(X, '') => CAST(STRING, X) */ |
847 | 22 | literal_dtor(&ZEND_OP2_LITERAL(opline)); |
848 | 22 | opline->opcode = ZEND_CAST; |
849 | 22 | opline->extended_value = IS_STRING; |
850 | 22 | opline->op2_type = IS_UNUSED; |
851 | 22 | opline->op2.var = 0; |
852 | 22 | ++(*opt_count); |
853 | 103k | } else if (opline->opcode == ZEND_CONCAT && |
854 | 73.8k | (opline->op1_type == IS_CONST || |
855 | 60.9k | (opline->op1_type == IS_TMP_VAR && |
856 | 25.5k | VAR_SOURCE(opline->op1) && |
857 | 25.3k | (VAR_SOURCE(opline->op1)->opcode == ZEND_FAST_CONCAT || |
858 | 14.2k | VAR_SOURCE(opline->op1)->opcode == ZEND_ROPE_END || |
859 | 14.1k | VAR_SOURCE(opline->op1)->opcode == ZEND_FETCH_CONSTANT || |
860 | 11.2k | VAR_SOURCE(opline->op1)->opcode == ZEND_FETCH_CLASS_CONSTANT))) && |
861 | 27.0k | (opline->op2_type == IS_CONST || |
862 | 16.7k | (opline->op2_type == IS_TMP_VAR && |
863 | 14.6k | VAR_SOURCE(opline->op2) && |
864 | 14.6k | (VAR_SOURCE(opline->op2)->opcode == ZEND_FAST_CONCAT || |
865 | 14.6k | VAR_SOURCE(opline->op2)->opcode == ZEND_ROPE_END || |
866 | 4.90k | VAR_SOURCE(opline->op2)->opcode == ZEND_FETCH_CONSTANT || |
867 | 22.1k | VAR_SOURCE(opline->op2)->opcode == ZEND_FETCH_CLASS_CONSTANT)))) { |
868 | 22.1k | opline->opcode = ZEND_FAST_CONCAT; |
869 | 22.1k | ++(*opt_count); |
870 | 22.1k | } |
871 | 103k | break; |
872 | | |
873 | 11.4k | case ZEND_ADD: |
874 | 22.3k | case ZEND_SUB: |
875 | 32.9k | case ZEND_MUL: |
876 | 45.8k | case ZEND_DIV: |
877 | 50.4k | case ZEND_MOD: |
878 | 53.7k | case ZEND_SL: |
879 | 55.2k | case ZEND_SR: |
880 | 67.1k | case ZEND_IS_SMALLER: |
881 | 70.5k | case ZEND_IS_SMALLER_OR_EQUAL: |
882 | 71.2k | case ZEND_IS_NOT_IDENTICAL: |
883 | 73.6k | case ZEND_BOOL_XOR: |
884 | 75.5k | case ZEND_BW_OR: |
885 | 89.9k | case ZEND_BW_AND: |
886 | 100k | case ZEND_BW_XOR: |
887 | 100k | if (opline->op1_type == IS_CONST && |
888 | 16.7k | opline->op2_type == IS_CONST) { |
889 | | /* evaluate constant expressions */ |
890 | 11.9k | zval result; |
891 | | |
892 | 11.9k | optimize_constant_binary_op: |
893 | 11.9k | if (zend_optimizer_eval_binary_op(&result, opline->opcode, &ZEND_OP1_LITERAL(opline), &ZEND_OP2_LITERAL(opline)) == SUCCESS) { |
894 | 4 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
895 | 4 | literal_dtor(&ZEND_OP2_LITERAL(opline)); |
896 | 4 | opline->opcode = ZEND_QM_ASSIGN; |
897 | 4 | SET_UNUSED(opline->op2); |
898 | 4 | zend_optimizer_update_op1_const(op_array, opline, &result); |
899 | 4 | ++(*opt_count); |
900 | 4 | } |
901 | 11.9k | } |
902 | 100k | break; |
903 | | |
904 | 100k | case ZEND_BW_NOT: |
905 | 30.8k | if (opline->op1_type == IS_CONST) { |
906 | | /* evaluate constant unary ops */ |
907 | 242 | zval result; |
908 | | |
909 | 2.53k | optimize_const_unary_op: |
910 | 2.53k | if (zend_optimizer_eval_unary_op(&result, opline->opcode, &ZEND_OP1_LITERAL(opline)) == SUCCESS) { |
911 | 2.27k | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
912 | 2.27k | opline->opcode = ZEND_QM_ASSIGN; |
913 | 2.27k | zend_optimizer_update_op1_const(op_array, opline, &result); |
914 | 2.27k | ++(*opt_count); |
915 | 2.27k | } |
916 | 2.53k | } |
917 | 33.1k | break; |
918 | | |
919 | 33.1k | case ZEND_CAST: |
920 | 3.01k | if (opline->op1_type == IS_CONST) { |
921 | | /* cast of constant operand */ |
922 | 387 | zval result; |
923 | | |
924 | 387 | if (zend_optimizer_eval_cast(&result, opline->extended_value, &ZEND_OP1_LITERAL(opline)) == SUCCESS) { |
925 | 4 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
926 | 4 | opline->opcode = ZEND_QM_ASSIGN; |
927 | 4 | opline->extended_value = 0; |
928 | 4 | zend_optimizer_update_op1_const(op_array, opline, &result); |
929 | 4 | ++(*opt_count); |
930 | 4 | } |
931 | 387 | } |
932 | 3.01k | break; |
933 | | |
934 | 418 | case ZEND_STRLEN: |
935 | 418 | if (opline->op1_type == IS_CONST) { |
936 | 18 | zval result; |
937 | | |
938 | 18 | if (zend_optimizer_eval_strlen(&result, &ZEND_OP1_LITERAL(opline)) == SUCCESS) { |
939 | 0 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
940 | 0 | opline->opcode = ZEND_QM_ASSIGN; |
941 | 0 | zend_optimizer_update_op1_const(op_array, opline, &result); |
942 | 0 | ++(*opt_count); |
943 | 0 | } |
944 | 18 | } |
945 | 418 | break; |
946 | | |
947 | 145k | case ZEND_RETURN: |
948 | 145k | if (opline->op1_type == IS_TMP_VAR) { |
949 | 4.01k | src = VAR_SOURCE(opline->op1); |
950 | 4.01k | if (src && src->opcode == ZEND_QM_ASSIGN) { |
951 | 144 | zend_op *op = src + 1; |
952 | 144 | bool optimize = true; |
953 | | |
954 | 144 | while (op < opline) { |
955 | 24 | if ((op->op1_type == opline->op1_type |
956 | 4 | && op->op1.var == opline->op1.var) |
957 | 20 | || (op->op2_type == opline->op1_type |
958 | 24 | && op->op2.var == opline->op1.var)) { |
959 | 24 | optimize = false; |
960 | 24 | break; |
961 | 24 | } |
962 | 0 | op++; |
963 | 0 | } |
964 | | |
965 | 144 | if (optimize) { |
966 | | /* T = QM_ASSIGN(X), RETURN(T) to NOP, RETURN(X) */ |
967 | 120 | VAR_SOURCE(opline->op1) = NULL; |
968 | 120 | COPY_NODE(opline->op1, src->op1); |
969 | 120 | MAKE_NOP(src); |
970 | 120 | ++(*opt_count); |
971 | 120 | } |
972 | 144 | } |
973 | 4.01k | } |
974 | 145k | break; |
975 | | |
976 | 18.6k | case ZEND_QM_ASSIGN: |
977 | 18.6k | if (opline->op1_type == opline->result_type && |
978 | 4.79k | opline->op1.var == opline->result.var) { |
979 | | /* strip T = QM_ASSIGN(T) */ |
980 | 0 | MAKE_NOP(opline); |
981 | 0 | ++(*opt_count); |
982 | 18.6k | } else if (opline->op1_type == IS_TMP_VAR && |
983 | 4.79k | opline->result_type == IS_TMP_VAR && |
984 | 4.79k | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
985 | | /* T1 = ..., T2 = QM_ASSIGN(T1) to T2 = ..., NOP */ |
986 | 2.17k | src = VAR_SOURCE(opline->op1); |
987 | 2.17k | if (src && |
988 | 2.17k | src->opcode != ZEND_COPY_TMP && |
989 | 2.17k | src->opcode != ZEND_ADD_ARRAY_ELEMENT && |
990 | 2.17k | src->opcode != ZEND_ADD_ARRAY_UNPACK && |
991 | 2.17k | (src->opcode != ZEND_DECLARE_LAMBDA_FUNCTION || |
992 | 2.17k | src == opline -1)) { |
993 | 2.17k | src->result.var = opline->result.var; |
994 | 2.17k | VAR_SOURCE(opline->op1) = NULL; |
995 | 2.17k | VAR_SOURCE(opline->result) = src; |
996 | 2.17k | MAKE_NOP(opline); |
997 | 2.17k | ++(*opt_count); |
998 | 2.17k | } |
999 | 2.17k | } |
1000 | 18.6k | break; |
1001 | 3.52M | } |
1002 | | |
1003 | | /* get variable source */ |
1004 | 3.52M | if (opline->result_type & (IS_VAR|IS_TMP_VAR)) { |
1005 | 1.65M | SET_VAR_SOURCE(opline); |
1006 | 1.65M | } |
1007 | 3.52M | opline++; |
1008 | 3.52M | } |
1009 | 560k | } |
1010 | | |
1011 | | /* Rebuild plain (optimized) op_array from CFG */ |
1012 | | static void assemble_code_blocks(zend_cfg *cfg, zend_op_array *op_array, zend_optimizer_ctx *ctx) |
1013 | 102k | { |
1014 | 102k | zend_basic_block *blocks = cfg->blocks; |
1015 | 102k | zend_basic_block *end = blocks + cfg->blocks_count; |
1016 | 102k | zend_basic_block *b; |
1017 | 102k | zend_op *new_opcodes; |
1018 | 102k | zend_op *opline; |
1019 | 102k | uint32_t len = 0; |
1020 | | |
1021 | 514k | for (b = blocks; b < end; b++) { |
1022 | 411k | if (b->len == 0) { |
1023 | 35.6k | continue; |
1024 | 35.6k | } |
1025 | 376k | if (b->flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1026 | 360k | opline = op_array->opcodes + b->start + b->len - 1; |
1027 | 360k | if (opline->opcode == ZEND_JMP) { |
1028 | 51.1k | zend_basic_block *next = b + 1; |
1029 | | |
1030 | 62.2k | while (next < end && !(next->flags & ZEND_BB_REACHABLE)) { |
1031 | 11.0k | next++; |
1032 | 11.0k | } |
1033 | 51.1k | if (next < end && next == blocks + b->successors[0]) { |
1034 | | /* JMP to the next block - strip it */ |
1035 | 18 | MAKE_NOP(opline); |
1036 | 18 | b->len--; |
1037 | 18 | } |
1038 | 308k | } else if (b->len == 1 && opline->opcode == ZEND_NOP) { |
1039 | | /* skip empty block */ |
1040 | 0 | b->len--; |
1041 | 0 | } |
1042 | 360k | len += b->len; |
1043 | 360k | } else { |
1044 | | /* this block will not be used, delete all constants there */ |
1045 | 16.3k | zend_op *op = op_array->opcodes + b->start; |
1046 | 16.3k | zend_op *end = op + b->len; |
1047 | 37.4k | for (; op < end; op++) { |
1048 | 21.1k | if (op->op1_type == IS_CONST) { |
1049 | 14.7k | literal_dtor(&ZEND_OP1_LITERAL(op)); |
1050 | 14.7k | } |
1051 | 21.1k | if (op->op2_type == IS_CONST) { |
1052 | 635 | literal_dtor(&ZEND_OP2_LITERAL(op)); |
1053 | 635 | } |
1054 | 21.1k | } |
1055 | 16.3k | } |
1056 | 376k | } |
1057 | | |
1058 | 102k | new_opcodes = emalloc(len * sizeof(zend_op)); |
1059 | 102k | opline = new_opcodes; |
1060 | | |
1061 | | /* Copy code of reachable blocks into a single buffer */ |
1062 | 514k | for (b = blocks; b < end; b++) { |
1063 | 411k | if (b->flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1064 | 360k | memcpy(opline, op_array->opcodes + b->start, b->len * sizeof(zend_op)); |
1065 | 360k | b->start = opline - new_opcodes; |
1066 | 360k | opline += b->len; |
1067 | 360k | } |
1068 | 411k | } |
1069 | | |
1070 | | /* adjust jump targets */ |
1071 | 102k | efree(op_array->opcodes); |
1072 | 102k | op_array->opcodes = new_opcodes; |
1073 | 102k | op_array->last = len; |
1074 | | |
1075 | 514k | for (b = blocks; b < end; b++) { |
1076 | 411k | if (!(b->flags & ZEND_BB_REACHABLE) || b->len == 0) { |
1077 | 51.9k | continue; |
1078 | 51.9k | } |
1079 | 360k | opline = op_array->opcodes + b->start + b->len - 1; |
1080 | 360k | switch (opline->opcode) { |
1081 | 663 | case ZEND_FAST_CALL: |
1082 | 51.8k | case ZEND_JMP: |
1083 | 51.8k | ZEND_SET_OP_JMP_ADDR(opline, opline->op1, new_opcodes + blocks[b->successors[0]].start); |
1084 | 51.8k | break; |
1085 | 16.6k | case ZEND_JMPZ: |
1086 | 26.2k | case ZEND_JMPNZ: |
1087 | 27.5k | case ZEND_JMPZ_EX: |
1088 | 28.9k | case ZEND_JMPNZ_EX: |
1089 | 41.7k | case ZEND_FE_RESET_R: |
1090 | 42.5k | case ZEND_FE_RESET_RW: |
1091 | 43.9k | case ZEND_JMP_SET: |
1092 | 48.2k | case ZEND_COALESCE: |
1093 | 49.7k | case ZEND_ASSERT_CHECK: |
1094 | 81.5k | case ZEND_JMP_NULL: |
1095 | 81.7k | case ZEND_BIND_INIT_STATIC_OR_JMP: |
1096 | 81.7k | case ZEND_JMP_FRAMELESS: |
1097 | 81.7k | ZEND_SET_OP_JMP_ADDR(opline, opline->op2, new_opcodes + blocks[b->successors[0]].start); |
1098 | 81.7k | break; |
1099 | 5.62k | case ZEND_CATCH: |
1100 | 5.62k | if (!(opline->extended_value & ZEND_LAST_CATCH)) { |
1101 | 4.24k | ZEND_SET_OP_JMP_ADDR(opline, opline->op2, new_opcodes + blocks[b->successors[0]].start); |
1102 | 4.24k | } |
1103 | 5.62k | break; |
1104 | 12.8k | case ZEND_FE_FETCH_R: |
1105 | 13.5k | case ZEND_FE_FETCH_RW: |
1106 | 13.5k | opline->extended_value = ZEND_OPLINE_TO_OFFSET(opline, new_opcodes + blocks[b->successors[0]].start); |
1107 | 13.5k | break; |
1108 | 8 | case ZEND_SWITCH_LONG: |
1109 | 58 | case ZEND_SWITCH_STRING: |
1110 | 232 | case ZEND_MATCH: |
1111 | 232 | { |
1112 | 232 | HashTable *jumptable = Z_ARRVAL(ZEND_OP2_LITERAL(opline)); |
1113 | 232 | zval *zv; |
1114 | 232 | uint32_t s = 0; |
1115 | 232 | ZEND_ASSERT(b->successors_count == (opline->opcode == ZEND_MATCH ? 1 : 2) + zend_hash_num_elements(jumptable)); |
1116 | | |
1117 | 2.09k | ZEND_HASH_FOREACH_VAL(jumptable, zv) { |
1118 | 2.09k | Z_LVAL_P(zv) = ZEND_OPLINE_TO_OFFSET(opline, new_opcodes + blocks[b->successors[s++]].start); |
1119 | 2.09k | } ZEND_HASH_FOREACH_END(); |
1120 | 232 | opline->extended_value = ZEND_OPLINE_TO_OFFSET(opline, new_opcodes + blocks[b->successors[s++]].start); |
1121 | 232 | break; |
1122 | 232 | } |
1123 | 360k | } |
1124 | 360k | } |
1125 | | |
1126 | | /* adjust exception jump targets & remove unused try_catch_array entries */ |
1127 | 102k | if (op_array->last_try_catch) { |
1128 | 25.9k | int i, j; |
1129 | 25.9k | uint32_t *map; |
1130 | 25.9k | ALLOCA_FLAG(use_heap); |
1131 | | |
1132 | 25.9k | map = (uint32_t *)do_alloca(sizeof(uint32_t) * op_array->last_try_catch, use_heap); |
1133 | 58.3k | for (i = 0, j = 0; i< op_array->last_try_catch; i++) { |
1134 | 32.3k | if (blocks[cfg->map[op_array->try_catch_array[i].try_op]].flags & ZEND_BB_REACHABLE) { |
1135 | 32.3k | map[i] = j; |
1136 | 32.3k | op_array->try_catch_array[j].try_op = blocks[cfg->map[op_array->try_catch_array[i].try_op]].start; |
1137 | 32.3k | if (op_array->try_catch_array[i].catch_op) { |
1138 | 31.7k | op_array->try_catch_array[j].catch_op = blocks[cfg->map[op_array->try_catch_array[i].catch_op]].start; |
1139 | 31.7k | } else { |
1140 | 594 | op_array->try_catch_array[j].catch_op = 0; |
1141 | 594 | } |
1142 | 32.3k | if (op_array->try_catch_array[i].finally_op) { |
1143 | 739 | op_array->try_catch_array[j].finally_op = blocks[cfg->map[op_array->try_catch_array[i].finally_op]].start; |
1144 | 31.6k | } else { |
1145 | 31.6k | op_array->try_catch_array[j].finally_op = 0; |
1146 | 31.6k | } |
1147 | 32.3k | if (!op_array->try_catch_array[i].finally_end) { |
1148 | 31.6k | op_array->try_catch_array[j].finally_end = 0; |
1149 | 31.6k | } else { |
1150 | 739 | op_array->try_catch_array[j].finally_end = blocks[cfg->map[op_array->try_catch_array[i].finally_end]].start; |
1151 | 739 | } |
1152 | 32.3k | j++; |
1153 | 32.3k | } |
1154 | 32.3k | } |
1155 | 25.9k | if (i != j) { |
1156 | 9 | op_array->last_try_catch = j; |
1157 | 9 | if (j == 0) { |
1158 | 5 | efree(op_array->try_catch_array); |
1159 | 5 | op_array->try_catch_array = NULL; |
1160 | 5 | } |
1161 | | |
1162 | 9 | if (op_array->fn_flags & ZEND_ACC_HAS_FINALLY_BLOCK) { |
1163 | 0 | zend_op *opline = new_opcodes; |
1164 | 0 | zend_op *end = opline + len; |
1165 | 0 | while (opline < end) { |
1166 | 0 | if (opline->opcode == ZEND_FAST_RET && |
1167 | 0 | opline->op2.num != (uint32_t)-1 && |
1168 | 0 | opline->op2.num < (uint32_t)j) { |
1169 | 0 | opline->op2.num = map[opline->op2.num]; |
1170 | 0 | } |
1171 | 0 | opline++; |
1172 | 0 | } |
1173 | 0 | } |
1174 | 9 | } |
1175 | 25.9k | free_alloca(map, use_heap); |
1176 | 25.9k | } |
1177 | | |
1178 | | /* rebuild map (just for printing) */ |
1179 | 102k | memset(cfg->map, -1, sizeof(int) * op_array->last); |
1180 | 514k | for (int n = 0; n < cfg->blocks_count; n++) { |
1181 | 411k | if (cfg->blocks[n].flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1182 | 360k | cfg->map[cfg->blocks[n].start] = n; |
1183 | 360k | } |
1184 | 411k | } |
1185 | 102k | } |
1186 | | |
1187 | | static zend_always_inline zend_basic_block *get_target_block(const zend_cfg *cfg, zend_basic_block *block, int n, uint32_t *opt_count) |
1188 | 177k | { |
1189 | 177k | int b; |
1190 | 177k | zend_basic_block *target_block = cfg->blocks + block->successors[n]; |
1191 | | |
1192 | 177k | if (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)) { |
1193 | 186 | do { |
1194 | 186 | b = target_block->successors[0]; |
1195 | 186 | target_block = cfg->blocks + b; |
1196 | 186 | } while (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)); |
1197 | 146 | block->successors[n] = b; |
1198 | 146 | ++(*opt_count); |
1199 | 146 | } |
1200 | 177k | return target_block; |
1201 | 177k | } |
1202 | | |
1203 | | static zend_always_inline zend_basic_block *get_follow_block(const zend_cfg *cfg, zend_basic_block *block, int n, uint32_t *opt_count) |
1204 | 45.0k | { |
1205 | 45.0k | int b; |
1206 | 45.0k | zend_basic_block *target_block = cfg->blocks + block->successors[n]; |
1207 | | |
1208 | 45.0k | if (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)) { |
1209 | 1.01k | do { |
1210 | 1.01k | b = target_block->successors[0]; |
1211 | 1.01k | target_block = cfg->blocks + b; |
1212 | 1.01k | } while (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)); |
1213 | 913 | block->successors[n] = b; |
1214 | 913 | ++(*opt_count); |
1215 | 913 | } |
1216 | 45.0k | return target_block; |
1217 | 45.0k | } |
1218 | | |
1219 | | static zend_always_inline zend_basic_block *get_next_block(const zend_cfg *cfg, zend_basic_block *block) |
1220 | 91.6k | { |
1221 | 91.6k | zend_basic_block *next_block = block + 1; |
1222 | 91.6k | zend_basic_block *end = cfg->blocks + cfg->blocks_count; |
1223 | | |
1224 | 105k | while (1) { |
1225 | 105k | if (next_block == end) { |
1226 | 811 | return NULL; |
1227 | 105k | } else if (next_block->flags & ZEND_BB_REACHABLE) { |
1228 | 90.8k | break; |
1229 | 90.8k | } |
1230 | 14.3k | next_block++; |
1231 | 14.3k | } |
1232 | 90.9k | while (next_block->len == 0 && !(next_block->flags & ZEND_BB_PROTECTED)) { |
1233 | 95 | next_block = cfg->blocks + next_block->successors[0]; |
1234 | 95 | } |
1235 | 90.8k | return next_block; |
1236 | 91.6k | } |
1237 | | |
1238 | | |
1239 | | /* we use "jmp_hitlist" to avoid infinity loops during jmp optimization */ |
1240 | | static zend_always_inline bool in_hitlist(int target, int *jmp_hitlist, int jmp_hitlist_count) |
1241 | 650 | { |
1242 | 650 | int i; |
1243 | | |
1244 | 818 | for (i = 0; i < jmp_hitlist_count; i++) { |
1245 | 381 | if (jmp_hitlist[i] == target) { |
1246 | 213 | return 1; |
1247 | 213 | } |
1248 | 381 | } |
1249 | 437 | return 0; |
1250 | 650 | } |
1251 | | |
1252 | | #define CHECK_LOOP(target) \ |
1253 | 650 | if (EXPECTED(!in_hitlist(target, jmp_hitlist, jmp_hitlist_count))) { \ |
1254 | 437 | jmp_hitlist[jmp_hitlist_count++] = target; \ |
1255 | 437 | } else { \ |
1256 | 213 | break; \ |
1257 | 213 | } |
1258 | | |
1259 | | static void zend_jmp_optimization(zend_basic_block *block, zend_op_array *op_array, const zend_cfg *cfg, int *jmp_hitlist, uint32_t *opt_count) |
1260 | 560k | { |
1261 | | /* last_op is the last opcode of the current block */ |
1262 | 560k | zend_basic_block *target_block, *follow_block, *next_block; |
1263 | 560k | zend_op *last_op, *target; |
1264 | 560k | int next, jmp_hitlist_count; |
1265 | | |
1266 | 560k | if (block->len == 0) { |
1267 | 1.47k | return; |
1268 | 1.47k | } |
1269 | | |
1270 | 558k | last_op = op_array->opcodes + block->start + block->len - 1; |
1271 | 558k | switch (last_op->opcode) { |
1272 | 90.7k | case ZEND_JMP: |
1273 | 90.7k | jmp_hitlist_count = 0; |
1274 | | |
1275 | 90.7k | target_block = get_target_block(cfg, block, 0, opt_count); |
1276 | 90.8k | while (target_block->len == 1) { |
1277 | 46.2k | target = op_array->opcodes + target_block->start; |
1278 | 46.2k | if (target->opcode == ZEND_JMP) { |
1279 | | /* JMP L, L: JMP L1 -> JMP L1 */ |
1280 | 76 | next = target_block->successors[0]; |
1281 | 46.1k | } else { |
1282 | 46.1k | break; |
1283 | 46.1k | } |
1284 | 76 | CHECK_LOOP(next); |
1285 | 40 | block->successors[0] = next; |
1286 | 40 | ++(*opt_count); |
1287 | 40 | target_block = get_target_block(cfg, block, 0, opt_count); |
1288 | 40 | } |
1289 | | |
1290 | 90.7k | next_block = get_next_block(cfg, block); |
1291 | 90.7k | if (target_block == next_block) { |
1292 | | /* JMP(next) -> NOP */ |
1293 | 940 | MAKE_NOP(last_op); |
1294 | 940 | ++(*opt_count); |
1295 | 940 | block->len--; |
1296 | 89.8k | } else if (target_block->len == 1) { |
1297 | 45.9k | target = op_array->opcodes + target_block->start; |
1298 | 45.9k | if ((target->opcode == ZEND_RETURN || |
1299 | 45.7k | target->opcode == ZEND_RETURN_BY_REF || |
1300 | 45.7k | target->opcode == ZEND_GENERATOR_RETURN) && |
1301 | 328 | !(op_array->fn_flags & ZEND_ACC_HAS_FINALLY_BLOCK)) { |
1302 | | /* JMP L, L: RETURN to immediate RETURN */ |
1303 | 62 | *last_op = *target; |
1304 | 62 | if (last_op->op1_type == IS_CONST) { |
1305 | 62 | zval zv; |
1306 | 62 | ZVAL_COPY(&zv, &ZEND_OP1_LITERAL(last_op)); |
1307 | 62 | last_op->op1.constant = zend_optimizer_add_literal(op_array, &zv); |
1308 | 62 | } |
1309 | 62 | block->successors_count = 0; |
1310 | 62 | ++(*opt_count); |
1311 | 62 | } |
1312 | 45.9k | } |
1313 | 90.7k | break; |
1314 | | |
1315 | 1.91k | case ZEND_JMP_SET: |
1316 | 8.19k | case ZEND_COALESCE: |
1317 | 40.9k | case ZEND_JMP_NULL: |
1318 | 40.9k | jmp_hitlist_count = 0; |
1319 | | |
1320 | 40.9k | target_block = get_target_block(cfg, block, 0, opt_count); |
1321 | 40.9k | while (target_block->len == 1) { |
1322 | 5.03k | target = op_array->opcodes + target_block->start; |
1323 | | |
1324 | 5.03k | if (target->opcode == ZEND_JMP) { |
1325 | | /* JMP_SET(X, L), L: JMP(L2) -> JMP_SET(X, L2) */ |
1326 | 32 | next = target_block->successors[0]; |
1327 | 32 | CHECK_LOOP(next); |
1328 | 32 | block->successors[0] = next; |
1329 | 32 | ++(*opt_count); |
1330 | 5.00k | } else { |
1331 | 5.00k | break; |
1332 | 5.00k | } |
1333 | 32 | target_block = get_target_block(cfg, block, 0, opt_count); |
1334 | 32 | } |
1335 | 40.9k | break; |
1336 | | |
1337 | 27.8k | case ZEND_JMPZ: |
1338 | 40.5k | case ZEND_JMPNZ: |
1339 | 40.5k | jmp_hitlist_count = 0; |
1340 | | |
1341 | 40.5k | target_block = get_target_block(cfg, block, 0, opt_count); |
1342 | 40.8k | while (target_block->len == 1) { |
1343 | 26.1k | target = op_array->opcodes + target_block->start; |
1344 | | |
1345 | 26.1k | if (target->opcode == ZEND_JMP) { |
1346 | | /* JMPZ(X, L), L: JMP(L2) -> JMPZ(X, L2) */ |
1347 | 88 | next = target_block->successors[0]; |
1348 | 26.0k | } else if (target->opcode == last_op->opcode && |
1349 | 760 | SAME_VAR(target->op1, last_op->op1)) { |
1350 | | /* JMPZ(X, L), L: JMPZ(X, L2) -> JMPZ(X, L2) */ |
1351 | 430 | next = target_block->successors[0]; |
1352 | 25.6k | } else if (target->opcode == INV_COND(last_op->opcode) && |
1353 | 128 | SAME_VAR(target->op1, last_op->op1)) { |
1354 | | /* JMPZ(X, L), L: JMPNZ(X, L2) -> JMPZ(X, L+1) */ |
1355 | 24 | next = target_block->successors[1]; |
1356 | 25.6k | } else { |
1357 | 25.6k | break; |
1358 | 25.6k | } |
1359 | 542 | CHECK_LOOP(next); |
1360 | 365 | block->successors[0] = next; |
1361 | 365 | ++(*opt_count); |
1362 | 365 | target_block = get_target_block(cfg, block, 0, opt_count); |
1363 | 365 | } |
1364 | | |
1365 | 40.5k | follow_block = get_follow_block(cfg, block, 1, opt_count); |
1366 | 40.5k | if (target_block == follow_block) { |
1367 | | /* L: JMP[N]Z(X, L+1) -> NOP or FREE(X) */ |
1368 | 627 | zend_optimizer_convert_to_free_op1(op_array, last_op); |
1369 | 627 | if (last_op->opcode == ZEND_NOP) { |
1370 | 0 | block->len--; |
1371 | 0 | } |
1372 | 627 | block->successors_count = 1; |
1373 | 627 | ++(*opt_count); |
1374 | 39.9k | } else if (follow_block->len == 1) { |
1375 | 9.27k | target = op_array->opcodes + follow_block->start; |
1376 | 9.27k | if (target->opcode == ZEND_JMP) { |
1377 | 1.05k | if (block->successors[0] == follow_block->successors[0]) { |
1378 | | /* JMPZ(X,L1), JMP(L1) -> NOP, JMP(L1) */ |
1379 | 236 | zend_optimizer_convert_to_free_op1(op_array, last_op); |
1380 | 236 | if (last_op->opcode == ZEND_NOP) { |
1381 | 0 | block->len--; |
1382 | 0 | } |
1383 | 236 | block->successors[0] = follow_block - cfg->blocks; |
1384 | 236 | block->successors_count = 1; |
1385 | 236 | ++(*opt_count); |
1386 | 236 | break; |
1387 | 820 | } else if (!(follow_block->flags & (ZEND_BB_TARGET | ZEND_BB_PROTECTED))) { |
1388 | 820 | next_block = get_next_block(cfg, follow_block); |
1389 | | |
1390 | 820 | if (target_block == next_block) { |
1391 | | /* JMPZ(X,L1) JMP(L2) L1: -> JMPNZ(X,L2) NOP*/ |
1392 | | |
1393 | 424 | last_op->opcode = INV_COND(last_op->opcode); |
1394 | | |
1395 | 424 | block->successors[0] = follow_block->successors[0]; |
1396 | 424 | block->successors[1] = next_block - cfg->blocks; |
1397 | | |
1398 | 424 | follow_block->flags &= ~ZEND_BB_REACHABLE; |
1399 | 424 | MAKE_NOP(target); |
1400 | 424 | follow_block->len = 0; |
1401 | | |
1402 | 424 | next_block->flags |= ZEND_BB_FOLLOW; |
1403 | | |
1404 | 424 | break; |
1405 | 424 | } |
1406 | 820 | } |
1407 | 1.05k | } |
1408 | 9.27k | } |
1409 | 39.8k | break; |
1410 | | |
1411 | 39.8k | case ZEND_JMPNZ_EX: |
1412 | 4.56k | case ZEND_JMPZ_EX: |
1413 | 4.56k | jmp_hitlist_count = 0; |
1414 | | |
1415 | 4.56k | target_block = get_target_block(cfg, block, 0, opt_count); |
1416 | 4.56k | while (target_block->len == 1) { |
1417 | 1.75k | target = op_array->opcodes + target_block->start; |
1418 | | |
1419 | 1.75k | if (target->opcode == ZEND_JMP) { |
1420 | | /* T = JMPZ_EX(X, L), L: JMP(L2) -> T = JMPZ(X, L2) */ |
1421 | 0 | next = target_block->successors[0]; |
1422 | 1.75k | } else if (target->opcode == last_op->opcode-3 && |
1423 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1424 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1425 | | /* T = JMPZ_EX(X, L1), L1: JMPZ({X|T}, L2) -> T = JMPZ_EX(X, L2) */ |
1426 | 0 | next = target_block->successors[0]; |
1427 | 1.75k | } else if (target->opcode == last_op->opcode && |
1428 | 0 | target->result.var == last_op->result.var && |
1429 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1430 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1431 | | /* T = JMPZ_EX(X, L1), L1: T = JMPZ_EX({X|T}, L2) -> T = JMPZ_EX(X, L2) */ |
1432 | 0 | next = target_block->successors[0]; |
1433 | 1.75k | } else if (target->opcode == INV_EX_COND(last_op->opcode) && |
1434 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1435 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1436 | | /* T = JMPZ_EX(X, L1), L1: JMPNZ({X|T1}, L2) -> T = JMPZ_EX(X, L1+1) */ |
1437 | 0 | next = target_block->successors[1]; |
1438 | 1.75k | } else if (target->opcode == INV_EX_COND_EX(last_op->opcode) && |
1439 | 128 | target->result.var == last_op->result.var && |
1440 | 120 | (SAME_VAR(target->op1, last_op->result) || |
1441 | 120 | SAME_VAR(target->op1, last_op->op1))) { |
1442 | | /* T = JMPZ_EX(X, L1), L1: T = JMPNZ_EX({X|T}, L2) -> T = JMPZ_EX(X, L1+1) */ |
1443 | 0 | next = target_block->successors[1]; |
1444 | 1.75k | } else if (target->opcode == ZEND_BOOL && |
1445 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1446 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1447 | | /* convert Y = JMPZ_EX(X,L1), L1: Z = BOOL(Y) to |
1448 | | Z = JMPZ_EX(X,L1+1) */ |
1449 | | |
1450 | | /* NOTE: This optimization pattern is not safe, but works, */ |
1451 | | /* because result of JMPZ_EX instruction */ |
1452 | | /* is not used on the following path and */ |
1453 | | /* should be used once on the branch path. */ |
1454 | | /* */ |
1455 | | /* The pattern works well only if jumps processed in */ |
1456 | | /* direct order, otherwise it breaks JMPZ_EX */ |
1457 | | /* sequences too early. */ |
1458 | 0 | last_op->result.var = target->result.var; |
1459 | 0 | next = target_block->successors[0]; |
1460 | 1.75k | } else { |
1461 | 1.75k | break; |
1462 | 1.75k | } |
1463 | 0 | CHECK_LOOP(next); |
1464 | 0 | block->successors[0] = next; |
1465 | 0 | ++(*opt_count); |
1466 | 0 | target_block = get_target_block(cfg, block, 0, opt_count); |
1467 | 0 | } |
1468 | | |
1469 | 4.56k | follow_block = get_follow_block(cfg, block, 1, opt_count); |
1470 | 4.56k | if (target_block == follow_block) { |
1471 | | /* L: T = JMP[N]Z_EX(X, L+1) -> T = BOOL(X) */ |
1472 | 0 | last_op->opcode = ZEND_BOOL; |
1473 | 0 | last_op->op2.num = 0; |
1474 | 0 | block->successors_count = 1; |
1475 | 0 | ++(*opt_count); |
1476 | 0 | break; |
1477 | 0 | } |
1478 | 4.56k | break; |
1479 | 558k | } |
1480 | 558k | } |
1481 | | |
1482 | | /* Global data dependencies */ |
1483 | | |
1484 | | /* Find a set of variables which are used outside of the block where they are |
1485 | | * defined. We won't apply some optimization patterns for such variables. */ |
1486 | | static void zend_t_usage(zend_cfg *cfg, zend_op_array *op_array, zend_bitset used_ext, zend_optimizer_ctx *ctx) |
1487 | 129k | { |
1488 | 129k | int n; |
1489 | 129k | zend_basic_block *block, *next_block; |
1490 | 129k | uint32_t var_num; |
1491 | 129k | uint32_t bitset_len; |
1492 | 129k | zend_bitset usage; |
1493 | 129k | zend_bitset defined_here; |
1494 | 129k | void *checkpoint; |
1495 | 129k | zend_op *opline, *end; |
1496 | | |
1497 | | |
1498 | 129k | if (op_array->T == 0) { |
1499 | | /* shortcut - if no Ts, nothing to do */ |
1500 | 15.1k | return; |
1501 | 15.1k | } |
1502 | | |
1503 | 114k | checkpoint = zend_arena_checkpoint(ctx->arena); |
1504 | 114k | bitset_len = zend_bitset_len(op_array->last_var + op_array->T); |
1505 | 114k | defined_here = zend_arena_alloc(&ctx->arena, bitset_len * ZEND_BITSET_ELM_SIZE); |
1506 | | |
1507 | 114k | zend_bitset_clear(defined_here, bitset_len); |
1508 | 598k | for (n = 1; n < cfg->blocks_count; n++) { |
1509 | 484k | block = cfg->blocks + n; |
1510 | | |
1511 | 484k | if (!(block->flags & ZEND_BB_REACHABLE)) { |
1512 | 52.4k | continue; |
1513 | 52.4k | } |
1514 | | |
1515 | 431k | opline = op_array->opcodes + block->start; |
1516 | 431k | end = opline + block->len; |
1517 | 431k | if (!(block->flags & ZEND_BB_FOLLOW) || |
1518 | 317k | (block->flags & ZEND_BB_TARGET)) { |
1519 | | /* Skip continuation of "extended" BB */ |
1520 | 225k | zend_bitset_clear(defined_here, bitset_len); |
1521 | 225k | } |
1522 | | |
1523 | 2.39M | while (opline<end) { |
1524 | 1.96M | if (opline->op1_type & (IS_VAR|IS_TMP_VAR)) { |
1525 | 557k | var_num = VAR_NUM(opline->op1.var); |
1526 | 557k | if (!zend_bitset_in(defined_here, var_num)) { |
1527 | 246k | zend_bitset_incl(used_ext, var_num); |
1528 | 246k | } |
1529 | 557k | } |
1530 | 1.96M | if (opline->op2_type == IS_VAR) { |
1531 | 58.3k | var_num = VAR_NUM(opline->op2.var); |
1532 | 58.3k | if (opline->opcode == ZEND_FE_FETCH_R || |
1533 | 58.0k | opline->opcode == ZEND_FE_FETCH_RW) { |
1534 | | /* these opcode use the op2 as result */ |
1535 | 253 | zend_bitset_incl(defined_here, var_num); |
1536 | 58.0k | } else if (!zend_bitset_in(defined_here, var_num)) { |
1537 | 162 | zend_bitset_incl(used_ext, var_num); |
1538 | 162 | } |
1539 | 1.90M | } else if (opline->op2_type == IS_TMP_VAR) { |
1540 | 285k | var_num = VAR_NUM(opline->op2.var); |
1541 | 285k | if (!zend_bitset_in(defined_here, var_num)) { |
1542 | 33.2k | zend_bitset_incl(used_ext, var_num); |
1543 | 33.2k | } |
1544 | 285k | } |
1545 | | |
1546 | 1.96M | if (opline->result_type == IS_VAR) { |
1547 | 135k | var_num = VAR_NUM(opline->result.var); |
1548 | 135k | zend_bitset_incl(defined_here, var_num); |
1549 | 1.82M | } else if (opline->result_type == IS_TMP_VAR) { |
1550 | 771k | var_num = VAR_NUM(opline->result.var); |
1551 | 771k | switch (opline->opcode) { |
1552 | 4.18k | case ZEND_ADD_ARRAY_ELEMENT: |
1553 | 4.23k | case ZEND_ADD_ARRAY_UNPACK: |
1554 | 218k | case ZEND_ROPE_ADD: |
1555 | | /* these opcodes use the result as argument */ |
1556 | 218k | if (!zend_bitset_in(defined_here, var_num)) { |
1557 | 181k | zend_bitset_incl(used_ext, var_num); |
1558 | 181k | } |
1559 | 218k | break; |
1560 | 552k | default : |
1561 | 552k | zend_bitset_incl(defined_here, var_num); |
1562 | 771k | } |
1563 | 771k | } |
1564 | 1.96M | opline++; |
1565 | 1.96M | } |
1566 | 431k | } |
1567 | | |
1568 | 114k | if (ctx->debug_level & ZEND_DUMP_BLOCK_PASS_VARS) { |
1569 | 0 | bool printed = false; |
1570 | 0 | uint32_t i; |
1571 | |
|
1572 | 0 | for (i = op_array->last_var; i< op_array->T; i++) { |
1573 | 0 | if (zend_bitset_in(used_ext, i)) { |
1574 | 0 | if (!printed) { |
1575 | 0 | fprintf(stderr, "NON-LOCAL-VARS: %d", i); |
1576 | 0 | printed = true; |
1577 | 0 | } else { |
1578 | 0 | fprintf(stderr, ", %d", i); |
1579 | 0 | } |
1580 | 0 | } |
1581 | 0 | } |
1582 | 0 | if (printed) { |
1583 | 0 | fprintf(stderr, "\n"); |
1584 | 0 | } |
1585 | 0 | } |
1586 | | |
1587 | 114k | usage = defined_here; |
1588 | 114k | next_block = NULL; |
1589 | 712k | for (n = cfg->blocks_count; n > 0;) { |
1590 | 598k | block = cfg->blocks + (--n); |
1591 | | |
1592 | 598k | if (!(block->flags & ZEND_BB_REACHABLE) || block->len == 0) { |
1593 | 52.6k | continue; |
1594 | 52.6k | } |
1595 | | |
1596 | 545k | end = op_array->opcodes + block->start; |
1597 | 545k | opline = end + block->len - 1; |
1598 | 545k | if (!next_block || |
1599 | 431k | !(next_block->flags & ZEND_BB_FOLLOW) || |
1600 | 339k | (next_block->flags & ZEND_BB_TARGET)) { |
1601 | | /* Skip continuation of "extended" BB */ |
1602 | 339k | zend_bitset_copy(usage, used_ext, bitset_len); |
1603 | 339k | } else if (block->successors_count > 1) { |
1604 | 122k | zend_bitset_union(usage, used_ext, bitset_len); |
1605 | 122k | } |
1606 | 545k | next_block = block; |
1607 | | |
1608 | 4.04M | while (opline >= end) { |
1609 | | /* usage checks */ |
1610 | 3.50M | if (opline->result_type & (IS_VAR|IS_TMP_VAR)) { |
1611 | 1.66M | if (!zend_bitset_in(usage, VAR_NUM(opline->result.var))) { |
1612 | 8.65k | switch (opline->opcode) { |
1613 | 0 | case ZEND_ASSIGN_OP: |
1614 | 0 | case ZEND_ASSIGN_DIM_OP: |
1615 | 0 | case ZEND_ASSIGN_OBJ_OP: |
1616 | 0 | case ZEND_ASSIGN_STATIC_PROP_OP: |
1617 | 0 | case ZEND_PRE_INC: |
1618 | 0 | case ZEND_PRE_DEC: |
1619 | 0 | case ZEND_ASSIGN: |
1620 | 0 | case ZEND_ASSIGN_REF: |
1621 | 0 | case ZEND_DO_FCALL: |
1622 | 0 | case ZEND_DO_ICALL: |
1623 | 0 | case ZEND_DO_UCALL: |
1624 | 0 | case ZEND_DO_FCALL_BY_NAME: |
1625 | 0 | opline->result_type = IS_UNUSED; |
1626 | 0 | break; |
1627 | 0 | case ZEND_POST_INC: |
1628 | 0 | case ZEND_POST_DEC: |
1629 | 0 | case ZEND_POST_INC_OBJ: |
1630 | 0 | case ZEND_POST_DEC_OBJ: |
1631 | 0 | case ZEND_POST_INC_STATIC_PROP: |
1632 | 0 | case ZEND_POST_DEC_STATIC_PROP: |
1633 | 0 | opline->opcode -= 2; |
1634 | 0 | opline->result_type = IS_UNUSED; |
1635 | 0 | break; |
1636 | 744 | case ZEND_QM_ASSIGN: |
1637 | 1.83k | case ZEND_BOOL: |
1638 | 4.66k | case ZEND_BOOL_NOT: |
1639 | 4.66k | zend_optimizer_convert_to_free_op1(op_array, opline); |
1640 | 4.66k | break; |
1641 | 1.89k | case ZEND_JMPZ_EX: |
1642 | 3.89k | case ZEND_JMPNZ_EX: |
1643 | 3.89k | opline->opcode -= 3; |
1644 | 3.89k | SET_UNUSED(opline->result); |
1645 | 3.89k | break; |
1646 | 0 | case ZEND_ADD_ARRAY_ELEMENT: |
1647 | 0 | case ZEND_ADD_ARRAY_UNPACK: |
1648 | 0 | case ZEND_ROPE_ADD: |
1649 | 0 | zend_bitset_incl(usage, VAR_NUM(opline->result.var)); |
1650 | 0 | break; |
1651 | 8.65k | } |
1652 | 1.66M | } else { |
1653 | 1.66M | switch (opline->opcode) { |
1654 | 44.7k | case ZEND_ADD_ARRAY_ELEMENT: |
1655 | 44.9k | case ZEND_ADD_ARRAY_UNPACK: |
1656 | 334k | case ZEND_ROPE_ADD: |
1657 | 334k | break; |
1658 | 1.32M | default: |
1659 | 1.32M | zend_bitset_excl(usage, VAR_NUM(opline->result.var)); |
1660 | 1.32M | break; |
1661 | 1.66M | } |
1662 | 1.66M | } |
1663 | 1.66M | } |
1664 | | |
1665 | 3.50M | if (opline->op2_type == IS_VAR) { |
1666 | 92.3k | switch (opline->opcode) { |
1667 | 233 | case ZEND_FE_FETCH_R: |
1668 | 253 | case ZEND_FE_FETCH_RW: |
1669 | 253 | zend_bitset_excl(usage, VAR_NUM(opline->op2.var)); |
1670 | 253 | break; |
1671 | 92.0k | default: |
1672 | 92.0k | zend_bitset_incl(usage, VAR_NUM(opline->op2.var)); |
1673 | 92.0k | break; |
1674 | 92.3k | } |
1675 | 3.41M | } else if (opline->op2_type == IS_TMP_VAR) { |
1676 | 544k | zend_bitset_incl(usage, VAR_NUM(opline->op2.var)); |
1677 | 544k | } |
1678 | | |
1679 | 3.50M | if (opline->op1_type & (IS_VAR|IS_TMP_VAR)) { |
1680 | 965k | zend_bitset_incl(usage, VAR_NUM(opline->op1.var)); |
1681 | 965k | } |
1682 | | |
1683 | 3.50M | opline--; |
1684 | 3.50M | } |
1685 | 545k | } |
1686 | | |
1687 | 114k | zend_arena_release(&ctx->arena, checkpoint); |
1688 | 114k | } |
1689 | | |
1690 | | static void zend_merge_blocks(zend_op_array *op_array, zend_cfg *cfg, uint32_t *opt_count) |
1691 | 129k | { |
1692 | 129k | int i; |
1693 | 129k | zend_basic_block *b, *bb; |
1694 | 129k | zend_basic_block *prev = NULL; |
1695 | | |
1696 | 746k | for (i = 0; i < cfg->blocks_count; i++) { |
1697 | 616k | b = cfg->blocks + i; |
1698 | 616k | if (b->flags & ZEND_BB_REACHABLE) { |
1699 | 558k | if ((b->flags & ZEND_BB_FOLLOW) && |
1700 | 315k | !(b->flags & (ZEND_BB_TARGET | ZEND_BB_PROTECTED)) && |
1701 | 151k | prev && prev->successors_count == 1 && prev->successors[0] == i) |
1702 | 32.2k | { |
1703 | 32.2k | zend_op *last_op = op_array->opcodes + prev->start + prev->len - 1; |
1704 | 32.2k | if (prev->len != 0 && last_op->opcode == ZEND_JMP) { |
1705 | 0 | MAKE_NOP(last_op); |
1706 | 0 | } |
1707 | | |
1708 | 35.7k | for (bb = prev + 1; bb != b; bb++) { |
1709 | 3.45k | zend_op *op = op_array->opcodes + bb->start; |
1710 | 3.45k | zend_op *end = op + bb->len; |
1711 | 6.58k | while (op < end) { |
1712 | 3.12k | if (op->op1_type == IS_CONST) { |
1713 | 1.20k | literal_dtor(&ZEND_OP1_LITERAL(op)); |
1714 | 1.20k | } |
1715 | 3.12k | if (op->op2_type == IS_CONST) { |
1716 | 690 | literal_dtor(&ZEND_OP2_LITERAL(op)); |
1717 | 690 | } |
1718 | 3.12k | MAKE_NOP(op); |
1719 | 3.12k | op++; |
1720 | 3.12k | } |
1721 | | /* make block empty */ |
1722 | 3.45k | bb->len = 0; |
1723 | 3.45k | } |
1724 | | |
1725 | | /* re-link */ |
1726 | 32.2k | prev->flags |= (b->flags & ZEND_BB_EXIT); |
1727 | 32.2k | prev->len = b->start + b->len - prev->start; |
1728 | 32.2k | prev->successors_count = b->successors_count; |
1729 | 32.2k | if (b->successors != b->successors_storage) { |
1730 | 52 | prev->successors = b->successors; |
1731 | 52 | b->successors = b->successors_storage; |
1732 | 32.2k | } else { |
1733 | 32.2k | memcpy(prev->successors, b->successors, b->successors_count * sizeof(int)); |
1734 | 32.2k | } |
1735 | | |
1736 | | /* unlink & make block empty and unreachable */ |
1737 | 32.2k | b->flags = 0; |
1738 | 32.2k | b->len = 0; |
1739 | 32.2k | b->successors_count = 0; |
1740 | 32.2k | ++(*opt_count); |
1741 | 525k | } else { |
1742 | 525k | prev = b; |
1743 | 525k | } |
1744 | 558k | } |
1745 | 616k | } |
1746 | 129k | } |
1747 | | |
1748 | 129k | #define PASSES 3 |
1749 | | |
1750 | | void zend_optimize_cfg(zend_op_array *op_array, zend_optimizer_ctx *ctx) |
1751 | 102k | { |
1752 | 102k | zend_cfg cfg; |
1753 | 102k | zend_basic_block *blocks, *end, *b; |
1754 | 102k | int pass; |
1755 | 102k | uint32_t bitset_len; |
1756 | 102k | zend_bitset usage; |
1757 | 102k | void *checkpoint; |
1758 | 102k | zend_op **Tsource; |
1759 | 102k | uint32_t opt_count; |
1760 | 102k | int *jmp_hitlist; |
1761 | | |
1762 | | /* Build CFG */ |
1763 | 102k | checkpoint = zend_arena_checkpoint(ctx->arena); |
1764 | 102k | zend_build_cfg(&ctx->arena, op_array, 0, &cfg); |
1765 | | |
1766 | 102k | if (cfg.blocks_count * (op_array->last_var + op_array->T) > 64 * 1024 * 1024) { |
1767 | 0 | zend_arena_release(&ctx->arena, checkpoint); |
1768 | 0 | return; |
1769 | 0 | } |
1770 | | |
1771 | 102k | if (ctx->debug_level & ZEND_DUMP_BEFORE_BLOCK_PASS) { |
1772 | 0 | zend_dump_op_array(op_array, ZEND_DUMP_CFG, "before block pass", &cfg); |
1773 | 0 | } |
1774 | | |
1775 | 102k | bitset_len = zend_bitset_len(op_array->last_var + op_array->T); |
1776 | 102k | Tsource = zend_arena_calloc(&ctx->arena, op_array->last_var + op_array->T, sizeof(zend_op *)); |
1777 | 102k | usage = zend_arena_alloc(&ctx->arena, bitset_len * ZEND_BITSET_ELM_SIZE); |
1778 | 102k | jmp_hitlist = zend_arena_alloc(&ctx->arena, cfg.blocks_count * sizeof(int)); |
1779 | | |
1780 | 102k | blocks = cfg.blocks; |
1781 | 102k | end = blocks + cfg.blocks_count; |
1782 | 129k | for (pass = 0; pass < PASSES; pass++) { |
1783 | 129k | opt_count = 0; |
1784 | | |
1785 | | /* Compute data dependencies */ |
1786 | 129k | zend_bitset_clear(usage, bitset_len); |
1787 | 129k | zend_t_usage(&cfg, op_array, usage, ctx); |
1788 | | |
1789 | | /* optimize each basic block separately */ |
1790 | 746k | for (b = blocks; b < end; b++) { |
1791 | 616k | if (!(b->flags & ZEND_BB_REACHABLE)) { |
1792 | 55.9k | continue; |
1793 | 55.9k | } |
1794 | | /* we track data dependencies only inside a single basic block */ |
1795 | 560k | if (!(b->flags & ZEND_BB_FOLLOW) || |
1796 | 354k | (b->flags & ZEND_BB_TARGET)) { |
1797 | | /* Skip continuation of "extended" BB */ |
1798 | 354k | memset(Tsource, 0, (op_array->last_var + op_array->T) * sizeof(zend_op *)); |
1799 | 354k | } |
1800 | 560k | zend_optimize_block(b, op_array, usage, &cfg, Tsource, &opt_count); |
1801 | 560k | } |
1802 | | |
1803 | | /* Eliminate NOPs */ |
1804 | 746k | for (b = blocks; b < end; b++) { |
1805 | 616k | if (b->flags & ZEND_BB_UNREACHABLE_FREE) { |
1806 | | /* In unreachable_free blocks only preserve loop var frees. */ |
1807 | 104 | for (uint32_t i = b->start; i < b->start + b->len; i++) { |
1808 | 70 | zend_op *opline = &op_array->opcodes[i]; |
1809 | 70 | if (!zend_optimizer_is_loop_var_free(opline)) { |
1810 | 36 | MAKE_NOP(opline); |
1811 | 36 | } |
1812 | 70 | } |
1813 | 34 | } |
1814 | 616k | if (b->flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1815 | 560k | strip_nops(op_array, b); |
1816 | 560k | } |
1817 | 616k | } |
1818 | | |
1819 | 129k | opt_count = 0; |
1820 | | |
1821 | | /* Jump optimization for each block */ |
1822 | 746k | for (b = blocks; b < end; b++) { |
1823 | 616k | if (b->flags & ZEND_BB_REACHABLE) { |
1824 | 560k | zend_jmp_optimization(b, op_array, &cfg, jmp_hitlist, &opt_count); |
1825 | 560k | } |
1826 | 616k | } |
1827 | | |
1828 | | /* Eliminate unreachable basic blocks */ |
1829 | 129k | zend_cfg_remark_reachable_blocks(op_array, &cfg); |
1830 | | |
1831 | | /* Merge Blocks */ |
1832 | 129k | zend_merge_blocks(op_array, &cfg, &opt_count); |
1833 | | |
1834 | 129k | if (opt_count == 0) { |
1835 | 102k | break; |
1836 | 102k | } |
1837 | 129k | } |
1838 | | |
1839 | 102k | assemble_code_blocks(&cfg, op_array, ctx); |
1840 | | |
1841 | 102k | if (ctx->debug_level & ZEND_DUMP_AFTER_BLOCK_PASS) { |
1842 | 0 | zend_dump_op_array(op_array, ZEND_DUMP_CFG | ZEND_DUMP_HIDE_UNREACHABLE, "after block pass", &cfg); |
1843 | 0 | } |
1844 | | |
1845 | | /* Destroy CFG */ |
1846 | 102k | zend_arena_release(&ctx->arena, checkpoint); |
1847 | 102k | } |