/src/php-src/Zend/Optimizer/block_pass.c
Line | Count | Source |
1 | | /* |
2 | | +----------------------------------------------------------------------+ |
3 | | | Zend OPcache | |
4 | | +----------------------------------------------------------------------+ |
5 | | | Copyright (c) The PHP Group | |
6 | | +----------------------------------------------------------------------+ |
7 | | | This source file is subject to version 3.01 of the PHP license, | |
8 | | | that is bundled with this package in the file LICENSE, and is | |
9 | | | available through the world-wide-web at the following url: | |
10 | | | https://www.php.net/license/3_01.txt | |
11 | | | If you did not receive a copy of the PHP license and are unable to | |
12 | | | obtain it through the world-wide-web, please send a note to | |
13 | | | license@php.net so we can mail you a copy immediately. | |
14 | | +----------------------------------------------------------------------+ |
15 | | | Authors: Andi Gutmans <andi@php.net> | |
16 | | | Zeev Suraski <zeev@php.net> | |
17 | | | Stanislav Malyshev <stas@zend.com> | |
18 | | | Dmitry Stogov <dmitry@php.net> | |
19 | | +----------------------------------------------------------------------+ |
20 | | */ |
21 | | |
22 | | #include "Optimizer/zend_optimizer.h" |
23 | | #include "Optimizer/zend_optimizer_internal.h" |
24 | | #include "zend_API.h" |
25 | | #include "zend_constants.h" |
26 | | #include "zend_execute.h" |
27 | | #include "zend_vm.h" |
28 | | #include "zend_bitset.h" |
29 | | #include "zend_cfg.h" |
30 | | #include "zend_dump.h" |
31 | | |
32 | | /* Checks if a constant (like "true") may be replaced by its value */ |
33 | | bool zend_optimizer_get_persistent_constant(zend_string *name, zval *result, bool copy) |
34 | 65.3k | { |
35 | 65.3k | const zend_constant *c = zend_hash_find_ptr(EG(zend_constants), name); |
36 | 65.3k | if (c) { |
37 | 64 | if ((ZEND_CONSTANT_FLAGS(c) & CONST_PERSISTENT) |
38 | 64 | && !(ZEND_CONSTANT_FLAGS(c) & CONST_DEPRECATED) |
39 | 0 | && (!(ZEND_CONSTANT_FLAGS(c) & CONST_NO_FILE_CACHE) |
40 | 0 | || !(CG(compiler_options) & ZEND_COMPILE_WITH_FILE_CACHE))) { |
41 | 0 | ZVAL_COPY_VALUE(result, &c->value); |
42 | 0 | if (copy) { |
43 | 0 | Z_TRY_ADDREF_P(result); |
44 | 0 | } |
45 | 0 | return true; |
46 | 64 | } else { |
47 | 64 | return false; |
48 | 64 | } |
49 | 64 | } |
50 | | |
51 | | /* Special constants null/true/false can always be substituted. */ |
52 | 65.2k | c = zend_get_special_const(ZSTR_VAL(name), ZSTR_LEN(name)); |
53 | 65.2k | if (c) { |
54 | 0 | ZVAL_COPY_VALUE(result, &c->value); |
55 | 0 | return true; |
56 | 0 | } |
57 | 65.2k | return false; |
58 | 65.2k | } |
59 | | |
60 | | /* Data dependencies macros */ |
61 | | |
62 | 2.08M | #define VAR_SOURCE(op) Tsource[VAR_NUM(op.var)] |
63 | 1.88M | #define SET_VAR_SOURCE(opline) Tsource[VAR_NUM(opline->result.var)] = opline |
64 | | |
65 | | static void strip_leading_nops(const zend_op_array *op_array, zend_basic_block *b) |
66 | 10.7k | { |
67 | 10.7k | const zend_op *opcodes = op_array->opcodes; |
68 | | |
69 | 12.8k | do { |
70 | 12.8k | b->start++; |
71 | 12.8k | b->len--; |
72 | 12.8k | } while (b->len > 0 && opcodes[b->start].opcode == ZEND_NOP); |
73 | 10.7k | } |
74 | | |
75 | | static void strip_nops(const zend_op_array *op_array, zend_basic_block *b) |
76 | 608k | { |
77 | 608k | uint32_t i, j; |
78 | | |
79 | 608k | if (b->len == 0) { |
80 | 1.23k | return; |
81 | 1.23k | } |
82 | | |
83 | 606k | if (op_array->opcodes[b->start].opcode == ZEND_NOP) { |
84 | 4.20k | strip_leading_nops(op_array, b); |
85 | 4.20k | } |
86 | | |
87 | 606k | if (b->len == 0) { |
88 | 348 | return; |
89 | 348 | } |
90 | | |
91 | | /* strip the inside NOPs */ |
92 | 606k | i = j = b->start + 1; |
93 | 3.85M | while (i < b->start + b->len) { |
94 | 3.24M | if (op_array->opcodes[i].opcode != ZEND_NOP) { |
95 | 3.21M | if (i != j) { |
96 | 62.3k | op_array->opcodes[j] = op_array->opcodes[i]; |
97 | 62.3k | } |
98 | 3.21M | j++; |
99 | 3.21M | } |
100 | 3.24M | i++; |
101 | 3.24M | } |
102 | 606k | b->len = j - b->start; |
103 | 639k | while (j < i) { |
104 | 32.7k | MAKE_NOP(op_array->opcodes + j); |
105 | 32.7k | j++; |
106 | 32.7k | } |
107 | 606k | } |
108 | | |
109 | 68 | static uint32_t get_const_switch_target(const zend_cfg *cfg, const zend_op_array *op_array, const zend_basic_block *block, zend_op *opline, const zval *val) { |
110 | 68 | HashTable *jumptable = Z_ARRVAL(ZEND_OP2_LITERAL(opline)); |
111 | 68 | zval *zv; |
112 | 68 | if ((opline->opcode == ZEND_SWITCH_LONG && Z_TYPE_P(val) != IS_LONG) |
113 | 68 | || (opline->opcode == ZEND_SWITCH_STRING && Z_TYPE_P(val) != IS_STRING)) { |
114 | | /* fallback to next block */ |
115 | 0 | return block->successors[block->successors_count - 1]; |
116 | 0 | } |
117 | 68 | if (opline->opcode == ZEND_MATCH && Z_TYPE_P(val) != IS_LONG && Z_TYPE_P(val) != IS_STRING) { |
118 | | /* always jump to the default arm */ |
119 | 12 | return block->successors[block->successors_count - 1]; |
120 | 12 | } |
121 | 56 | if (Z_TYPE_P(val) == IS_LONG) { |
122 | 28 | zv = zend_hash_index_find(jumptable, Z_LVAL_P(val)); |
123 | 28 | } else { |
124 | 28 | ZEND_ASSERT(Z_TYPE_P(val) == IS_STRING); |
125 | 28 | zv = zend_hash_find(jumptable, Z_STR_P(val)); |
126 | 28 | } |
127 | 56 | if (!zv) { |
128 | | /* default */ |
129 | 36 | return block->successors[block->successors_count - (opline->opcode == ZEND_MATCH ? 1 : 2)]; |
130 | 36 | } |
131 | 20 | return cfg->map[ZEND_OFFSET_TO_OPLINE_NUM(op_array, opline, Z_LVAL_P(zv))]; |
132 | 56 | } |
133 | | |
134 | | static void zend_optimize_block(zend_basic_block *block, zend_op_array *op_array, zend_bitset used_ext, zend_cfg *cfg, zend_op **Tsource, uint32_t *opt_count) |
135 | 608k | { |
136 | 608k | zend_op *opline, *src; |
137 | 608k | zend_op *end, *last_op = NULL; |
138 | | |
139 | 608k | if (block->len == 0) { |
140 | 248 | return; |
141 | 248 | } |
142 | | |
143 | 607k | if (op_array->opcodes[block->start].opcode == ZEND_NOP) { |
144 | | /* remove leading NOPs */ |
145 | 6.57k | strip_leading_nops(op_array, block); |
146 | 6.57k | } |
147 | | |
148 | 607k | opline = op_array->opcodes + block->start; |
149 | 607k | end = opline + block->len; |
150 | 4.46M | while (opline < end) { |
151 | | /* Constant Propagation: strip X = QM_ASSIGN(const) */ |
152 | 3.86M | if (opline->op1_type == IS_TMP_VAR && |
153 | 901k | opline->opcode != ZEND_FREE) { |
154 | 858k | src = VAR_SOURCE(opline->op1); |
155 | 858k | if (src && |
156 | 802k | src->opcode == ZEND_QM_ASSIGN && |
157 | 5.94k | src->op1_type == IS_CONST |
158 | 858k | ) { |
159 | 2.41k | znode_op op1 = opline->op1; |
160 | 2.41k | if (opline->opcode == ZEND_VERIFY_RETURN_TYPE) { |
161 | 2 | COPY_NODE(opline->result, opline->op1); |
162 | 2 | COPY_NODE(opline->op1, src->op1); |
163 | 2 | VAR_SOURCE(op1) = NULL; |
164 | 2 | MAKE_NOP(src); |
165 | 2 | ++(*opt_count); |
166 | 2.41k | } else { |
167 | 2.41k | zval c; |
168 | 2.41k | ZVAL_COPY(&c, &ZEND_OP1_LITERAL(src)); |
169 | 2.41k | if (opline->opcode != ZEND_CASE |
170 | 2.41k | && opline->opcode != ZEND_CASE_STRICT |
171 | 2.41k | && opline->opcode != ZEND_FETCH_LIST_R |
172 | 2.40k | && opline->opcode != ZEND_SWITCH_LONG |
173 | 2.40k | && opline->opcode != ZEND_SWITCH_STRING |
174 | 2.40k | && opline->opcode != ZEND_MATCH |
175 | 2.39k | && opline->opcode != ZEND_MATCH_ERROR |
176 | 2.39k | && zend_optimizer_update_op1_const(op_array, opline, &c)) { |
177 | 2.34k | VAR_SOURCE(op1) = NULL; |
178 | 2.34k | if (opline->opcode != ZEND_JMP_NULL |
179 | 2.33k | && !zend_bitset_in(used_ext, VAR_NUM(src->result.var))) { |
180 | 1.39k | literal_dtor(&ZEND_OP1_LITERAL(src)); |
181 | 1.39k | MAKE_NOP(src); |
182 | 1.39k | } |
183 | 2.34k | ++(*opt_count); |
184 | 2.34k | } else { |
185 | 68 | zval_ptr_dtor_nogc(&c); |
186 | 68 | } |
187 | 2.41k | } |
188 | 2.41k | } |
189 | 858k | } |
190 | | |
191 | | /* Constant Propagation: strip X = QM_ASSIGN(const) */ |
192 | 3.86M | if (opline->op2_type == IS_TMP_VAR) { |
193 | 627k | src = VAR_SOURCE(opline->op2); |
194 | 627k | if (src && |
195 | 583k | src->opcode == ZEND_QM_ASSIGN && |
196 | 126 | src->op1_type == IS_CONST) { |
197 | | |
198 | 98 | znode_op op2 = opline->op2; |
199 | 98 | zval c; |
200 | | |
201 | 98 | ZVAL_COPY(&c, &ZEND_OP1_LITERAL(src)); |
202 | 98 | if (zend_optimizer_update_op2_const(op_array, opline, &c)) { |
203 | 86 | VAR_SOURCE(op2) = NULL; |
204 | 86 | if (!zend_bitset_in(used_ext, VAR_NUM(src->result.var))) { |
205 | 86 | literal_dtor(&ZEND_OP1_LITERAL(src)); |
206 | 86 | MAKE_NOP(src); |
207 | 86 | } |
208 | 86 | ++(*opt_count); |
209 | 86 | } else { |
210 | 12 | zval_ptr_dtor_nogc(&c); |
211 | 12 | } |
212 | 98 | } |
213 | 627k | } |
214 | | |
215 | 3.86M | switch (opline->opcode) { |
216 | 186k | case ZEND_ECHO: |
217 | 186k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
218 | 39.7k | src = VAR_SOURCE(opline->op1); |
219 | 39.7k | if (src && |
220 | 36.7k | src->opcode == ZEND_CAST && |
221 | 136 | src->extended_value == IS_STRING) { |
222 | | /* T = CAST(X, String), ECHO(T) => NOP, ECHO(X) */ |
223 | 90 | VAR_SOURCE(opline->op1) = NULL; |
224 | 90 | COPY_NODE(opline->op1, src->op1); |
225 | 90 | MAKE_NOP(src); |
226 | 90 | ++(*opt_count); |
227 | 90 | } |
228 | 146k | } else if (opline->op1_type == IS_CONST && |
229 | 145k | Z_TYPE(ZEND_OP1_LITERAL(opline)) != IS_DOUBLE) { |
230 | 145k | if (last_op == opline - 1) { |
231 | | /* compress consecutive ECHO's. |
232 | | * Float to string conversion may be affected by current |
233 | | * locale setting. |
234 | | */ |
235 | 5.59k | size_t l, old_len; |
236 | | |
237 | 5.59k | if (Z_TYPE(ZEND_OP1_LITERAL(opline)) != IS_STRING) { |
238 | 58 | convert_to_string(&ZEND_OP1_LITERAL(opline)); |
239 | 58 | } |
240 | 5.59k | if (Z_TYPE(ZEND_OP1_LITERAL(last_op)) != IS_STRING) { |
241 | 35 | convert_to_string(&ZEND_OP1_LITERAL(last_op)); |
242 | 35 | } |
243 | 5.59k | old_len = Z_STRLEN(ZEND_OP1_LITERAL(last_op)); |
244 | 5.59k | l = old_len + Z_STRLEN(ZEND_OP1_LITERAL(opline)); |
245 | 5.59k | if (!Z_REFCOUNTED(ZEND_OP1_LITERAL(last_op))) { |
246 | 2.17k | zend_string *tmp = zend_string_alloc(l, 0); |
247 | 2.17k | memcpy(ZSTR_VAL(tmp), Z_STRVAL(ZEND_OP1_LITERAL(last_op)), old_len); |
248 | 2.17k | Z_STR(ZEND_OP1_LITERAL(last_op)) = tmp; |
249 | 3.41k | } else { |
250 | 3.41k | Z_STR(ZEND_OP1_LITERAL(last_op)) = zend_string_extend(Z_STR(ZEND_OP1_LITERAL(last_op)), l, 0); |
251 | 3.41k | } |
252 | 5.59k | Z_TYPE_INFO(ZEND_OP1_LITERAL(last_op)) = IS_STRING_EX; |
253 | 5.59k | memcpy(Z_STRVAL(ZEND_OP1_LITERAL(last_op)) + old_len, Z_STRVAL(ZEND_OP1_LITERAL(opline)), Z_STRLEN(ZEND_OP1_LITERAL(opline))); |
254 | 5.59k | Z_STRVAL(ZEND_OP1_LITERAL(last_op))[l] = '\0'; |
255 | 5.59k | zval_ptr_dtor_nogc(&ZEND_OP1_LITERAL(opline)); |
256 | 5.59k | ZVAL_STR(&ZEND_OP1_LITERAL(opline), zend_new_interned_string(Z_STR(ZEND_OP1_LITERAL(last_op)))); |
257 | 5.59k | ZVAL_NULL(&ZEND_OP1_LITERAL(last_op)); |
258 | 5.59k | MAKE_NOP(last_op); |
259 | 5.59k | ++(*opt_count); |
260 | 5.59k | } |
261 | 145k | last_op = opline; |
262 | 145k | } |
263 | 186k | break; |
264 | | |
265 | 572 | case ZEND_MATCH_ERROR: |
266 | 572 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
267 | 236 | src = VAR_SOURCE(opline->op1); |
268 | 236 | VAR_SOURCE(opline->op1) = NULL; |
269 | 236 | } |
270 | 572 | break; |
271 | | |
272 | 64.2k | case ZEND_FREE: |
273 | | /* Note: Only remove the source if the source is local to this block. |
274 | | * If it's not local, then the other blocks successors must also eventually either FREE or consume the temporary, |
275 | | * hence removing the temporary is not safe in the general case, especially when other consumers are not FREE. |
276 | | * A FREE may not be removed without also removing the source's result, because otherwise that would cause a memory leak. */ |
277 | 64.2k | if (opline->extended_value == ZEND_FREE_VOID_CAST) { |
278 | | /* Keep the ZEND_FREE opcode alive. */ |
279 | 64.1k | } else if (opline->op1_type == IS_TMP_VAR) { |
280 | 43.0k | src = VAR_SOURCE(opline->op1); |
281 | 43.0k | if (src) { |
282 | 37.3k | switch (src->opcode) { |
283 | 63 | case ZEND_BOOL: |
284 | 355 | case ZEND_BOOL_NOT: |
285 | | /* T = BOOL(X), FREE(T) => T = BOOL(X) */ |
286 | | /* The remaining BOOL is removed by a separate optimization */ |
287 | | /* The source is a bool, no source removals take place, so this may be done non-locally. */ |
288 | 355 | VAR_SOURCE(opline->op1) = NULL; |
289 | 355 | MAKE_NOP(opline); |
290 | 355 | ++(*opt_count); |
291 | 355 | break; |
292 | 959 | case ZEND_ASSIGN: |
293 | 966 | case ZEND_ASSIGN_DIM: |
294 | 971 | case ZEND_ASSIGN_OBJ: |
295 | 971 | case ZEND_ASSIGN_STATIC_PROP: |
296 | 1.36k | case ZEND_ASSIGN_OP: |
297 | 1.36k | case ZEND_ASSIGN_DIM_OP: |
298 | 1.37k | case ZEND_ASSIGN_OBJ_OP: |
299 | 1.37k | case ZEND_ASSIGN_STATIC_PROP_OP: |
300 | 1.37k | case ZEND_PRE_INC: |
301 | 1.37k | case ZEND_PRE_DEC: |
302 | 1.37k | case ZEND_PRE_INC_OBJ: |
303 | 1.37k | case ZEND_PRE_DEC_OBJ: |
304 | 1.37k | case ZEND_PRE_INC_STATIC_PROP: |
305 | 1.37k | case ZEND_PRE_DEC_STATIC_PROP: |
306 | 1.37k | if (src < op_array->opcodes + block->start) { |
307 | 0 | break; |
308 | 0 | } |
309 | 1.37k | src->result_type = IS_UNUSED; |
310 | 1.37k | VAR_SOURCE(opline->op1) = NULL; |
311 | 1.37k | MAKE_NOP(opline); |
312 | 1.37k | ++(*opt_count); |
313 | 1.37k | break; |
314 | 35.6k | default: |
315 | 35.6k | break; |
316 | 37.3k | } |
317 | 37.3k | } |
318 | 43.0k | } else if (opline->op1_type == IS_VAR) { |
319 | 21.0k | src = VAR_SOURCE(opline->op1); |
320 | | /* V = OP, FREE(V) => OP. NOP */ |
321 | 21.0k | if (src >= op_array->opcodes + block->start && |
322 | 20.0k | src->opcode != ZEND_FETCH_R && |
323 | 20.0k | src->opcode != ZEND_FETCH_STATIC_PROP_R && |
324 | 20.0k | src->opcode != ZEND_FETCH_DIM_R && |
325 | 20.0k | src->opcode != ZEND_FETCH_OBJ_R && |
326 | 20.0k | src->opcode != ZEND_NEW && |
327 | 1.40k | src->opcode != ZEND_FETCH_THIS) { |
328 | 1.40k | src->result_type = IS_UNUSED; |
329 | 1.40k | MAKE_NOP(opline); |
330 | 1.40k | ++(*opt_count); |
331 | 1.40k | if (src->opcode == ZEND_QM_ASSIGN) { |
332 | 32 | if (src->op1_type & (IS_VAR|IS_TMP_VAR)) { |
333 | 0 | src->opcode = ZEND_FREE; |
334 | 32 | } else { |
335 | 32 | MAKE_NOP(src); |
336 | 32 | } |
337 | 32 | } |
338 | 1.40k | } |
339 | 21.0k | } |
340 | 64.2k | break; |
341 | | |
342 | | #if 0 |
343 | | /* pre-evaluate functions: |
344 | | constant(x) |
345 | | function_exists(x) |
346 | | extension_loaded(x) |
347 | | BAD: interacts badly with Accelerator |
348 | | */ |
349 | | if((opline->op1_type & IS_VAR) && |
350 | | VAR_SOURCE(opline->op1) && VAR_SOURCE(opline->op1)->opcode == ZEND_DO_CF_FCALL && |
351 | | VAR_SOURCE(opline->op1)->extended_value == 1) { |
352 | | zend_op *fcall = VAR_SOURCE(opline->op1); |
353 | | zend_op *sv = fcall-1; |
354 | | if(sv >= block->start_opline && sv->opcode == ZEND_SEND_VAL && |
355 | | sv->op1_type == IS_CONST && Z_TYPE(OPLINE_OP1_LITERAL(sv)) == IS_STRING && |
356 | | Z_LVAL(OPLINE_OP2_LITERAL(sv)) == 1 |
357 | | ) { |
358 | | zval *arg = &OPLINE_OP1_LITERAL(sv); |
359 | | char *fname = FUNCTION_CACHE->funcs[Z_LVAL(ZEND_OP1_LITERAL(fcall))].function_name; |
360 | | size_t flen = FUNCTION_CACHE->funcs[Z_LVAL(ZEND_OP1_LITERAL(fcall))].name_len; |
361 | | if((flen == sizeof("function_exists")-1 && zend_binary_strcasecmp(fname, flen, "function_exists", sizeof("function_exists")-1) == 0) || |
362 | | (flen == sizeof("is_callable")-1 && zend_binary_strcasecmp(fname, flen, "is_callable", sizeof("is_callable")-1) == 0) |
363 | | ) { |
364 | | zend_function *function; |
365 | | if((function = zend_hash_find_ptr(EG(function_table), Z_STR_P(arg))) != NULL) { |
366 | | literal_dtor(arg); |
367 | | MAKE_NOP(sv); |
368 | | MAKE_NOP(fcall); |
369 | | LITERAL_BOOL(opline->op1, 1); |
370 | | opline->op1_type = IS_CONST; |
371 | | } |
372 | | } else if(flen == sizeof("constant")-1 && zend_binary_strcasecmp(fname, flen, "constant", sizeof("constant")-1) == 0) { |
373 | | zval c; |
374 | | if (zend_optimizer_get_persistent_constant(Z_STR_P(arg), &c, true ELS_CC)) { |
375 | | literal_dtor(arg); |
376 | | MAKE_NOP(sv); |
377 | | MAKE_NOP(fcall); |
378 | | ZEND_OP1_LITERAL(opline) = zend_optimizer_add_literal(op_array, &c); |
379 | | /* no copy ctor - get already copied it */ |
380 | | opline->op1_type = IS_CONST; |
381 | | } |
382 | | } else if(flen == sizeof("extension_loaded")-1 && zend_binary_strcasecmp(fname, flen, "extension_loaded", sizeof("extension_loaded")-1) == 0) { |
383 | | if(zend_hash_exists(&module_registry, Z_STR_P(arg))) { |
384 | | literal_dtor(arg); |
385 | | MAKE_NOP(sv); |
386 | | MAKE_NOP(fcall); |
387 | | LITERAL_BOOL(opline->op1, 1); |
388 | | opline->op1_type = IS_CONST; |
389 | | } |
390 | | } |
391 | | } |
392 | | } |
393 | | #endif |
394 | | |
395 | 64.2k | case ZEND_FETCH_LIST_R: |
396 | 1.98k | case ZEND_FETCH_LIST_W: |
397 | 1.98k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
398 | | /* LIST variable will be deleted later by FREE */ |
399 | 1.68k | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
400 | 1.68k | } |
401 | 1.98k | break; |
402 | | |
403 | 8 | case ZEND_SWITCH_LONG: |
404 | 79 | case ZEND_SWITCH_STRING: |
405 | 393 | case ZEND_MATCH: |
406 | 393 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
407 | | /* SWITCH variable will be deleted later by FREE, so we can't optimize it */ |
408 | 137 | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
409 | 137 | break; |
410 | 137 | } |
411 | 256 | if (opline->op1_type == IS_CONST) { |
412 | 68 | uint32_t target = get_const_switch_target(cfg, op_array, block, opline, &ZEND_OP1_LITERAL(opline)); |
413 | 68 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
414 | 68 | literal_dtor(&ZEND_OP2_LITERAL(opline)); |
415 | 68 | opline->opcode = ZEND_JMP; |
416 | 68 | opline->op1_type = IS_UNUSED; |
417 | 68 | opline->op2_type = IS_UNUSED; |
418 | 68 | block->successors_count = 1; |
419 | 68 | block->successors[0] = target; |
420 | 68 | } |
421 | 256 | break; |
422 | | |
423 | 0 | case ZEND_EXT_STMT: |
424 | 0 | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
425 | | /* Variable will be deleted later by FREE, so we can't optimize it */ |
426 | 0 | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
427 | 0 | break; |
428 | 0 | } |
429 | 0 | break; |
430 | | |
431 | 173 | case ZEND_CASE: |
432 | 421 | case ZEND_CASE_STRICT: |
433 | 5.28k | case ZEND_COPY_TMP: |
434 | 5.28k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
435 | | /* Variable will be deleted later by FREE, so we can't optimize it */ |
436 | 5.28k | Tsource[VAR_NUM(opline->op1.var)] = NULL; |
437 | 5.28k | break; |
438 | 5.28k | } |
439 | 0 | if (opline->op1_type == IS_CONST && |
440 | 0 | opline->op2_type == IS_CONST) { |
441 | 0 | goto optimize_constant_binary_op; |
442 | 0 | } |
443 | | /* |
444 | | * CASE(TRUE, X) => BOOL(X) |
445 | | * CASE(FALSE, X) => BOOL_NOT(X) |
446 | | */ |
447 | 0 | if (opline->op1_type == IS_CONST && |
448 | 0 | (Z_TYPE(ZEND_OP1_LITERAL(opline)) == IS_FALSE || |
449 | 0 | Z_TYPE(ZEND_OP1_LITERAL(opline)) == IS_TRUE)) { |
450 | | /* Optimization of comparison with "null" is not safe, |
451 | | * because ("0" == null) is not equal to !("0") |
452 | | */ |
453 | 0 | opline->opcode = |
454 | 0 | ((opline->opcode != ZEND_IS_NOT_EQUAL) == ((Z_TYPE(ZEND_OP1_LITERAL(opline))) == IS_TRUE)) ? |
455 | 0 | ZEND_BOOL : ZEND_BOOL_NOT; |
456 | 0 | COPY_NODE(opline->op1, opline->op2); |
457 | 0 | SET_UNUSED(opline->op2); |
458 | 0 | ++(*opt_count); |
459 | 0 | goto optimize_bool; |
460 | 0 | } else if (opline->op2_type == IS_CONST && |
461 | 0 | (Z_TYPE(ZEND_OP2_LITERAL(opline)) == IS_FALSE || |
462 | 0 | Z_TYPE(ZEND_OP2_LITERAL(opline)) == IS_TRUE)) { |
463 | | /* Optimization of comparison with "null" is not safe, |
464 | | * because ("0" == null) is not equal to !("0") |
465 | | */ |
466 | 0 | opline->opcode = |
467 | 0 | ((opline->opcode != ZEND_IS_NOT_EQUAL) == ((Z_TYPE(ZEND_OP2_LITERAL(opline))) == IS_TRUE)) ? |
468 | 0 | ZEND_BOOL : ZEND_BOOL_NOT; |
469 | 0 | SET_UNUSED(opline->op2); |
470 | 0 | ++(*opt_count); |
471 | 0 | goto optimize_bool; |
472 | 0 | } |
473 | 0 | break; |
474 | | |
475 | 25.6k | case ZEND_IS_EQUAL: |
476 | 28.9k | case ZEND_IS_NOT_EQUAL: |
477 | 28.9k | if (opline->op1_type == IS_CONST && |
478 | 0 | opline->op2_type == IS_CONST) { |
479 | 0 | goto optimize_constant_binary_op; |
480 | 0 | } |
481 | | /* IS_EQ(TRUE, X) => BOOL(X) |
482 | | * IS_EQ(FALSE, X) => BOOL_NOT(X) |
483 | | * IS_NOT_EQ(TRUE, X) => BOOL_NOT(X) |
484 | | * IS_NOT_EQ(FALSE, X) => BOOL(X) |
485 | | * Those optimizations are not safe if the other operand ends up being NAN |
486 | | * as BOOL/BOOL_NOT will warn, while IS_EQUAL/IS_NOT_EQUAL do not. |
487 | | */ |
488 | 28.9k | break; |
489 | 28.9k | case ZEND_IS_IDENTICAL: |
490 | 2.70k | if (opline->op1_type == IS_CONST && |
491 | 0 | opline->op2_type == IS_CONST) { |
492 | 0 | goto optimize_constant_binary_op; |
493 | 0 | } |
494 | | |
495 | 2.70k | if (opline->op1_type == IS_CONST && |
496 | 0 | (Z_TYPE(ZEND_OP1_LITERAL(opline)) <= IS_TRUE && Z_TYPE(ZEND_OP1_LITERAL(opline)) >= IS_NULL)) { |
497 | | /* IS_IDENTICAL(TRUE, T) => TYPE_CHECK(T, TRUE) |
498 | | * IS_IDENTICAL(FALSE, T) => TYPE_CHECK(T, FALSE) |
499 | | * IS_IDENTICAL(NULL, T) => TYPE_CHECK(T, NULL) |
500 | | */ |
501 | 0 | opline->opcode = ZEND_TYPE_CHECK; |
502 | 0 | opline->extended_value = (1 << Z_TYPE(ZEND_OP1_LITERAL(opline))); |
503 | 0 | COPY_NODE(opline->op1, opline->op2); |
504 | 0 | SET_UNUSED(opline->op2); |
505 | 0 | ++(*opt_count); |
506 | 0 | goto optimize_type_check; |
507 | 2.70k | } else if (opline->op2_type == IS_CONST && |
508 | 1.77k | (Z_TYPE(ZEND_OP2_LITERAL(opline)) <= IS_TRUE && Z_TYPE(ZEND_OP2_LITERAL(opline)) >= IS_NULL)) { |
509 | | /* IS_IDENTICAL(T, TRUE) => TYPE_CHECK(T, TRUE) |
510 | | * IS_IDENTICAL(T, FALSE) => TYPE_CHECK(T, FALSE) |
511 | | * IS_IDENTICAL(T, NULL) => TYPE_CHECK(T, NULL) |
512 | | */ |
513 | 118 | opline->opcode = ZEND_TYPE_CHECK; |
514 | 118 | opline->extended_value = (1 << Z_TYPE(ZEND_OP2_LITERAL(opline))); |
515 | 118 | SET_UNUSED(opline->op2); |
516 | 118 | ++(*opt_count); |
517 | 118 | goto optimize_type_check; |
518 | 118 | } |
519 | 2.58k | break; |
520 | 2.58k | case ZEND_TYPE_CHECK: |
521 | 1.47k | optimize_type_check: |
522 | 1.47k | if (opline->extended_value == (1 << IS_TRUE) || opline->extended_value == (1 << IS_FALSE)) { |
523 | 244 | if (opline->op1_type == IS_TMP_VAR && |
524 | 198 | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
525 | 198 | src = VAR_SOURCE(opline->op1); |
526 | | |
527 | 198 | if (src) { |
528 | 198 | switch (src->opcode) { |
529 | 0 | case ZEND_BOOL: |
530 | 0 | case ZEND_BOOL_NOT: |
531 | | /* T = BOOL(X) + TYPE_CHECK(T, TRUE) -> BOOL(X), NOP |
532 | | * T = BOOL(X) + TYPE_CHECK(T, FALSE) -> BOOL_NOT(X), NOP |
533 | | * T = BOOL_NOT(X) + TYPE_CHECK(T, TRUE) -> BOOL_NOT(X), NOP |
534 | | * T = BOOL_NOT(X) + TYPE_CHECK(T, FALSE) -> BOOL(X), NOP |
535 | | */ |
536 | 0 | src->opcode = |
537 | 0 | ((src->opcode == ZEND_BOOL) == (opline->extended_value == (1 << IS_TRUE))) ? |
538 | 0 | ZEND_BOOL : ZEND_BOOL_NOT; |
539 | 0 | COPY_NODE(src->result, opline->result); |
540 | 0 | SET_VAR_SOURCE(src); |
541 | 0 | MAKE_NOP(opline); |
542 | 0 | ++(*opt_count); |
543 | 0 | break; |
544 | 198 | } |
545 | 198 | } |
546 | 198 | } |
547 | 244 | } |
548 | 1.47k | break; |
549 | | |
550 | 7.55k | case ZEND_BOOL: |
551 | 19.9k | case ZEND_BOOL_NOT: |
552 | 28.1k | optimize_bool: |
553 | 28.1k | if (opline->op1_type == IS_CONST) { |
554 | 2.61k | goto optimize_const_unary_op; |
555 | 2.61k | } |
556 | 25.5k | if (opline->op1_type == IS_TMP_VAR && |
557 | 22.3k | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
558 | 21.4k | src = VAR_SOURCE(opline->op1); |
559 | 21.4k | if (src) { |
560 | 21.4k | switch (src->opcode) { |
561 | 4.29k | case ZEND_BOOL_NOT: |
562 | | /* T = BOOL_NOT(X) + BOOL(T) -> NOP, BOOL_NOT(X) */ |
563 | 4.29k | VAR_SOURCE(opline->op1) = NULL; |
564 | 4.29k | COPY_NODE(opline->op1, src->op1); |
565 | 4.29k | opline->opcode = (opline->opcode == ZEND_BOOL) ? ZEND_BOOL_NOT : ZEND_BOOL; |
566 | 4.29k | MAKE_NOP(src); |
567 | 4.29k | ++(*opt_count); |
568 | 4.29k | goto optimize_bool; |
569 | 3.96k | case ZEND_BOOL: |
570 | | /* T = BOOL(X) + BOOL(T) -> NOP, BOOL(X) */ |
571 | 3.96k | VAR_SOURCE(opline->op1) = NULL; |
572 | 3.96k | COPY_NODE(opline->op1, src->op1); |
573 | 3.96k | MAKE_NOP(src); |
574 | 3.96k | ++(*opt_count); |
575 | 3.96k | goto optimize_bool; |
576 | 245 | case ZEND_IS_EQUAL: |
577 | 245 | if (opline->opcode == ZEND_BOOL_NOT) { |
578 | 0 | src->opcode = ZEND_IS_NOT_EQUAL; |
579 | 0 | } |
580 | 245 | COPY_NODE(src->result, opline->result); |
581 | 245 | SET_VAR_SOURCE(src); |
582 | 245 | MAKE_NOP(opline); |
583 | 245 | ++(*opt_count); |
584 | 245 | break; |
585 | 200 | case ZEND_IS_NOT_EQUAL: |
586 | 200 | if (opline->opcode == ZEND_BOOL_NOT) { |
587 | 0 | src->opcode = ZEND_IS_EQUAL; |
588 | 0 | } |
589 | 200 | COPY_NODE(src->result, opline->result); |
590 | 200 | SET_VAR_SOURCE(src); |
591 | 200 | MAKE_NOP(opline); |
592 | 200 | ++(*opt_count); |
593 | 200 | break; |
594 | 197 | case ZEND_IS_IDENTICAL: |
595 | 197 | if (opline->opcode == ZEND_BOOL_NOT) { |
596 | 0 | src->opcode = ZEND_IS_NOT_IDENTICAL; |
597 | 0 | } |
598 | 197 | COPY_NODE(src->result, opline->result); |
599 | 197 | SET_VAR_SOURCE(src); |
600 | 197 | MAKE_NOP(opline); |
601 | 197 | ++(*opt_count); |
602 | 197 | break; |
603 | 71 | case ZEND_IS_NOT_IDENTICAL: |
604 | 71 | if (opline->opcode == ZEND_BOOL_NOT) { |
605 | 0 | src->opcode = ZEND_IS_IDENTICAL; |
606 | 0 | } |
607 | 71 | COPY_NODE(src->result, opline->result); |
608 | 71 | SET_VAR_SOURCE(src); |
609 | 71 | MAKE_NOP(opline); |
610 | 71 | ++(*opt_count); |
611 | 71 | break; |
612 | 172 | case ZEND_IS_SMALLER: |
613 | 172 | if (opline->opcode == ZEND_BOOL_NOT) { |
614 | 0 | uint8_t tmp_type; |
615 | 0 | uint32_t tmp; |
616 | |
|
617 | 0 | src->opcode = ZEND_IS_SMALLER_OR_EQUAL; |
618 | 0 | tmp_type = src->op1_type; |
619 | 0 | src->op1_type = src->op2_type; |
620 | 0 | src->op2_type = tmp_type; |
621 | 0 | tmp = src->op1.num; |
622 | 0 | src->op1.num = src->op2.num; |
623 | 0 | src->op2.num = tmp; |
624 | 0 | } |
625 | 172 | COPY_NODE(src->result, opline->result); |
626 | 172 | SET_VAR_SOURCE(src); |
627 | 172 | MAKE_NOP(opline); |
628 | 172 | ++(*opt_count); |
629 | 172 | break; |
630 | 273 | case ZEND_IS_SMALLER_OR_EQUAL: |
631 | 273 | if (opline->opcode == ZEND_BOOL_NOT) { |
632 | 0 | uint8_t tmp_type; |
633 | 0 | uint32_t tmp; |
634 | |
|
635 | 0 | src->opcode = ZEND_IS_SMALLER; |
636 | 0 | tmp_type = src->op1_type; |
637 | 0 | src->op1_type = src->op2_type; |
638 | 0 | src->op2_type = tmp_type; |
639 | 0 | tmp = src->op1.num; |
640 | 0 | src->op1.num = src->op2.num; |
641 | 0 | src->op2.num = tmp; |
642 | 0 | } |
643 | 273 | COPY_NODE(src->result, opline->result); |
644 | 273 | SET_VAR_SOURCE(src); |
645 | 273 | MAKE_NOP(opline); |
646 | 273 | ++(*opt_count); |
647 | 273 | break; |
648 | 10 | case ZEND_ISSET_ISEMPTY_CV: |
649 | 28 | case ZEND_ISSET_ISEMPTY_VAR: |
650 | 309 | case ZEND_ISSET_ISEMPTY_DIM_OBJ: |
651 | 373 | case ZEND_ISSET_ISEMPTY_PROP_OBJ: |
652 | 387 | case ZEND_ISSET_ISEMPTY_STATIC_PROP: |
653 | 428 | case ZEND_INSTANCEOF: |
654 | 557 | case ZEND_TYPE_CHECK: |
655 | 564 | case ZEND_DEFINED: |
656 | 564 | case ZEND_IN_ARRAY: |
657 | 594 | case ZEND_ARRAY_KEY_EXISTS: |
658 | 594 | if (opline->opcode == ZEND_BOOL_NOT) { |
659 | 445 | break; |
660 | 445 | } |
661 | 149 | COPY_NODE(src->result, opline->result); |
662 | 149 | SET_VAR_SOURCE(src); |
663 | 149 | MAKE_NOP(opline); |
664 | 149 | ++(*opt_count); |
665 | 149 | break; |
666 | 21.4k | } |
667 | 21.4k | } |
668 | 21.4k | } |
669 | 17.2k | break; |
670 | | |
671 | 31.6k | case ZEND_JMPZ: |
672 | 43.8k | case ZEND_JMPNZ: |
673 | 45.7k | while (1) { |
674 | 45.7k | if (opline->op1_type == IS_CONST) { |
675 | 792 | ++(*opt_count); |
676 | 792 | block->successors_count = 1; |
677 | 792 | if (zend_is_true(&ZEND_OP1_LITERAL(opline)) == |
678 | 792 | (opline->opcode == ZEND_JMPZ)) { |
679 | | |
680 | 364 | MAKE_NOP(opline); |
681 | 364 | block->successors[0] = block->successors[1]; |
682 | 364 | block->len--; |
683 | 364 | cfg->blocks[block->successors[0]].flags |= ZEND_BB_FOLLOW; |
684 | 364 | break; |
685 | 428 | } else { |
686 | 428 | zend_basic_block *next = cfg->blocks + block->successors[1]; |
687 | | |
688 | 428 | next->flags &= ~ZEND_BB_FOLLOW; |
689 | 428 | if (!(next->flags & (ZEND_BB_TARGET|ZEND_BB_PROTECTED))) { |
690 | 364 | next->flags &= ~ZEND_BB_REACHABLE; |
691 | 364 | } |
692 | 428 | opline->opcode = ZEND_JMP; |
693 | 428 | COPY_NODE(opline->op1, opline->op2); |
694 | 428 | break; |
695 | 428 | } |
696 | 44.9k | } else if (opline->op1_type == IS_TMP_VAR && |
697 | 41.8k | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
698 | 41.0k | src = VAR_SOURCE(opline->op1); |
699 | 41.0k | if (src) { |
700 | 41.0k | if (src->opcode == ZEND_BOOL_NOT) { |
701 | 739 | VAR_SOURCE(opline->op1) = NULL; |
702 | 739 | COPY_NODE(opline->op1, src->op1); |
703 | | /* T = BOOL_NOT(X) + JMPZ(T) -> NOP, JMPNZ(X) */ |
704 | 739 | opline->opcode = INV_COND(opline->opcode); |
705 | 739 | MAKE_NOP(src); |
706 | 739 | ++(*opt_count); |
707 | 739 | continue; |
708 | 40.3k | } else if (src->opcode == ZEND_BOOL || |
709 | 39.2k | src->opcode == ZEND_QM_ASSIGN) { |
710 | 1.08k | VAR_SOURCE(opline->op1) = NULL; |
711 | 1.08k | COPY_NODE(opline->op1, src->op1); |
712 | 1.08k | MAKE_NOP(src); |
713 | 1.08k | ++(*opt_count); |
714 | 1.08k | continue; |
715 | 1.08k | } |
716 | 41.0k | } |
717 | 41.0k | } |
718 | 43.0k | break; |
719 | 45.7k | } |
720 | 43.8k | break; |
721 | | |
722 | 2.85k | case ZEND_JMPZ_EX: |
723 | 5.85k | case ZEND_JMPNZ_EX: |
724 | 6.61k | while (1) { |
725 | 6.61k | if (opline->op1_type == IS_CONST) { |
726 | 1.37k | bool is_jmpz_ex = opline->opcode == ZEND_JMPZ_EX; |
727 | 1.37k | if (zend_is_true(&ZEND_OP1_LITERAL(opline)) == is_jmpz_ex) { |
728 | | |
729 | 377 | ++(*opt_count); |
730 | 377 | opline->opcode = ZEND_QM_ASSIGN; |
731 | 377 | zval_ptr_dtor_nogc(&ZEND_OP1_LITERAL(opline)); |
732 | 377 | ZVAL_BOOL(&ZEND_OP1_LITERAL(opline), is_jmpz_ex); |
733 | 377 | opline->op2.num = 0; |
734 | 377 | block->successors_count = 1; |
735 | 377 | block->successors[0] = block->successors[1]; |
736 | 377 | cfg->blocks[block->successors[0]].flags |= ZEND_BB_FOLLOW; |
737 | 377 | break; |
738 | 377 | } |
739 | 5.24k | } else if (opline->op1_type == IS_TMP_VAR && |
740 | 4.94k | (!zend_bitset_in(used_ext, VAR_NUM(opline->op1.var)) || |
741 | 4.30k | opline->result.var == opline->op1.var)) { |
742 | 4.30k | src = VAR_SOURCE(opline->op1); |
743 | 4.30k | if (src) { |
744 | 3.70k | if (src->opcode == ZEND_BOOL || |
745 | 2.94k | src->opcode == ZEND_QM_ASSIGN) { |
746 | 761 | VAR_SOURCE(opline->op1) = NULL; |
747 | 761 | COPY_NODE(opline->op1, src->op1); |
748 | 761 | MAKE_NOP(src); |
749 | 761 | ++(*opt_count); |
750 | 761 | continue; |
751 | 761 | } |
752 | 3.70k | } |
753 | 4.30k | } |
754 | 5.48k | break; |
755 | 6.61k | } |
756 | 5.85k | break; |
757 | | |
758 | 83.4k | case ZEND_CONCAT: |
759 | 115k | case ZEND_FAST_CONCAT: |
760 | 115k | if (opline->op1_type == IS_CONST && |
761 | 26.5k | opline->op2_type == IS_CONST) { |
762 | 0 | goto optimize_constant_binary_op; |
763 | 0 | } |
764 | | |
765 | 115k | if (opline->op2_type == IS_CONST && |
766 | 43.6k | opline->op1_type == IS_TMP_VAR) { |
767 | | |
768 | 29.2k | src = VAR_SOURCE(opline->op1); |
769 | 29.2k | if (src && |
770 | 29.1k | (src->opcode == ZEND_CONCAT || |
771 | 24.2k | src->opcode == ZEND_FAST_CONCAT) && |
772 | 27.2k | src->op2_type == IS_CONST) { |
773 | | /* compress consecutive CONCATs */ |
774 | 1.08k | size_t l, old_len; |
775 | | |
776 | 1.08k | if (Z_TYPE(ZEND_OP2_LITERAL(opline)) != IS_STRING) { |
777 | 0 | convert_to_string(&ZEND_OP2_LITERAL(opline)); |
778 | 0 | } |
779 | 1.08k | if (Z_TYPE(ZEND_OP2_LITERAL(src)) != IS_STRING) { |
780 | 0 | convert_to_string(&ZEND_OP2_LITERAL(src)); |
781 | 0 | } |
782 | | |
783 | 1.08k | VAR_SOURCE(opline->op1) = NULL; |
784 | 1.08k | COPY_NODE(opline->op1, src->op1); |
785 | 1.08k | old_len = Z_STRLEN(ZEND_OP2_LITERAL(src)); |
786 | 1.08k | l = old_len + Z_STRLEN(ZEND_OP2_LITERAL(opline)); |
787 | 1.08k | if (!Z_REFCOUNTED(ZEND_OP2_LITERAL(src))) { |
788 | 320 | zend_string *tmp = zend_string_alloc(l, 0); |
789 | 320 | memcpy(ZSTR_VAL(tmp), Z_STRVAL(ZEND_OP2_LITERAL(src)), old_len); |
790 | 320 | Z_STR(ZEND_OP2_LITERAL(src)) = tmp; |
791 | 763 | } else { |
792 | 763 | Z_STR(ZEND_OP2_LITERAL(src)) = zend_string_extend(Z_STR(ZEND_OP2_LITERAL(src)), l, 0); |
793 | 763 | } |
794 | 1.08k | Z_TYPE_INFO(ZEND_OP2_LITERAL(src)) = IS_STRING_EX; |
795 | 1.08k | memcpy(Z_STRVAL(ZEND_OP2_LITERAL(src)) + old_len, Z_STRVAL(ZEND_OP2_LITERAL(opline)), Z_STRLEN(ZEND_OP2_LITERAL(opline))); |
796 | 1.08k | Z_STRVAL(ZEND_OP2_LITERAL(src))[l] = '\0'; |
797 | 1.08k | zval_ptr_dtor_str(&ZEND_OP2_LITERAL(opline)); |
798 | 1.08k | ZVAL_STR(&ZEND_OP2_LITERAL(opline), zend_new_interned_string(Z_STR(ZEND_OP2_LITERAL(src)))); |
799 | 1.08k | ZVAL_NULL(&ZEND_OP2_LITERAL(src)); |
800 | 1.08k | MAKE_NOP(src); |
801 | 1.08k | ++(*opt_count); |
802 | 1.08k | } |
803 | 29.2k | } |
804 | | |
805 | 115k | if (opline->op1_type & (IS_TMP_VAR|IS_VAR)) { |
806 | 45.4k | src = VAR_SOURCE(opline->op1); |
807 | 45.4k | if (src && |
808 | 45.1k | src->opcode == ZEND_CAST && |
809 | 151 | src->extended_value == IS_STRING && |
810 | 5 | src->op1_type != IS_CONST) { |
811 | | /* convert T1 = CAST(STRING, X), T2 = CONCAT(T1, Y) to T2 = CONCAT(X,Y) */ |
812 | 3 | VAR_SOURCE(opline->op1) = NULL; |
813 | 3 | COPY_NODE(opline->op1, src->op1); |
814 | 3 | MAKE_NOP(src); |
815 | 3 | ++(*opt_count); |
816 | 3 | } |
817 | 45.4k | } |
818 | 115k | if (opline->op2_type & (IS_TMP_VAR|IS_VAR)) { |
819 | 69.6k | src = VAR_SOURCE(opline->op2); |
820 | 69.6k | if (src && |
821 | 69.4k | src->opcode == ZEND_CAST && |
822 | 156 | src->extended_value == IS_STRING && |
823 | 64 | src->op1_type != IS_CONST) { |
824 | | /* convert T1 = CAST(STRING, X), T2 = CONCAT(Y, T1) to T2 = CONCAT(Y,X) */ |
825 | 16 | VAR_SOURCE(opline->op2) = NULL; |
826 | 16 | COPY_NODE(opline->op2, src->op1); |
827 | 16 | MAKE_NOP(src); |
828 | 16 | ++(*opt_count); |
829 | 16 | } |
830 | 69.6k | } |
831 | 115k | if (opline->op1_type == IS_CONST && |
832 | 26.5k | Z_TYPE(ZEND_OP1_LITERAL(opline)) == IS_STRING && |
833 | 26.5k | Z_STRLEN(ZEND_OP1_LITERAL(opline)) == 0) { |
834 | | /* convert CONCAT('', X) => CAST(STRING, X) */ |
835 | 13 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
836 | 13 | opline->opcode = ZEND_CAST; |
837 | 13 | opline->extended_value = IS_STRING; |
838 | 13 | COPY_NODE(opline->op1, opline->op2); |
839 | 13 | opline->op2_type = IS_UNUSED; |
840 | 13 | opline->op2.var = 0; |
841 | 13 | ++(*opt_count); |
842 | 115k | } else if (opline->op2_type == IS_CONST && |
843 | 43.6k | Z_TYPE(ZEND_OP2_LITERAL(opline)) == IS_STRING && |
844 | 43.6k | Z_STRLEN(ZEND_OP2_LITERAL(opline)) == 0) { |
845 | | /* convert CONCAT(X, '') => CAST(STRING, X) */ |
846 | 22 | literal_dtor(&ZEND_OP2_LITERAL(opline)); |
847 | 22 | opline->opcode = ZEND_CAST; |
848 | 22 | opline->extended_value = IS_STRING; |
849 | 22 | opline->op2_type = IS_UNUSED; |
850 | 22 | opline->op2.var = 0; |
851 | 22 | ++(*opt_count); |
852 | 115k | } else if (opline->opcode == ZEND_CONCAT && |
853 | 83.3k | (opline->op1_type == IS_CONST || |
854 | 68.6k | (opline->op1_type == IS_TMP_VAR && |
855 | 28.8k | VAR_SOURCE(opline->op1) && |
856 | 28.5k | (VAR_SOURCE(opline->op1)->opcode == ZEND_FAST_CONCAT || |
857 | 15.7k | VAR_SOURCE(opline->op1)->opcode == ZEND_ROPE_END || |
858 | 15.6k | VAR_SOURCE(opline->op1)->opcode == ZEND_FETCH_CONSTANT || |
859 | 11.9k | VAR_SOURCE(opline->op1)->opcode == ZEND_FETCH_CLASS_CONSTANT))) && |
860 | 31.3k | (opline->op2_type == IS_CONST || |
861 | 19.6k | (opline->op2_type == IS_TMP_VAR && |
862 | 17.2k | VAR_SOURCE(opline->op2) && |
863 | 17.2k | (VAR_SOURCE(opline->op2)->opcode == ZEND_FAST_CONCAT || |
864 | 17.2k | VAR_SOURCE(opline->op2)->opcode == ZEND_ROPE_END || |
865 | 6.03k | VAR_SOURCE(opline->op2)->opcode == ZEND_FETCH_CONSTANT || |
866 | 25.7k | VAR_SOURCE(opline->op2)->opcode == ZEND_FETCH_CLASS_CONSTANT)))) { |
867 | 25.7k | opline->opcode = ZEND_FAST_CONCAT; |
868 | 25.7k | ++(*opt_count); |
869 | 25.7k | } |
870 | 115k | break; |
871 | | |
872 | 13.1k | case ZEND_ADD: |
873 | 24.8k | case ZEND_SUB: |
874 | 36.1k | case ZEND_MUL: |
875 | 48.8k | case ZEND_DIV: |
876 | 54.2k | case ZEND_MOD: |
877 | 58.7k | case ZEND_SL: |
878 | 60.5k | case ZEND_SR: |
879 | 71.2k | case ZEND_IS_SMALLER: |
880 | 75.0k | case ZEND_IS_SMALLER_OR_EQUAL: |
881 | 75.7k | case ZEND_IS_NOT_IDENTICAL: |
882 | 78.6k | case ZEND_BOOL_XOR: |
883 | 80.9k | case ZEND_BW_OR: |
884 | 97.1k | case ZEND_BW_AND: |
885 | 109k | case ZEND_BW_XOR: |
886 | 109k | if (opline->op1_type == IS_CONST && |
887 | 19.3k | opline->op2_type == IS_CONST) { |
888 | | /* evaluate constant expressions */ |
889 | 14.0k | zval result; |
890 | | |
891 | 14.0k | optimize_constant_binary_op: |
892 | 14.0k | if (zend_optimizer_eval_binary_op(&result, opline->opcode, &ZEND_OP1_LITERAL(opline), &ZEND_OP2_LITERAL(opline)) == SUCCESS) { |
893 | 8 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
894 | 8 | literal_dtor(&ZEND_OP2_LITERAL(opline)); |
895 | 8 | opline->opcode = ZEND_QM_ASSIGN; |
896 | 8 | SET_UNUSED(opline->op2); |
897 | 8 | zend_optimizer_update_op1_const(op_array, opline, &result); |
898 | 8 | ++(*opt_count); |
899 | 8 | } |
900 | 14.0k | } |
901 | 109k | break; |
902 | | |
903 | 109k | case ZEND_BW_NOT: |
904 | 23.5k | if (opline->op1_type == IS_CONST) { |
905 | | /* evaluate constant unary ops */ |
906 | 253 | zval result; |
907 | | |
908 | 2.86k | optimize_const_unary_op: |
909 | 2.86k | if (zend_optimizer_eval_unary_op(&result, opline->opcode, &ZEND_OP1_LITERAL(opline)) == SUCCESS) { |
910 | 2.59k | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
911 | 2.59k | opline->opcode = ZEND_QM_ASSIGN; |
912 | 2.59k | zend_optimizer_update_op1_const(op_array, opline, &result); |
913 | 2.59k | ++(*opt_count); |
914 | 2.59k | } |
915 | 2.86k | } |
916 | 26.1k | break; |
917 | | |
918 | 26.1k | case ZEND_CAST: |
919 | 3.44k | if (opline->op1_type == IS_CONST) { |
920 | | /* cast of constant operand */ |
921 | 344 | zval result; |
922 | | |
923 | 344 | if (zend_optimizer_eval_cast(&result, opline->extended_value, &ZEND_OP1_LITERAL(opline)) == SUCCESS) { |
924 | 4 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
925 | 4 | opline->opcode = ZEND_QM_ASSIGN; |
926 | 4 | opline->extended_value = 0; |
927 | 4 | zend_optimizer_update_op1_const(op_array, opline, &result); |
928 | 4 | ++(*opt_count); |
929 | 4 | } |
930 | 344 | } |
931 | 3.44k | break; |
932 | | |
933 | 2.95k | case ZEND_STRLEN: |
934 | 2.95k | if (opline->op1_type == IS_CONST) { |
935 | 20 | zval result; |
936 | | |
937 | 20 | if (zend_optimizer_eval_strlen(&result, &ZEND_OP1_LITERAL(opline)) == SUCCESS) { |
938 | 0 | literal_dtor(&ZEND_OP1_LITERAL(opline)); |
939 | 0 | opline->opcode = ZEND_QM_ASSIGN; |
940 | 0 | zend_optimizer_update_op1_const(op_array, opline, &result); |
941 | 0 | ++(*opt_count); |
942 | 0 | } |
943 | 20 | } |
944 | 2.95k | break; |
945 | | |
946 | 152k | case ZEND_RETURN: |
947 | 152k | if (opline->op1_type == IS_TMP_VAR) { |
948 | 4.20k | src = VAR_SOURCE(opline->op1); |
949 | 4.20k | if (src && src->opcode == ZEND_QM_ASSIGN) { |
950 | 184 | zend_op *op = src + 1; |
951 | 184 | bool optimize = true; |
952 | | |
953 | 184 | while (op < opline) { |
954 | 24 | if ((op->op1_type == opline->op1_type |
955 | 4 | && op->op1.var == opline->op1.var) |
956 | 20 | || (op->op2_type == opline->op1_type |
957 | 24 | && op->op2.var == opline->op1.var)) { |
958 | 24 | optimize = false; |
959 | 24 | break; |
960 | 24 | } |
961 | 0 | op++; |
962 | 0 | } |
963 | | |
964 | 184 | if (optimize) { |
965 | | /* T = QM_ASSIGN(X), RETURN(T) to NOP, RETURN(X) */ |
966 | 160 | VAR_SOURCE(opline->op1) = NULL; |
967 | 160 | COPY_NODE(opline->op1, src->op1); |
968 | 160 | MAKE_NOP(src); |
969 | 160 | ++(*opt_count); |
970 | 160 | } |
971 | 184 | } |
972 | 4.20k | } |
973 | 152k | break; |
974 | | |
975 | 20.6k | case ZEND_QM_ASSIGN: |
976 | 20.6k | if (opline->op1_type == opline->result_type && |
977 | 5.08k | opline->op1.var == opline->result.var) { |
978 | | /* strip T = QM_ASSIGN(T) */ |
979 | 0 | MAKE_NOP(opline); |
980 | 0 | ++(*opt_count); |
981 | 20.6k | } else if (opline->op1_type == IS_TMP_VAR && |
982 | 5.08k | opline->result_type == IS_TMP_VAR && |
983 | 5.08k | !zend_bitset_in(used_ext, VAR_NUM(opline->op1.var))) { |
984 | | /* T1 = ..., T2 = QM_ASSIGN(T1) to T2 = ..., NOP */ |
985 | 2.52k | src = VAR_SOURCE(opline->op1); |
986 | 2.52k | if (src && |
987 | 2.52k | src->opcode != ZEND_COPY_TMP && |
988 | 2.52k | src->opcode != ZEND_ADD_ARRAY_ELEMENT && |
989 | 2.52k | src->opcode != ZEND_ADD_ARRAY_UNPACK && |
990 | 2.52k | (src->opcode != ZEND_DECLARE_LAMBDA_FUNCTION || |
991 | 2.52k | src == opline -1)) { |
992 | 2.52k | src->result.var = opline->result.var; |
993 | 2.52k | VAR_SOURCE(opline->op1) = NULL; |
994 | 2.52k | VAR_SOURCE(opline->result) = src; |
995 | 2.52k | MAKE_NOP(opline); |
996 | 2.52k | ++(*opt_count); |
997 | 2.52k | } |
998 | 2.52k | } |
999 | 20.6k | break; |
1000 | 3.86M | } |
1001 | | |
1002 | | /* get variable source */ |
1003 | 3.86M | if (opline->result_type & (IS_VAR|IS_TMP_VAR)) { |
1004 | 1.87M | SET_VAR_SOURCE(opline); |
1005 | 1.87M | } |
1006 | 3.86M | opline++; |
1007 | 3.86M | } |
1008 | 607k | } |
1009 | | |
1010 | | /* Rebuild plain (optimized) op_array from CFG */ |
1011 | | static void assemble_code_blocks(const zend_cfg *cfg, zend_op_array *op_array, zend_optimizer_ctx *ctx) |
1012 | 106k | { |
1013 | 106k | zend_basic_block *blocks = cfg->blocks; |
1014 | 106k | const zend_basic_block *end = blocks + cfg->blocks_count; |
1015 | 106k | zend_basic_block *b; |
1016 | 106k | zend_op *new_opcodes; |
1017 | 106k | zend_op *opline; |
1018 | 106k | uint32_t len = 0; |
1019 | | |
1020 | 555k | for (b = blocks; b < end; b++) { |
1021 | 448k | if (b->len == 0) { |
1022 | 38.0k | continue; |
1023 | 38.0k | } |
1024 | 410k | if (b->flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1025 | 394k | opline = op_array->opcodes + b->start + b->len - 1; |
1026 | 394k | if (opline->opcode == ZEND_JMP) { |
1027 | 54.6k | const zend_basic_block *next = b + 1; |
1028 | | |
1029 | 66.9k | while (next < end && !(next->flags & ZEND_BB_REACHABLE)) { |
1030 | 12.3k | next++; |
1031 | 12.3k | } |
1032 | 54.6k | if (next < end && next == blocks + b->successors[0]) { |
1033 | | /* JMP to the next block - strip it */ |
1034 | 12 | MAKE_NOP(opline); |
1035 | 12 | b->len--; |
1036 | 12 | } |
1037 | 339k | } else if (b->len == 1 && opline->opcode == ZEND_NOP) { |
1038 | | /* skip empty block */ |
1039 | 0 | b->len--; |
1040 | 0 | } |
1041 | 394k | len += b->len; |
1042 | 394k | } else { |
1043 | | /* this block will not be used, delete all constants there */ |
1044 | 16.6k | const zend_op *op = op_array->opcodes + b->start; |
1045 | 16.6k | const zend_op *last_op = op + b->len; |
1046 | 38.2k | for (; op < last_op; op++) { |
1047 | 21.5k | if (op->op1_type == IS_CONST) { |
1048 | 14.9k | literal_dtor(&ZEND_OP1_LITERAL(op)); |
1049 | 14.9k | } |
1050 | 21.5k | if (op->op2_type == IS_CONST) { |
1051 | 648 | literal_dtor(&ZEND_OP2_LITERAL(op)); |
1052 | 648 | } |
1053 | 21.5k | } |
1054 | 16.6k | } |
1055 | 410k | } |
1056 | | |
1057 | 106k | new_opcodes = emalloc(len * sizeof(zend_op)); |
1058 | 106k | opline = new_opcodes; |
1059 | | |
1060 | | /* Copy code of reachable blocks into a single buffer */ |
1061 | 555k | for (b = blocks; b < end; b++) { |
1062 | 448k | if (b->flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1063 | 394k | memcpy(opline, op_array->opcodes + b->start, b->len * sizeof(zend_op)); |
1064 | 394k | b->start = opline - new_opcodes; |
1065 | 394k | opline += b->len; |
1066 | 394k | } |
1067 | 448k | } |
1068 | | |
1069 | | /* adjust jump targets */ |
1070 | 106k | efree(op_array->opcodes); |
1071 | 106k | op_array->opcodes = new_opcodes; |
1072 | 106k | op_array->last = len; |
1073 | | |
1074 | 555k | for (b = blocks; b < end; b++) { |
1075 | 448k | if (!(b->flags & ZEND_BB_REACHABLE) || b->len == 0) { |
1076 | 54.6k | continue; |
1077 | 54.6k | } |
1078 | 394k | opline = op_array->opcodes + b->start + b->len - 1; |
1079 | 394k | switch (opline->opcode) { |
1080 | 645 | case ZEND_FAST_CALL: |
1081 | 55.2k | case ZEND_JMP: |
1082 | 55.2k | ZEND_SET_OP_JMP_ADDR(opline, opline->op1, new_opcodes + blocks[b->successors[0]].start); |
1083 | 55.2k | break; |
1084 | 18.1k | case ZEND_JMPZ: |
1085 | 27.9k | case ZEND_JMPNZ: |
1086 | 29.6k | case ZEND_JMPZ_EX: |
1087 | 31.2k | case ZEND_JMPNZ_EX: |
1088 | 45.3k | case ZEND_FE_RESET_R: |
1089 | 46.1k | case ZEND_FE_RESET_RW: |
1090 | 47.5k | case ZEND_JMP_SET: |
1091 | 52.2k | case ZEND_COALESCE: |
1092 | 53.6k | case ZEND_ASSERT_CHECK: |
1093 | 94.3k | case ZEND_JMP_NULL: |
1094 | 94.5k | case ZEND_BIND_INIT_STATIC_OR_JMP: |
1095 | 94.5k | case ZEND_JMP_FRAMELESS: |
1096 | 94.5k | ZEND_SET_OP_JMP_ADDR(opline, opline->op2, new_opcodes + blocks[b->successors[0]].start); |
1097 | 94.5k | break; |
1098 | 6.39k | case ZEND_CATCH: |
1099 | 6.39k | if (!(opline->extended_value & ZEND_LAST_CATCH)) { |
1100 | 4.89k | ZEND_SET_OP_JMP_ADDR(opline, opline->op2, new_opcodes + blocks[b->successors[0]].start); |
1101 | 4.89k | } |
1102 | 6.39k | break; |
1103 | 14.1k | case ZEND_FE_FETCH_R: |
1104 | 14.9k | case ZEND_FE_FETCH_RW: |
1105 | 14.9k | opline->extended_value = ZEND_OPLINE_TO_OFFSET(opline, new_opcodes + blocks[b->successors[0]].start); |
1106 | 14.9k | break; |
1107 | 8 | case ZEND_SWITCH_LONG: |
1108 | 63 | case ZEND_SWITCH_STRING: |
1109 | 237 | case ZEND_MATCH: |
1110 | 237 | { |
1111 | 237 | const HashTable *jumptable = Z_ARRVAL(ZEND_OP2_LITERAL(opline)); |
1112 | 237 | zval *zv; |
1113 | 237 | uint32_t s = 0; |
1114 | 237 | ZEND_ASSERT(b->successors_count == (opline->opcode == ZEND_MATCH ? 1 : 2) + zend_hash_num_elements(jumptable)); |
1115 | | |
1116 | 2.17k | ZEND_HASH_FOREACH_VAL(jumptable, zv) { |
1117 | 2.17k | Z_LVAL_P(zv) = ZEND_OPLINE_TO_OFFSET(opline, new_opcodes + blocks[b->successors[s++]].start); |
1118 | 2.17k | } ZEND_HASH_FOREACH_END(); |
1119 | 237 | opline->extended_value = ZEND_OPLINE_TO_OFFSET(opline, new_opcodes + blocks[b->successors[s++]].start); |
1120 | 237 | break; |
1121 | 237 | } |
1122 | 394k | } |
1123 | 394k | } |
1124 | | |
1125 | | /* adjust exception jump targets & remove unused try_catch_array entries */ |
1126 | 106k | if (op_array->last_try_catch) { |
1127 | 27.9k | uint32_t i, j; |
1128 | 27.9k | uint32_t *map; |
1129 | 27.9k | ALLOCA_FLAG(use_heap); |
1130 | | |
1131 | 27.9k | map = (uint32_t *)do_alloca(sizeof(uint32_t) * op_array->last_try_catch, use_heap); |
1132 | 62.5k | for (i = 0, j = 0; i< op_array->last_try_catch; i++) { |
1133 | 34.6k | if (blocks[cfg->map[op_array->try_catch_array[i].try_op]].flags & ZEND_BB_REACHABLE) { |
1134 | 34.6k | map[i] = j; |
1135 | 34.6k | op_array->try_catch_array[j].try_op = blocks[cfg->map[op_array->try_catch_array[i].try_op]].start; |
1136 | 34.6k | if (op_array->try_catch_array[i].catch_op) { |
1137 | 34.0k | op_array->try_catch_array[j].catch_op = blocks[cfg->map[op_array->try_catch_array[i].catch_op]].start; |
1138 | 34.0k | } else { |
1139 | 586 | op_array->try_catch_array[j].catch_op = 0; |
1140 | 586 | } |
1141 | 34.6k | if (op_array->try_catch_array[i].finally_op) { |
1142 | 725 | op_array->try_catch_array[j].finally_op = blocks[cfg->map[op_array->try_catch_array[i].finally_op]].start; |
1143 | 33.8k | } else { |
1144 | 33.8k | op_array->try_catch_array[j].finally_op = 0; |
1145 | 33.8k | } |
1146 | 34.6k | if (!op_array->try_catch_array[i].finally_end) { |
1147 | 33.8k | op_array->try_catch_array[j].finally_end = 0; |
1148 | 33.8k | } else { |
1149 | 725 | op_array->try_catch_array[j].finally_end = blocks[cfg->map[op_array->try_catch_array[i].finally_end]].start; |
1150 | 725 | } |
1151 | 34.6k | j++; |
1152 | 34.6k | } |
1153 | 34.6k | } |
1154 | 27.9k | if (i != j) { |
1155 | 10 | op_array->last_try_catch = j; |
1156 | 10 | if (j == 0) { |
1157 | 6 | efree(op_array->try_catch_array); |
1158 | 6 | op_array->try_catch_array = NULL; |
1159 | 6 | } |
1160 | | |
1161 | 10 | if (op_array->fn_flags & ZEND_ACC_HAS_FINALLY_BLOCK) { |
1162 | 0 | zend_op *finally_opline = new_opcodes; |
1163 | 0 | const zend_op *last_finally_op = finally_opline + len; |
1164 | 0 | while (finally_opline < last_finally_op) { |
1165 | 0 | if (finally_opline->opcode == ZEND_FAST_RET && |
1166 | 0 | finally_opline->op2.num != (uint32_t)-1 && |
1167 | 0 | finally_opline->op2.num < j) { |
1168 | 0 | finally_opline->op2.num = map[finally_opline->op2.num]; |
1169 | 0 | } |
1170 | 0 | finally_opline++; |
1171 | 0 | } |
1172 | 0 | } |
1173 | 10 | } |
1174 | 27.9k | free_alloca(map, use_heap); |
1175 | 27.9k | } |
1176 | | |
1177 | | /* rebuild map (just for printing) */ |
1178 | 106k | memset(cfg->map, -1, sizeof(int) * op_array->last); |
1179 | 555k | for (int n = 0; n < cfg->blocks_count; n++) { |
1180 | 448k | if (cfg->blocks[n].flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1181 | 394k | cfg->map[cfg->blocks[n].start] = n; |
1182 | 394k | } |
1183 | 448k | } |
1184 | 106k | } |
1185 | | |
1186 | | static zend_always_inline zend_basic_block *get_target_block(const zend_cfg *cfg, const zend_basic_block *block, int n, uint32_t *opt_count) |
1187 | 195k | { |
1188 | 195k | int b; |
1189 | 195k | zend_basic_block *target_block = cfg->blocks + block->successors[n]; |
1190 | | |
1191 | 195k | if (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)) { |
1192 | 204 | do { |
1193 | 204 | b = target_block->successors[0]; |
1194 | 204 | target_block = cfg->blocks + b; |
1195 | 204 | } while (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)); |
1196 | 148 | block->successors[n] = b; |
1197 | 148 | ++(*opt_count); |
1198 | 148 | } |
1199 | 195k | return target_block; |
1200 | 195k | } |
1201 | | |
1202 | | static zend_always_inline zend_basic_block *get_follow_block(const zend_cfg *cfg, const zend_basic_block *block, int n, uint32_t *opt_count) |
1203 | 48.5k | { |
1204 | 48.5k | int b; |
1205 | 48.5k | zend_basic_block *target_block = cfg->blocks + block->successors[n]; |
1206 | | |
1207 | 48.5k | if (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)) { |
1208 | 1.08k | do { |
1209 | 1.08k | b = target_block->successors[0]; |
1210 | 1.08k | target_block = cfg->blocks + b; |
1211 | 1.08k | } while (target_block->len == 0 && !(target_block->flags & ZEND_BB_PROTECTED)); |
1212 | 981 | block->successors[n] = b; |
1213 | 981 | ++(*opt_count); |
1214 | 981 | } |
1215 | 48.5k | return target_block; |
1216 | 48.5k | } |
1217 | | |
1218 | | static zend_always_inline zend_basic_block *get_next_block(const zend_cfg *cfg, zend_basic_block *block) |
1219 | 97.4k | { |
1220 | 97.4k | zend_basic_block *next_block = block + 1; |
1221 | 97.4k | const zend_basic_block *end = cfg->blocks + cfg->blocks_count; |
1222 | | |
1223 | 113k | while (1) { |
1224 | 113k | if (next_block == end) { |
1225 | 889 | return NULL; |
1226 | 112k | } else if (next_block->flags & ZEND_BB_REACHABLE) { |
1227 | 96.5k | break; |
1228 | 96.5k | } |
1229 | 15.8k | next_block++; |
1230 | 15.8k | } |
1231 | 96.6k | while (next_block->len == 0 && !(next_block->flags & ZEND_BB_PROTECTED)) { |
1232 | 97 | next_block = cfg->blocks + next_block->successors[0]; |
1233 | 97 | } |
1234 | 96.5k | return next_block; |
1235 | 97.4k | } |
1236 | | |
1237 | | |
1238 | | /* we use "jmp_hitlist" to avoid infinity loops during jmp optimization */ |
1239 | | static zend_always_inline bool in_hitlist(int target, const int *jmp_hitlist, int jmp_hitlist_count) |
1240 | 686 | { |
1241 | 686 | int i; |
1242 | | |
1243 | 854 | for (i = 0; i < jmp_hitlist_count; i++) { |
1244 | 393 | if (jmp_hitlist[i] == target) { |
1245 | 225 | return 1; |
1246 | 225 | } |
1247 | 393 | } |
1248 | 461 | return 0; |
1249 | 686 | } |
1250 | | |
1251 | | #define CHECK_LOOP(target) \ |
1252 | 686 | if (EXPECTED(!in_hitlist(target, jmp_hitlist, jmp_hitlist_count))) { \ |
1253 | 461 | jmp_hitlist[jmp_hitlist_count++] = target; \ |
1254 | 461 | } else { \ |
1255 | 225 | break; \ |
1256 | 225 | } |
1257 | | |
1258 | | static void zend_jmp_optimization(zend_basic_block *block, zend_op_array *op_array, const zend_cfg *cfg, int *jmp_hitlist, uint32_t *opt_count) |
1259 | 607k | { |
1260 | | /* last_op is the last opcode of the current block */ |
1261 | 607k | zend_basic_block *target_block, *follow_block, *next_block; |
1262 | 607k | zend_op *last_op, *target; |
1263 | 607k | int next, jmp_hitlist_count; |
1264 | | |
1265 | 607k | if (block->len == 0) { |
1266 | 1.58k | return; |
1267 | 1.58k | } |
1268 | | |
1269 | 606k | last_op = op_array->opcodes + block->start + block->len - 1; |
1270 | 606k | switch (last_op->opcode) { |
1271 | 96.6k | case ZEND_JMP: |
1272 | 96.6k | jmp_hitlist_count = 0; |
1273 | | |
1274 | 96.6k | target_block = get_target_block(cfg, block, 0, opt_count); |
1275 | 96.7k | while (target_block->len == 1) { |
1276 | 51.4k | target = op_array->opcodes + target_block->start; |
1277 | 51.4k | if (target->opcode == ZEND_JMP) { |
1278 | | /* JMP L, L: JMP L1 -> JMP L1 */ |
1279 | 86 | next = target_block->successors[0]; |
1280 | 51.3k | } else { |
1281 | 51.3k | break; |
1282 | 51.3k | } |
1283 | 86 | CHECK_LOOP(next); |
1284 | 47 | block->successors[0] = next; |
1285 | 47 | ++(*opt_count); |
1286 | 47 | target_block = get_target_block(cfg, block, 0, opt_count); |
1287 | 47 | } |
1288 | | |
1289 | 96.6k | next_block = get_next_block(cfg, block); |
1290 | 96.6k | if (target_block == next_block) { |
1291 | | /* JMP(next) -> NOP */ |
1292 | 987 | MAKE_NOP(last_op); |
1293 | 987 | ++(*opt_count); |
1294 | 987 | block->len--; |
1295 | 95.6k | } else if (target_block->len == 1) { |
1296 | 51.1k | target = op_array->opcodes + target_block->start; |
1297 | 51.1k | if ((target->opcode == ZEND_RETURN || |
1298 | 50.9k | target->opcode == ZEND_RETURN_BY_REF || |
1299 | 50.9k | target->opcode == ZEND_GENERATOR_RETURN) && |
1300 | 320 | !(op_array->fn_flags & ZEND_ACC_HAS_FINALLY_BLOCK)) { |
1301 | | /* JMP L, L: RETURN to immediate RETURN */ |
1302 | 52 | *last_op = *target; |
1303 | 52 | if (last_op->op1_type == IS_CONST) { |
1304 | 52 | zval zv; |
1305 | 52 | ZVAL_COPY(&zv, &ZEND_OP1_LITERAL(last_op)); |
1306 | 52 | last_op->op1.constant = zend_optimizer_add_literal(op_array, &zv); |
1307 | 52 | } |
1308 | 52 | block->successors_count = 0; |
1309 | 52 | ++(*opt_count); |
1310 | 52 | } |
1311 | 51.1k | } |
1312 | 96.6k | break; |
1313 | | |
1314 | 2.00k | case ZEND_JMP_SET: |
1315 | 8.64k | case ZEND_COALESCE: |
1316 | 50.0k | case ZEND_JMP_NULL: |
1317 | 50.0k | jmp_hitlist_count = 0; |
1318 | | |
1319 | 50.0k | target_block = get_target_block(cfg, block, 0, opt_count); |
1320 | 50.0k | while (target_block->len == 1) { |
1321 | 5.21k | target = op_array->opcodes + target_block->start; |
1322 | | |
1323 | 5.21k | if (target->opcode == ZEND_JMP) { |
1324 | | /* JMP_SET(X, L), L: JMP(L2) -> JMP_SET(X, L2) */ |
1325 | 32 | next = target_block->successors[0]; |
1326 | 32 | CHECK_LOOP(next); |
1327 | 32 | block->successors[0] = next; |
1328 | 32 | ++(*opt_count); |
1329 | 5.17k | } else { |
1330 | 5.17k | break; |
1331 | 5.17k | } |
1332 | 32 | target_block = get_target_block(cfg, block, 0, opt_count); |
1333 | 32 | } |
1334 | 50.0k | break; |
1335 | | |
1336 | 30.6k | case ZEND_JMPZ: |
1337 | 43.0k | case ZEND_JMPNZ: |
1338 | 43.0k | jmp_hitlist_count = 0; |
1339 | | |
1340 | 43.0k | target_block = get_target_block(cfg, block, 0, opt_count); |
1341 | 43.4k | while (target_block->len == 1) { |
1342 | 29.0k | target = op_array->opcodes + target_block->start; |
1343 | | |
1344 | 29.0k | if (target->opcode == ZEND_JMP) { |
1345 | | /* JMPZ(X, L), L: JMP(L2) -> JMPZ(X, L2) */ |
1346 | 84 | next = target_block->successors[0]; |
1347 | 28.9k | } else if (target->opcode == last_op->opcode && |
1348 | 804 | SAME_VAR(target->op1, last_op->op1)) { |
1349 | | /* JMPZ(X, L), L: JMPZ(X, L2) -> JMPZ(X, L2) */ |
1350 | 454 | next = target_block->successors[0]; |
1351 | 28.4k | } else if (target->opcode == INV_COND(last_op->opcode) && |
1352 | 135 | SAME_VAR(target->op1, last_op->op1)) { |
1353 | | /* JMPZ(X, L), L: JMPNZ(X, L2) -> JMPZ(X, L+1) */ |
1354 | 30 | next = target_block->successors[1]; |
1355 | 28.4k | } else { |
1356 | 28.4k | break; |
1357 | 28.4k | } |
1358 | 568 | CHECK_LOOP(next); |
1359 | 382 | block->successors[0] = next; |
1360 | 382 | ++(*opt_count); |
1361 | 382 | target_block = get_target_block(cfg, block, 0, opt_count); |
1362 | 382 | } |
1363 | | |
1364 | 43.0k | follow_block = get_follow_block(cfg, block, 1, opt_count); |
1365 | 43.0k | if (target_block == follow_block) { |
1366 | | /* L: JMP[N]Z(X, L+1) -> NOP or FREE(X) */ |
1367 | 724 | zend_optimizer_convert_to_free_op1(op_array, last_op); |
1368 | 724 | if (last_op->opcode == ZEND_NOP) { |
1369 | 0 | block->len--; |
1370 | 0 | } |
1371 | 724 | block->successors_count = 1; |
1372 | 724 | ++(*opt_count); |
1373 | 42.3k | } else if (follow_block->len == 1) { |
1374 | 8.58k | target = op_array->opcodes + follow_block->start; |
1375 | 8.58k | if (target->opcode == ZEND_JMP) { |
1376 | 1.06k | if (block->successors[0] == follow_block->successors[0]) { |
1377 | | /* JMPZ(X,L1), JMP(L1) -> NOP, JMP(L1) */ |
1378 | 236 | zend_optimizer_convert_to_free_op1(op_array, last_op); |
1379 | 236 | if (last_op->opcode == ZEND_NOP) { |
1380 | 0 | block->len--; |
1381 | 0 | } |
1382 | 236 | block->successors[0] = follow_block - cfg->blocks; |
1383 | 236 | block->successors_count = 1; |
1384 | 236 | ++(*opt_count); |
1385 | 236 | break; |
1386 | 826 | } else if (!(follow_block->flags & (ZEND_BB_TARGET | ZEND_BB_PROTECTED))) { |
1387 | 826 | next_block = get_next_block(cfg, follow_block); |
1388 | | |
1389 | 826 | if (target_block == next_block) { |
1390 | | /* JMPZ(X,L1) JMP(L2) L1: -> JMPNZ(X,L2) NOP*/ |
1391 | | |
1392 | 424 | last_op->opcode = INV_COND(last_op->opcode); |
1393 | | |
1394 | 424 | block->successors[0] = follow_block->successors[0]; |
1395 | 424 | block->successors[1] = next_block - cfg->blocks; |
1396 | | |
1397 | 424 | follow_block->flags &= ~ZEND_BB_REACHABLE; |
1398 | 424 | MAKE_NOP(target); |
1399 | 424 | follow_block->len = 0; |
1400 | | |
1401 | 424 | next_block->flags |= ZEND_BB_FOLLOW; |
1402 | | |
1403 | 424 | break; |
1404 | 424 | } |
1405 | 826 | } |
1406 | 1.06k | } |
1407 | 8.58k | } |
1408 | 42.4k | break; |
1409 | | |
1410 | 42.4k | case ZEND_JMPNZ_EX: |
1411 | 5.48k | case ZEND_JMPZ_EX: |
1412 | 5.48k | jmp_hitlist_count = 0; |
1413 | | |
1414 | 5.48k | target_block = get_target_block(cfg, block, 0, opt_count); |
1415 | 5.48k | while (target_block->len == 1) { |
1416 | 2.01k | target = op_array->opcodes + target_block->start; |
1417 | | |
1418 | 2.01k | if (target->opcode == ZEND_JMP) { |
1419 | | /* T = JMPZ_EX(X, L), L: JMP(L2) -> T = JMPZ(X, L2) */ |
1420 | 0 | next = target_block->successors[0]; |
1421 | 2.01k | } else if (target->opcode == last_op->opcode-3 && |
1422 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1423 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1424 | | /* T = JMPZ_EX(X, L1), L1: JMPZ({X|T}, L2) -> T = JMPZ_EX(X, L2) */ |
1425 | 0 | next = target_block->successors[0]; |
1426 | 2.01k | } else if (target->opcode == last_op->opcode && |
1427 | 0 | target->result.var == last_op->result.var && |
1428 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1429 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1430 | | /* T = JMPZ_EX(X, L1), L1: T = JMPZ_EX({X|T}, L2) -> T = JMPZ_EX(X, L2) */ |
1431 | 0 | next = target_block->successors[0]; |
1432 | 2.01k | } else if (target->opcode == INV_EX_COND(last_op->opcode) && |
1433 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1434 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1435 | | /* T = JMPZ_EX(X, L1), L1: JMPNZ({X|T1}, L2) -> T = JMPZ_EX(X, L1+1) */ |
1436 | 0 | next = target_block->successors[1]; |
1437 | 2.01k | } else if (target->opcode == INV_EX_COND_EX(last_op->opcode) && |
1438 | 158 | target->result.var == last_op->result.var && |
1439 | 150 | (SAME_VAR(target->op1, last_op->result) || |
1440 | 150 | SAME_VAR(target->op1, last_op->op1))) { |
1441 | | /* T = JMPZ_EX(X, L1), L1: T = JMPNZ_EX({X|T}, L2) -> T = JMPZ_EX(X, L1+1) */ |
1442 | 0 | next = target_block->successors[1]; |
1443 | 2.01k | } else if (target->opcode == ZEND_BOOL && |
1444 | 0 | (SAME_VAR(target->op1, last_op->result) || |
1445 | 0 | SAME_VAR(target->op1, last_op->op1))) { |
1446 | | /* convert Y = JMPZ_EX(X,L1), L1: Z = BOOL(Y) to |
1447 | | Z = JMPZ_EX(X,L1+1) */ |
1448 | | |
1449 | | /* NOTE: This optimization pattern is not safe, but works, */ |
1450 | | /* because result of JMPZ_EX instruction */ |
1451 | | /* is not used on the following path and */ |
1452 | | /* should be used once on the branch path. */ |
1453 | | /* */ |
1454 | | /* The pattern works well only if jumps processed in */ |
1455 | | /* direct order, otherwise it breaks JMPZ_EX */ |
1456 | | /* sequences too early. */ |
1457 | 0 | last_op->result.var = target->result.var; |
1458 | 0 | next = target_block->successors[0]; |
1459 | 2.01k | } else { |
1460 | 2.01k | break; |
1461 | 2.01k | } |
1462 | 0 | CHECK_LOOP(next); |
1463 | 0 | block->successors[0] = next; |
1464 | 0 | ++(*opt_count); |
1465 | 0 | target_block = get_target_block(cfg, block, 0, opt_count); |
1466 | 0 | } |
1467 | | |
1468 | 5.48k | follow_block = get_follow_block(cfg, block, 1, opt_count); |
1469 | 5.48k | if (target_block == follow_block) { |
1470 | | /* L: T = JMP[N]Z_EX(X, L+1) -> T = BOOL(X) */ |
1471 | 0 | last_op->opcode = ZEND_BOOL; |
1472 | 0 | last_op->op2.num = 0; |
1473 | 0 | block->successors_count = 1; |
1474 | 0 | ++(*opt_count); |
1475 | 0 | break; |
1476 | 0 | } |
1477 | 5.48k | break; |
1478 | 606k | } |
1479 | 606k | } |
1480 | | |
1481 | | /* Global data dependencies */ |
1482 | | |
1483 | | /* Find a set of variables which are used outside of the block where they are |
1484 | | * defined. We won't apply some optimization patterns for such variables. */ |
1485 | | static void zend_t_usage(const zend_cfg *cfg, const zend_op_array *op_array, zend_bitset used_ext, zend_optimizer_ctx *ctx) |
1486 | 134k | { |
1487 | 134k | int n; |
1488 | 134k | zend_basic_block *block, *next_block; |
1489 | 134k | uint32_t var_num; |
1490 | 134k | uint32_t bitset_len; |
1491 | 134k | zend_bitset usage; |
1492 | 134k | zend_bitset defined_here; |
1493 | 134k | void *checkpoint; |
1494 | 134k | zend_op *opline, *end; |
1495 | | |
1496 | | |
1497 | 134k | if (op_array->T == 0) { |
1498 | | /* shortcut - if no Ts, nothing to do */ |
1499 | 15.2k | return; |
1500 | 15.2k | } |
1501 | | |
1502 | 119k | checkpoint = zend_arena_checkpoint(ctx->arena); |
1503 | 119k | bitset_len = zend_bitset_len(op_array->last_var + op_array->T); |
1504 | 119k | defined_here = zend_arena_alloc(&ctx->arena, bitset_len * ZEND_BITSET_ELM_SIZE); |
1505 | | |
1506 | 119k | zend_bitset_clear(defined_here, bitset_len); |
1507 | 648k | for (n = 1; n < cfg->blocks_count; n++) { |
1508 | 529k | block = cfg->blocks + n; |
1509 | | |
1510 | 529k | if (!(block->flags & ZEND_BB_REACHABLE)) { |
1511 | 55.3k | continue; |
1512 | 55.3k | } |
1513 | | |
1514 | 473k | opline = op_array->opcodes + block->start; |
1515 | 473k | end = opline + block->len; |
1516 | 473k | if (!(block->flags & ZEND_BB_FOLLOW) || |
1517 | 351k | (block->flags & ZEND_BB_TARGET)) { |
1518 | | /* Skip continuation of "extended" BB */ |
1519 | 244k | zend_bitset_clear(defined_here, bitset_len); |
1520 | 244k | } |
1521 | | |
1522 | 2.64M | while (opline<end) { |
1523 | 2.17M | if (opline->op1_type & (IS_VAR|IS_TMP_VAR)) { |
1524 | 653k | var_num = VAR_NUM(opline->op1.var); |
1525 | 653k | if (!zend_bitset_in(defined_here, var_num)) { |
1526 | 307k | zend_bitset_incl(used_ext, var_num); |
1527 | 307k | } |
1528 | 653k | } |
1529 | 2.17M | if (opline->op2_type == IS_VAR) { |
1530 | 62.8k | var_num = VAR_NUM(opline->op2.var); |
1531 | 62.8k | if (opline->opcode == ZEND_FE_FETCH_R || |
1532 | 62.6k | opline->opcode == ZEND_FE_FETCH_RW) { |
1533 | | /* these opcode use the op2 as result */ |
1534 | 259 | zend_bitset_incl(defined_here, var_num); |
1535 | 62.6k | } else if (!zend_bitset_in(defined_here, var_num)) { |
1536 | 158 | zend_bitset_incl(used_ext, var_num); |
1537 | 158 | } |
1538 | 2.10M | } else if (opline->op2_type == IS_TMP_VAR) { |
1539 | 327k | var_num = VAR_NUM(opline->op2.var); |
1540 | 327k | if (!zend_bitset_in(defined_here, var_num)) { |
1541 | 44.3k | zend_bitset_incl(used_ext, var_num); |
1542 | 44.3k | } |
1543 | 327k | } |
1544 | | |
1545 | 2.17M | if (opline->result_type == IS_VAR) { |
1546 | 145k | var_num = VAR_NUM(opline->result.var); |
1547 | 145k | zend_bitset_incl(defined_here, var_num); |
1548 | 2.02M | } else if (opline->result_type == IS_TMP_VAR) { |
1549 | 904k | var_num = VAR_NUM(opline->result.var); |
1550 | 904k | switch (opline->opcode) { |
1551 | 4.52k | case ZEND_ADD_ARRAY_ELEMENT: |
1552 | 4.57k | case ZEND_ADD_ARRAY_UNPACK: |
1553 | 283k | case ZEND_ROPE_ADD: |
1554 | | /* these opcodes use the result as argument */ |
1555 | 283k | if (!zend_bitset_in(defined_here, var_num)) { |
1556 | 234k | zend_bitset_incl(used_ext, var_num); |
1557 | 234k | } |
1558 | 283k | break; |
1559 | 620k | default : |
1560 | 620k | zend_bitset_incl(defined_here, var_num); |
1561 | 904k | } |
1562 | 904k | } |
1563 | 2.17M | opline++; |
1564 | 2.17M | } |
1565 | 473k | } |
1566 | | |
1567 | 119k | if (ctx->debug_level & ZEND_DUMP_BLOCK_PASS_VARS) { |
1568 | 0 | bool printed = false; |
1569 | 0 | uint32_t i; |
1570 | |
|
1571 | 0 | for (i = op_array->last_var; i< op_array->T; i++) { |
1572 | 0 | if (zend_bitset_in(used_ext, i)) { |
1573 | 0 | if (!printed) { |
1574 | 0 | fprintf(stderr, "NON-LOCAL-VARS: %d", i); |
1575 | 0 | printed = true; |
1576 | 0 | } else { |
1577 | 0 | fprintf(stderr, ", %d", i); |
1578 | 0 | } |
1579 | 0 | } |
1580 | 0 | } |
1581 | 0 | if (printed) { |
1582 | 0 | fprintf(stderr, "\n"); |
1583 | 0 | } |
1584 | 0 | } |
1585 | | |
1586 | 119k | usage = defined_here; |
1587 | 119k | next_block = NULL; |
1588 | 768k | for (n = cfg->blocks_count; n > 0;) { |
1589 | 648k | block = cfg->blocks + (--n); |
1590 | | |
1591 | 648k | if (!(block->flags & ZEND_BB_REACHABLE) || block->len == 0) { |
1592 | 55.5k | continue; |
1593 | 55.5k | } |
1594 | | |
1595 | 592k | end = op_array->opcodes + block->start; |
1596 | 592k | opline = end + block->len - 1; |
1597 | 592k | if (!next_block || |
1598 | 473k | !(next_block->flags & ZEND_BB_FOLLOW) || |
1599 | 364k | (next_block->flags & ZEND_BB_TARGET)) { |
1600 | | /* Skip continuation of "extended" BB */ |
1601 | 364k | zend_bitset_copy(usage, used_ext, bitset_len); |
1602 | 364k | } else if (block->successors_count > 1) { |
1603 | 138k | zend_bitset_union(usage, used_ext, bitset_len); |
1604 | 138k | } |
1605 | 592k | next_block = block; |
1606 | | |
1607 | 4.42M | while (opline >= end) { |
1608 | | /* usage checks */ |
1609 | 3.83M | if (opline->result_type & (IS_VAR|IS_TMP_VAR)) { |
1610 | 1.89M | if (!zend_bitset_in(usage, VAR_NUM(opline->result.var))) { |
1611 | 9.54k | switch (opline->opcode) { |
1612 | 0 | case ZEND_ASSIGN_OP: |
1613 | 0 | case ZEND_ASSIGN_DIM_OP: |
1614 | 0 | case ZEND_ASSIGN_OBJ_OP: |
1615 | 0 | case ZEND_ASSIGN_STATIC_PROP_OP: |
1616 | 0 | case ZEND_PRE_INC: |
1617 | 0 | case ZEND_PRE_DEC: |
1618 | 0 | case ZEND_ASSIGN: |
1619 | 0 | case ZEND_ASSIGN_REF: |
1620 | 0 | case ZEND_DO_FCALL: |
1621 | 0 | case ZEND_DO_ICALL: |
1622 | 0 | case ZEND_DO_UCALL: |
1623 | 0 | case ZEND_DO_FCALL_BY_NAME: |
1624 | 0 | opline->result_type = IS_UNUSED; |
1625 | 0 | break; |
1626 | 0 | case ZEND_POST_INC: |
1627 | 0 | case ZEND_POST_DEC: |
1628 | 0 | case ZEND_POST_INC_OBJ: |
1629 | 0 | case ZEND_POST_DEC_OBJ: |
1630 | 0 | case ZEND_POST_INC_STATIC_PROP: |
1631 | 0 | case ZEND_POST_DEC_STATIC_PROP: |
1632 | 0 | opline->opcode -= 2; |
1633 | 0 | opline->result_type = IS_UNUSED; |
1634 | 0 | break; |
1635 | 902 | case ZEND_QM_ASSIGN: |
1636 | 2.06k | case ZEND_BOOL: |
1637 | 5.13k | case ZEND_BOOL_NOT: |
1638 | 5.13k | zend_optimizer_convert_to_free_op1(op_array, opline); |
1639 | 5.13k | break; |
1640 | 1.96k | case ZEND_JMPZ_EX: |
1641 | 4.31k | case ZEND_JMPNZ_EX: |
1642 | 4.31k | opline->opcode -= 3; |
1643 | 4.31k | SET_UNUSED(opline->result); |
1644 | 4.31k | break; |
1645 | 0 | case ZEND_ADD_ARRAY_ELEMENT: |
1646 | 0 | case ZEND_ADD_ARRAY_UNPACK: |
1647 | 0 | case ZEND_ROPE_ADD: |
1648 | 0 | zend_bitset_incl(usage, VAR_NUM(opline->result.var)); |
1649 | 0 | break; |
1650 | 9.54k | } |
1651 | 1.88M | } else { |
1652 | 1.88M | switch (opline->opcode) { |
1653 | 48.0k | case ZEND_ADD_ARRAY_ELEMENT: |
1654 | 48.3k | case ZEND_ADD_ARRAY_UNPACK: |
1655 | 406k | case ZEND_ROPE_ADD: |
1656 | 406k | break; |
1657 | 1.47M | default: |
1658 | 1.47M | zend_bitset_excl(usage, VAR_NUM(opline->result.var)); |
1659 | 1.47M | break; |
1660 | 1.88M | } |
1661 | 1.88M | } |
1662 | 1.89M | } |
1663 | | |
1664 | 3.83M | if (opline->op2_type == IS_VAR) { |
1665 | 96.8k | switch (opline->opcode) { |
1666 | 239 | case ZEND_FE_FETCH_R: |
1667 | 259 | case ZEND_FE_FETCH_RW: |
1668 | 259 | zend_bitset_excl(usage, VAR_NUM(opline->op2.var)); |
1669 | 259 | break; |
1670 | 96.5k | default: |
1671 | 96.5k | zend_bitset_incl(usage, VAR_NUM(opline->op2.var)); |
1672 | 96.5k | break; |
1673 | 96.8k | } |
1674 | 3.73M | } else if (opline->op2_type == IS_TMP_VAR) { |
1675 | 627k | zend_bitset_incl(usage, VAR_NUM(opline->op2.var)); |
1676 | 627k | } |
1677 | | |
1678 | 3.83M | if (opline->op1_type & (IS_VAR|IS_TMP_VAR)) { |
1679 | 1.09M | zend_bitset_incl(usage, VAR_NUM(opline->op1.var)); |
1680 | 1.09M | } |
1681 | | |
1682 | 3.83M | opline--; |
1683 | 3.83M | } |
1684 | 592k | } |
1685 | | |
1686 | 119k | zend_arena_release(&ctx->arena, checkpoint); |
1687 | 119k | } |
1688 | | |
1689 | | static void zend_merge_blocks(const zend_op_array *op_array, const zend_cfg *cfg, uint32_t *opt_count) |
1690 | 134k | { |
1691 | 134k | int i; |
1692 | 134k | zend_basic_block *b, *bb; |
1693 | 134k | zend_basic_block *prev = NULL; |
1694 | | |
1695 | 801k | for (i = 0; i < cfg->blocks_count; i++) { |
1696 | 667k | b = cfg->blocks + i; |
1697 | 667k | if (b->flags & ZEND_BB_REACHABLE) { |
1698 | 605k | if ((b->flags & ZEND_BB_FOLLOW) && |
1699 | 350k | !(b->flags & (ZEND_BB_TARGET | ZEND_BB_PROTECTED)) && |
1700 | 170k | prev && prev->successors_count == 1 && prev->successors[0] == i) |
1701 | 34.5k | { |
1702 | 34.5k | zend_op *last_op = op_array->opcodes + prev->start + prev->len - 1; |
1703 | 34.5k | if (prev->len != 0 && last_op->opcode == ZEND_JMP) { |
1704 | 0 | MAKE_NOP(last_op); |
1705 | 0 | } |
1706 | | |
1707 | 38.2k | for (bb = prev + 1; bb != b; bb++) { |
1708 | 3.72k | zend_op *op = op_array->opcodes + bb->start; |
1709 | 3.72k | const zend_op *end = op + bb->len; |
1710 | 6.77k | while (op < end) { |
1711 | 3.05k | if (op->op1_type == IS_CONST) { |
1712 | 1.25k | literal_dtor(&ZEND_OP1_LITERAL(op)); |
1713 | 1.25k | } |
1714 | 3.05k | if (op->op2_type == IS_CONST) { |
1715 | 650 | literal_dtor(&ZEND_OP2_LITERAL(op)); |
1716 | 650 | } |
1717 | 3.05k | MAKE_NOP(op); |
1718 | 3.05k | op++; |
1719 | 3.05k | } |
1720 | | /* make block empty */ |
1721 | 3.72k | bb->len = 0; |
1722 | 3.72k | } |
1723 | | |
1724 | | /* re-link */ |
1725 | 34.5k | prev->flags |= (b->flags & ZEND_BB_EXIT); |
1726 | 34.5k | prev->len = b->start + b->len - prev->start; |
1727 | 34.5k | prev->successors_count = b->successors_count; |
1728 | 34.5k | if (b->successors != b->successors_storage) { |
1729 | 50 | prev->successors = b->successors; |
1730 | 50 | b->successors = b->successors_storage; |
1731 | 34.4k | } else { |
1732 | 34.4k | memcpy(prev->successors, b->successors, b->successors_count * sizeof(int)); |
1733 | 34.4k | } |
1734 | | |
1735 | | /* unlink & make block empty and unreachable */ |
1736 | 34.5k | b->flags = 0; |
1737 | 34.5k | b->len = 0; |
1738 | 34.5k | b->successors_count = 0; |
1739 | 34.5k | ++(*opt_count); |
1740 | 571k | } else { |
1741 | 571k | prev = b; |
1742 | 571k | } |
1743 | 605k | } |
1744 | 667k | } |
1745 | 134k | } |
1746 | | |
1747 | 134k | #define PASSES 3 |
1748 | | |
1749 | | void zend_optimize_cfg(zend_op_array *op_array, zend_optimizer_ctx *ctx) |
1750 | 106k | { |
1751 | 106k | zend_cfg cfg; |
1752 | 106k | zend_basic_block *blocks, *end, *b; |
1753 | 106k | int pass; |
1754 | 106k | uint32_t bitset_len; |
1755 | 106k | zend_bitset usage; |
1756 | 106k | void *checkpoint; |
1757 | 106k | zend_op **Tsource; |
1758 | 106k | uint32_t opt_count; |
1759 | 106k | int *jmp_hitlist; |
1760 | | |
1761 | | /* Build CFG */ |
1762 | 106k | checkpoint = zend_arena_checkpoint(ctx->arena); |
1763 | 106k | zend_build_cfg(&ctx->arena, op_array, 0, &cfg); |
1764 | | |
1765 | 106k | if (cfg.blocks_count * (op_array->last_var + op_array->T) > 64 * 1024 * 1024) { |
1766 | 0 | zend_arena_release(&ctx->arena, checkpoint); |
1767 | 0 | return; |
1768 | 0 | } |
1769 | | |
1770 | 106k | if (ctx->debug_level & ZEND_DUMP_BEFORE_BLOCK_PASS) { |
1771 | 0 | zend_dump_op_array(op_array, ZEND_DUMP_CFG, "before block pass", &cfg); |
1772 | 0 | } |
1773 | | |
1774 | 106k | bitset_len = zend_bitset_len(op_array->last_var + op_array->T); |
1775 | 106k | Tsource = zend_arena_calloc(&ctx->arena, op_array->last_var + op_array->T, sizeof(zend_op *)); |
1776 | 106k | usage = zend_arena_alloc(&ctx->arena, bitset_len * ZEND_BITSET_ELM_SIZE); |
1777 | 106k | jmp_hitlist = zend_arena_alloc(&ctx->arena, cfg.blocks_count * sizeof(int)); |
1778 | | |
1779 | 106k | blocks = cfg.blocks; |
1780 | 106k | end = blocks + cfg.blocks_count; |
1781 | 134k | for (pass = 0; pass < PASSES; pass++) { |
1782 | 134k | opt_count = 0; |
1783 | | |
1784 | | /* Compute data dependencies */ |
1785 | 134k | zend_bitset_clear(usage, bitset_len); |
1786 | 134k | zend_t_usage(&cfg, op_array, usage, ctx); |
1787 | | |
1788 | | /* optimize each basic block separately */ |
1789 | 801k | for (b = blocks; b < end; b++) { |
1790 | 667k | if (!(b->flags & ZEND_BB_REACHABLE)) { |
1791 | 58.8k | continue; |
1792 | 58.8k | } |
1793 | | /* we track data dependencies only inside a single basic block */ |
1794 | 608k | if (!(b->flags & ZEND_BB_FOLLOW) || |
1795 | 379k | (b->flags & ZEND_BB_TARGET)) { |
1796 | | /* Skip continuation of "extended" BB */ |
1797 | 379k | memset(Tsource, 0, (op_array->last_var + op_array->T) * sizeof(zend_op *)); |
1798 | 379k | } |
1799 | 608k | zend_optimize_block(b, op_array, usage, &cfg, Tsource, &opt_count); |
1800 | 608k | } |
1801 | | |
1802 | | /* Eliminate NOPs */ |
1803 | 801k | for (b = blocks; b < end; b++) { |
1804 | 667k | if (b->flags & ZEND_BB_UNREACHABLE_FREE) { |
1805 | | /* In unreachable_free blocks only preserve loop var frees. */ |
1806 | 94 | for (uint32_t i = b->start; i < b->start + b->len; i++) { |
1807 | 64 | zend_op *opline = &op_array->opcodes[i]; |
1808 | 64 | if (!zend_optimizer_is_loop_var_free(opline)) { |
1809 | 34 | MAKE_NOP(opline); |
1810 | 34 | } |
1811 | 64 | } |
1812 | 30 | } |
1813 | 667k | if (b->flags & (ZEND_BB_REACHABLE|ZEND_BB_UNREACHABLE_FREE)) { |
1814 | 608k | strip_nops(op_array, b); |
1815 | 608k | } |
1816 | 667k | } |
1817 | | |
1818 | 134k | opt_count = 0; |
1819 | | |
1820 | | /* Jump optimization for each block */ |
1821 | 801k | for (b = blocks; b < end; b++) { |
1822 | 667k | if (b->flags & ZEND_BB_REACHABLE) { |
1823 | 607k | zend_jmp_optimization(b, op_array, &cfg, jmp_hitlist, &opt_count); |
1824 | 607k | } |
1825 | 667k | } |
1826 | | |
1827 | | /* Eliminate unreachable basic blocks */ |
1828 | 134k | zend_cfg_remark_reachable_blocks(op_array, &cfg); |
1829 | | |
1830 | | /* Merge Blocks */ |
1831 | 134k | zend_merge_blocks(op_array, &cfg, &opt_count); |
1832 | | |
1833 | 134k | if (opt_count == 0) { |
1834 | 106k | break; |
1835 | 106k | } |
1836 | 134k | } |
1837 | | |
1838 | 106k | assemble_code_blocks(&cfg, op_array, ctx); |
1839 | | |
1840 | 106k | if (ctx->debug_level & ZEND_DUMP_AFTER_BLOCK_PASS) { |
1841 | 0 | zend_dump_op_array(op_array, ZEND_DUMP_CFG | ZEND_DUMP_HIDE_UNREACHABLE, "after block pass", &cfg); |
1842 | 0 | } |
1843 | | |
1844 | | /* Destroy CFG */ |
1845 | 106k | zend_arena_release(&ctx->arena, checkpoint); |
1846 | 106k | } |