/src/php-src/Zend/Optimizer/zend_cfg.c
Line | Count | Source |
1 | | /* |
2 | | +----------------------------------------------------------------------+ |
3 | | | Zend Engine, CFG - Control Flow Graph | |
4 | | +----------------------------------------------------------------------+ |
5 | | | Copyright (c) The PHP Group | |
6 | | +----------------------------------------------------------------------+ |
7 | | | This source file is subject to version 3.01 of the PHP license, | |
8 | | | that is bundled with this package in the file LICENSE, and is | |
9 | | | available through the world-wide-web at the following url: | |
10 | | | https://www.php.net/license/3_01.txt | |
11 | | | If you did not receive a copy of the PHP license and are unable to | |
12 | | | obtain it through the world-wide-web, please send a note to | |
13 | | | license@php.net so we can mail you a copy immediately. | |
14 | | +----------------------------------------------------------------------+ |
15 | | | Authors: Dmitry Stogov <dmitry@php.net> | |
16 | | +----------------------------------------------------------------------+ |
17 | | */ |
18 | | |
19 | | #include "zend_compile.h" |
20 | | #include "zend_cfg.h" |
21 | | #include "zend_func_info.h" |
22 | | #include "zend_worklist.h" |
23 | | #include "zend_optimizer.h" |
24 | | #include "zend_optimizer_internal.h" |
25 | | #include "zend_sort.h" |
26 | | |
27 | | static void zend_mark_reachable(zend_op *opcodes, zend_cfg *cfg, zend_basic_block *b) /* {{{ */ |
28 | 202k | { |
29 | 202k | zend_basic_block *blocks = cfg->blocks; |
30 | | |
31 | 202k | zend_worklist work; |
32 | 202k | ALLOCA_FLAG(list_use_heap) |
33 | 202k | ZEND_WORKLIST_ALLOCA(&work, cfg->blocks_count, list_use_heap); |
34 | | |
35 | 202k | zend_worklist_push(&work, b - cfg->blocks); |
36 | | |
37 | 831k | while (zend_worklist_len(&work)) { |
38 | 628k | int i; |
39 | 628k | b = cfg->blocks + zend_worklist_pop(&work); |
40 | | |
41 | 628k | b->flags |= ZEND_BB_REACHABLE; |
42 | 628k | if (b->successors_count == 0) { |
43 | 172k | b->flags |= ZEND_BB_EXIT; |
44 | 172k | continue; |
45 | 172k | } |
46 | | |
47 | 1.09M | for (i = 0; i < b->successors_count; i++) { |
48 | 639k | zend_basic_block *succ = blocks + b->successors[i]; |
49 | | |
50 | 639k | if (b->len != 0) { |
51 | 638k | uint8_t opcode = opcodes[b->start + b->len - 1].opcode; |
52 | 638k | if (opcode == ZEND_MATCH) { |
53 | 1.44k | succ->flags |= ZEND_BB_TARGET; |
54 | 637k | } else if (opcode == ZEND_SWITCH_LONG || opcode == ZEND_SWITCH_STRING) { |
55 | 665 | if (i == b->successors_count - 1) { |
56 | 135 | succ->flags |= ZEND_BB_FOLLOW | ZEND_BB_TARGET; |
57 | 530 | } else { |
58 | 530 | succ->flags |= ZEND_BB_TARGET; |
59 | 530 | } |
60 | 636k | } else if (b->successors_count == 1) { |
61 | 272k | if (opcode == ZEND_JMP) { |
62 | 76.1k | succ->flags |= ZEND_BB_TARGET; |
63 | 196k | } else { |
64 | 196k | succ->flags |= ZEND_BB_FOLLOW; |
65 | | |
66 | 196k | if ((cfg->flags & ZEND_CFG_STACKLESS)) { |
67 | 0 | if (opcode == ZEND_INCLUDE_OR_EVAL || |
68 | 0 | opcode == ZEND_GENERATOR_CREATE || |
69 | 0 | opcode == ZEND_YIELD || |
70 | 0 | opcode == ZEND_YIELD_FROM || |
71 | 0 | opcode == ZEND_DO_FCALL || |
72 | 0 | opcode == ZEND_DO_UCALL || |
73 | 0 | opcode == ZEND_DO_FCALL_BY_NAME) { |
74 | 0 | succ->flags |= ZEND_BB_ENTRY; |
75 | 0 | } |
76 | 0 | } |
77 | 196k | if ((cfg->flags & ZEND_CFG_RECV_ENTRY)) { |
78 | 0 | if (opcode == ZEND_RECV || |
79 | 0 | opcode == ZEND_RECV_INIT) { |
80 | 0 | succ->flags |= ZEND_BB_RECV_ENTRY; |
81 | 0 | } |
82 | 0 | } |
83 | 196k | } |
84 | 363k | } else { |
85 | 363k | ZEND_ASSERT(b->successors_count == 2); |
86 | 363k | if (i == 0) { |
87 | 181k | succ->flags |= ZEND_BB_TARGET; |
88 | 181k | } else { |
89 | 181k | succ->flags |= ZEND_BB_FOLLOW; |
90 | 181k | } |
91 | 363k | } |
92 | 638k | } else { |
93 | 415 | succ->flags |= ZEND_BB_FOLLOW; |
94 | 415 | } |
95 | | |
96 | | /* Check reachability of successor */ |
97 | 639k | if (!(succ->flags & ZEND_BB_REACHABLE)) { |
98 | 545k | zend_worklist_push(&work, succ - cfg->blocks); |
99 | 545k | } |
100 | 639k | } |
101 | 455k | } |
102 | | |
103 | 202k | ZEND_WORKLIST_FREE_ALLOCA(&work, list_use_heap); |
104 | 202k | } |
105 | | /* }}} */ |
106 | | |
107 | | static void zend_mark_reachable_blocks(const zend_op_array *op_array, zend_cfg *cfg, int start) /* {{{ */ |
108 | 154k | { |
109 | 154k | zend_basic_block *blocks = cfg->blocks; |
110 | | |
111 | 154k | blocks[start].flags = ZEND_BB_START; |
112 | 154k | zend_mark_reachable(op_array->opcodes, cfg, blocks + start); |
113 | | |
114 | 154k | if (op_array->last_try_catch) { |
115 | 38.5k | zend_basic_block *b; |
116 | 38.5k | int j, changed; |
117 | 38.5k | uint32_t *block_map = cfg->map; |
118 | | |
119 | 76.8k | do { |
120 | 76.8k | changed = 0; |
121 | | |
122 | | /* Add exception paths */ |
123 | 173k | for (j = 0; j < op_array->last_try_catch; j++) { |
124 | | |
125 | | /* check for jumps into the middle of try block */ |
126 | 96.7k | b = blocks + block_map[op_array->try_catch_array[j].try_op]; |
127 | 96.7k | if (!(b->flags & ZEND_BB_REACHABLE)) { |
128 | 30 | zend_basic_block *end; |
129 | | |
130 | 30 | if (op_array->try_catch_array[j].catch_op) { |
131 | 30 | end = blocks + block_map[op_array->try_catch_array[j].catch_op]; |
132 | 70 | while (b != end) { |
133 | 46 | if (b->flags & ZEND_BB_REACHABLE) { |
134 | 6 | op_array->try_catch_array[j].try_op = b->start; |
135 | 6 | break; |
136 | 6 | } |
137 | 40 | b++; |
138 | 40 | } |
139 | 30 | } |
140 | 30 | b = blocks + block_map[op_array->try_catch_array[j].try_op]; |
141 | 30 | if (!(b->flags & ZEND_BB_REACHABLE)) { |
142 | 24 | if (op_array->try_catch_array[j].finally_op) { |
143 | 6 | end = blocks + block_map[op_array->try_catch_array[j].finally_op]; |
144 | 22 | while (b != end) { |
145 | 22 | if (b->flags & ZEND_BB_REACHABLE) { |
146 | | /* In case we get here, there is no live try block but there is a live finally block. |
147 | | * If we do have catch_op set, we need to set it to the first catch block to satisfy |
148 | | * the constraint try_op <= catch_op <= finally_op */ |
149 | 6 | op_array->try_catch_array[j].try_op = |
150 | 6 | op_array->try_catch_array[j].catch_op ? op_array->try_catch_array[j].catch_op : b->start; |
151 | 6 | changed = 1; |
152 | 6 | zend_mark_reachable(op_array->opcodes, cfg, blocks + block_map[op_array->try_catch_array[j].try_op]); |
153 | 6 | break; |
154 | 6 | } |
155 | 16 | b++; |
156 | 16 | } |
157 | 6 | } |
158 | 24 | } |
159 | 30 | } |
160 | | |
161 | 96.7k | b = blocks + block_map[op_array->try_catch_array[j].try_op]; |
162 | 96.7k | if (b->flags & ZEND_BB_REACHABLE) { |
163 | 96.7k | b->flags |= ZEND_BB_TRY; |
164 | 96.7k | if (op_array->try_catch_array[j].catch_op) { |
165 | 95.6k | b = blocks + block_map[op_array->try_catch_array[j].catch_op]; |
166 | 95.6k | b->flags |= ZEND_BB_CATCH; |
167 | 95.6k | if (!(b->flags & ZEND_BB_REACHABLE)) { |
168 | 47.8k | changed = 1; |
169 | 47.8k | zend_mark_reachable(op_array->opcodes, cfg, b); |
170 | 47.8k | } |
171 | 95.6k | } |
172 | 96.7k | if (op_array->try_catch_array[j].finally_op) { |
173 | 1.49k | b = blocks + block_map[op_array->try_catch_array[j].finally_op]; |
174 | 1.49k | b->flags |= ZEND_BB_FINALLY; |
175 | 1.49k | if (!(b->flags & ZEND_BB_REACHABLE)) { |
176 | 176 | changed = 1; |
177 | 176 | zend_mark_reachable(op_array->opcodes, cfg, b); |
178 | 176 | } |
179 | 1.49k | } |
180 | 96.7k | if (op_array->try_catch_array[j].finally_end) { |
181 | 1.49k | b = blocks + block_map[op_array->try_catch_array[j].finally_end]; |
182 | 1.49k | b->flags |= ZEND_BB_FINALLY_END; |
183 | 1.49k | if (!(b->flags & ZEND_BB_REACHABLE)) { |
184 | 256 | changed = 1; |
185 | 256 | zend_mark_reachable(op_array->opcodes, cfg, b); |
186 | 256 | } |
187 | 1.49k | } |
188 | 96.7k | } else { |
189 | 18 | if (op_array->try_catch_array[j].catch_op) { |
190 | 18 | ZEND_ASSERT(!(blocks[block_map[op_array->try_catch_array[j].catch_op]].flags & ZEND_BB_REACHABLE)); |
191 | 18 | } |
192 | 18 | if (op_array->try_catch_array[j].finally_op) { |
193 | 0 | ZEND_ASSERT(!(blocks[block_map[op_array->try_catch_array[j].finally_op]].flags & ZEND_BB_REACHABLE)); |
194 | 0 | } |
195 | 18 | if (op_array->try_catch_array[j].finally_end) { |
196 | 0 | ZEND_ASSERT(!(blocks[block_map[op_array->try_catch_array[j].finally_end]].flags & ZEND_BB_REACHABLE)); |
197 | 0 | } |
198 | 18 | } |
199 | 96.7k | } |
200 | 76.8k | } while (changed); |
201 | 38.5k | } |
202 | | |
203 | 154k | if (cfg->flags & ZEND_FUNC_FREE_LOOP_VAR) { |
204 | 19.4k | zend_basic_block *b; |
205 | 19.4k | int j; |
206 | 19.4k | uint32_t *block_map = cfg->map; |
207 | | |
208 | | /* Mark blocks that are unreachable, but free a loop var created in a reachable block. */ |
209 | 241k | for (b = blocks; b < blocks + cfg->blocks_count; b++) { |
210 | 221k | if (b->flags & ZEND_BB_REACHABLE) { |
211 | 214k | continue; |
212 | 214k | } |
213 | | |
214 | 8.68k | for (j = b->start; j < b->start + b->len; j++) { |
215 | 1.45k | zend_op *opline = &op_array->opcodes[j]; |
216 | 1.45k | if (zend_optimizer_is_loop_var_free(opline)) { |
217 | 40 | zend_op *def_opline = zend_optimizer_get_loop_var_def(op_array, opline); |
218 | 40 | if (def_opline) { |
219 | 40 | uint32_t def_block = block_map[def_opline - op_array->opcodes]; |
220 | 40 | if (blocks[def_block].flags & ZEND_BB_REACHABLE) { |
221 | 32 | b->flags |= ZEND_BB_UNREACHABLE_FREE; |
222 | 32 | break; |
223 | 32 | } |
224 | 40 | } |
225 | 40 | } |
226 | 1.45k | } |
227 | 7.26k | } |
228 | 19.4k | } |
229 | 154k | } |
230 | | /* }}} */ |
231 | | |
232 | | void zend_cfg_remark_reachable_blocks(const zend_op_array *op_array, zend_cfg *cfg) /* {{{ */ |
233 | 64.5k | { |
234 | 64.5k | zend_basic_block *blocks = cfg->blocks; |
235 | 64.5k | int i; |
236 | 64.5k | int start = 0; |
237 | | |
238 | 64.5k | for (i = 0; i < cfg->blocks_count; i++) { |
239 | 64.5k | if (blocks[i].flags & ZEND_BB_REACHABLE) { |
240 | 64.5k | start = i; |
241 | 64.5k | i++; |
242 | 64.5k | break; |
243 | 64.5k | } |
244 | 64.5k | } |
245 | | |
246 | | /* clear all flags */ |
247 | 389k | for (i = 0; i < cfg->blocks_count; i++) { |
248 | 325k | blocks[i].flags = 0; |
249 | 325k | } |
250 | | |
251 | 64.5k | zend_mark_reachable_blocks(op_array, cfg, start); |
252 | 64.5k | } |
253 | | /* }}} */ |
254 | | |
255 | 340k | static void initialize_block(zend_basic_block *block) { |
256 | 340k | block->flags = 0; |
257 | 340k | block->successors = block->successors_storage; |
258 | 340k | block->successors_count = 0; |
259 | 340k | block->predecessors_count = 0; |
260 | 340k | block->predecessor_offset = -1; |
261 | 340k | block->idom = -1; |
262 | 340k | block->loop_header = -1; |
263 | 340k | block->level = -1; |
264 | 340k | block->children = -1; |
265 | 340k | block->next_child = -1; |
266 | 340k | } |
267 | | |
268 | 427k | #define BB_START(i) do { \ |
269 | 427k | if (!block_map[i]) { blocks_count++;} \ |
270 | 427k | block_map[i]++; \ |
271 | 427k | } while (0) |
272 | | |
273 | | ZEND_API void zend_build_cfg(zend_arena **arena, const zend_op_array *op_array, uint32_t build_flags, zend_cfg *cfg) /* {{{ */ |
274 | 89.8k | { |
275 | 89.8k | uint32_t flags = 0; |
276 | 89.8k | uint32_t i; |
277 | 89.8k | uint32_t *block_map; |
278 | 89.8k | zend_function *fn; |
279 | 89.8k | int blocks_count = 0; |
280 | 89.8k | zend_basic_block *blocks; |
281 | 89.8k | zval *zv; |
282 | 89.8k | bool extra_entry_block = false; |
283 | | |
284 | 89.8k | cfg->flags = build_flags & (ZEND_CFG_STACKLESS|ZEND_CFG_RECV_ENTRY); |
285 | | |
286 | 89.8k | cfg->map = block_map = zend_arena_calloc(arena, op_array->last, sizeof(uint32_t)); |
287 | | |
288 | | /* Build CFG, Step 1: Find basic blocks starts, calculate number of blocks */ |
289 | 89.8k | BB_START(0); |
290 | 2.30M | for (i = 0; i < op_array->last; i++) { |
291 | 2.21M | zend_op *opline = op_array->opcodes + i; |
292 | 2.21M | switch (opline->opcode) { |
293 | 19.9k | case ZEND_RECV: |
294 | 22.9k | case ZEND_RECV_INIT: |
295 | 22.9k | if (build_flags & ZEND_CFG_RECV_ENTRY) { |
296 | 0 | BB_START(i + 1); |
297 | 0 | } |
298 | 22.9k | break; |
299 | 98.0k | case ZEND_RETURN: |
300 | 99.2k | case ZEND_RETURN_BY_REF: |
301 | 101k | case ZEND_GENERATOR_RETURN: |
302 | 101k | case ZEND_VERIFY_NEVER_TYPE: |
303 | 101k | if (i + 1 < op_array->last) { |
304 | 12.3k | BB_START(i + 1); |
305 | 12.3k | } |
306 | 101k | break; |
307 | 318 | case ZEND_MATCH_ERROR: |
308 | 2.18k | case ZEND_THROW: |
309 | | /* Don't treat THROW as terminator if it's used in expression context, |
310 | | * as we may lose live ranges when eliminating unreachable code. */ |
311 | 2.18k | if (opline->extended_value != ZEND_THROW_IS_EXPR && i + 1 < op_array->last) { |
312 | 1.40k | BB_START(i + 1); |
313 | 1.40k | } |
314 | 2.18k | break; |
315 | 4.54k | case ZEND_INCLUDE_OR_EVAL: |
316 | 4.54k | flags |= ZEND_FUNC_INDIRECT_VAR_ACCESS; |
317 | 4.54k | ZEND_FALLTHROUGH; |
318 | 6.22k | case ZEND_GENERATOR_CREATE: |
319 | 8.02k | case ZEND_YIELD: |
320 | 8.48k | case ZEND_YIELD_FROM: |
321 | 8.48k | if (build_flags & ZEND_CFG_STACKLESS) { |
322 | 0 | BB_START(i + 1); |
323 | 0 | } |
324 | 8.48k | break; |
325 | 178k | case ZEND_DO_FCALL: |
326 | 187k | case ZEND_DO_UCALL: |
327 | 187k | case ZEND_DO_FCALL_BY_NAME: |
328 | 187k | flags |= ZEND_FUNC_HAS_CALLS; |
329 | 187k | if (build_flags & ZEND_CFG_STACKLESS) { |
330 | 0 | BB_START(i + 1); |
331 | 0 | } |
332 | 187k | break; |
333 | 0 | case ZEND_DO_ICALL: |
334 | 0 | flags |= ZEND_FUNC_HAS_CALLS; |
335 | 0 | break; |
336 | 90.7k | case ZEND_INIT_FCALL: |
337 | 93.2k | case ZEND_INIT_NS_FCALL_BY_NAME: |
338 | 93.2k | zv = CRT_CONSTANT(opline->op2); |
339 | 93.2k | if (opline->opcode == ZEND_INIT_NS_FCALL_BY_NAME) { |
340 | | /* The third literal is the lowercased unqualified name */ |
341 | 2.59k | zv += 2; |
342 | 2.59k | } |
343 | 93.2k | if ((fn = zend_hash_find_ptr(EG(function_table), Z_STR_P(zv))) != NULL) { |
344 | 75.0k | if (fn->type == ZEND_INTERNAL_FUNCTION) { |
345 | 75.0k | flags |= zend_optimizer_classify_function( |
346 | 75.0k | Z_STR_P(zv), opline->extended_value); |
347 | 75.0k | } |
348 | 75.0k | } |
349 | 93.2k | break; |
350 | 475 | case ZEND_FAST_CALL: |
351 | 475 | BB_START(OP_JMP_ADDR(opline, opline->op1) - op_array->opcodes); |
352 | 475 | BB_START(i + 1); |
353 | 475 | break; |
354 | 363 | case ZEND_FAST_RET: |
355 | 363 | if (i + 1 < op_array->last) { |
356 | 363 | BB_START(i + 1); |
357 | 363 | } |
358 | 363 | break; |
359 | 32.5k | case ZEND_JMP: |
360 | 32.5k | BB_START(OP_JMP_ADDR(opline, opline->op1) - op_array->opcodes); |
361 | 32.5k | if (i + 1 < op_array->last) { |
362 | 32.1k | BB_START(i + 1); |
363 | 32.1k | } |
364 | 32.5k | break; |
365 | 11.5k | case ZEND_JMPZ: |
366 | 18.8k | case ZEND_JMPNZ: |
367 | 21.8k | case ZEND_JMPZ_EX: |
368 | 24.2k | case ZEND_JMPNZ_EX: |
369 | 25.7k | case ZEND_JMP_SET: |
370 | 29.3k | case ZEND_COALESCE: |
371 | 30.4k | case ZEND_ASSERT_CHECK: |
372 | 80.2k | case ZEND_JMP_NULL: |
373 | 80.4k | case ZEND_BIND_INIT_STATIC_OR_JMP: |
374 | 80.4k | case ZEND_JMP_FRAMELESS: |
375 | 80.4k | BB_START(OP_JMP_ADDR(opline, opline->op2) - op_array->opcodes); |
376 | 80.4k | BB_START(i + 1); |
377 | 80.4k | break; |
378 | 18.1k | case ZEND_CATCH: |
379 | 18.1k | if (!(opline->extended_value & ZEND_LAST_CATCH)) { |
380 | 2.19k | BB_START(OP_JMP_ADDR(opline, opline->op2) - op_array->opcodes); |
381 | 2.19k | } |
382 | 18.1k | BB_START(i + 1); |
383 | 18.1k | break; |
384 | 7.70k | case ZEND_FE_FETCH_R: |
385 | 8.43k | case ZEND_FE_FETCH_RW: |
386 | 8.43k | BB_START(ZEND_OFFSET_TO_OPLINE_NUM(op_array, opline, opline->extended_value)); |
387 | 8.43k | BB_START(i + 1); |
388 | 8.43k | break; |
389 | 7.70k | case ZEND_FE_RESET_R: |
390 | 8.43k | case ZEND_FE_RESET_RW: |
391 | 8.43k | BB_START(OP_JMP_ADDR(opline, opline->op2) - op_array->opcodes); |
392 | 8.43k | BB_START(i + 1); |
393 | 8.43k | break; |
394 | 8 | case ZEND_SWITCH_LONG: |
395 | 82 | case ZEND_SWITCH_STRING: |
396 | 258 | case ZEND_MATCH: |
397 | 258 | { |
398 | 258 | HashTable *jumptable = Z_ARRVAL_P(CRT_CONSTANT(opline->op2)); |
399 | 258 | zval *zv; |
400 | 2.39k | ZEND_HASH_FOREACH_VAL(jumptable, zv) { |
401 | 2.39k | BB_START(ZEND_OFFSET_TO_OPLINE_NUM(op_array, opline, Z_LVAL_P(zv))); |
402 | 2.39k | } ZEND_HASH_FOREACH_END(); |
403 | 258 | BB_START(ZEND_OFFSET_TO_OPLINE_NUM(op_array, opline, opline->extended_value)); |
404 | 258 | BB_START(i + 1); |
405 | 258 | break; |
406 | 82 | } |
407 | 2.16k | case ZEND_FETCH_R: |
408 | 3.51k | case ZEND_FETCH_W: |
409 | 4.46k | case ZEND_FETCH_RW: |
410 | 4.48k | case ZEND_FETCH_FUNC_ARG: |
411 | 4.52k | case ZEND_FETCH_IS: |
412 | 4.56k | case ZEND_FETCH_UNSET: |
413 | 4.72k | case ZEND_UNSET_VAR: |
414 | 4.93k | case ZEND_ISSET_ISEMPTY_VAR: |
415 | 4.93k | if (opline->extended_value & ZEND_FETCH_LOCAL) { |
416 | 3.83k | flags |= ZEND_FUNC_INDIRECT_VAR_ACCESS; |
417 | 3.83k | } else if ((opline->extended_value & (ZEND_FETCH_GLOBAL | ZEND_FETCH_GLOBAL_LOCK)) && |
418 | 1.09k | !op_array->function_name) { |
419 | 430 | flags |= ZEND_FUNC_INDIRECT_VAR_ACCESS; |
420 | 430 | } |
421 | 4.93k | break; |
422 | 106 | case ZEND_FUNC_GET_ARGS: |
423 | 106 | flags |= ZEND_FUNC_VARARG; |
424 | 106 | break; |
425 | 0 | case ZEND_EXT_STMT: |
426 | 0 | flags |= ZEND_FUNC_HAS_EXTENDED_STMT; |
427 | 0 | break; |
428 | 0 | case ZEND_EXT_FCALL_BEGIN: |
429 | 0 | case ZEND_EXT_FCALL_END: |
430 | 0 | flags |= ZEND_FUNC_HAS_EXTENDED_FCALL; |
431 | 0 | break; |
432 | 52.1k | case ZEND_FREE: |
433 | 60.7k | case ZEND_FE_FREE: |
434 | 60.7k | if (zend_optimizer_is_loop_var_free(opline) |
435 | 8.70k | && ((opline-1)->opcode != ZEND_MATCH_ERROR |
436 | 8.67k | || (opline-1)->extended_value != ZEND_THROW_IS_EXPR)) { |
437 | 8.67k | BB_START(i); |
438 | 8.67k | flags |= ZEND_FUNC_FREE_LOOP_VAR; |
439 | 8.67k | } |
440 | 60.7k | break; |
441 | 2.21M | } |
442 | 2.21M | } |
443 | | |
444 | | /* If the entry block has predecessors, we may need to split it */ |
445 | 89.8k | if ((build_flags & ZEND_CFG_NO_ENTRY_PREDECESSORS) |
446 | 38.4k | && op_array->last > 0 && block_map[0] > 1) { |
447 | 67 | extra_entry_block = true; |
448 | 67 | } |
449 | | |
450 | 89.8k | if (op_array->last_try_catch) { |
451 | 29.2k | for (uint32_t j = 0; j < op_array->last_try_catch; j++) { |
452 | 16.2k | BB_START(op_array->try_catch_array[j].try_op); |
453 | 16.2k | if (op_array->try_catch_array[j].catch_op) { |
454 | 15.9k | BB_START(op_array->try_catch_array[j].catch_op); |
455 | 15.9k | } |
456 | 16.2k | if (op_array->try_catch_array[j].finally_op) { |
457 | 363 | BB_START(op_array->try_catch_array[j].finally_op); |
458 | 363 | } |
459 | 16.2k | if (op_array->try_catch_array[j].finally_end) { |
460 | 363 | BB_START(op_array->try_catch_array[j].finally_end); |
461 | 363 | } |
462 | 16.2k | } |
463 | 12.9k | } |
464 | | |
465 | 89.8k | blocks_count += extra_entry_block; |
466 | 89.8k | cfg->blocks_count = blocks_count; |
467 | | |
468 | | /* Build CFG, Step 2: Build Array of Basic Blocks */ |
469 | 89.8k | cfg->blocks = blocks = zend_arena_calloc(arena, sizeof(zend_basic_block), blocks_count); |
470 | | |
471 | 89.8k | blocks_count = -1; |
472 | | |
473 | 89.8k | if (extra_entry_block) { |
474 | 67 | initialize_block(&blocks[0]); |
475 | 67 | blocks[0].start = 0; |
476 | 67 | blocks[0].len = 0; |
477 | 67 | blocks_count++; |
478 | 67 | } |
479 | | |
480 | 2.30M | for (i = 0; i < op_array->last; i++) { |
481 | 2.21M | if (block_map[i]) { |
482 | 340k | if (blocks_count >= 0) { |
483 | 250k | blocks[blocks_count].len = i - blocks[blocks_count].start; |
484 | 250k | } |
485 | 340k | blocks_count++; |
486 | 340k | initialize_block(&blocks[blocks_count]); |
487 | 340k | blocks[blocks_count].start = i; |
488 | 340k | } |
489 | 2.21M | block_map[i] = blocks_count; |
490 | 2.21M | } |
491 | | |
492 | 89.8k | blocks[blocks_count].len = i - blocks[blocks_count].start; |
493 | 89.8k | blocks_count++; |
494 | | |
495 | | /* Build CFG, Step 3: Calculate successors */ |
496 | 430k | for (int j = 0; j < blocks_count; j++) { |
497 | 340k | zend_basic_block *block = &blocks[j]; |
498 | 340k | zend_op *opline; |
499 | 340k | if (block->len == 0) { |
500 | 67 | block->successors_count = 1; |
501 | 67 | block->successors[0] = j + 1; |
502 | 67 | continue; |
503 | 67 | } |
504 | | |
505 | 340k | opline = op_array->opcodes + block->start + block->len - 1; |
506 | 340k | switch (opline->opcode) { |
507 | 363 | case ZEND_FAST_RET: |
508 | 98.4k | case ZEND_RETURN: |
509 | 99.6k | case ZEND_RETURN_BY_REF: |
510 | 101k | case ZEND_GENERATOR_RETURN: |
511 | 103k | case ZEND_THROW: |
512 | 103k | case ZEND_MATCH_ERROR: |
513 | 103k | case ZEND_VERIFY_NEVER_TYPE: |
514 | 103k | break; |
515 | 32.5k | case ZEND_JMP: |
516 | 32.5k | block->successors_count = 1; |
517 | 32.5k | block->successors[0] = block_map[OP_JMP_ADDR(opline, opline->op1) - op_array->opcodes]; |
518 | 32.5k | break; |
519 | 11.5k | case ZEND_JMPZ: |
520 | 18.8k | case ZEND_JMPNZ: |
521 | 21.8k | case ZEND_JMPZ_EX: |
522 | 24.2k | case ZEND_JMPNZ_EX: |
523 | 25.7k | case ZEND_JMP_SET: |
524 | 29.3k | case ZEND_COALESCE: |
525 | 30.4k | case ZEND_ASSERT_CHECK: |
526 | 80.2k | case ZEND_JMP_NULL: |
527 | 80.4k | case ZEND_BIND_INIT_STATIC_OR_JMP: |
528 | 80.4k | case ZEND_JMP_FRAMELESS: |
529 | 80.4k | block->successors_count = 2; |
530 | 80.4k | block->successors[0] = block_map[OP_JMP_ADDR(opline, opline->op2) - op_array->opcodes]; |
531 | 80.4k | block->successors[1] = j + 1; |
532 | 80.4k | break; |
533 | 18.1k | case ZEND_CATCH: |
534 | 18.1k | if (!(opline->extended_value & ZEND_LAST_CATCH)) { |
535 | 2.19k | block->successors_count = 2; |
536 | 2.19k | block->successors[0] = block_map[OP_JMP_ADDR(opline, opline->op2) - op_array->opcodes]; |
537 | 2.19k | block->successors[1] = j + 1; |
538 | 15.9k | } else { |
539 | 15.9k | block->successors_count = 1; |
540 | 15.9k | block->successors[0] = j + 1; |
541 | 15.9k | } |
542 | 18.1k | break; |
543 | 7.70k | case ZEND_FE_FETCH_R: |
544 | 8.43k | case ZEND_FE_FETCH_RW: |
545 | 8.43k | block->successors_count = 2; |
546 | 8.43k | block->successors[0] = block_map[ZEND_OFFSET_TO_OPLINE_NUM(op_array, opline, opline->extended_value)]; |
547 | 8.43k | block->successors[1] = j + 1; |
548 | 8.43k | break; |
549 | 7.70k | case ZEND_FE_RESET_R: |
550 | 8.43k | case ZEND_FE_RESET_RW: |
551 | 8.43k | block->successors_count = 2; |
552 | 8.43k | block->successors[0] = block_map[OP_JMP_ADDR(opline, opline->op2) - op_array->opcodes]; |
553 | 8.43k | block->successors[1] = j + 1; |
554 | 8.43k | break; |
555 | 475 | case ZEND_FAST_CALL: |
556 | 475 | block->successors_count = 2; |
557 | 475 | block->successors[0] = block_map[OP_JMP_ADDR(opline, opline->op1) - op_array->opcodes]; |
558 | 475 | block->successors[1] = j + 1; |
559 | 475 | break; |
560 | 8 | case ZEND_SWITCH_LONG: |
561 | 82 | case ZEND_SWITCH_STRING: |
562 | 258 | case ZEND_MATCH: |
563 | 258 | { |
564 | 258 | HashTable *jumptable = Z_ARRVAL_P(CRT_CONSTANT(opline->op2)); |
565 | 258 | zval *zv; |
566 | 258 | uint32_t s = 0; |
567 | | |
568 | 258 | block->successors_count = (opline->opcode == ZEND_MATCH ? 1 : 2) + zend_hash_num_elements(jumptable); |
569 | 258 | block->successors = zend_arena_calloc(arena, block->successors_count, sizeof(int)); |
570 | | |
571 | 2.39k | ZEND_HASH_FOREACH_VAL(jumptable, zv) { |
572 | 2.39k | block->successors[s++] = block_map[ZEND_OFFSET_TO_OPLINE_NUM(op_array, opline, Z_LVAL_P(zv))]; |
573 | 2.39k | } ZEND_HASH_FOREACH_END(); |
574 | | |
575 | 258 | block->successors[s++] = block_map[ZEND_OFFSET_TO_OPLINE_NUM(op_array, opline, opline->extended_value)]; |
576 | 258 | if (opline->opcode != ZEND_MATCH) { |
577 | 82 | block->successors[s++] = j + 1; |
578 | 82 | } |
579 | 258 | break; |
580 | 82 | } |
581 | 88.1k | default: |
582 | 88.1k | block->successors_count = 1; |
583 | 88.1k | block->successors[0] = j + 1; |
584 | 88.1k | break; |
585 | 340k | } |
586 | 340k | } |
587 | | |
588 | | /* Build CFG, Step 4, Mark Reachable Basic Blocks */ |
589 | 89.8k | cfg->flags |= flags; |
590 | 89.8k | zend_mark_reachable_blocks(op_array, cfg, 0); |
591 | 89.8k | } |
592 | | /* }}} */ |
593 | | |
594 | | ZEND_API void zend_cfg_build_predecessors(zend_arena **arena, zend_cfg *cfg) /* {{{ */ |
595 | 37.0k | { |
596 | 37.0k | int j, s, edges; |
597 | 37.0k | zend_basic_block *b; |
598 | 37.0k | zend_basic_block *blocks = cfg->blocks; |
599 | 37.0k | zend_basic_block *end = blocks + cfg->blocks_count; |
600 | 37.0k | int *predecessors; |
601 | | |
602 | 37.0k | edges = 0; |
603 | 152k | for (b = blocks; b < end; b++) { |
604 | 115k | b->predecessors_count = 0; |
605 | 115k | } |
606 | 152k | for (b = blocks; b < end; b++) { |
607 | 115k | if (!(b->flags & ZEND_BB_REACHABLE)) { |
608 | 10 | b->successors_count = 0; |
609 | 10 | b->predecessors_count = 0; |
610 | 115k | } else { |
611 | 233k | for (s = 0; s < b->successors_count; s++) { |
612 | 117k | edges++; |
613 | 117k | blocks[b->successors[s]].predecessors_count++; |
614 | 117k | } |
615 | 115k | } |
616 | 115k | } |
617 | | |
618 | 37.0k | cfg->edges_count = edges; |
619 | 37.0k | cfg->predecessors = predecessors = (int*)zend_arena_calloc(arena, sizeof(int), edges); |
620 | | |
621 | 37.0k | edges = 0; |
622 | 152k | for (b = blocks; b < end; b++) { |
623 | 115k | if (b->flags & ZEND_BB_REACHABLE) { |
624 | 115k | b->predecessor_offset = edges; |
625 | 115k | edges += b->predecessors_count; |
626 | 115k | b->predecessors_count = 0; |
627 | 115k | } |
628 | 115k | } |
629 | | |
630 | 152k | for (j = 0; j < cfg->blocks_count; j++) { |
631 | 115k | if (blocks[j].flags & ZEND_BB_REACHABLE) { |
632 | | /* SWITCH_STRING/LONG may have few identical successors */ |
633 | 233k | for (s = 0; s < blocks[j].successors_count; s++) { |
634 | 117k | int duplicate = 0; |
635 | 117k | int p; |
636 | | |
637 | 158k | for (p = 0; p < s; p++) { |
638 | 40.9k | if (blocks[j].successors[p] == blocks[j].successors[s]) { |
639 | 93 | duplicate = 1; |
640 | 93 | break; |
641 | 93 | } |
642 | 40.9k | } |
643 | 117k | if (!duplicate) { |
644 | 117k | zend_basic_block *b = blocks + blocks[j].successors[s]; |
645 | | |
646 | 117k | predecessors[b->predecessor_offset + b->predecessors_count] = j; |
647 | 117k | b->predecessors_count++; |
648 | 117k | } |
649 | 117k | } |
650 | 115k | } |
651 | 115k | } |
652 | 37.0k | } |
653 | | /* }}} */ |
654 | | |
655 | | /* Computes a postorder numbering of the CFG */ |
656 | | static void compute_postnum_recursive( |
657 | | int *postnum, int *cur, const zend_cfg *cfg, int block_num) /* {{{ */ |
658 | 122k | { |
659 | 122k | int s; |
660 | 122k | zend_basic_block *block = &cfg->blocks[block_num]; |
661 | 122k | if (postnum[block_num] != -1) { |
662 | 38.7k | return; |
663 | 38.7k | } |
664 | | |
665 | 84.1k | postnum[block_num] = -2; /* Marker for "currently visiting" */ |
666 | 201k | for (s = 0; s < block->successors_count; s++) { |
667 | 117k | compute_postnum_recursive(postnum, cur, cfg, block->successors[s]); |
668 | 117k | } |
669 | 84.1k | postnum[block_num] = (*cur)++; |
670 | 84.1k | } |
671 | | /* }}} */ |
672 | | |
673 | | /* Computes dominator tree using algorithm from "A Simple, Fast Dominance Algorithm" by |
674 | | * Cooper, Harvey and Kennedy. */ |
675 | | ZEND_API void zend_cfg_compute_dominators_tree(const zend_op_array *op_array, zend_cfg *cfg) /* {{{ */ |
676 | 37.0k | { |
677 | 37.0k | zend_basic_block *blocks = cfg->blocks; |
678 | 37.0k | int blocks_count = cfg->blocks_count; |
679 | 37.0k | int j, k, changed; |
680 | | |
681 | 37.0k | if (cfg->blocks_count == 1) { |
682 | 31.4k | blocks[0].level = 0; |
683 | 31.4k | return; |
684 | 31.4k | } |
685 | | |
686 | 5.55k | ALLOCA_FLAG(use_heap) |
687 | 5.55k | int *postnum = do_alloca(sizeof(int) * cfg->blocks_count, use_heap); |
688 | 5.55k | memset(postnum, -1, sizeof(int) * cfg->blocks_count); |
689 | 5.55k | j = 0; |
690 | 5.55k | compute_postnum_recursive(postnum, &j, cfg, 0); |
691 | | |
692 | | /* FIXME: move declarations */ |
693 | 5.55k | blocks[0].idom = 0; |
694 | 13.3k | do { |
695 | 13.3k | changed = 0; |
696 | | /* Iterating in RPO here would converge faster */ |
697 | 190k | for (j = 1; j < blocks_count; j++) { |
698 | 176k | int idom = -1; |
699 | | |
700 | 176k | if ((blocks[j].flags & ZEND_BB_REACHABLE) == 0) { |
701 | 18 | continue; |
702 | 18 | } |
703 | 438k | for (k = 0; k < blocks[j].predecessors_count; k++) { |
704 | 261k | int pred = cfg->predecessors[blocks[j].predecessor_offset + k]; |
705 | | |
706 | 261k | if (blocks[pred].idom >= 0) { |
707 | 242k | if (idom < 0) { |
708 | 165k | idom = pred; |
709 | 165k | } else { |
710 | 153k | while (idom != pred) { |
711 | 196k | while (postnum[pred] < postnum[idom]) pred = blocks[pred].idom; |
712 | 81.1k | while (postnum[idom] < postnum[pred]) idom = blocks[idom].idom; |
713 | 76.7k | } |
714 | 76.5k | } |
715 | 242k | } |
716 | 261k | } |
717 | | |
718 | 176k | if (idom >= 0 && blocks[j].idom != idom) { |
719 | 78.6k | blocks[j].idom = idom; |
720 | 78.6k | changed = 1; |
721 | 78.6k | } |
722 | 176k | } |
723 | 13.3k | } while (changed); |
724 | 5.55k | blocks[0].idom = -1; |
725 | | |
726 | 84.1k | for (j = 1; j < blocks_count; j++) { |
727 | 78.6k | if ((blocks[j].flags & ZEND_BB_REACHABLE) == 0) { |
728 | 10 | continue; |
729 | 10 | } |
730 | 78.6k | if (blocks[j].idom >= 0) { |
731 | | /* Sort by block number to traverse children in pre-order */ |
732 | 78.6k | if (blocks[blocks[j].idom].children < 0 || |
733 | 41.4k | j < blocks[blocks[j].idom].children) { |
734 | 41.4k | blocks[j].next_child = blocks[blocks[j].idom].children; |
735 | 41.4k | blocks[blocks[j].idom].children = j; |
736 | 41.4k | } else { |
737 | 37.1k | int k = blocks[blocks[j].idom].children; |
738 | 40.6k | while (blocks[k].next_child >=0 && j > blocks[k].next_child) { |
739 | 3.44k | k = blocks[k].next_child; |
740 | 3.44k | } |
741 | 37.1k | blocks[j].next_child = blocks[k].next_child; |
742 | 37.1k | blocks[k].next_child = j; |
743 | 37.1k | } |
744 | 78.6k | } |
745 | 78.6k | } |
746 | | |
747 | 89.7k | for (j = 0; j < blocks_count; j++) { |
748 | 84.1k | int idom = blocks[j].idom, level = 0; |
749 | 84.1k | if ((blocks[j].flags & ZEND_BB_REACHABLE) == 0) { |
750 | 10 | continue; |
751 | 10 | } |
752 | 86.5k | while (idom >= 0) { |
753 | 80.9k | level++; |
754 | 80.9k | if (blocks[idom].level >= 0) { |
755 | 78.6k | level += blocks[idom].level; |
756 | 78.6k | break; |
757 | 78.6k | } else { |
758 | 2.36k | idom = blocks[idom].idom; |
759 | 2.36k | } |
760 | 80.9k | } |
761 | 84.1k | blocks[j].level = level; |
762 | 84.1k | } |
763 | | |
764 | 5.55k | free_alloca(postnum, use_heap); |
765 | 5.55k | } |
766 | | /* }}} */ |
767 | | |
768 | | static bool dominates(zend_basic_block *blocks, int a, int b) /* {{{ */ |
769 | 40.3k | { |
770 | 63.7k | while (blocks[b].level > blocks[a].level) { |
771 | 23.4k | b = blocks[b].idom; |
772 | 23.4k | } |
773 | 40.3k | return a == b; |
774 | 40.3k | } |
775 | | /* }}} */ |
776 | | |
777 | | ZEND_API void zend_cfg_identify_loops(const zend_op_array *op_array, zend_cfg *cfg) /* {{{ */ |
778 | 37.0k | { |
779 | 37.0k | int i, j, k, n; |
780 | 37.0k | int time; |
781 | 37.0k | zend_basic_block *blocks = cfg->blocks; |
782 | 37.0k | int *entry_times, *exit_times; |
783 | 37.0k | zend_worklist work; |
784 | 37.0k | int flag = ZEND_FUNC_NO_LOOPS; |
785 | 37.0k | int *sorted_blocks; |
786 | 37.0k | ALLOCA_FLAG(list_use_heap) |
787 | 37.0k | ALLOCA_FLAG(tree_use_heap) |
788 | | |
789 | 37.0k | if (cfg->blocks_count == 1) { |
790 | 31.4k | cfg->flags |= flag; |
791 | 31.4k | return; |
792 | 31.4k | } |
793 | | |
794 | 5.55k | ZEND_WORKLIST_ALLOCA(&work, cfg->blocks_count, list_use_heap); |
795 | | |
796 | | /* We don't materialize the DJ spanning tree explicitly, as we are only interested in ancestor |
797 | | * queries. These are implemented by checking entry/exit times of the DFS search. */ |
798 | 5.55k | entry_times = do_alloca(3 * sizeof(int) * cfg->blocks_count, tree_use_heap); |
799 | 5.55k | exit_times = entry_times + cfg->blocks_count; |
800 | 5.55k | sorted_blocks = exit_times + cfg->blocks_count; |
801 | 5.55k | memset(entry_times, -1, 2 * sizeof(int) * cfg->blocks_count); |
802 | | |
803 | 5.55k | zend_worklist_push(&work, 0); |
804 | 5.55k | time = 0; |
805 | 89.7k | while (zend_worklist_len(&work)) { |
806 | 162k | next: |
807 | 162k | i = zend_worklist_peek(&work); |
808 | 162k | if (entry_times[i] == -1) { |
809 | 84.1k | entry_times[i] = time++; |
810 | 84.1k | } |
811 | | /* Visit blocks immediately dominated by i. */ |
812 | 248k | for (j = blocks[i].children; j >= 0; j = blocks[j].next_child) { |
813 | 131k | if (zend_worklist_push(&work, j)) { |
814 | 46.2k | goto next; |
815 | 46.2k | } |
816 | 131k | } |
817 | | /* Visit join edges. */ |
818 | 234k | for (j = 0; j < blocks[i].successors_count; j++) { |
819 | 149k | int succ = blocks[i].successors[j]; |
820 | 149k | if (blocks[succ].idom == i) { |
821 | 76.9k | continue; |
822 | 76.9k | } else if (zend_worklist_push(&work, succ)) { |
823 | 32.3k | goto next; |
824 | 32.3k | } |
825 | 149k | } |
826 | 84.1k | exit_times[i] = time++; |
827 | 84.1k | zend_worklist_pop(&work); |
828 | 84.1k | } |
829 | | |
830 | | /* Sort blocks by level, which is the opposite order in which we want to process them */ |
831 | 5.55k | sorted_blocks[0] = 0; |
832 | 5.55k | j = 0; |
833 | 5.55k | n = 1; |
834 | 50.6k | while (j != n) { |
835 | 45.0k | i = j; |
836 | 45.0k | j = n; |
837 | 129k | for (; i < j; i++) { |
838 | 84.1k | int child; |
839 | 162k | for (child = blocks[sorted_blocks[i]].children; child >= 0; child = blocks[child].next_child) { |
840 | 78.6k | sorted_blocks[n++] = child; |
841 | 78.6k | } |
842 | 84.1k | } |
843 | 45.0k | } |
844 | | |
845 | | /* Identify loops. See Sreedhar et al, "Identifying Loops Using DJ Graphs". */ |
846 | 89.7k | while (n > 0) { |
847 | 84.1k | i = sorted_blocks[--n]; |
848 | | |
849 | 84.1k | if (blocks[i].predecessors_count < 2) { |
850 | | /* loop header has at least two input edges */ |
851 | 47.4k | continue; |
852 | 47.4k | } |
853 | | |
854 | 112k | for (j = 0; j < blocks[i].predecessors_count; j++) { |
855 | 75.3k | int pred = cfg->predecessors[blocks[i].predecessor_offset + j]; |
856 | | |
857 | | /* A join edge is one for which the predecessor does not |
858 | | immediately dominate the successor. */ |
859 | 75.3k | if (blocks[i].idom == pred) { |
860 | 34.9k | continue; |
861 | 34.9k | } |
862 | | |
863 | | /* In a loop back-edge (back-join edge), the successor dominates |
864 | | the predecessor. */ |
865 | 40.3k | if (dominates(blocks, i, pred)) { |
866 | 4.72k | blocks[i].flags |= ZEND_BB_LOOP_HEADER; |
867 | 4.72k | flag &= ~ZEND_FUNC_NO_LOOPS; |
868 | 4.72k | if (!zend_worklist_len(&work)) { |
869 | 4.33k | zend_bitset_clear(work.visited, zend_bitset_len(cfg->blocks_count)); |
870 | 4.33k | } |
871 | 4.72k | zend_worklist_push(&work, pred); |
872 | 35.6k | } else { |
873 | | /* Otherwise it's a cross-join edge. See if it's a branch |
874 | | to an ancestor on the DJ spanning tree. */ |
875 | 35.6k | if (entry_times[pred] > entry_times[i] && exit_times[pred] < exit_times[i]) { |
876 | 0 | blocks[i].flags |= ZEND_BB_IRREDUCIBLE_LOOP; |
877 | 0 | flag |= ZEND_FUNC_IRREDUCIBLE; |
878 | 0 | flag &= ~ZEND_FUNC_NO_LOOPS; |
879 | 0 | } |
880 | 35.6k | } |
881 | 40.3k | } |
882 | 58.3k | while (zend_worklist_len(&work)) { |
883 | 21.6k | j = zend_worklist_pop(&work); |
884 | 22.8k | while (blocks[j].loop_header >= 0) { |
885 | 1.16k | j = blocks[j].loop_header; |
886 | 1.16k | } |
887 | 21.6k | if (j != i) { |
888 | 16.7k | if (blocks[j].idom < 0 && j != 0) { |
889 | | /* Ignore blocks that are unreachable or only abnormally reachable. */ |
890 | 0 | continue; |
891 | 0 | } |
892 | 16.7k | blocks[j].loop_header = i; |
893 | 39.7k | for (k = 0; k < blocks[j].predecessors_count; k++) { |
894 | 22.9k | zend_worklist_push(&work, cfg->predecessors[blocks[j].predecessor_offset + k]); |
895 | 22.9k | } |
896 | 16.7k | } |
897 | 21.6k | } |
898 | 36.6k | } |
899 | | |
900 | 5.55k | free_alloca(entry_times, tree_use_heap); |
901 | 5.55k | ZEND_WORKLIST_FREE_ALLOCA(&work, list_use_heap); |
902 | | |
903 | 5.55k | cfg->flags |= flag; |
904 | 5.55k | } |
905 | | /* }}} */ |