Coverage Report

Created: 2025-12-14 06:09

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/php-src/Zend/Optimizer/dce.c
Line
Count
Source
1
/*
2
   +----------------------------------------------------------------------+
3
   | Zend Engine, DCE - Dead Code Elimination                             |
4
   +----------------------------------------------------------------------+
5
   | Copyright (c) The PHP Group                                          |
6
   +----------------------------------------------------------------------+
7
   | This source file is subject to version 3.01 of the PHP license,      |
8
   | that is bundled with this package in the file LICENSE, and is        |
9
   | available through the world-wide-web at the following url:           |
10
   | https://www.php.net/license/3_01.txt                                 |
11
   | If you did not receive a copy of the PHP license and are unable to   |
12
   | obtain it through the world-wide-web, please send a note to          |
13
   | license@php.net so we can mail you a copy immediately.               |
14
   +----------------------------------------------------------------------+
15
   | Authors: Nikita Popov <nikic@php.net>                                |
16
   |          Dmitry Stogov <dmitry@php.net>                              |
17
   +----------------------------------------------------------------------+
18
*/
19
20
#include "Optimizer/zend_optimizer_internal.h"
21
#include "Optimizer/zend_inference.h"
22
#include "Optimizer/zend_ssa.h"
23
#include "Optimizer/zend_func_info.h"
24
#include "Optimizer/zend_call_graph.h"
25
#include "zend_bitset.h"
26
27
/* This pass implements a form of dead code elimination (DCE). The algorithm optimistically assumes
28
 * that all instructions and phis are dead. Instructions with immediate side-effects are then marked
29
 * as live. We then recursively (using a worklist) propagate liveness to the instructions that def
30
 * the used operands.
31
 *
32
 * Notes:
33
 *  * This pass does not perform unreachable code elimination. This happens as part of the SCCP
34
 *    pass.
35
 *  * The DCE is performed without taking control-dependence into account, i.e. all conditional
36
 *    branches are assumed to be live. It's possible to take control-dependence into account using
37
 *    the DCE algorithm described by Cytron et al., however it requires the construction of a
38
 *    postdominator tree and of postdominance frontiers, which does not seem worthwhile at this
39
 *    point.
40
 *  * We separate intrinsic side-effects from potential side-effects in the form of notices thrown
41
 *    by the instruction (in case we want to make this configurable). See may_have_side_effects() and
42
 *    zend_may_throw().
43
 *  * We often cannot DCE assignments and unsets while guaranteeing that dtors run in the same
44
 *    order. There is an optimization option to allow reordering of dtor effects.
45
 *  * The algorithm is able to eliminate dead modifications of non-escaping arrays
46
 *    and objects as well as dead arrays and objects allocations.
47
 */
48
49
typedef struct {
50
  zend_ssa *ssa;
51
  zend_op_array *op_array;
52
  zend_bitset instr_dead;
53
  zend_bitset phi_dead;
54
  zend_bitset instr_worklist;
55
  zend_bitset phi_worklist;
56
  zend_bitset phi_worklist_no_val;
57
  uint32_t instr_worklist_len;
58
  uint32_t phi_worklist_len;
59
  unsigned reorder_dtor_effects : 1;
60
} context;
61
62
16.9k
static inline bool is_bad_mod(const zend_ssa *ssa, int use, int def) {
63
16.9k
  if (def < 0) {
64
    /* This modification is not tracked by SSA, assume the worst */
65
3.11k
    return true;
66
3.11k
  }
67
13.8k
  if (ssa->var_info[use].type & MAY_BE_REF) {
68
    /* Modification of reference may have side-effect */
69
5.95k
    return true;
70
5.95k
  }
71
7.85k
  return false;
72
13.8k
}
73
74
static inline bool may_have_side_effects(
75
    const zend_op_array *op_array, const zend_ssa *ssa,
76
    const zend_op *opline, const zend_ssa_op *ssa_op,
77
384k
    bool reorder_dtor_effects) {
78
384k
  switch (opline->opcode) {
79
1.64k
    case ZEND_NOP:
80
1.69k
    case ZEND_IS_IDENTICAL:
81
1.71k
    case ZEND_IS_NOT_IDENTICAL:
82
3.15k
    case ZEND_QM_ASSIGN:
83
5.08k
    case ZEND_FE_FREE:
84
5.15k
    case ZEND_TYPE_CHECK:
85
5.16k
    case ZEND_DEFINED:
86
5.68k
    case ZEND_ADD:
87
5.93k
    case ZEND_SUB:
88
6.37k
    case ZEND_MUL:
89
6.38k
    case ZEND_POW:
90
6.45k
    case ZEND_BW_OR:
91
6.95k
    case ZEND_BW_AND:
92
7.15k
    case ZEND_BW_XOR:
93
8.53k
    case ZEND_CONCAT:
94
8.61k
    case ZEND_FAST_CONCAT:
95
8.73k
    case ZEND_DIV:
96
8.96k
    case ZEND_MOD:
97
9.36k
    case ZEND_BOOL_XOR:
98
9.92k
    case ZEND_BOOL:
99
10.1k
    case ZEND_BOOL_NOT:
100
10.3k
    case ZEND_BW_NOT:
101
10.8k
    case ZEND_SL:
102
10.9k
    case ZEND_SR:
103
11.1k
    case ZEND_IS_EQUAL:
104
11.4k
    case ZEND_IS_NOT_EQUAL:
105
12.5k
    case ZEND_IS_SMALLER:
106
12.5k
    case ZEND_IS_SMALLER_OR_EQUAL:
107
12.5k
    case ZEND_CASE:
108
12.5k
    case ZEND_CASE_STRICT:
109
12.6k
    case ZEND_CAST:
110
12.6k
    case ZEND_ROPE_INIT:
111
12.6k
    case ZEND_ROPE_ADD:
112
12.6k
    case ZEND_INIT_ARRAY:
113
12.6k
    case ZEND_SPACESHIP:
114
13.2k
    case ZEND_STRLEN:
115
13.3k
    case ZEND_COUNT:
116
13.3k
    case ZEND_GET_TYPE:
117
13.3k
    case ZEND_ISSET_ISEMPTY_THIS:
118
13.3k
    case ZEND_ISSET_ISEMPTY_DIM_OBJ:
119
13.5k
    case ZEND_FETCH_DIM_IS:
120
13.5k
    case ZEND_ISSET_ISEMPTY_CV:
121
13.5k
    case ZEND_ISSET_ISEMPTY_VAR:
122
13.5k
    case ZEND_FETCH_IS:
123
13.5k
    case ZEND_IN_ARRAY:
124
13.5k
    case ZEND_FUNC_NUM_ARGS:
125
13.5k
    case ZEND_FUNC_GET_ARGS:
126
13.5k
    case ZEND_ARRAY_KEY_EXISTS:
127
14.0k
    case ZEND_COPY_TMP:
128
      /* No side effects */
129
14.0k
      return false;
130
12.1k
    case ZEND_FREE:
131
12.1k
      return opline->extended_value == ZEND_FREE_VOID_CAST;
132
42
    case ZEND_ADD_ARRAY_ELEMENT:
133
      /* TODO: We can't free two vars. Keep instruction alive. <?php [0, "$a" => "$b"]; */
134
42
      if ((opline->op1_type & (IS_VAR|IS_TMP_VAR)) && (opline->op2_type & (IS_VAR|IS_TMP_VAR))) {
135
0
        return true;
136
0
      }
137
42
      return false;
138
125
    case ZEND_ROPE_END:
139
      /* TODO: Rope dce optimization, see #76446 */
140
125
      return true;
141
7.36k
    case ZEND_JMP:
142
10.8k
    case ZEND_JMPZ:
143
15.3k
    case ZEND_JMPNZ:
144
15.7k
    case ZEND_JMPZ_EX:
145
16.0k
    case ZEND_JMPNZ_EX:
146
16.3k
    case ZEND_JMP_SET:
147
16.5k
    case ZEND_COALESCE:
148
17.0k
    case ZEND_ASSERT_CHECK:
149
18.9k
    case ZEND_JMP_NULL:
150
19.0k
    case ZEND_BIND_INIT_STATIC_OR_JMP:
151
19.0k
    case ZEND_JMP_FRAMELESS:
152
      /* For our purposes a jumps and branches are side effects. */
153
19.0k
      return true;
154
0
    case ZEND_BEGIN_SILENCE:
155
69.7k
    case ZEND_END_SILENCE:
156
89.0k
    case ZEND_ECHO:
157
89.0k
    case ZEND_INCLUDE_OR_EVAL:
158
89.9k
    case ZEND_THROW:
159
90.0k
    case ZEND_MATCH_ERROR:
160
90.0k
    case ZEND_EXT_STMT:
161
90.0k
    case ZEND_EXT_FCALL_BEGIN:
162
90.0k
    case ZEND_EXT_FCALL_END:
163
90.1k
    case ZEND_TICKS:
164
90.8k
    case ZEND_YIELD:
165
90.8k
    case ZEND_YIELD_FROM:
166
90.8k
    case ZEND_VERIFY_NEVER_TYPE:
167
      /* Intrinsic side effects */
168
90.8k
      return true;
169
47.0k
    case ZEND_DO_FCALL:
170
47.1k
    case ZEND_DO_FCALL_BY_NAME:
171
47.1k
    case ZEND_DO_ICALL:
172
49.9k
    case ZEND_DO_UCALL:
173
49.9k
    case ZEND_FRAMELESS_ICALL_0:
174
49.9k
    case ZEND_FRAMELESS_ICALL_1:
175
49.9k
    case ZEND_FRAMELESS_ICALL_2:
176
49.9k
    case ZEND_FRAMELESS_ICALL_3:
177
      /* For now assume all calls have side effects */
178
49.9k
      return true;
179
3.98k
    case ZEND_RECV:
180
4.57k
    case ZEND_RECV_INIT:
181
      /* Even though RECV_INIT can be side-effect free, these cannot be simply dropped
182
       * due to the prologue skipping code. */
183
4.57k
      return true;
184
451
    case ZEND_ASSIGN_REF:
185
451
      return true;
186
9.79k
    case ZEND_ASSIGN:
187
9.79k
    {
188
9.79k
      if (is_bad_mod(ssa, ssa_op->op1_use, ssa_op->op1_def)) {
189
4.55k
        return true;
190
4.55k
      }
191
5.24k
      if (!reorder_dtor_effects) {
192
5.24k
        if (opline->op2_type != IS_CONST
193
1.80k
          && (OP2_INFO() & MAY_HAVE_DTOR)
194
534
          && ssa->vars[ssa_op->op2_use].escape_state != ESCAPE_STATE_NO_ESCAPE) {
195
          /* DCE might shorten lifetime */
196
446
          return true;
197
446
        }
198
5.24k
      }
199
4.79k
      return false;
200
5.24k
    }
201
63
    case ZEND_UNSET_VAR:
202
63
      return true;
203
636
    case ZEND_UNSET_CV:
204
636
    {
205
636
      uint32_t t1 = OP1_INFO();
206
636
      if (t1 & MAY_BE_REF) {
207
        /* We don't consider uses as the LHS of an assignment as real uses during DCE, so
208
         * an unset may be considered dead even if there is a later assignment to the
209
         * variable. Removing the unset in this case would not be correct if the variable
210
         * is a reference, because unset breaks references. */
211
596
        return true;
212
596
      }
213
40
      return false;
214
636
    }
215
1.88k
    case ZEND_PRE_INC:
216
2.05k
    case ZEND_POST_INC:
217
2.12k
    case ZEND_PRE_DEC:
218
2.23k
    case ZEND_POST_DEC:
219
2.23k
      return is_bad_mod(ssa, ssa_op->op1_use, ssa_op->op1_def);
220
540
    case ZEND_ASSIGN_OP:
221
540
      return is_bad_mod(ssa, ssa_op->op1_use, ssa_op->op1_def)
222
370
        || ssa->vars[ssa_op->op1_def].escape_state != ESCAPE_STATE_NO_ESCAPE;
223
1.68k
    case ZEND_ASSIGN_DIM:
224
4.25k
    case ZEND_ASSIGN_OBJ:
225
4.25k
      if (is_bad_mod(ssa, ssa_op->op1_use, ssa_op->op1_def)
226
3.99k
        || ssa->vars[ssa_op->op1_def].escape_state != ESCAPE_STATE_NO_ESCAPE) {
227
3.99k
        return true;
228
3.99k
      }
229
265
      if (!reorder_dtor_effects) {
230
265
        opline++;
231
265
        ssa_op++;
232
265
        if (opline->op1_type != IS_CONST
233
186
          && (OP1_INFO() & MAY_HAVE_DTOR)) {
234
          /* DCE might shorten lifetime */
235
51
          return true;
236
51
        }
237
265
      }
238
214
      return false;
239
72
    case ZEND_PRE_INC_OBJ:
240
90
    case ZEND_PRE_DEC_OBJ:
241
94
    case ZEND_POST_INC_OBJ:
242
94
    case ZEND_POST_DEC_OBJ:
243
94
      if (is_bad_mod(ssa, ssa_op->op1_use, ssa_op->op1_def)
244
94
        || ssa->vars[ssa_op->op1_def].escape_state != ESCAPE_STATE_NO_ESCAPE) {
245
94
        return true;
246
94
      }
247
0
      return false;
248
239
    case ZEND_BIND_STATIC:
249
239
      if (op_array->static_variables) {
250
        /* Implicit and Explicit bind static is effectively prologue of closure so
251
           report it has side effects like RECV, RECV_INIT; This allows us to
252
           reflect on the closure and discover used variable at runtime */
253
239
        if ((opline->extended_value & (ZEND_BIND_IMPLICIT|ZEND_BIND_EXPLICIT))) {
254
111
          return true;
255
111
        }
256
        /* Modifies static variables which are observable through reflection */
257
128
        if ((opline->extended_value & ZEND_BIND_REF) && opline->op2_type != IS_UNUSED) {
258
88
          return true;
259
88
        }
260
128
      }
261
40
      return false;
262
36
    case ZEND_CHECK_VAR:
263
36
      return (OP1_INFO() & MAY_BE_UNDEF) != 0;
264
2
    case ZEND_FE_RESET_R:
265
2
    case ZEND_FE_RESET_RW:
266
      /* Model as not having side-effects -- let the side-effect be introduced by
267
       * FE_FETCH if the array is not known to be non-empty. */
268
2
      return (OP1_INFO() & MAY_BE_ANY) != MAY_BE_ARRAY;
269
175k
    default:
270
      /* For everything we didn't handle, assume a side-effect */
271
175k
      return true;
272
384k
  }
273
384k
}
274
275
773k
static zend_always_inline void add_to_worklists(const context *ctx, int var_num, int check) {
276
773k
  const zend_ssa_var *var = &ctx->ssa->vars[var_num];
277
773k
  if (var->definition >= 0) {
278
581k
    if (!check || zend_bitset_in(ctx->instr_dead, var->definition)) {
279
538k
      zend_bitset_incl(ctx->instr_worklist, var->definition);
280
538k
    }
281
581k
  } else if (var->definition_phi) {
282
140k
    if (!check || zend_bitset_in(ctx->phi_dead, var_num)) {
283
90.1k
      zend_bitset_incl(ctx->phi_worklist, var_num);
284
90.1k
    }
285
140k
  }
286
773k
}
287
288
20.1k
static inline void add_to_phi_worklist_no_val(const context *ctx, int var_num) {
289
20.1k
  const zend_ssa_var *var = &ctx->ssa->vars[var_num];
290
20.1k
  if (var->definition_phi && zend_bitset_in(ctx->phi_dead, var_num)) {
291
3.07k
    zend_bitset_incl(ctx->phi_worklist_no_val, var_num);
292
3.07k
  }
293
20.1k
}
294
295
860k
static zend_always_inline void add_operands_to_worklists(const context *ctx, const zend_op *opline, const zend_ssa_op *ssa_op, const zend_ssa *ssa, int check) {
296
860k
  if (ssa_op->result_use >= 0) {
297
9.27k
    add_to_worklists(ctx, ssa_op->result_use, check);
298
9.27k
  }
299
860k
  if (ssa_op->op1_use >= 0) {
300
489k
    if (!zend_ssa_is_no_val_use(opline, ssa_op, ssa_op->op1_use)
301
33.9k
     || (opline->opcode == ZEND_ASSIGN
302
475k
      && (ssa->var_info[ssa_op->op1_use].type & MAY_BE_REF) != 0)) {
303
475k
      add_to_worklists(ctx, ssa_op->op1_use, check);
304
475k
    } else {
305
14.1k
      add_to_phi_worklist_no_val(ctx, ssa_op->op1_use);
306
14.1k
    }
307
489k
  }
308
860k
  if (ssa_op->op2_use >= 0) {
309
150k
    if (!zend_ssa_is_no_val_use(opline, ssa_op, ssa_op->op2_use)
310
1.78k
     || (opline->opcode == ZEND_FE_FETCH_R
311
149k
      && (ssa->var_info[ssa_op->op2_use].type & MAY_BE_REF) != 0)) {
312
149k
      add_to_worklists(ctx, ssa_op->op2_use, check);
313
149k
    } else {
314
908
      add_to_phi_worklist_no_val(ctx, ssa_op->op2_use);
315
908
    }
316
150k
  }
317
860k
}
318
319
78.7k
static zend_always_inline void add_phi_sources_to_worklists(const context *ctx, zend_ssa_phi *phi, int check) {
320
78.7k
  const zend_ssa *ssa = ctx->ssa;
321
78.7k
  int source;
322
356k
  FOREACH_PHI_SOURCE(phi, source) {
323
356k
    add_to_worklists(ctx, source, check);
324
356k
  } FOREACH_PHI_SOURCE_END();
325
78.7k
}
326
327
10.2k
static inline bool is_var_dead(const context *ctx, int var_num) {
328
10.2k
  const zend_ssa_var *var = &ctx->ssa->vars[var_num];
329
10.2k
  if (var->definition_phi) {
330
586
    return zend_bitset_in(ctx->phi_dead, var_num);
331
9.68k
  } else if (var->definition >= 0) {
332
5.39k
    return zend_bitset_in(ctx->instr_dead, var->definition);
333
5.39k
  } else {
334
    /* Variable has no definition, so either the definition has already been removed (var is
335
     * dead) or this is one of the implicit variables at the start of the function (for our
336
     * purposes live) */
337
4.29k
    return var_num >= ctx->op_array->last_var;
338
4.29k
  }
339
10.2k
}
340
341
// Sometimes we can mark the var as EXT_UNUSED
342
4.49k
static bool try_remove_var_def(const context *ctx, int free_var, int use_chain, const zend_op *opline) {
343
4.49k
  if (use_chain >= 0) {
344
568
    return false;
345
568
  }
346
3.93k
  zend_ssa_var *var = &ctx->ssa->vars[free_var];
347
3.93k
  int def = var->definition;
348
349
3.93k
  if (def >= 0) {
350
3.81k
    zend_ssa_op *def_op = &ctx->ssa->ops[def];
351
352
3.81k
    if (def_op->result_def == free_var
353
3.81k
        && var->phi_use_chain == NULL
354
3.81k
        && var->use_chain == (opline - ctx->op_array->opcodes)) {
355
3.72k
      zend_op *def_opline = &ctx->op_array->opcodes[def];
356
357
3.72k
      switch (def_opline->opcode) {
358
75
        case ZEND_ASSIGN:
359
75
        case ZEND_ASSIGN_REF:
360
80
        case ZEND_ASSIGN_DIM:
361
80
        case ZEND_ASSIGN_OBJ:
362
80
        case ZEND_ASSIGN_OBJ_REF:
363
80
        case ZEND_ASSIGN_STATIC_PROP:
364
80
        case ZEND_ASSIGN_STATIC_PROP_REF:
365
116
        case ZEND_ASSIGN_OP:
366
122
        case ZEND_ASSIGN_DIM_OP:
367
122
        case ZEND_ASSIGN_OBJ_OP:
368
122
        case ZEND_ASSIGN_STATIC_PROP_OP:
369
122
        case ZEND_PRE_INC:
370
122
        case ZEND_PRE_DEC:
371
122
        case ZEND_PRE_INC_OBJ:
372
122
        case ZEND_PRE_DEC_OBJ:
373
122
        case ZEND_DO_ICALL:
374
123
        case ZEND_DO_UCALL:
375
123
        case ZEND_DO_FCALL_BY_NAME:
376
405
        case ZEND_DO_FCALL:
377
405
        case ZEND_INCLUDE_OR_EVAL:
378
405
        case ZEND_YIELD:
379
405
        case ZEND_YIELD_FROM:
380
405
        case ZEND_ASSERT_CHECK:
381
405
          def_opline->result_type = IS_UNUSED;
382
405
          def_opline->result.var = 0;
383
405
          def_op->result_def = -1;
384
405
          var->definition = -1;
385
405
          return true;
386
3.32k
        default:
387
3.32k
          break;
388
3.72k
      }
389
3.72k
    }
390
3.81k
  }
391
3.52k
  return false;
392
3.93k
}
393
394
27.0k
static zend_always_inline bool may_be_refcounted(uint32_t type) {
395
27.0k
  return (type & (MAY_BE_STRING|MAY_BE_ARRAY|MAY_BE_OBJECT|MAY_BE_RESOURCE|MAY_BE_REF)) != 0;
396
27.0k
}
397
398
11.5k
static inline bool is_free_of_live_var(const context *ctx, const zend_op *opline, const zend_ssa_op *ssa_op) {
399
11.5k
  switch (opline->opcode) {
400
4.26k
    case ZEND_FREE:
401
      /* It is always safe to remove FREEs of non-refcounted values, even if they are live. */
402
4.26k
      if ((ctx->ssa->var_info[ssa_op->op1_use].type & (MAY_BE_REF|MAY_BE_ANY|MAY_BE_UNDEF)) != 0
403
4.21k
       && !may_be_refcounted(ctx->ssa->var_info[ssa_op->op1_use].type)) {
404
3.22k
        return false;
405
3.22k
      }
406
1.04k
      ZEND_FALLTHROUGH;
407
1.51k
    case ZEND_FE_FREE:
408
1.51k
      return !is_var_dead(ctx, ssa_op->op1_use);
409
6.84k
    default:
410
6.84k
      return false;
411
11.5k
  }
412
11.5k
}
413
414
/* Returns whether the instruction has been DCEd */
415
13.2k
static bool dce_instr(const context *ctx, zend_op *opline, zend_ssa_op *ssa_op) {
416
13.2k
  const zend_ssa *ssa = ctx->ssa;
417
13.2k
  int free_var = -1;
418
13.2k
  uint8_t free_var_type;
419
420
13.2k
  if (opline->opcode == ZEND_NOP) {
421
1.64k
    return false;
422
1.64k
  }
423
424
  /* We mark FREEs as dead, but they're only really dead if the destroyed var is dead */
425
11.5k
  if (is_free_of_live_var(ctx, opline, ssa_op)) {
426
1.10k
    return false;
427
1.10k
  }
428
429
10.4k
  if ((opline->op1_type & (IS_VAR|IS_TMP_VAR)) && !is_var_dead(ctx, ssa_op->op1_use)) {
430
3.43k
    if (!try_remove_var_def(ctx, ssa_op->op1_use, ssa_op->op1_use_chain, opline)) {
431
3.40k
      if (may_be_refcounted(ssa->var_info[ssa_op->op1_use].type)
432
822
          && opline->opcode != ZEND_CASE
433
822
          && opline->opcode != ZEND_CASE_STRICT
434
822
          && opline->opcode != ZEND_COPY_TMP) {
435
254
        free_var = ssa_op->op1_use;
436
254
        free_var_type = opline->op1_type;
437
254
      }
438
3.40k
    }
439
3.43k
  }
440
10.4k
  if ((opline->op2_type & (IS_VAR|IS_TMP_VAR)) && !is_var_dead(ctx, ssa_op->op2_use)) {
441
1.06k
    if (!try_remove_var_def(ctx, ssa_op->op2_use, ssa_op->op2_use_chain, opline)) {
442
693
      if (may_be_refcounted(ssa->var_info[ssa_op->op2_use].type)) {
443
326
        if (free_var >= 0) {
444
          // TODO: We can't free two vars. Keep instruction alive.
445
158
          zend_bitset_excl(ctx->instr_dead, opline - ctx->op_array->opcodes);
446
158
          return false;
447
158
        }
448
168
        free_var = ssa_op->op2_use;
449
168
        free_var_type = opline->op2_type;
450
168
      }
451
693
    }
452
1.06k
  }
453
454
10.3k
  zend_ssa_rename_defs_of_instr(ctx->ssa, ssa_op);
455
10.3k
  zend_ssa_remove_instr(ctx->ssa, opline, ssa_op);
456
457
10.3k
  if (free_var >= 0) {
458
264
    opline->opcode = ZEND_FREE;
459
264
    opline->op1.var = EX_NUM_TO_VAR(ssa->vars[free_var].var);
460
264
    opline->op1_type = free_var_type;
461
462
264
    ssa_op->op1_use = free_var;
463
264
    ssa_op->op1_use_chain = ssa->vars[free_var].use_chain;
464
264
    ssa->vars[free_var].use_chain = ssa_op - ssa->ops;
465
264
    return false;
466
264
  }
467
10.0k
  return true;
468
10.3k
}
469
470
45.9k
static inline int get_common_phi_source(const zend_ssa *ssa, zend_ssa_phi *phi) {
471
45.9k
  int common_source = -1;
472
45.9k
  int source;
473
230k
  FOREACH_PHI_SOURCE(phi, source) {
474
230k
    if (source == phi->ssa_var) {
475
615
      continue;
476
615
    }
477
91.8k
    if (common_source == -1) {
478
45.9k
      common_source = source;
479
45.9k
    } else if (common_source != source) {
480
45.6k
      return -1;
481
45.6k
    }
482
91.8k
  } FOREACH_PHI_SOURCE_END();
483
484
  /* If all sources are phi->ssa_var this phi must be in an unreachable cycle.
485
   * We can't easily drop the phi in that case, as we don't have something to replace it with.
486
   * Ideally SCCP would eliminate the whole cycle. */
487
393
  return common_source;
488
45.9k
}
489
490
66.5k
static void try_remove_trivial_phi(const context *ctx, zend_ssa_phi *phi) {
491
66.5k
  zend_ssa *ssa = ctx->ssa;
492
66.5k
  if (phi->pi < 0) {
493
    /* Phi assignment with identical source operands */
494
45.9k
    int common_source = get_common_phi_source(ssa, phi);
495
45.9k
    if (common_source >= 0) {
496
393
      zend_ssa_rename_var_uses(ssa, phi->ssa_var, common_source, 1);
497
393
      zend_ssa_remove_phi(ssa, phi);
498
393
    }
499
45.9k
  } else {
500
    /* Pi assignment that is only used in Phi/Pi assignments */
501
    // TODO What if we want to rerun type inference after DCE? Maybe separate this?
502
    /*ZEND_ASSERT(phi->sources[0] != -1);
503
    if (ssa->vars[phi->ssa_var].use_chain < 0) {
504
      zend_ssa_rename_var_uses_keep_types(ssa, phi->ssa_var, phi->sources[0], 1);
505
      zend_ssa_remove_phi(ssa, phi);
506
    }*/
507
20.5k
  }
508
66.5k
}
509
510
0
static inline bool may_break_varargs(const zend_op_array *op_array, const zend_ssa *ssa, const zend_ssa_op *ssa_op) {
511
0
  if (ssa_op->op1_def >= 0
512
0
      && ssa->vars[ssa_op->op1_def].var < op_array->num_args) {
513
0
    return true;
514
0
  }
515
0
  if (ssa_op->op2_def >= 0
516
0
      && ssa->vars[ssa_op->op2_def].var < op_array->num_args) {
517
0
    return true;
518
0
  }
519
0
  if (ssa_op->result_def >= 0
520
0
      && ssa->vars[ssa_op->result_def].var < op_array->num_args) {
521
0
    return true;
522
0
  }
523
0
  return false;
524
0
}
525
526
14.9k
static inline bool may_throw_dce_exception(const zend_op *opline) {
527
14.9k
  return opline->opcode == ZEND_ADD_ARRAY_ELEMENT && opline->op2_type == IS_UNUSED;
528
14.9k
}
529
530
38.3k
int dce_optimize_op_array(zend_op_array *op_array, zend_optimizer_ctx *optimizer_ctx, zend_ssa *ssa, bool reorder_dtor_effects) {
531
38.3k
  int i;
532
38.3k
  zend_ssa_phi *phi;
533
38.3k
  int removed_ops = 0;
534
535
  /* DCE of CV operations that changes arguments may affect vararg functions. */
536
38.3k
  bool has_varargs = (ssa->cfg.flags & ZEND_FUNC_VARARG) != 0;
537
538
38.3k
  context ctx;
539
38.3k
  ctx.ssa = ssa;
540
38.3k
  ctx.op_array = op_array;
541
38.3k
  ctx.reorder_dtor_effects = reorder_dtor_effects;
542
543
38.3k
  void *checkpoint = zend_arena_checkpoint(optimizer_ctx->arena);
544
  /* We have no dedicated phi vector, so we use the whole ssa var vector instead */
545
38.3k
  ctx.instr_worklist_len = zend_bitset_len(op_array->last);
546
38.3k
  ctx.instr_worklist = zend_arena_calloc(&optimizer_ctx->arena, ctx.instr_worklist_len, sizeof(zend_ulong));
547
38.3k
  ctx.phi_worklist_len = zend_bitset_len(ssa->vars_count);
548
38.3k
  ctx.phi_worklist = zend_arena_calloc(&optimizer_ctx->arena, ctx.phi_worklist_len, sizeof(zend_ulong));
549
38.3k
  ctx.phi_worklist_no_val = zend_arena_calloc(&optimizer_ctx->arena, ctx.phi_worklist_len, sizeof(zend_ulong));
550
551
  /* Optimistically assume all instructions and phis to be dead */
552
38.3k
  ctx.instr_dead = zend_arena_calloc(&optimizer_ctx->arena, ctx.instr_worklist_len, sizeof(zend_ulong));
553
38.3k
  ctx.phi_dead = zend_arena_alloc(&optimizer_ctx->arena, ctx.phi_worklist_len * sizeof(zend_ulong));
554
38.3k
  memset(ctx.phi_dead, 0xff, sizeof(zend_ulong) * ctx.phi_worklist_len);
555
556
  /* Mark non-CV phis as live. Even if the result is unused, we generally cannot remove one
557
   * of the producing instructions, as it combines producing the result with control flow.
558
   * This can be made more precise if there are any cases where this is not the case. */
559
215k
  FOREACH_PHI(phi) {
560
215k
    if (phi->var >= op_array->last_var
561
18.7k
        && may_be_refcounted(ssa->var_info[phi->ssa_var].type)) {
562
15.0k
      zend_bitset_excl(ctx.phi_dead, phi->ssa_var);
563
15.0k
      add_phi_sources_to_worklists(&ctx, phi, 0);
564
15.0k
    }
565
215k
  } FOREACH_PHI_END();
566
567
  /* Mark reachable instruction without side effects as dead */
568
38.3k
  int b = ssa->cfg.blocks_count;
569
145k
  while (b > 0) {
570
106k
    int op_data = -1;
571
572
106k
    b--;
573
106k
    const zend_basic_block *block = &ssa->cfg.blocks[b];
574
106k
    if (!(block->flags & ZEND_BB_REACHABLE)) {
575
5.20k
      continue;
576
5.20k
    }
577
101k
    i = block->start + block->len;
578
974k
    while (i > block->start) {
579
873k
      i--;
580
581
873k
      if (op_array->opcodes[i].opcode == ZEND_OP_DATA) {
582
9.53k
        op_data = i;
583
9.53k
        continue;
584
9.53k
      }
585
586
863k
      if (zend_bitset_in(ctx.instr_worklist, i)) {
587
479k
        zend_bitset_excl(ctx.instr_worklist, i);
588
479k
        add_operands_to_worklists(&ctx, &op_array->opcodes[i], &ssa->ops[i], ssa, 0);
589
479k
        if (op_data >= 0) {
590
4.14k
          add_operands_to_worklists(&ctx, &op_array->opcodes[op_data], &ssa->ops[op_data], ssa, 0);
591
4.14k
        }
592
479k
      } else if (may_have_side_effects(op_array, ssa, &op_array->opcodes[i], &ssa->ops[i], ctx.reorder_dtor_effects)
593
32.6k
          || (zend_may_throw(&op_array->opcodes[i], &ssa->ops[i], op_array, ssa)
594
14.9k
            && !may_throw_dce_exception(&op_array->opcodes[i]))
595
366k
          || (has_varargs && may_break_varargs(op_array, ssa, &ssa->ops[i]))) {
596
366k
        if (op_array->opcodes[i].opcode == ZEND_NEW
597
40
            && op_array->opcodes[i+1].opcode == ZEND_DO_FCALL
598
40
            && ssa->ops[i].result_def >= 0
599
40
            && ssa->vars[ssa->ops[i].result_def].escape_state == ESCAPE_STATE_NO_ESCAPE) {
600
38
          zend_bitset_incl(ctx.instr_dead, i);
601
38
          zend_bitset_incl(ctx.instr_dead, i+1);
602
366k
        } else {
603
366k
          add_operands_to_worklists(&ctx, &op_array->opcodes[i], &ssa->ops[i], ssa, 0);
604
366k
          if (op_data >= 0) {
605
5.35k
            add_operands_to_worklists(&ctx, &op_array->opcodes[op_data], &ssa->ops[op_data], ssa, 0);
606
5.35k
          }
607
366k
        }
608
366k
      } else {
609
17.7k
        zend_bitset_incl(ctx.instr_dead, i);
610
17.7k
        if (op_data >= 0) {
611
37
          zend_bitset_incl(ctx.instr_dead, op_data);
612
37
        }
613
17.7k
      }
614
863k
      op_data = -1;
615
863k
    }
616
101k
  }
617
618
  /* Propagate liveness backwards to all definitions of used vars */
619
45.1k
  while (!zend_bitset_empty(ctx.instr_worklist, ctx.instr_worklist_len)
620
43.8k
      || !zend_bitset_empty(ctx.phi_worklist, ctx.phi_worklist_len)) {
621
11.3k
    while ((i = zend_bitset_pop_first(ctx.instr_worklist, ctx.instr_worklist_len)) >= 0) {
622
4.61k
      zend_bitset_excl(ctx.instr_dead, i);
623
4.61k
      add_operands_to_worklists(&ctx, &op_array->opcodes[i], &ssa->ops[i], ssa, 1);
624
4.61k
      if (i < op_array->last
625
4.61k
       && (op_array->opcodes[i+1].opcode == ZEND_OP_DATA
626
4.58k
        || (op_array->opcodes[i].opcode == ZEND_NEW
627
32
         && op_array->opcodes[i+1].opcode == ZEND_DO_FCALL))) {
628
32
        zend_bitset_excl(ctx.instr_dead, i+1);
629
32
        add_operands_to_worklists(&ctx, &op_array->opcodes[i+1], &ssa->ops[i+1], ssa, 1);
630
32
      }
631
4.61k
    }
632
70.4k
    while ((i = zend_bitset_pop_first(ctx.phi_worklist, ctx.phi_worklist_len)) >= 0) {
633
63.6k
      zend_bitset_excl(ctx.phi_dead, i);
634
63.6k
      zend_bitset_excl(ctx.phi_worklist_no_val, i);
635
63.6k
      add_phi_sources_to_worklists(&ctx, ssa->vars[i].definition_phi, 1);
636
63.6k
    }
637
6.76k
  }
638
639
  /* Eliminate dead instructions */
640
178k
  ZEND_BITSET_FOREACH(ctx.instr_dead, ctx.instr_worklist_len, i) {
641
13.2k
    removed_ops += dce_instr(&ctx, &op_array->opcodes[i], &ssa->ops[i]);
642
13.2k
  } ZEND_BITSET_FOREACH_END();
643
644
  /* Improper uses don't count as "uses" for the purpose of instruction elimination,
645
   * but we have to retain phis defining them.
646
   * Propagate this information backwards, marking any phi with an improperly used
647
   * target as non-dead. */
648
40.9k
  while ((i = zend_bitset_pop_first(ctx.phi_worklist_no_val, ctx.phi_worklist_len)) >= 0) {
649
2.61k
    zend_ssa_phi *phi = ssa->vars[i].definition_phi;
650
2.61k
    int source;
651
2.61k
    zend_bitset_excl(ctx.phi_dead, i);
652
12.7k
    FOREACH_PHI_SOURCE(phi, source) {
653
12.7k
      add_to_phi_worklist_no_val(&ctx, source);
654
12.7k
    } FOREACH_PHI_SOURCE_END();
655
2.61k
  }
656
657
  /* Now collect the actually dead phis */
658
215k
  FOREACH_PHI(phi) {
659
215k
    if (zend_bitset_in(ctx.phi_dead, phi->ssa_var)) {
660
3.53k
      zend_ssa_remove_uses_of_var(ssa, phi->ssa_var);
661
3.53k
      zend_ssa_remove_phi(ssa, phi);
662
66.5k
    } else {
663
      /* Remove trivial phis (phis with identical source operands) */
664
66.5k
      try_remove_trivial_phi(&ctx, phi);
665
66.5k
    }
666
215k
  } FOREACH_PHI_END();
667
668
38.3k
  zend_arena_release(&optimizer_ctx->arena, checkpoint);
669
670
38.3k
  return removed_ops;
671
38.3k
}