Coverage Report

Created: 2025-10-13 06:15

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/cpython3/Python/assemble.c
Line
Count
Source
1
#include "Python.h"
2
#include "pycore_code.h"            // write_location_entry_start()
3
#include "pycore_compile.h"
4
#include "pycore_instruction_sequence.h"
5
#include "pycore_opcode_utils.h"    // IS_BACKWARDS_JUMP_OPCODE
6
#include "pycore_opcode_metadata.h" // is_pseudo_target, _PyOpcode_Caches
7
#include "pycore_symtable.h"        // _Py_SourceLocation
8
9
#include <stdbool.h>
10
11
37.2k
#define DEFAULT_CODE_SIZE 128
12
37.2k
#define DEFAULT_LNOTAB_SIZE 16
13
37.2k
#define DEFAULT_CNOTAB_SIZE 32
14
15
#undef SUCCESS
16
#undef ERROR
17
5.15M
#define SUCCESS 0
18
37.2k
#define ERROR -1
19
20
#define RETURN_IF_ERROR(X)  \
21
5.39M
    if ((X) < 0) {          \
22
0
        return ERROR;       \
23
0
    }
24
25
typedef _Py_SourceLocation location;
26
typedef _PyInstruction instruction;
27
typedef _PyInstructionSequence instr_sequence;
28
29
static inline bool
30
same_location(location a, location b)
31
6.10M
{
32
6.10M
    return a.lineno == b.lineno &&
33
2.85M
           a.end_lineno == b.end_lineno &&
34
2.84M
           a.col_offset == b.col_offset &&
35
1.58M
           a.end_col_offset == b.end_col_offset;
36
6.10M
}
37
38
static int
39
instr_size(instruction *instr)
40
20.1M
{
41
20.1M
    int opcode = instr->i_opcode;
42
20.1M
    int oparg = instr->i_oparg;
43
20.1M
    assert(!IS_PSEUDO_INSTR(opcode));
44
20.1M
    assert(OPCODE_HAS_ARG(opcode) || oparg == 0);
45
20.1M
    int extended_args = (0xFFFFFF < oparg) + (0xFFFF < oparg) + (0xFF < oparg);
46
20.1M
    int caches = _PyOpcode_Caches[opcode];
47
20.1M
    return extended_args + 1 + caches;
48
20.1M
}
49
50
struct assembler {
51
    PyObject *a_bytecode;  /* bytes containing bytecode */
52
    int a_offset;              /* offset into bytecode */
53
    PyObject *a_except_table;  /* bytes containing exception table */
54
    int a_except_table_off;    /* offset into exception table */
55
    /* Location Info */
56
    int a_lineno;          /* lineno of last emitted instruction */
57
    PyObject* a_linetable; /* bytes containing location info */
58
    int a_location_off;    /* offset of last written location info frame */
59
};
60
61
static int
62
assemble_init(struct assembler *a, int firstlineno)
63
37.2k
{
64
37.2k
    memset(a, 0, sizeof(struct assembler));
65
37.2k
    a->a_lineno = firstlineno;
66
37.2k
    a->a_linetable = NULL;
67
37.2k
    a->a_location_off = 0;
68
37.2k
    a->a_except_table = NULL;
69
37.2k
    a->a_bytecode = PyBytes_FromStringAndSize(NULL, DEFAULT_CODE_SIZE);
70
37.2k
    if (a->a_bytecode == NULL) {
71
0
        goto error;
72
0
    }
73
37.2k
    a->a_linetable = PyBytes_FromStringAndSize(NULL, DEFAULT_CNOTAB_SIZE);
74
37.2k
    if (a->a_linetable == NULL) {
75
0
        goto error;
76
0
    }
77
37.2k
    a->a_except_table = PyBytes_FromStringAndSize(NULL, DEFAULT_LNOTAB_SIZE);
78
37.2k
    if (a->a_except_table == NULL) {
79
0
        goto error;
80
0
    }
81
37.2k
    return SUCCESS;
82
0
error:
83
0
    Py_XDECREF(a->a_bytecode);
84
0
    Py_XDECREF(a->a_linetable);
85
0
    Py_XDECREF(a->a_except_table);
86
0
    return ERROR;
87
37.2k
}
88
89
static void
90
assemble_free(struct assembler *a)
91
37.2k
{
92
37.2k
    Py_XDECREF(a->a_bytecode);
93
37.2k
    Py_XDECREF(a->a_linetable);
94
37.2k
    Py_XDECREF(a->a_except_table);
95
37.2k
}
96
97
static inline void
98
464k
write_except_byte(struct assembler *a, int byte) {
99
464k
    unsigned char *p = (unsigned char *) PyBytes_AS_STRING(a->a_except_table);
100
464k
    p[a->a_except_table_off++] = byte;
101
464k
}
102
103
182k
#define CONTINUATION_BIT 64
104
105
static void
106
assemble_emit_exception_table_item(struct assembler *a, int value, int msb)
107
281k
{
108
281k
    assert ((msb | 128) == 128);
109
281k
    assert(value >= 0 && value < (1 << 30));
110
281k
    if (value >= 1 << 24) {
111
0
        write_except_byte(a, (value >> 24) | CONTINUATION_BIT | msb);
112
0
        msb = 0;
113
0
    }
114
281k
    if (value >= 1 << 18) {
115
0
        write_except_byte(a, ((value >> 18)&0x3f) | CONTINUATION_BIT | msb);
116
0
        msb = 0;
117
0
    }
118
281k
    if (value >= 1 << 12) {
119
49.3k
        write_except_byte(a, ((value >> 12)&0x3f) | CONTINUATION_BIT | msb);
120
49.3k
        msb = 0;
121
49.3k
    }
122
281k
    if (value >= 1 << 6) {
123
132k
        write_except_byte(a, ((value >> 6)&0x3f) | CONTINUATION_BIT | msb);
124
132k
        msb = 0;
125
132k
    }
126
281k
    write_except_byte(a, (value&0x3f) | msb);
127
281k
}
128
129
/* See InternalDocs/exception_handling.md for details of layout */
130
70.4k
#define MAX_SIZE_OF_ENTRY 20
131
132
static int
133
assemble_emit_exception_table_entry(struct assembler *a, int start, int end,
134
                                    int handler_offset,
135
                                    _PyExceptHandlerInfo *handler)
136
70.4k
{
137
70.4k
    Py_ssize_t len = PyBytes_GET_SIZE(a->a_except_table);
138
70.4k
    if (a->a_except_table_off + MAX_SIZE_OF_ENTRY >= len) {
139
6.68k
        RETURN_IF_ERROR(_PyBytes_Resize(&a->a_except_table, len * 2));
140
6.68k
    }
141
70.4k
    int size = end-start;
142
70.4k
    assert(end > start);
143
70.4k
    int target = handler_offset;
144
70.4k
    int depth = handler->h_startdepth - 1;
145
70.4k
    if (handler->h_preserve_lasti > 0) {
146
53.0k
        depth -= 1;
147
53.0k
    }
148
70.4k
    assert(depth >= 0);
149
70.4k
    int depth_lasti = (depth<<1) | handler->h_preserve_lasti;
150
70.4k
    assemble_emit_exception_table_item(a, start, (1<<7));
151
70.4k
    assemble_emit_exception_table_item(a, size, 0);
152
70.4k
    assemble_emit_exception_table_item(a, target, 0);
153
70.4k
    assemble_emit_exception_table_item(a, depth_lasti, 0);
154
70.4k
    return SUCCESS;
155
70.4k
}
156
157
static int
158
assemble_exception_table(struct assembler *a, instr_sequence *instrs)
159
37.2k
{
160
37.2k
    int ioffset = 0;
161
37.2k
    _PyExceptHandlerInfo handler;
162
37.2k
    handler.h_label = -1;
163
37.2k
    handler.h_startdepth = -1;
164
37.2k
    handler.h_preserve_lasti = -1;
165
37.2k
    int start = -1;
166
3.09M
    for (int i = 0; i < instrs->s_used; i++) {
167
3.05M
        instruction *instr = &instrs->s_instrs[i];
168
3.05M
        if (instr->i_except_handler_info.h_label != handler.h_label) {
169
102k
            if (handler.h_label >= 0) {
170
70.4k
                int handler_offset = instrs->s_instrs[handler.h_label].i_offset;
171
70.4k
                RETURN_IF_ERROR(
172
70.4k
                    assemble_emit_exception_table_entry(a, start, ioffset,
173
70.4k
                                                        handler_offset,
174
70.4k
                                                        &handler));
175
70.4k
            }
176
102k
            start = ioffset;
177
102k
            handler = instr->i_except_handler_info;
178
102k
        }
179
3.05M
        ioffset += instr_size(instr);
180
3.05M
    }
181
37.2k
    if (handler.h_label >= 0) {
182
0
        int handler_offset = instrs->s_instrs[handler.h_label].i_offset;
183
0
        RETURN_IF_ERROR(assemble_emit_exception_table_entry(a, start, ioffset,
184
0
                                                            handler_offset,
185
0
                                                            &handler));
186
0
    }
187
37.2k
    return SUCCESS;
188
37.2k
}
189
190
191
/* Code location emitting code. See locations.md for a description of the format. */
192
193
#define MSB 0x80
194
195
static void
196
write_location_byte(struct assembler* a, int val)
197
650k
{
198
650k
    PyBytes_AS_STRING(a->a_linetable)[a->a_location_off] = val&255;
199
650k
    a->a_location_off++;
200
650k
}
201
202
203
static uint8_t *
204
location_pointer(struct assembler* a)
205
6.57M
{
206
6.57M
    return (uint8_t *)PyBytes_AS_STRING(a->a_linetable) +
207
6.57M
        a->a_location_off;
208
6.57M
}
209
210
static void
211
write_location_first_byte(struct assembler* a, int code, int length)
212
1.70M
{
213
1.70M
    a->a_location_off += write_location_entry_start(
214
1.70M
        location_pointer(a), code, length);
215
1.70M
}
216
217
static void
218
write_location_varint(struct assembler* a, unsigned int val)
219
3.65M
{
220
3.65M
    uint8_t *ptr = location_pointer(a);
221
3.65M
    a->a_location_off += write_varint(ptr, val);
222
3.65M
}
223
224
225
static void
226
write_location_signed_varint(struct assembler* a, int val)
227
1.21M
{
228
1.21M
    uint8_t *ptr = location_pointer(a);
229
1.21M
    a->a_location_off += write_signed_varint(ptr, val);
230
1.21M
}
231
232
static void
233
write_location_info_short_form(struct assembler* a, int length, int column, int end_column)
234
268k
{
235
268k
    assert(length > 0 &&  length <= 8);
236
268k
    int column_low_bits = column & 7;
237
268k
    int column_group = column >> 3;
238
268k
    assert(column < 80);
239
268k
    assert(end_column >= column);
240
268k
    assert(end_column - column < 16);
241
268k
    write_location_first_byte(a, PY_CODE_LOCATION_INFO_SHORT0 + column_group, length);
242
268k
    write_location_byte(a, (column_low_bits << 4) | (end_column - column));
243
268k
}
244
245
static void
246
write_location_info_oneline_form(struct assembler* a, int length, int line_delta, int column, int end_column)
247
190k
{
248
190k
    assert(length > 0 &&  length <= 8);
249
190k
    assert(line_delta >= 0 && line_delta < 3);
250
190k
    assert(column < 128);
251
190k
    assert(end_column < 128);
252
190k
    write_location_first_byte(a, PY_CODE_LOCATION_INFO_ONE_LINE0 + line_delta, length);
253
190k
    write_location_byte(a, column);
254
190k
    write_location_byte(a, end_column);
255
190k
}
256
257
static void
258
write_location_info_long_form(struct assembler* a, location loc, int length)
259
1.21M
{
260
1.21M
    assert(length > 0 &&  length <= 8);
261
1.21M
    write_location_first_byte(a, PY_CODE_LOCATION_INFO_LONG, length);
262
1.21M
    write_location_signed_varint(a, loc.lineno - a->a_lineno);
263
1.21M
    assert(loc.end_lineno >= loc.lineno);
264
1.21M
    write_location_varint(a, loc.end_lineno - loc.lineno);
265
1.21M
    write_location_varint(a, loc.col_offset + 1);
266
1.21M
    write_location_varint(a, loc.end_col_offset + 1);
267
1.21M
}
268
269
static void
270
write_location_info_none(struct assembler* a, int length)
271
27.1k
{
272
27.1k
    write_location_first_byte(a, PY_CODE_LOCATION_INFO_NONE, length);
273
27.1k
}
274
275
static void
276
write_location_info_no_column(struct assembler* a, int length, int line_delta)
277
2.22k
{
278
2.22k
    write_location_first_byte(a, PY_CODE_LOCATION_INFO_NO_COLUMNS, length);
279
2.22k
    write_location_signed_varint(a, line_delta);
280
2.22k
}
281
282
1.70M
#define THEORETICAL_MAX_ENTRY_SIZE 25 /* 1 + 6 + 6 + 6 + 6 */
283
284
285
static int
286
write_location_info_entry(struct assembler* a, location loc, int isize)
287
1.70M
{
288
1.70M
    Py_ssize_t len = PyBytes_GET_SIZE(a->a_linetable);
289
1.70M
    if (a->a_location_off + THEORETICAL_MAX_ENTRY_SIZE >= len) {
290
41.4k
        assert(len > THEORETICAL_MAX_ENTRY_SIZE);
291
41.4k
        RETURN_IF_ERROR(_PyBytes_Resize(&a->a_linetable, len*2));
292
41.4k
    }
293
1.70M
    if (loc.lineno == NO_LOCATION.lineno) {
294
27.1k
        write_location_info_none(a, isize);
295
27.1k
        return SUCCESS;
296
27.1k
    }
297
1.67M
    int line_delta = loc.lineno - a->a_lineno;
298
1.67M
    int column = loc.col_offset;
299
1.67M
    int end_column = loc.end_col_offset;
300
1.67M
    if (column < 0 || end_column < 0) {
301
2.22k
        if (loc.end_lineno == loc.lineno || loc.end_lineno < 0) {
302
2.22k
            write_location_info_no_column(a, isize, line_delta);
303
2.22k
            a->a_lineno = loc.lineno;
304
2.22k
            return SUCCESS;
305
2.22k
        }
306
2.22k
    }
307
1.67M
    else if (loc.end_lineno == loc.lineno) {
308
1.61M
        if (line_delta == 0 && column < 80 && end_column - column < 16 && end_column >= column) {
309
268k
            write_location_info_short_form(a, isize, column, end_column);
310
268k
            return SUCCESS;
311
268k
        }
312
1.34M
        if (line_delta >= 0 && line_delta < 3 && column < 128 && end_column < 128) {
313
190k
            write_location_info_oneline_form(a, isize, line_delta, column, end_column);
314
190k
            a->a_lineno = loc.lineno;
315
190k
            return SUCCESS;
316
190k
        }
317
1.34M
    }
318
1.21M
    write_location_info_long_form(a, loc, isize);
319
1.21M
    a->a_lineno = loc.lineno;
320
1.21M
    return SUCCESS;
321
1.67M
}
322
323
static int
324
assemble_emit_location(struct assembler* a, location loc, int isize)
325
1.56M
{
326
1.56M
    if (isize == 0) {
327
26.3k
        return SUCCESS;
328
26.3k
    }
329
1.70M
    while (isize > 8) {
330
171k
        RETURN_IF_ERROR(write_location_info_entry(a, loc, 8));
331
171k
        isize -= 8;
332
171k
    }
333
1.53M
    return write_location_info_entry(a, loc, isize);
334
1.53M
}
335
336
static int
337
assemble_location_info(struct assembler *a, instr_sequence *instrs,
338
                       int firstlineno)
339
37.2k
{
340
37.2k
    a->a_lineno = firstlineno;
341
37.2k
    location loc = NO_LOCATION;
342
3.09M
    for (int i = instrs->s_used-1; i >= 0; i--) {
343
3.05M
        instruction *instr = &instrs->s_instrs[i];
344
3.05M
        if (same_location(instr->i_loc, NEXT_LOCATION)) {
345
1.33k
            if (IS_TERMINATOR_OPCODE(instr->i_opcode)) {
346
61
                instr->i_loc = NO_LOCATION;
347
61
            }
348
1.27k
            else {
349
1.27k
                assert(i < instrs->s_used-1);
350
1.27k
                instr->i_loc = instr[1].i_loc;
351
1.27k
            }
352
1.33k
        }
353
3.05M
    }
354
37.2k
    int size = 0;
355
3.09M
    for (int i = 0; i < instrs->s_used; i++) {
356
3.05M
        instruction *instr = &instrs->s_instrs[i];
357
3.05M
        if (!same_location(loc, instr->i_loc)) {
358
1.52M
                RETURN_IF_ERROR(assemble_emit_location(a, loc, size));
359
1.52M
                loc = instr->i_loc;
360
1.52M
                size = 0;
361
1.52M
        }
362
3.05M
        size += instr_size(instr);
363
3.05M
    }
364
37.2k
    RETURN_IF_ERROR(assemble_emit_location(a, loc, size));
365
37.2k
    return SUCCESS;
366
37.2k
}
367
368
static void
369
write_instr(_Py_CODEUNIT *codestr, instruction *instr, int ilen)
370
3.05M
{
371
3.05M
    int opcode = instr->i_opcode;
372
3.05M
    assert(!IS_PSEUDO_INSTR(opcode));
373
3.05M
    int oparg = instr->i_oparg;
374
3.05M
    assert(OPCODE_HAS_ARG(opcode) || oparg == 0);
375
3.05M
    int caches = _PyOpcode_Caches[opcode];
376
3.05M
    switch (ilen - caches) {
377
0
        case 4:
378
0
            codestr->op.code = EXTENDED_ARG;
379
0
            codestr->op.arg = (oparg >> 24) & 0xFF;
380
0
            codestr++;
381
0
            _Py_FALLTHROUGH;
382
15.9k
        case 3:
383
15.9k
            codestr->op.code = EXTENDED_ARG;
384
15.9k
            codestr->op.arg = (oparg >> 16) & 0xFF;
385
15.9k
            codestr++;
386
15.9k
            _Py_FALLTHROUGH;
387
117k
        case 2:
388
117k
            codestr->op.code = EXTENDED_ARG;
389
117k
            codestr->op.arg = (oparg >> 8) & 0xFF;
390
117k
            codestr++;
391
117k
            _Py_FALLTHROUGH;
392
3.05M
        case 1:
393
3.05M
            codestr->op.code = opcode;
394
3.05M
            codestr->op.arg = oparg & 0xFF;
395
3.05M
            codestr++;
396
3.05M
            break;
397
0
        default:
398
0
            Py_UNREACHABLE();
399
3.05M
    }
400
5.69M
    while (caches--) {
401
2.63M
        codestr->op.code = CACHE;
402
2.63M
        codestr->op.arg = 0;
403
2.63M
        codestr++;
404
2.63M
    }
405
3.05M
}
406
407
/* assemble_emit_instr()
408
   Extend the bytecode with a new instruction.
409
   Update lnotab if necessary.
410
*/
411
412
static int
413
assemble_emit_instr(struct assembler *a, instruction *instr)
414
3.05M
{
415
3.05M
    Py_ssize_t len = PyBytes_GET_SIZE(a->a_bytecode);
416
3.05M
    _Py_CODEUNIT *code;
417
418
3.05M
    int size = instr_size(instr);
419
3.05M
    if (a->a_offset + size >= len / (int)sizeof(_Py_CODEUNIT)) {
420
15.0k
        if (len > PY_SSIZE_T_MAX / 2) {
421
0
            return ERROR;
422
0
        }
423
15.0k
        RETURN_IF_ERROR(_PyBytes_Resize(&a->a_bytecode, len * 2));
424
15.0k
    }
425
3.05M
    code = (_Py_CODEUNIT *)PyBytes_AS_STRING(a->a_bytecode) + a->a_offset;
426
3.05M
    a->a_offset += size;
427
3.05M
    write_instr(code, instr, size);
428
3.05M
    return SUCCESS;
429
3.05M
}
430
431
static int
432
assemble_emit(struct assembler *a, instr_sequence *instrs,
433
              int first_lineno, PyObject *const_cache)
434
37.2k
{
435
37.2k
    RETURN_IF_ERROR(assemble_init(a, first_lineno));
436
437
3.09M
    for (int i = 0; i < instrs->s_used; i++) {
438
3.05M
        instruction *instr = &instrs->s_instrs[i];
439
3.05M
        RETURN_IF_ERROR(assemble_emit_instr(a, instr));
440
3.05M
    }
441
442
37.2k
    RETURN_IF_ERROR(assemble_location_info(a, instrs, a->a_lineno));
443
444
37.2k
    RETURN_IF_ERROR(assemble_exception_table(a, instrs));
445
446
37.2k
    RETURN_IF_ERROR(_PyBytes_Resize(&a->a_except_table, a->a_except_table_off));
447
37.2k
    RETURN_IF_ERROR(_PyCompile_ConstCacheMergeOne(const_cache, &a->a_except_table));
448
449
37.2k
    RETURN_IF_ERROR(_PyBytes_Resize(&a->a_linetable, a->a_location_off));
450
37.2k
    RETURN_IF_ERROR(_PyCompile_ConstCacheMergeOne(const_cache, &a->a_linetable));
451
452
37.2k
    RETURN_IF_ERROR(_PyBytes_Resize(&a->a_bytecode, a->a_offset * sizeof(_Py_CODEUNIT)));
453
37.2k
    RETURN_IF_ERROR(_PyCompile_ConstCacheMergeOne(const_cache, &a->a_bytecode));
454
37.2k
    return SUCCESS;
455
37.2k
}
456
457
static PyObject *
458
dict_keys_inorder(PyObject *dict, Py_ssize_t offset)
459
37.2k
{
460
37.2k
    PyObject *tuple, *k, *v;
461
37.2k
    Py_ssize_t pos = 0, size = PyDict_GET_SIZE(dict);
462
463
37.2k
    tuple = PyTuple_New(size);
464
37.2k
    if (tuple == NULL)
465
0
        return NULL;
466
158k
    while (PyDict_Next(dict, &pos, &k, &v)) {
467
121k
        Py_ssize_t i = PyLong_AsSsize_t(v);
468
121k
        if (i == -1 && PyErr_Occurred()) {
469
0
            Py_DECREF(tuple);
470
0
            return NULL;
471
0
        }
472
121k
        assert((i - offset) < size);
473
121k
        assert((i - offset) >= 0);
474
121k
        PyTuple_SET_ITEM(tuple, i - offset, Py_NewRef(k));
475
121k
    }
476
37.2k
    return tuple;
477
37.2k
}
478
479
// This is in codeobject.c.
480
extern void _Py_set_localsplus_info(int, PyObject *, unsigned char,
481
                                   PyObject *, PyObject *);
482
483
static int
484
compute_localsplus_info(_PyCompile_CodeUnitMetadata *umd, int nlocalsplus,
485
                        int flags, PyObject *names, PyObject *kinds)
486
37.2k
{
487
37.2k
    PyObject *k, *v;
488
37.2k
    Py_ssize_t pos = 0;
489
490
    // Set the locals kinds.  Arg vars fill the first portion of the list.
491
37.2k
    struct {
492
37.2k
        int count;
493
37.2k
        _PyLocals_Kind kind;
494
37.2k
    }  argvarkinds[6] = {
495
37.2k
        {(int)umd->u_posonlyargcount, CO_FAST_ARG_POS},
496
37.2k
        {(int)umd->u_argcount, CO_FAST_ARG_POS | CO_FAST_ARG_KW},
497
37.2k
        {(int)umd->u_kwonlyargcount, CO_FAST_ARG_KW},
498
37.2k
        {!!(flags & CO_VARARGS), CO_FAST_ARG_VAR | CO_FAST_ARG_POS},
499
37.2k
        {!!(flags & CO_VARKEYWORDS), CO_FAST_ARG_VAR | CO_FAST_ARG_KW},
500
37.2k
        {-1, 0},  // the remaining local vars
501
37.2k
    };
502
37.2k
    int max = 0;
503
260k
    for (int i = 0; i < 6; i++) {
504
223k
        max = argvarkinds[i].count < 0
505
223k
            ? INT_MAX
506
223k
            : max + argvarkinds[i].count;
507
289k
        while (pos < max && PyDict_Next(umd->u_varnames, &pos, &k, &v)) {
508
65.8k
            int offset = PyLong_AsInt(v);
509
65.8k
            if (offset == -1 && PyErr_Occurred()) {
510
0
                return ERROR;
511
0
            }
512
65.8k
            assert(offset >= 0);
513
65.8k
            assert(offset < nlocalsplus);
514
515
65.8k
            _PyLocals_Kind kind = CO_FAST_LOCAL | argvarkinds[i].kind;
516
517
65.8k
            int has_key = PyDict_Contains(umd->u_fasthidden, k);
518
65.8k
            RETURN_IF_ERROR(has_key);
519
65.8k
            if (has_key) {
520
1.86k
                kind |= CO_FAST_HIDDEN;
521
1.86k
            }
522
523
65.8k
            has_key = PyDict_Contains(umd->u_cellvars, k);
524
65.8k
            RETURN_IF_ERROR(has_key);
525
65.8k
            if (has_key) {
526
442
                kind |= CO_FAST_CELL;
527
442
            }
528
529
65.8k
            _Py_set_localsplus_info(offset, k, kind, names, kinds);
530
65.8k
        }
531
223k
    }
532
37.2k
    int nlocals = (int)PyDict_GET_SIZE(umd->u_varnames);
533
534
    // This counter mirrors the fix done in fix_cell_offsets().
535
37.2k
    int numdropped = 0, cellvar_offset = -1;
536
37.2k
    pos = 0;
537
43.6k
    while (PyDict_Next(umd->u_cellvars, &pos, &k, &v)) {
538
6.40k
        int has_name = PyDict_Contains(umd->u_varnames, k);
539
6.40k
        RETURN_IF_ERROR(has_name);
540
6.40k
        if (has_name) {
541
            // Skip cells that are already covered by locals.
542
442
            numdropped += 1;
543
442
            continue;
544
442
        }
545
546
5.96k
        cellvar_offset = PyLong_AsInt(v);
547
5.96k
        if (cellvar_offset == -1 && PyErr_Occurred()) {
548
0
            return ERROR;
549
0
        }
550
5.96k
        assert(cellvar_offset >= 0);
551
5.96k
        cellvar_offset += nlocals - numdropped;
552
5.96k
        assert(cellvar_offset < nlocalsplus);
553
5.96k
        _Py_set_localsplus_info(cellvar_offset, k, CO_FAST_CELL, names, kinds);
554
5.96k
    }
555
556
37.2k
    pos = 0;
557
44.4k
    while (PyDict_Next(umd->u_freevars, &pos, &k, &v)) {
558
7.24k
        int offset = PyLong_AsInt(v);
559
7.24k
        if (offset == -1 && PyErr_Occurred()) {
560
0
            return ERROR;
561
0
        }
562
7.24k
        assert(offset >= 0);
563
7.24k
        offset += nlocals - numdropped;
564
7.24k
        assert(offset < nlocalsplus);
565
        /* XXX If the assertion below fails it is most likely because a freevar
566
           was added to u_freevars with the wrong index due to not taking into
567
           account cellvars already present, see gh-128632. */
568
7.24k
        assert(offset > cellvar_offset);
569
7.24k
        _Py_set_localsplus_info(offset, k, CO_FAST_FREE, names, kinds);
570
7.24k
    }
571
37.2k
    return SUCCESS;
572
37.2k
}
573
574
static PyCodeObject *
575
makecode(_PyCompile_CodeUnitMetadata *umd, struct assembler *a, PyObject *const_cache,
576
         PyObject *constslist, int maxdepth, int nlocalsplus, int code_flags,
577
         PyObject *filename)
578
37.2k
{
579
37.2k
    PyCodeObject *co = NULL;
580
37.2k
    PyObject *names = NULL;
581
37.2k
    PyObject *consts = NULL;
582
37.2k
    PyObject *localsplusnames = NULL;
583
37.2k
    PyObject *localspluskinds = NULL;
584
37.2k
    names = dict_keys_inorder(umd->u_names, 0);
585
37.2k
    if (!names) {
586
0
        goto error;
587
0
    }
588
37.2k
    if (_PyCompile_ConstCacheMergeOne(const_cache, &names) < 0) {
589
0
        goto error;
590
0
    }
591
592
37.2k
    consts = PyList_AsTuple(constslist); /* PyCode_New requires a tuple */
593
37.2k
    if (consts == NULL) {
594
0
        goto error;
595
0
    }
596
37.2k
    if (_PyCompile_ConstCacheMergeOne(const_cache, &consts) < 0) {
597
0
        goto error;
598
0
    }
599
600
37.2k
    assert(umd->u_posonlyargcount < INT_MAX);
601
37.2k
    assert(umd->u_argcount < INT_MAX);
602
37.2k
    assert(umd->u_kwonlyargcount < INT_MAX);
603
37.2k
    int posonlyargcount = (int)umd->u_posonlyargcount;
604
37.2k
    int posorkwargcount = (int)umd->u_argcount;
605
37.2k
    assert(INT_MAX - posonlyargcount - posorkwargcount > 0);
606
37.2k
    int kwonlyargcount = (int)umd->u_kwonlyargcount;
607
608
37.2k
    localsplusnames = PyTuple_New(nlocalsplus);
609
37.2k
    if (localsplusnames == NULL) {
610
0
        goto error;
611
0
    }
612
37.2k
    localspluskinds = PyBytes_FromStringAndSize(NULL, nlocalsplus);
613
37.2k
    if (localspluskinds == NULL) {
614
0
        goto error;
615
0
    }
616
37.2k
    if (compute_localsplus_info(
617
37.2k
            umd, nlocalsplus, code_flags,
618
37.2k
            localsplusnames, localspluskinds) == ERROR)
619
0
    {
620
0
        goto error;
621
0
    }
622
623
37.2k
    struct _PyCodeConstructor con = {
624
37.2k
        .filename = filename,
625
37.2k
        .name = umd->u_name,
626
37.2k
        .qualname = umd->u_qualname ? umd->u_qualname : umd->u_name,
627
37.2k
        .flags = code_flags,
628
629
37.2k
        .code = a->a_bytecode,
630
37.2k
        .firstlineno = umd->u_firstlineno,
631
37.2k
        .linetable = a->a_linetable,
632
633
37.2k
        .consts = consts,
634
37.2k
        .names = names,
635
636
37.2k
        .localsplusnames = localsplusnames,
637
37.2k
        .localspluskinds = localspluskinds,
638
639
37.2k
        .argcount = posonlyargcount + posorkwargcount,
640
37.2k
        .posonlyargcount = posonlyargcount,
641
37.2k
        .kwonlyargcount = kwonlyargcount,
642
643
37.2k
        .stacksize = maxdepth,
644
645
37.2k
        .exceptiontable = a->a_except_table,
646
37.2k
    };
647
648
37.2k
   if (_PyCode_Validate(&con) < 0) {
649
0
        goto error;
650
0
    }
651
652
37.2k
    if (_PyCompile_ConstCacheMergeOne(const_cache, &localsplusnames) < 0) {
653
0
        goto error;
654
0
    }
655
37.2k
    con.localsplusnames = localsplusnames;
656
657
37.2k
    co = _PyCode_New(&con);
658
37.2k
    if (co == NULL) {
659
0
        goto error;
660
0
    }
661
662
37.2k
error:
663
37.2k
    Py_XDECREF(names);
664
37.2k
    Py_XDECREF(consts);
665
37.2k
    Py_XDECREF(localsplusnames);
666
37.2k
    Py_XDECREF(localspluskinds);
667
37.2k
    return co;
668
37.2k
}
669
670
671
// The offset (in code units) of the END_SEND from the SEND in the `yield from` sequence.
672
2.50k
#define END_SEND_OFFSET 5
673
674
static int
675
resolve_jump_offsets(instr_sequence *instrs)
676
37.2k
{
677
    /* Compute the size of each instruction and fixup jump args.
678
     * Replace instruction index with position in bytecode.
679
     */
680
681
3.09M
    for (int i = 0; i < instrs->s_used; i++) {
682
3.05M
        instruction *instr = &instrs->s_instrs[i];
683
3.05M
        if (OPCODE_HAS_JUMP(instr->i_opcode)) {
684
177k
            instr->i_target = instr->i_oparg;
685
177k
        }
686
3.05M
    }
687
688
37.2k
    int extended_arg_recompile;
689
690
38.6k
    do {
691
38.6k
        int totsize = 0;
692
5.31M
        for (int i = 0; i < instrs->s_used; i++) {
693
5.27M
            instruction *instr = &instrs->s_instrs[i];
694
5.27M
            instr->i_offset = totsize;
695
5.27M
            int isize = instr_size(instr);
696
5.27M
            totsize += isize;
697
5.27M
        }
698
38.6k
        extended_arg_recompile = 0;
699
700
38.6k
        int offset = 0;
701
5.31M
        for (int i = 0; i < instrs->s_used; i++) {
702
5.27M
            instruction *instr = &instrs->s_instrs[i];
703
5.27M
            int isize = instr_size(instr);
704
            /* jump offsets are computed relative to
705
             * the instruction pointer after fetching
706
             * the jump instruction.
707
             */
708
5.27M
            offset += isize;
709
5.27M
            if (OPCODE_HAS_JUMP(instr->i_opcode)) {
710
401k
                instruction *target = &instrs->s_instrs[instr->i_target];
711
401k
                instr->i_oparg = target->i_offset;
712
401k
                if (instr->i_opcode == END_ASYNC_FOR) {
713
                    // sys.monitoring needs to be able to find the matching END_SEND
714
                    // but the target is the SEND, so we adjust it here.
715
2.50k
                    instr->i_oparg = offset - instr->i_oparg - END_SEND_OFFSET;
716
2.50k
                }
717
398k
                else if (instr->i_oparg < offset) {
718
40.6k
                    assert(IS_BACKWARDS_JUMP_OPCODE(instr->i_opcode));
719
40.6k
                    instr->i_oparg = offset - instr->i_oparg;
720
40.6k
                }
721
357k
                else {
722
357k
                    assert(!IS_BACKWARDS_JUMP_OPCODE(instr->i_opcode));
723
357k
                    instr->i_oparg = instr->i_oparg - offset;
724
357k
                }
725
401k
                if (instr_size(instr) != isize) {
726
81.6k
                    extended_arg_recompile = 1;
727
81.6k
                }
728
401k
            }
729
5.27M
        }
730
    /* XXX: This is an awful hack that could hurt performance, but
731
        on the bright side it should work until we come up
732
        with a better solution.
733
734
        The issue is that in the first loop instr_size() is
735
        called, and it requires i_oparg be set appropriately.
736
        There is a bootstrap problem because i_oparg is
737
        calculated in the second loop above.
738
739
        So we loop until we stop seeing new EXTENDED_ARGs.
740
        The only EXTENDED_ARGs that could be popping up are
741
        ones in jump instructions.  So this should converge
742
        fairly quickly.
743
    */
744
38.6k
    } while (extended_arg_recompile);
745
37.2k
    return SUCCESS;
746
37.2k
}
747
748
static int
749
resolve_unconditional_jumps(instr_sequence *instrs)
750
37.2k
{
751
    /* Resolve directions of unconditional jumps */
752
753
3.09M
    for (int i = 0; i < instrs->s_used; i++) {
754
3.05M
        instruction *instr = &instrs->s_instrs[i];
755
3.05M
        bool is_forward = (instr->i_oparg > i);
756
3.05M
        switch(instr->i_opcode) {
757
9.45k
            case JUMP:
758
9.45k
                assert(is_pseudo_target(JUMP, JUMP_FORWARD));
759
9.45k
                assert(is_pseudo_target(JUMP, JUMP_BACKWARD));
760
9.45k
                instr->i_opcode = is_forward ? JUMP_FORWARD : JUMP_BACKWARD;
761
9.45k
                break;
762
24.0k
            case JUMP_NO_INTERRUPT:
763
24.0k
                assert(is_pseudo_target(JUMP_NO_INTERRUPT, JUMP_FORWARD));
764
24.0k
                assert(is_pseudo_target(JUMP_NO_INTERRUPT, JUMP_BACKWARD_NO_INTERRUPT));
765
24.0k
                instr->i_opcode = is_forward ?
766
14.2k
                    JUMP_FORWARD : JUMP_BACKWARD_NO_INTERRUPT;
767
24.0k
                break;
768
3.02M
            default:
769
3.02M
                if (OPCODE_HAS_JUMP(instr->i_opcode) &&
770
143k
                    IS_PSEUDO_INSTR(instr->i_opcode)) {
771
0
                    Py_UNREACHABLE();
772
0
                }
773
3.05M
        }
774
3.05M
    }
775
37.2k
    return SUCCESS;
776
37.2k
}
777
778
PyCodeObject *
779
_PyAssemble_MakeCodeObject(_PyCompile_CodeUnitMetadata *umd, PyObject *const_cache,
780
                           PyObject *consts, int maxdepth, instr_sequence *instrs,
781
                           int nlocalsplus, int code_flags, PyObject *filename)
782
37.2k
{
783
37.2k
    if (_PyInstructionSequence_ApplyLabelMap(instrs) < 0) {
784
0
        return NULL;
785
0
    }
786
37.2k
    if (resolve_unconditional_jumps(instrs) < 0) {
787
0
        return NULL;
788
0
    }
789
37.2k
    if (resolve_jump_offsets(instrs) < 0) {
790
0
        return NULL;
791
0
    }
792
37.2k
    PyCodeObject *co = NULL;
793
794
37.2k
    struct assembler a;
795
37.2k
    int res = assemble_emit(&a, instrs, umd->u_firstlineno, const_cache);
796
37.2k
    if (res == SUCCESS) {
797
37.2k
        co = makecode(umd, &a, const_cache, consts, maxdepth, nlocalsplus,
798
37.2k
                      code_flags, filename);
799
37.2k
    }
800
37.2k
    assemble_free(&a);
801
37.2k
    return co;
802
37.2k
}