Coverage Report

Created: 2025-08-24 07:03

/src/cpython/Objects/listobject.c
Line
Count
Source (jump to first uncovered line)
1
/* List object implementation */
2
3
#include "Python.h"
4
#include "pycore_abstract.h"      // _PyIndex_Check()
5
#include "pycore_ceval.h"         // _PyEval_GetBuiltin()
6
#include "pycore_critical_section.h"  // _Py_CRITICAL_SECTION_ASSERT_OBJECT_LOCKED()
7
#include "pycore_dict.h"          // _PyDictViewObject
8
#include "pycore_freelist.h"      // _Py_FREELIST_FREE(), _Py_FREELIST_POP()
9
#include "pycore_pyatomic_ft_wrappers.h"
10
#include "pycore_interp.h"        // PyInterpreterState.list
11
#include "pycore_list.h"          // struct _Py_list_freelist, _PyListIterObject
12
#include "pycore_long.h"          // _PyLong_DigitCount
13
#include "pycore_modsupport.h"    // _PyArg_NoKwnames()
14
#include "pycore_object.h"        // _PyObject_GC_TRACK(), _PyDebugAllocatorStats()
15
#include "pycore_stackref.h"      // _Py_TryIncrefCompareStackRef()
16
#include "pycore_tuple.h"         // _PyTuple_FromArray()
17
#include "pycore_typeobject.h"    // _Py_TYPE_VERSION_LIST
18
#include "pycore_setobject.h"     // _PySet_NextEntry()
19
#include <stddef.h>
20
21
/*[clinic input]
22
class list "PyListObject *" "&PyList_Type"
23
[clinic start generated code]*/
24
/*[clinic end generated code: output=da39a3ee5e6b4b0d input=f9b222678f9f71e0]*/
25
26
#include "clinic/listobject.c.h"
27
28
_Py_DECLARE_STR(list_err, "list index out of range");
29
30
#ifdef Py_GIL_DISABLED
31
typedef struct {
32
    Py_ssize_t allocated;
33
    PyObject *ob_item[];
34
} _PyListArray;
35
36
static _PyListArray *
37
list_allocate_array(size_t capacity)
38
{
39
    if (capacity > PY_SSIZE_T_MAX/sizeof(PyObject*) - 1) {
40
        return NULL;
41
    }
42
    _PyListArray *array = PyMem_Malloc(sizeof(_PyListArray) + capacity * sizeof(PyObject *));
43
    if (array == NULL) {
44
        return NULL;
45
    }
46
    array->allocated = capacity;
47
    return array;
48
}
49
50
static Py_ssize_t
51
list_capacity(PyObject **items)
52
{
53
    _PyListArray *array = _Py_CONTAINER_OF(items, _PyListArray, ob_item);
54
    return array->allocated;
55
}
56
#endif
57
58
static void
59
free_list_items(PyObject** items, bool use_qsbr)
60
124M
{
61
#ifdef Py_GIL_DISABLED
62
    _PyListArray *array = _Py_CONTAINER_OF(items, _PyListArray, ob_item);
63
    if (use_qsbr) {
64
        size_t size = sizeof(_PyListArray) + array->allocated * sizeof(PyObject *);
65
        _PyMem_FreeDelayed(array, size);
66
    }
67
    else {
68
        PyMem_Free(array);
69
    }
70
#else
71
124M
    PyMem_Free(items);
72
124M
#endif
73
124M
}
74
75
static void
76
ensure_shared_on_resize(PyListObject *self)
77
91.3M
{
78
#ifdef Py_GIL_DISABLED
79
    // We can't use _Py_CRITICAL_SECTION_ASSERT_OBJECT_LOCKED here because
80
    // the `CALL_LIST_APPEND` bytecode handler may lock the list without
81
    // a critical section.
82
    assert(Py_REFCNT(self) == 1 || PyMutex_IsLocked(&_PyObject_CAST(self)->ob_mutex));
83
84
    // Ensure that the list array is freed using QSBR if we are not the
85
    // owning thread.
86
    if (!_Py_IsOwnedByCurrentThread((PyObject *)self) &&
87
        !_PyObject_GC_IS_SHARED(self))
88
    {
89
        _PyObject_GC_SET_SHARED(self);
90
    }
91
#endif
92
91.3M
}
93
94
/* Ensure ob_item has room for at least newsize elements, and set
95
 * ob_size to newsize.  If newsize > ob_size on entry, the content
96
 * of the new slots at exit is undefined heap trash; it's the caller's
97
 * responsibility to overwrite them with sane values.
98
 * The number of allocated elements may grow, shrink, or stay the same.
99
 * Failure is impossible if newsize <= self.allocated on entry, although
100
 * that partly relies on an assumption that the system realloc() never
101
 * fails when passed a number of bytes <= the number of bytes last
102
 * allocated (the C standard doesn't guarantee this, but it's hard to
103
 * imagine a realloc implementation where it wouldn't be true).
104
 * Note that self->ob_item may change, and even if newsize is less
105
 * than ob_size on entry.
106
 */
107
static int
108
list_resize(PyListObject *self, Py_ssize_t newsize)
109
110M
{
110
110M
    size_t new_allocated, target_bytes;
111
110M
    Py_ssize_t allocated = self->allocated;
112
113
    /* Bypass realloc() when a previous overallocation is large enough
114
       to accommodate the newsize.  If the newsize falls lower than half
115
       the allocated size, then proceed with the realloc() to shrink the list.
116
    */
117
110M
    if (allocated >= newsize && newsize >= (allocated >> 1)) {
118
19.1M
        assert(self->ob_item != NULL || newsize == 0);
119
19.1M
        Py_SET_SIZE(self, newsize);
120
19.1M
        return 0;
121
19.1M
    }
122
123
    /* This over-allocates proportional to the list size, making room
124
     * for additional growth.  The over-allocation is mild, but is
125
     * enough to give linear-time amortized behavior over a long
126
     * sequence of appends() in the presence of a poorly-performing
127
     * system realloc().
128
     * Add padding to make the allocated size multiple of 4.
129
     * The growth pattern is:  0, 4, 8, 16, 24, 32, 40, 52, 64, 76, ...
130
     * Note: new_allocated won't overflow because the largest possible value
131
     *       is PY_SSIZE_T_MAX * (9 / 8) + 6 which always fits in a size_t.
132
     */
133
91.3M
    new_allocated = ((size_t)newsize + (newsize >> 3) + 6) & ~(size_t)3;
134
    /* Do not overallocate if the new size is closer to overallocated size
135
     * than to the old size.
136
     */
137
91.3M
    if (newsize - Py_SIZE(self) > (Py_ssize_t)(new_allocated - newsize))
138
9.95k
        new_allocated = ((size_t)newsize + 3) & ~(size_t)3;
139
140
91.3M
    if (newsize == 0)
141
2.33k
        new_allocated = 0;
142
143
91.3M
    ensure_shared_on_resize(self);
144
145
#ifdef Py_GIL_DISABLED
146
    _PyListArray *array = list_allocate_array(new_allocated);
147
    if (array == NULL) {
148
        PyErr_NoMemory();
149
        return -1;
150
    }
151
    PyObject **old_items = self->ob_item;
152
    if (self->ob_item) {
153
        if (new_allocated < (size_t)allocated) {
154
            target_bytes = new_allocated * sizeof(PyObject*);
155
        }
156
        else {
157
            target_bytes = allocated * sizeof(PyObject*);
158
        }
159
        memcpy(array->ob_item, self->ob_item, target_bytes);
160
    }
161
    if (new_allocated > (size_t)allocated) {
162
        memset(array->ob_item + allocated, 0, sizeof(PyObject *) * (new_allocated - allocated));
163
    }
164
     _Py_atomic_store_ptr_release(&self->ob_item, &array->ob_item);
165
    self->allocated = new_allocated;
166
    Py_SET_SIZE(self, newsize);
167
    if (old_items != NULL) {
168
        free_list_items(old_items, _PyObject_GC_IS_SHARED(self));
169
    }
170
#else
171
91.3M
    PyObject **items;
172
91.3M
    if (new_allocated <= (size_t)PY_SSIZE_T_MAX / sizeof(PyObject *)) {
173
91.3M
        target_bytes = new_allocated * sizeof(PyObject *);
174
91.3M
        items = (PyObject **)PyMem_Realloc(self->ob_item, target_bytes);
175
91.3M
    }
176
0
    else {
177
        // integer overflow
178
0
        items = NULL;
179
0
    }
180
91.3M
    if (items == NULL) {
181
0
        PyErr_NoMemory();
182
0
        return -1;
183
0
    }
184
91.3M
    self->ob_item = items;
185
91.3M
    Py_SET_SIZE(self, newsize);
186
91.3M
    self->allocated = new_allocated;
187
91.3M
#endif
188
91.3M
    return 0;
189
91.3M
}
190
191
static int
192
list_preallocate_exact(PyListObject *self, Py_ssize_t size)
193
6.22M
{
194
6.22M
    PyObject **items;
195
6.22M
    assert(self->ob_item == NULL);
196
6.22M
    assert(size > 0);
197
198
    /* Since the Python memory allocator has granularity of 16 bytes on 64-bit
199
     * platforms (8 on 32-bit), there is no benefit of allocating space for
200
     * the odd number of items, and there is no drawback of rounding the
201
     * allocated size up to the nearest even number.
202
     */
203
6.22M
    size = (size + 1) & ~(size_t)1;
204
#ifdef Py_GIL_DISABLED
205
    _PyListArray *array = list_allocate_array(size);
206
    if (array == NULL) {
207
        PyErr_NoMemory();
208
        return -1;
209
    }
210
    items = array->ob_item;
211
    memset(items, 0, size * sizeof(PyObject *));
212
#else
213
6.22M
    items = PyMem_New(PyObject*, size);
214
6.22M
    if (items == NULL) {
215
0
        PyErr_NoMemory();
216
0
        return -1;
217
0
    }
218
6.22M
#endif
219
6.22M
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item, items);
220
6.22M
    self->allocated = size;
221
6.22M
    return 0;
222
6.22M
}
223
224
/* Print summary info about the state of the optimized allocator */
225
void
226
_PyList_DebugMallocStats(FILE *out)
227
0
{
228
0
    _PyDebugAllocatorStats(out,
229
0
                           "free PyListObject",
230
0
                            _Py_FREELIST_SIZE(lists),
231
0
                           sizeof(PyListObject));
232
0
}
233
234
PyObject *
235
PyList_New(Py_ssize_t size)
236
289M
{
237
289M
    if (size < 0) {
238
0
        PyErr_BadInternalCall();
239
0
        return NULL;
240
0
    }
241
242
289M
    PyListObject *op = _Py_FREELIST_POP(PyListObject, lists);
243
289M
    if (op == NULL) {
244
32.1M
        op = PyObject_GC_New(PyListObject, &PyList_Type);
245
32.1M
        if (op == NULL) {
246
0
            return NULL;
247
0
        }
248
32.1M
    }
249
289M
    if (size <= 0) {
250
242M
        op->ob_item = NULL;
251
242M
    }
252
46.9M
    else {
253
#ifdef Py_GIL_DISABLED
254
        _PyListArray *array = list_allocate_array(size);
255
        if (array == NULL) {
256
            Py_DECREF(op);
257
            return PyErr_NoMemory();
258
        }
259
        memset(&array->ob_item, 0, size * sizeof(PyObject *));
260
        op->ob_item = array->ob_item;
261
#else
262
46.9M
        op->ob_item = (PyObject **) PyMem_Calloc(size, sizeof(PyObject *));
263
46.9M
#endif
264
46.9M
        if (op->ob_item == NULL) {
265
0
            Py_DECREF(op);
266
0
            return PyErr_NoMemory();
267
0
        }
268
46.9M
    }
269
289M
    Py_SET_SIZE(op, size);
270
289M
    op->allocated = size;
271
289M
    _PyObject_GC_TRACK(op);
272
289M
    return (PyObject *) op;
273
289M
}
274
275
static PyObject *
276
list_new_prealloc(Py_ssize_t size)
277
13.6M
{
278
13.6M
    assert(size > 0);
279
13.6M
    PyListObject *op = (PyListObject *) PyList_New(0);
280
13.6M
    if (op == NULL) {
281
0
        return NULL;
282
0
    }
283
13.6M
    assert(op->ob_item == NULL);
284
#ifdef Py_GIL_DISABLED
285
    _PyListArray *array = list_allocate_array(size);
286
    if (array == NULL) {
287
        Py_DECREF(op);
288
        return PyErr_NoMemory();
289
    }
290
    op->ob_item = array->ob_item;
291
#else
292
13.6M
    op->ob_item = PyMem_New(PyObject *, size);
293
13.6M
    if (op->ob_item == NULL) {
294
0
        Py_DECREF(op);
295
0
        return PyErr_NoMemory();
296
0
    }
297
13.6M
#endif
298
13.6M
    op->allocated = size;
299
13.6M
    return (PyObject *) op;
300
13.6M
}
301
302
Py_ssize_t
303
PyList_Size(PyObject *op)
304
89.8k
{
305
89.8k
    if (!PyList_Check(op)) {
306
0
        PyErr_BadInternalCall();
307
0
        return -1;
308
0
    }
309
89.8k
    else {
310
89.8k
        return PyList_GET_SIZE(op);
311
89.8k
    }
312
89.8k
}
313
314
static inline int
315
valid_index(Py_ssize_t i, Py_ssize_t limit)
316
223M
{
317
    /* The cast to size_t lets us use just a single comparison
318
       to check whether i is in the range: 0 <= i < limit.
319
320
       See:  Section 14.2 "Bounds Checking" in the Agner Fog
321
       optimization manual found at:
322
       https://www.agner.org/optimize/optimizing_cpp.pdf
323
    */
324
223M
    return (size_t) i < (size_t) limit;
325
223M
}
326
327
#ifdef Py_GIL_DISABLED
328
329
static PyObject *
330
list_item_impl(PyListObject *self, Py_ssize_t idx)
331
{
332
    PyObject *item = NULL;
333
    Py_BEGIN_CRITICAL_SECTION(self);
334
    if (!_PyObject_GC_IS_SHARED(self)) {
335
        _PyObject_GC_SET_SHARED(self);
336
    }
337
    Py_ssize_t size = Py_SIZE(self);
338
    if (!valid_index(idx, size)) {
339
        goto exit;
340
    }
341
    item = _Py_NewRefWithLock(self->ob_item[idx]);
342
exit:
343
    Py_END_CRITICAL_SECTION();
344
    return item;
345
}
346
347
static inline PyObject*
348
list_get_item_ref(PyListObject *op, Py_ssize_t i)
349
{
350
    if (!_Py_IsOwnedByCurrentThread((PyObject *)op) && !_PyObject_GC_IS_SHARED(op)) {
351
        return list_item_impl(op, i);
352
    }
353
    // Need atomic operation for the getting size.
354
    Py_ssize_t size = PyList_GET_SIZE(op);
355
    if (!valid_index(i, size)) {
356
        return NULL;
357
    }
358
    PyObject **ob_item = _Py_atomic_load_ptr(&op->ob_item);
359
    if (ob_item == NULL) {
360
        return NULL;
361
    }
362
    Py_ssize_t cap = list_capacity(ob_item);
363
    assert(cap != -1);
364
    if (!valid_index(i, cap)) {
365
        return NULL;
366
    }
367
    PyObject *item = _Py_TryXGetRef(&ob_item[i]);
368
    if (item == NULL) {
369
        return list_item_impl(op, i);
370
    }
371
    return item;
372
}
373
#else
374
static inline PyObject*
375
list_get_item_ref(PyListObject *op, Py_ssize_t i)
376
170M
{
377
170M
    if (!valid_index(i, Py_SIZE(op))) {
378
33.1M
        return NULL;
379
33.1M
    }
380
137M
    return Py_NewRef(PyList_GET_ITEM(op, i));
381
170M
}
382
#endif
383
384
PyObject *
385
PyList_GetItem(PyObject *op, Py_ssize_t i)
386
584
{
387
584
    if (!PyList_Check(op)) {
388
0
        PyErr_BadInternalCall();
389
0
        return NULL;
390
0
    }
391
584
    if (!valid_index(i, Py_SIZE(op))) {
392
0
        _Py_DECLARE_STR(list_err, "list index out of range");
393
0
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
394
0
        return NULL;
395
0
    }
396
584
    return ((PyListObject *)op) -> ob_item[i];
397
584
}
398
399
PyObject *
400
PyList_GetItemRef(PyObject *op, Py_ssize_t i)
401
83.2k
{
402
83.2k
    if (!PyList_Check(op)) {
403
0
        PyErr_SetString(PyExc_TypeError, "expected a list");
404
0
        return NULL;
405
0
    }
406
83.2k
    PyObject *item = list_get_item_ref((PyListObject *)op, i);
407
83.2k
    if (item == NULL) {
408
0
        _Py_DECLARE_STR(list_err, "list index out of range");
409
0
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
410
0
        return NULL;
411
0
    }
412
83.2k
    return item;
413
83.2k
}
414
415
PyObject *
416
_PyList_GetItemRef(PyListObject *list, Py_ssize_t i)
417
1.85k
{
418
1.85k
    return list_get_item_ref(list, i);
419
1.85k
}
420
421
#ifdef Py_GIL_DISABLED
422
int
423
_PyList_GetItemRefNoLock(PyListObject *list, Py_ssize_t i, _PyStackRef *result)
424
{
425
    assert(_Py_IsOwnedByCurrentThread((PyObject *)list) ||
426
           _PyObject_GC_IS_SHARED(list));
427
    if (!valid_index(i, PyList_GET_SIZE(list))) {
428
        return 0;
429
    }
430
    PyObject **ob_item = _Py_atomic_load_ptr(&list->ob_item);
431
    if (ob_item == NULL) {
432
        return 0;
433
    }
434
    Py_ssize_t cap = list_capacity(ob_item);
435
    assert(cap != -1);
436
    if (!valid_index(i, cap)) {
437
        return 0;
438
    }
439
    PyObject *obj = _Py_atomic_load_ptr(&ob_item[i]);
440
    if (obj == NULL || !_Py_TryIncrefCompareStackRef(&ob_item[i], obj, result)) {
441
        return -1;
442
    }
443
    return 1;
444
}
445
#endif
446
447
int
448
PyList_SetItem(PyObject *op, Py_ssize_t i,
449
               PyObject *newitem)
450
22.2k
{
451
22.2k
    if (!PyList_Check(op)) {
452
0
        Py_XDECREF(newitem);
453
0
        PyErr_BadInternalCall();
454
0
        return -1;
455
0
    }
456
22.2k
    int ret;
457
22.2k
    PyListObject *self = ((PyListObject *)op);
458
22.2k
    Py_BEGIN_CRITICAL_SECTION(self);
459
22.2k
    if (!valid_index(i, Py_SIZE(self))) {
460
0
        Py_XDECREF(newitem);
461
0
        PyErr_SetString(PyExc_IndexError,
462
0
                        "list assignment index out of range");
463
0
        ret = -1;
464
0
        goto end;
465
0
    }
466
22.2k
    PyObject *tmp = self->ob_item[i];
467
22.2k
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item[i], newitem);
468
22.2k
    Py_XDECREF(tmp);
469
22.2k
    ret = 0;
470
22.2k
end:;
471
22.2k
    Py_END_CRITICAL_SECTION();
472
22.2k
    return ret;
473
22.2k
}
474
475
static int
476
ins1(PyListObject *self, Py_ssize_t where, PyObject *v)
477
76
{
478
76
    Py_ssize_t i, n = Py_SIZE(self);
479
76
    PyObject **items;
480
76
    if (v == NULL) {
481
0
        PyErr_BadInternalCall();
482
0
        return -1;
483
0
    }
484
485
76
    assert((size_t)n + 1 < PY_SSIZE_T_MAX);
486
76
    if (list_resize(self, n+1) < 0)
487
0
        return -1;
488
489
76
    if (where < 0) {
490
0
        where += n;
491
0
        if (where < 0)
492
0
            where = 0;
493
0
    }
494
76
    if (where > n)
495
0
        where = n;
496
76
    items = self->ob_item;
497
462
    for (i = n; --i >= where; )
498
386
        FT_ATOMIC_STORE_PTR_RELAXED(items[i+1], items[i]);
499
76
    FT_ATOMIC_STORE_PTR_RELEASE(items[where], Py_NewRef(v));
500
76
    return 0;
501
76
}
502
503
int
504
PyList_Insert(PyObject *op, Py_ssize_t where, PyObject *newitem)
505
16
{
506
16
    if (!PyList_Check(op)) {
507
0
        PyErr_BadInternalCall();
508
0
        return -1;
509
0
    }
510
16
    PyListObject *self = (PyListObject *)op;
511
16
    int err;
512
16
    Py_BEGIN_CRITICAL_SECTION(self);
513
16
    err = ins1(self, where, newitem);
514
16
    Py_END_CRITICAL_SECTION();
515
16
    return err;
516
16
}
517
518
/* internal, used by _PyList_AppendTakeRef */
519
int
520
_PyList_AppendTakeRefListResize(PyListObject *self, PyObject *newitem)
521
65.9M
{
522
65.9M
    Py_ssize_t len = Py_SIZE(self);
523
65.9M
    assert(self->allocated == -1 || self->allocated == len);
524
65.9M
    if (list_resize(self, len + 1) < 0) {
525
0
        Py_DECREF(newitem);
526
0
        return -1;
527
0
    }
528
65.9M
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item[len], newitem);
529
65.9M
    return 0;
530
65.9M
}
531
532
int
533
PyList_Append(PyObject *op, PyObject *newitem)
534
160M
{
535
160M
    if (PyList_Check(op) && (newitem != NULL)) {
536
160M
        int ret;
537
160M
        Py_BEGIN_CRITICAL_SECTION(op);
538
160M
        ret = _PyList_AppendTakeRef((PyListObject *)op, Py_NewRef(newitem));
539
160M
        Py_END_CRITICAL_SECTION();
540
160M
        return ret;
541
160M
    }
542
0
    PyErr_BadInternalCall();
543
0
    return -1;
544
160M
}
545
546
/* Methods */
547
548
static void
549
list_dealloc(PyObject *self)
550
309M
{
551
309M
    PyListObject *op = (PyListObject *)self;
552
309M
    Py_ssize_t i;
553
309M
    PyObject_GC_UnTrack(op);
554
309M
    if (op->ob_item != NULL) {
555
        /* Do it backwards, for Christian Tismer.
556
           There's a simple test case where somehow this reduces
557
           thrashing when a *very* large list is created and
558
           immediately deleted. */
559
109M
        i = Py_SIZE(op);
560
1.55G
        while (--i >= 0) {
561
1.44G
            Py_XDECREF(op->ob_item[i]);
562
1.44G
        }
563
109M
        free_list_items(op->ob_item, false);
564
109M
        op->ob_item = NULL;
565
109M
    }
566
309M
    if (PyList_CheckExact(op)) {
567
298M
        _Py_FREELIST_FREE(lists, op, PyObject_GC_Del);
568
298M
    }
569
11.1M
    else {
570
11.1M
        PyObject_GC_Del(op);
571
11.1M
    }
572
309M
}
573
574
static PyObject *
575
list_repr_impl(PyListObject *v)
576
3.75M
{
577
3.75M
    int res = Py_ReprEnter((PyObject*)v);
578
3.75M
    if (res != 0) {
579
0
        return (res > 0 ? PyUnicode_FromString("[...]") : NULL);
580
0
    }
581
582
    /* "[" + "1" + ", 2" * (len - 1) + "]" */
583
3.75M
    Py_ssize_t prealloc = 1 + 1 + (2 + 1) * (Py_SIZE(v) - 1) + 1;
584
3.75M
    PyUnicodeWriter *writer = PyUnicodeWriter_Create(prealloc);
585
3.75M
    PyObject *item = NULL;
586
3.75M
    if (writer == NULL) {
587
0
        goto error;
588
0
    }
589
590
3.75M
    if (PyUnicodeWriter_WriteChar(writer, '[') < 0) {
591
0
        goto error;
592
0
    }
593
594
    /* Do repr() on each element.  Note that this may mutate the list,
595
       so must refetch the list size on each iteration. */
596
10.5M
    for (Py_ssize_t i = 0; i < Py_SIZE(v); ++i) {
597
        /* Hold a strong reference since repr(item) can mutate the list */
598
6.76M
        item = Py_NewRef(v->ob_item[i]);
599
600
6.76M
        if (i > 0) {
601
3.00M
            if (PyUnicodeWriter_WriteChar(writer, ',') < 0) {
602
0
                goto error;
603
0
            }
604
3.00M
            if (PyUnicodeWriter_WriteChar(writer, ' ') < 0) {
605
0
                goto error;
606
0
            }
607
3.00M
        }
608
609
6.76M
        if (PyUnicodeWriter_WriteRepr(writer, item) < 0) {
610
0
            goto error;
611
0
        }
612
6.76M
        Py_CLEAR(item);
613
6.76M
    }
614
615
3.75M
    if (PyUnicodeWriter_WriteChar(writer, ']') < 0) {
616
0
        goto error;
617
0
    }
618
619
3.75M
    Py_ReprLeave((PyObject *)v);
620
3.75M
    return PyUnicodeWriter_Finish(writer);
621
622
0
error:
623
0
    Py_XDECREF(item);
624
0
    PyUnicodeWriter_Discard(writer);
625
0
    Py_ReprLeave((PyObject *)v);
626
0
    return NULL;
627
3.75M
}
628
629
static PyObject *
630
list_repr(PyObject *self)
631
3.76M
{
632
3.76M
    if (PyList_GET_SIZE(self) == 0) {
633
6.52k
        return PyUnicode_FromString("[]");
634
6.52k
    }
635
3.75M
    PyListObject *v = (PyListObject *)self;
636
3.75M
    PyObject *ret = NULL;
637
3.75M
    Py_BEGIN_CRITICAL_SECTION(v);
638
3.75M
    ret = list_repr_impl(v);
639
3.75M
    Py_END_CRITICAL_SECTION();
640
3.75M
    return ret;
641
3.76M
}
642
643
static Py_ssize_t
644
list_length(PyObject *a)
645
59.3M
{
646
59.3M
    return PyList_GET_SIZE(a);
647
59.3M
}
648
649
static int
650
list_contains(PyObject *aa, PyObject *el)
651
2.36k
{
652
653
28.8k
    for (Py_ssize_t i = 0; ; i++) {
654
28.8k
        PyObject *item = list_get_item_ref((PyListObject *)aa, i);
655
28.8k
        if (item == NULL) {
656
            // out-of-bounds
657
1.75k
            return 0;
658
1.75k
        }
659
27.1k
        int cmp = PyObject_RichCompareBool(item, el, Py_EQ);
660
27.1k
        Py_DECREF(item);
661
27.1k
        if (cmp != 0) {
662
612
            return cmp;
663
612
        }
664
27.1k
    }
665
0
    return 0;
666
2.36k
}
667
668
static PyObject *
669
list_item(PyObject *aa, Py_ssize_t i)
670
16.4M
{
671
16.4M
    PyListObject *a = (PyListObject *)aa;
672
16.4M
    if (!valid_index(i, PyList_GET_SIZE(a))) {
673
991
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
674
991
        return NULL;
675
991
    }
676
16.4M
    PyObject *item;
677
#ifdef Py_GIL_DISABLED
678
    item = list_get_item_ref(a, i);
679
    if (item == NULL) {
680
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
681
        return NULL;
682
    }
683
#else
684
16.4M
    item = Py_NewRef(a->ob_item[i]);
685
16.4M
#endif
686
16.4M
    return item;
687
16.4M
}
688
689
static PyObject *
690
list_slice_lock_held(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
691
2.06M
{
692
2.06M
    PyListObject *np;
693
2.06M
    PyObject **src, **dest;
694
2.06M
    Py_ssize_t i, len;
695
2.06M
    len = ihigh - ilow;
696
2.06M
    if (len <= 0) {
697
0
        return PyList_New(0);
698
0
    }
699
2.06M
    np = (PyListObject *) list_new_prealloc(len);
700
2.06M
    if (np == NULL)
701
0
        return NULL;
702
703
2.06M
    src = a->ob_item + ilow;
704
2.06M
    dest = np->ob_item;
705
37.3M
    for (i = 0; i < len; i++) {
706
35.2M
        PyObject *v = src[i];
707
35.2M
        dest[i] = Py_NewRef(v);
708
35.2M
    }
709
2.06M
    Py_SET_SIZE(np, len);
710
2.06M
    return (PyObject *)np;
711
2.06M
}
712
713
PyObject *
714
PyList_GetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
715
0
{
716
0
    if (!PyList_Check(a)) {
717
0
        PyErr_BadInternalCall();
718
0
        return NULL;
719
0
    }
720
0
    PyObject *ret;
721
0
    Py_BEGIN_CRITICAL_SECTION(a);
722
0
    if (ilow < 0) {
723
0
        ilow = 0;
724
0
    }
725
0
    else if (ilow > Py_SIZE(a)) {
726
0
        ilow = Py_SIZE(a);
727
0
    }
728
0
    if (ihigh < ilow) {
729
0
        ihigh = ilow;
730
0
    }
731
0
    else if (ihigh > Py_SIZE(a)) {
732
0
        ihigh = Py_SIZE(a);
733
0
    }
734
0
    ret = list_slice_lock_held((PyListObject *)a, ilow, ihigh);
735
0
    Py_END_CRITICAL_SECTION();
736
0
    return ret;
737
0
}
738
739
static PyObject *
740
list_concat_lock_held(PyListObject *a, PyListObject *b)
741
19.2M
{
742
19.2M
    Py_ssize_t size;
743
19.2M
    Py_ssize_t i;
744
19.2M
    PyObject **src, **dest;
745
19.2M
    PyListObject *np;
746
19.2M
    assert((size_t)Py_SIZE(a) + (size_t)Py_SIZE(b) < PY_SSIZE_T_MAX);
747
19.2M
    size = Py_SIZE(a) + Py_SIZE(b);
748
19.2M
    if (size == 0) {
749
7.73M
        return PyList_New(0);
750
7.73M
    }
751
11.5M
    np = (PyListObject *) list_new_prealloc(size);
752
11.5M
    if (np == NULL) {
753
0
        return NULL;
754
0
    }
755
11.5M
    src = a->ob_item;
756
11.5M
    dest = np->ob_item;
757
459M
    for (i = 0; i < Py_SIZE(a); i++) {
758
448M
        PyObject *v = src[i];
759
448M
        dest[i] = Py_NewRef(v);
760
448M
    }
761
11.5M
    src = b->ob_item;
762
11.5M
    dest = np->ob_item + Py_SIZE(a);
763
218M
    for (i = 0; i < Py_SIZE(b); i++) {
764
207M
        PyObject *v = src[i];
765
207M
        dest[i] = Py_NewRef(v);
766
207M
    }
767
11.5M
    Py_SET_SIZE(np, size);
768
11.5M
    return (PyObject *)np;
769
11.5M
}
770
771
static PyObject *
772
list_concat(PyObject *aa, PyObject *bb)
773
19.2M
{
774
19.2M
    if (!PyList_Check(bb)) {
775
0
        PyErr_Format(PyExc_TypeError,
776
0
                  "can only concatenate list (not \"%.200s\") to list",
777
0
                  Py_TYPE(bb)->tp_name);
778
0
        return NULL;
779
0
    }
780
19.2M
    PyListObject *a = (PyListObject *)aa;
781
19.2M
    PyListObject *b = (PyListObject *)bb;
782
19.2M
    PyObject *ret;
783
19.2M
    Py_BEGIN_CRITICAL_SECTION2(a, b);
784
19.2M
    ret = list_concat_lock_held(a, b);
785
19.2M
    Py_END_CRITICAL_SECTION2();
786
19.2M
    return ret;
787
19.2M
}
788
789
static PyObject *
790
list_repeat_lock_held(PyListObject *a, Py_ssize_t n)
791
14.8k
{
792
14.8k
    const Py_ssize_t input_size = Py_SIZE(a);
793
14.8k
    if (input_size == 0 || n <= 0)
794
2.33k
        return PyList_New(0);
795
12.5k
    assert(n > 0);
796
797
12.5k
    if (input_size > PY_SSIZE_T_MAX / n)
798
0
        return PyErr_NoMemory();
799
12.5k
    Py_ssize_t output_size = input_size * n;
800
801
12.5k
    PyListObject *np = (PyListObject *) list_new_prealloc(output_size);
802
12.5k
    if (np == NULL)
803
0
        return NULL;
804
805
12.5k
    PyObject **dest = np->ob_item;
806
12.5k
    if (input_size == 1) {
807
12.5k
        PyObject *elem = a->ob_item[0];
808
12.5k
        _Py_RefcntAdd(elem, n);
809
12.5k
        PyObject **dest_end = dest + output_size;
810
14.1M
        while (dest < dest_end) {
811
14.0M
            *dest++ = elem;
812
14.0M
        }
813
12.5k
    }
814
0
    else {
815
0
        PyObject **src = a->ob_item;
816
0
        PyObject **src_end = src + input_size;
817
0
        while (src < src_end) {
818
0
            _Py_RefcntAdd(*src, n);
819
0
            *dest++ = *src++;
820
0
        }
821
        // TODO: _Py_memory_repeat calls are not safe for shared lists in
822
        // GIL_DISABLED builds. (See issue #129069)
823
0
        _Py_memory_repeat((char *)np->ob_item, sizeof(PyObject *)*output_size,
824
0
                                        sizeof(PyObject *)*input_size);
825
0
    }
826
827
12.5k
    Py_SET_SIZE(np, output_size);
828
12.5k
    return (PyObject *) np;
829
12.5k
}
830
831
static PyObject *
832
list_repeat(PyObject *aa, Py_ssize_t n)
833
14.8k
{
834
14.8k
    PyObject *ret;
835
14.8k
    PyListObject *a = (PyListObject *)aa;
836
14.8k
    Py_BEGIN_CRITICAL_SECTION(a);
837
14.8k
    ret = list_repeat_lock_held(a, n);
838
14.8k
    Py_END_CRITICAL_SECTION();
839
14.8k
    return ret;
840
14.8k
}
841
842
static void
843
list_clear_impl(PyListObject *a, bool is_resize)
844
15.2M
{
845
15.2M
    PyObject **items = a->ob_item;
846
15.2M
    if (items == NULL) {
847
0
        return;
848
0
    }
849
850
    /* Because XDECREF can recursively invoke operations on
851
       this list, we make it empty first. */
852
15.2M
    Py_ssize_t i = Py_SIZE(a);
853
15.2M
    Py_SET_SIZE(a, 0);
854
15.2M
    FT_ATOMIC_STORE_PTR_RELEASE(a->ob_item, NULL);
855
15.2M
    a->allocated = 0;
856
30.6M
    while (--i >= 0) {
857
15.3M
        Py_XDECREF(items[i]);
858
15.3M
    }
859
#ifdef Py_GIL_DISABLED
860
    if (is_resize) {
861
        ensure_shared_on_resize(a);
862
    }
863
    bool use_qsbr = is_resize && _PyObject_GC_IS_SHARED(a);
864
#else
865
15.2M
    bool use_qsbr = false;
866
15.2M
#endif
867
15.2M
    free_list_items(items, use_qsbr);
868
    // Note that there is no guarantee that the list is actually empty
869
    // at this point, because XDECREF may have populated it indirectly again!
870
15.2M
}
871
872
static void
873
list_clear(PyListObject *a)
874
15.2M
{
875
15.2M
    list_clear_impl(a, true);
876
15.2M
}
877
878
static int
879
list_clear_slot(PyObject *self)
880
0
{
881
0
    list_clear_impl((PyListObject *)self, false);
882
0
    return 0;
883
0
}
884
885
/* a[ilow:ihigh] = v if v != NULL.
886
 * del a[ilow:ihigh] if v == NULL.
887
 *
888
 * Special speed gimmick:  when v is NULL and ihigh - ilow <= 8, it's
889
 * guaranteed the call cannot fail.
890
 */
891
static int
892
list_ass_slice_lock_held(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
893
4.03M
{
894
    /* Because [X]DECREF can recursively invoke list operations on
895
       this list, we must postpone all [X]DECREF activity until
896
       after the list is back in its canonical shape.  Therefore
897
       we must allocate an additional array, 'recycle', into which
898
       we temporarily copy the items that are deleted from the
899
       list. :-( */
900
4.03M
    PyObject *recycle_on_stack[8];
901
4.03M
    PyObject **recycle = recycle_on_stack; /* will allocate more if needed */
902
4.03M
    PyObject **item;
903
4.03M
    PyObject **vitem = NULL;
904
4.03M
    PyObject *v_as_SF = NULL; /* PySequence_Fast(v) */
905
4.03M
    Py_ssize_t n; /* # of elements in replacement list */
906
4.03M
    Py_ssize_t norig; /* # of elements in list getting replaced */
907
4.03M
    Py_ssize_t d; /* Change in size */
908
4.03M
    Py_ssize_t k;
909
4.03M
    size_t s;
910
4.03M
    int result = -1;            /* guilty until proved innocent */
911
4.03M
#define b ((PyListObject *)v)
912
4.03M
    if (v == NULL)
913
3.77M
        n = 0;
914
252k
    else {
915
252k
        v_as_SF = PySequence_Fast(v, "can only assign an iterable");
916
252k
        if(v_as_SF == NULL)
917
0
            goto Error;
918
252k
        n = PySequence_Fast_GET_SIZE(v_as_SF);
919
252k
        vitem = PySequence_Fast_ITEMS(v_as_SF);
920
252k
    }
921
4.03M
    if (ilow < 0)
922
0
        ilow = 0;
923
4.03M
    else if (ilow > Py_SIZE(a))
924
0
        ilow = Py_SIZE(a);
925
926
4.03M
    if (ihigh < ilow)
927
0
        ihigh = ilow;
928
4.03M
    else if (ihigh > Py_SIZE(a))
929
0
        ihigh = Py_SIZE(a);
930
931
4.03M
    norig = ihigh - ilow;
932
4.03M
    assert(norig >= 0);
933
4.03M
    d = n - norig;
934
4.03M
    if (Py_SIZE(a) + d == 0) {
935
544k
        Py_XDECREF(v_as_SF);
936
544k
        list_clear(a);
937
544k
        return 0;
938
544k
    }
939
3.48M
    item = a->ob_item;
940
    /* recycle the items that we are about to remove */
941
3.48M
    s = norig * sizeof(PyObject *);
942
    /* If norig == 0, item might be NULL, in which case we may not memcpy from it. */
943
3.48M
    if (s) {
944
3.25M
        if (s > sizeof(recycle_on_stack)) {
945
121
            recycle = (PyObject **)PyMem_Malloc(s);
946
121
            if (recycle == NULL) {
947
0
                PyErr_NoMemory();
948
0
                goto Error;
949
0
            }
950
121
        }
951
3.25M
        memcpy(recycle, &item[ilow], s);
952
3.25M
    }
953
954
3.48M
    if (d < 0) { /* Delete -d items */
955
3.25M
        Py_ssize_t tail;
956
3.25M
        tail = (Py_SIZE(a) - ihigh) * sizeof(PyObject *);
957
        // TODO: these memmove/memcpy calls are not safe for shared lists in
958
        // GIL_DISABLED builds. (See issue #129069)
959
3.25M
        memmove(&item[ihigh+d], &item[ihigh], tail);
960
3.25M
        if (list_resize(a, Py_SIZE(a) + d) < 0) {
961
0
            memmove(&item[ihigh], &item[ihigh+d], tail);
962
0
            memcpy(&item[ilow], recycle, s);
963
0
            goto Error;
964
0
        }
965
3.25M
        item = a->ob_item;
966
3.25M
    }
967
235k
    else if (d > 0) { /* Insert d items */
968
235k
        k = Py_SIZE(a);
969
235k
        if (list_resize(a, k+d) < 0)
970
0
            goto Error;
971
235k
        item = a->ob_item;
972
        // TODO: these memmove/memcpy calls are not safe for shared lists in
973
        // GIL_DISABLED builds. (See issue #129069)
974
235k
        memmove(&item[ihigh+d], &item[ihigh],
975
235k
            (k - ihigh)*sizeof(PyObject *));
976
235k
    }
977
3.72M
    for (k = 0; k < n; k++, ilow++) {
978
236k
        PyObject *w = vitem[k];
979
236k
        FT_ATOMIC_STORE_PTR_RELEASE(item[ilow], Py_XNewRef(w));
980
236k
    }
981
6.74M
    for (k = norig - 1; k >= 0; --k)
982
3.25M
        Py_XDECREF(recycle[k]);
983
3.48M
    result = 0;
984
3.48M
 Error:
985
3.48M
    if (recycle != recycle_on_stack)
986
121
        PyMem_Free(recycle);
987
3.48M
    Py_XDECREF(v_as_SF);
988
3.48M
    return result;
989
3.48M
#undef b
990
3.48M
}
991
992
static int
993
list_ass_slice(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
994
3.77M
{
995
3.77M
    int ret;
996
3.77M
    if (a == (PyListObject *)v) {
997
0
        Py_BEGIN_CRITICAL_SECTION(a);
998
0
        Py_ssize_t n = PyList_GET_SIZE(a);
999
0
        PyObject *copy = list_slice_lock_held(a, 0, n);
1000
0
        if (copy == NULL) {
1001
0
            ret = -1;
1002
0
        }
1003
0
        else {
1004
0
            ret = list_ass_slice_lock_held(a, ilow, ihigh, copy);
1005
0
            Py_DECREF(copy);
1006
0
        }
1007
0
        Py_END_CRITICAL_SECTION();
1008
0
    }
1009
3.77M
    else if (v != NULL && PyList_CheckExact(v)) {
1010
222
        Py_BEGIN_CRITICAL_SECTION2(a, v);
1011
222
        ret = list_ass_slice_lock_held(a, ilow, ihigh, v);
1012
222
        Py_END_CRITICAL_SECTION2();
1013
222
    }
1014
3.77M
    else {
1015
3.77M
        Py_BEGIN_CRITICAL_SECTION(a);
1016
3.77M
        ret = list_ass_slice_lock_held(a, ilow, ihigh, v);
1017
3.77M
        Py_END_CRITICAL_SECTION();
1018
3.77M
    }
1019
3.77M
    return ret;
1020
3.77M
}
1021
1022
int
1023
PyList_SetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
1024
3.77M
{
1025
3.77M
    if (!PyList_Check(a)) {
1026
0
        PyErr_BadInternalCall();
1027
0
        return -1;
1028
0
    }
1029
3.77M
    return list_ass_slice((PyListObject *)a, ilow, ihigh, v);
1030
3.77M
}
1031
1032
static int
1033
list_inplace_repeat_lock_held(PyListObject *self, Py_ssize_t n)
1034
0
{
1035
0
    Py_ssize_t input_size = PyList_GET_SIZE(self);
1036
0
    if (input_size == 0 || n == 1) {
1037
0
        return 0;
1038
0
    }
1039
1040
0
    if (n < 1) {
1041
0
        list_clear(self);
1042
0
        return 0;
1043
0
    }
1044
1045
0
    if (input_size > PY_SSIZE_T_MAX / n) {
1046
0
        PyErr_NoMemory();
1047
0
        return -1;
1048
0
    }
1049
0
    Py_ssize_t output_size = input_size * n;
1050
1051
0
    if (list_resize(self, output_size) < 0) {
1052
0
        return -1;
1053
0
    }
1054
1055
0
    PyObject **items = self->ob_item;
1056
0
    for (Py_ssize_t j = 0; j < input_size; j++) {
1057
0
        _Py_RefcntAdd(items[j], n-1);
1058
0
    }
1059
    // TODO: _Py_memory_repeat calls are not safe for shared lists in
1060
    // GIL_DISABLED builds. (See issue #129069)
1061
0
    _Py_memory_repeat((char *)items, sizeof(PyObject *)*output_size,
1062
0
                      sizeof(PyObject *)*input_size);
1063
0
    return 0;
1064
0
}
1065
1066
static PyObject *
1067
list_inplace_repeat(PyObject *_self, Py_ssize_t n)
1068
0
{
1069
0
    PyObject *ret;
1070
0
    PyListObject *self = (PyListObject *) _self;
1071
0
    Py_BEGIN_CRITICAL_SECTION(self);
1072
0
    if (list_inplace_repeat_lock_held(self, n) < 0) {
1073
0
        ret = NULL;
1074
0
    }
1075
0
    else {
1076
0
        ret = Py_NewRef(self);
1077
0
    }
1078
0
    Py_END_CRITICAL_SECTION();
1079
0
    return ret;
1080
0
}
1081
1082
static int
1083
list_ass_item_lock_held(PyListObject *a, Py_ssize_t i, PyObject *v)
1084
9.35k
{
1085
9.35k
    if (!valid_index(i, Py_SIZE(a))) {
1086
0
        PyErr_SetString(PyExc_IndexError,
1087
0
                        "list assignment index out of range");
1088
0
        return -1;
1089
0
    }
1090
9.35k
    PyObject *tmp = a->ob_item[i];
1091
9.35k
    if (v == NULL) {
1092
6.27k
        Py_ssize_t size = Py_SIZE(a);
1093
6.27k
        for (Py_ssize_t idx = i; idx < size - 1; idx++) {
1094
0
            FT_ATOMIC_STORE_PTR_RELAXED(a->ob_item[idx], a->ob_item[idx + 1]);
1095
0
        }
1096
6.27k
        Py_SET_SIZE(a, size - 1);
1097
6.27k
    }
1098
3.08k
    else {
1099
3.08k
        FT_ATOMIC_STORE_PTR_RELEASE(a->ob_item[i], Py_NewRef(v));
1100
3.08k
    }
1101
9.35k
    Py_DECREF(tmp);
1102
9.35k
    return 0;
1103
9.35k
}
1104
1105
static int
1106
list_ass_item(PyObject *aa, Py_ssize_t i, PyObject *v)
1107
6.17k
{
1108
6.17k
    int ret;
1109
6.17k
    PyListObject *a = (PyListObject *)aa;
1110
6.17k
    Py_BEGIN_CRITICAL_SECTION(a);
1111
6.17k
    ret = list_ass_item_lock_held(a, i, v);
1112
6.17k
    Py_END_CRITICAL_SECTION();
1113
6.17k
    return ret;
1114
6.17k
}
1115
1116
/*[clinic input]
1117
@critical_section
1118
list.insert
1119
1120
    index: Py_ssize_t
1121
    object: object
1122
    /
1123
1124
Insert object before index.
1125
[clinic start generated code]*/
1126
1127
static PyObject *
1128
list_insert_impl(PyListObject *self, Py_ssize_t index, PyObject *object)
1129
/*[clinic end generated code: output=7f35e32f60c8cb78 input=b1987ca998a4ae2d]*/
1130
60
{
1131
60
    if (ins1(self, index, object) == 0) {
1132
60
        Py_RETURN_NONE;
1133
60
    }
1134
0
    return NULL;
1135
60
}
1136
1137
/*[clinic input]
1138
@critical_section
1139
list.clear as py_list_clear
1140
1141
Remove all items from list.
1142
[clinic start generated code]*/
1143
1144
static PyObject *
1145
py_list_clear_impl(PyListObject *self)
1146
/*[clinic end generated code: output=83726743807e3518 input=e285b7f09051a9ba]*/
1147
171
{
1148
171
    list_clear(self);
1149
171
    Py_RETURN_NONE;
1150
171
}
1151
1152
/*[clinic input]
1153
@critical_section
1154
list.copy
1155
1156
Return a shallow copy of the list.
1157
[clinic start generated code]*/
1158
1159
static PyObject *
1160
list_copy_impl(PyListObject *self)
1161
/*[clinic end generated code: output=ec6b72d6209d418e input=81c54b0c7bb4f73d]*/
1162
0
{
1163
0
    return list_slice_lock_held(self, 0, Py_SIZE(self));
1164
0
}
1165
1166
/*[clinic input]
1167
@critical_section
1168
list.append
1169
1170
     object: object
1171
     /
1172
1173
Append object to the end of the list.
1174
[clinic start generated code]*/
1175
1176
static PyObject *
1177
list_append_impl(PyListObject *self, PyObject *object)
1178
/*[clinic end generated code: output=78423561d92ed405 input=122b0853de54004f]*/
1179
19.4M
{
1180
19.4M
    if (_PyList_AppendTakeRef(self, Py_NewRef(object)) < 0) {
1181
0
        return NULL;
1182
0
    }
1183
19.4M
    Py_RETURN_NONE;
1184
19.4M
}
1185
1186
static int
1187
list_extend_fast(PyListObject *self, PyObject *iterable)
1188
24.5M
{
1189
24.5M
    Py_ssize_t n = PySequence_Fast_GET_SIZE(iterable);
1190
24.5M
    if (n == 0) {
1191
        /* short circuit when iterable is empty */
1192
8.60M
        return 0;
1193
8.60M
    }
1194
1195
15.9M
    Py_ssize_t m = Py_SIZE(self);
1196
    // It should not be possible to allocate a list large enough to cause
1197
    // an overflow on any relevant platform.
1198
15.9M
    assert(m < PY_SSIZE_T_MAX - n);
1199
15.9M
    if (self->ob_item == NULL) {
1200
1.26M
        if (list_preallocate_exact(self, n) < 0) {
1201
0
            return -1;
1202
0
        }
1203
1.26M
        Py_SET_SIZE(self, n);
1204
1.26M
    }
1205
14.7M
    else if (list_resize(self, m + n) < 0) {
1206
0
        return -1;
1207
0
    }
1208
1209
    // note that we may still have self == iterable here for the
1210
    // situation a.extend(a), but the following code works
1211
    // in that case too.  Just make sure to resize self
1212
    // before calling PySequence_Fast_ITEMS.
1213
    //
1214
    // populate the end of self with iterable's items.
1215
15.9M
    PyObject **src = PySequence_Fast_ITEMS(iterable);
1216
15.9M
    PyObject **dest = self->ob_item + m;
1217
50.1M
    for (Py_ssize_t i = 0; i < n; i++) {
1218
34.2M
        PyObject *o = src[i];
1219
34.2M
        FT_ATOMIC_STORE_PTR_RELEASE(dest[i], Py_NewRef(o));
1220
34.2M
    }
1221
15.9M
    return 0;
1222
15.9M
}
1223
1224
static int
1225
list_extend_iter_lock_held(PyListObject *self, PyObject *iterable)
1226
5.61M
{
1227
5.61M
    PyObject *it = PyObject_GetIter(iterable);
1228
5.61M
    if (it == NULL) {
1229
0
        return -1;
1230
0
    }
1231
5.61M
    PyObject *(*iternext)(PyObject *) = *Py_TYPE(it)->tp_iternext;
1232
1233
    /* Guess a result list size. */
1234
5.61M
    Py_ssize_t n = PyObject_LengthHint(iterable, 8);
1235
5.61M
    if (n < 0) {
1236
0
        Py_DECREF(it);
1237
0
        return -1;
1238
0
    }
1239
1240
5.61M
    Py_ssize_t m = Py_SIZE(self);
1241
5.61M
    if (m > PY_SSIZE_T_MAX - n) {
1242
        /* m + n overflowed; on the chance that n lied, and there really
1243
         * is enough room, ignore it.  If n was telling the truth, we'll
1244
         * eventually run out of memory during the loop.
1245
         */
1246
0
    }
1247
5.61M
    else if (self->ob_item == NULL) {
1248
5.29M
        if (n && list_preallocate_exact(self, n) < 0)
1249
0
            goto error;
1250
5.29M
    }
1251
317k
    else {
1252
        /* Make room. */
1253
317k
        if (list_resize(self, m + n) < 0) {
1254
0
            goto error;
1255
0
        }
1256
1257
        /* Make the list sane again. */
1258
317k
        Py_SET_SIZE(self, m);
1259
317k
    }
1260
1261
    /* Run iterator to exhaustion. */
1262
71.8M
    for (;;) {
1263
71.8M
        PyObject *item = iternext(it);
1264
71.8M
        if (item == NULL) {
1265
5.61M
            if (PyErr_Occurred()) {
1266
639
                if (PyErr_ExceptionMatches(PyExc_StopIteration))
1267
0
                    PyErr_Clear();
1268
639
                else
1269
639
                    goto error;
1270
639
            }
1271
5.61M
            break;
1272
5.61M
        }
1273
1274
66.1M
        if (Py_SIZE(self) < self->allocated) {
1275
65.2M
            Py_ssize_t len = Py_SIZE(self);
1276
65.2M
            FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item[len], item);  // steals item ref
1277
65.2M
            Py_SET_SIZE(self, len + 1);
1278
65.2M
        }
1279
996k
        else {
1280
996k
            if (_PyList_AppendTakeRef(self, item) < 0)
1281
0
                goto error;
1282
996k
        }
1283
66.1M
    }
1284
1285
    /* Cut back result list if initial guess was too large. */
1286
5.61M
    if (Py_SIZE(self) < self->allocated) {
1287
4.35M
        if (list_resize(self, Py_SIZE(self)) < 0)
1288
0
            goto error;
1289
4.35M
    }
1290
1291
5.61M
    Py_DECREF(it);
1292
5.61M
    return 0;
1293
1294
639
  error:
1295
639
    Py_DECREF(it);
1296
639
    return -1;
1297
5.61M
}
1298
1299
static int
1300
list_extend_lock_held(PyListObject *self, PyObject *iterable)
1301
24.5M
{
1302
24.5M
    PyObject *seq = PySequence_Fast(iterable, "argument must be iterable");
1303
24.5M
    if (!seq) {
1304
0
        return -1;
1305
0
    }
1306
1307
24.5M
    int res = list_extend_fast(self, seq);
1308
24.5M
    Py_DECREF(seq);
1309
24.5M
    return res;
1310
24.5M
}
1311
1312
static int
1313
list_extend_set(PyListObject *self, PySetObject *other)
1314
20.2k
{
1315
20.2k
    Py_ssize_t m = Py_SIZE(self);
1316
20.2k
    Py_ssize_t n = PySet_GET_SIZE(other);
1317
20.2k
    Py_ssize_t r = m + n;
1318
20.2k
    if (r == 0) {
1319
891
        return 0;
1320
891
    }
1321
19.4k
    if (list_resize(self, r) < 0) {
1322
0
        return -1;
1323
0
    }
1324
1325
19.4k
    assert(self->ob_item != NULL);
1326
    /* populate the end of self with iterable's items */
1327
19.4k
    Py_ssize_t setpos = 0;
1328
19.4k
    Py_hash_t hash;
1329
19.4k
    PyObject *key;
1330
19.4k
    PyObject **dest = self->ob_item + m;
1331
128k
    while (_PySet_NextEntryRef((PyObject *)other, &setpos, &key, &hash)) {
1332
109k
        FT_ATOMIC_STORE_PTR_RELEASE(*dest, key);
1333
109k
        dest++;
1334
109k
    }
1335
19.4k
    Py_SET_SIZE(self, r);
1336
19.4k
    return 0;
1337
19.4k
}
1338
1339
static int
1340
list_extend_dict(PyListObject *self, PyDictObject *dict, int which_item)
1341
311
{
1342
    // which_item: 0 for keys and 1 for values
1343
311
    Py_ssize_t m = Py_SIZE(self);
1344
311
    Py_ssize_t n = PyDict_GET_SIZE(dict);
1345
311
    Py_ssize_t r = m + n;
1346
311
    if (r == 0) {
1347
0
        return 0;
1348
0
    }
1349
311
    if (list_resize(self, r) < 0) {
1350
0
        return -1;
1351
0
    }
1352
1353
311
    assert(self->ob_item != NULL);
1354
311
    PyObject **dest = self->ob_item + m;
1355
311
    Py_ssize_t pos = 0;
1356
311
    PyObject *keyvalue[2];
1357
1.69k
    while (_PyDict_Next((PyObject *)dict, &pos, &keyvalue[0], &keyvalue[1], NULL)) {
1358
1.38k
        PyObject *obj = keyvalue[which_item];
1359
1.38k
        Py_INCREF(obj);
1360
1.38k
        FT_ATOMIC_STORE_PTR_RELEASE(*dest, obj);
1361
1.38k
        dest++;
1362
1.38k
    }
1363
1364
311
    Py_SET_SIZE(self, r);
1365
311
    return 0;
1366
311
}
1367
1368
static int
1369
list_extend_dictitems(PyListObject *self, PyDictObject *dict)
1370
0
{
1371
0
    Py_ssize_t m = Py_SIZE(self);
1372
0
    Py_ssize_t n = PyDict_GET_SIZE(dict);
1373
0
    Py_ssize_t r = m + n;
1374
0
    if (r == 0) {
1375
0
        return 0;
1376
0
    }
1377
0
    if (list_resize(self, r) < 0) {
1378
0
        return -1;
1379
0
    }
1380
1381
0
    assert(self->ob_item != NULL);
1382
0
    PyObject **dest = self->ob_item + m;
1383
0
    Py_ssize_t pos = 0;
1384
0
    Py_ssize_t i = 0;
1385
0
    PyObject *key, *value;
1386
0
    while (_PyDict_Next((PyObject *)dict, &pos, &key, &value, NULL)) {
1387
0
        PyObject *item = PyTuple_Pack(2, key, value);
1388
0
        if (item == NULL) {
1389
0
            Py_SET_SIZE(self, m + i);
1390
0
            return -1;
1391
0
        }
1392
0
        FT_ATOMIC_STORE_PTR_RELEASE(*dest, item);
1393
0
        dest++;
1394
0
        i++;
1395
0
    }
1396
1397
0
    Py_SET_SIZE(self, r);
1398
0
    return 0;
1399
0
}
1400
1401
static int
1402
_list_extend(PyListObject *self, PyObject *iterable)
1403
30.2M
{
1404
    // Special case:
1405
    // lists and tuples which can use PySequence_Fast ops
1406
30.2M
    int res = -1;
1407
30.2M
    if ((PyObject *)self == iterable) {
1408
0
        Py_BEGIN_CRITICAL_SECTION(self);
1409
0
        res = list_inplace_repeat_lock_held(self, 2);
1410
0
        Py_END_CRITICAL_SECTION();
1411
0
    }
1412
30.2M
    else if (PyList_CheckExact(iterable)) {
1413
9.84M
        Py_BEGIN_CRITICAL_SECTION2(self, iterable);
1414
9.84M
        res = list_extend_lock_held(self, iterable);
1415
9.84M
        Py_END_CRITICAL_SECTION2();
1416
9.84M
    }
1417
20.3M
    else if (PyTuple_CheckExact(iterable)) {
1418
14.7M
        Py_BEGIN_CRITICAL_SECTION(self);
1419
14.7M
        res = list_extend_lock_held(self, iterable);
1420
14.7M
        Py_END_CRITICAL_SECTION();
1421
14.7M
    }
1422
5.63M
    else if (PyAnySet_CheckExact(iterable)) {
1423
20.2k
        Py_BEGIN_CRITICAL_SECTION2(self, iterable);
1424
20.2k
        res = list_extend_set(self, (PySetObject *)iterable);
1425
20.2k
        Py_END_CRITICAL_SECTION2();
1426
20.2k
    }
1427
5.61M
    else if (PyDict_CheckExact(iterable)) {
1428
309
        Py_BEGIN_CRITICAL_SECTION2(self, iterable);
1429
309
        res = list_extend_dict(self, (PyDictObject *)iterable, 0 /*keys*/);
1430
309
        Py_END_CRITICAL_SECTION2();
1431
309
    }
1432
5.61M
    else if (Py_IS_TYPE(iterable, &PyDictKeys_Type)) {
1433
0
        PyDictObject *dict = ((_PyDictViewObject *)iterable)->dv_dict;
1434
0
        Py_BEGIN_CRITICAL_SECTION2(self, dict);
1435
0
        res = list_extend_dict(self, dict, 0 /*keys*/);
1436
0
        Py_END_CRITICAL_SECTION2();
1437
0
    }
1438
5.61M
    else if (Py_IS_TYPE(iterable, &PyDictValues_Type)) {
1439
2
        PyDictObject *dict = ((_PyDictViewObject *)iterable)->dv_dict;
1440
2
        Py_BEGIN_CRITICAL_SECTION2(self, dict);
1441
2
        res = list_extend_dict(self, dict, 1 /*values*/);
1442
2
        Py_END_CRITICAL_SECTION2();
1443
2
    }
1444
5.61M
    else if (Py_IS_TYPE(iterable, &PyDictItems_Type)) {
1445
0
        PyDictObject *dict = ((_PyDictViewObject *)iterable)->dv_dict;
1446
0
        Py_BEGIN_CRITICAL_SECTION2(self, dict);
1447
0
        res = list_extend_dictitems(self, dict);
1448
0
        Py_END_CRITICAL_SECTION2();
1449
0
    }
1450
5.61M
    else {
1451
5.61M
        Py_BEGIN_CRITICAL_SECTION(self);
1452
5.61M
        res = list_extend_iter_lock_held(self, iterable);
1453
5.61M
        Py_END_CRITICAL_SECTION();
1454
5.61M
    }
1455
30.2M
    return res;
1456
30.2M
}
1457
1458
/*[clinic input]
1459
list.extend as list_extend
1460
1461
     iterable: object
1462
     /
1463
1464
Extend list by appending elements from the iterable.
1465
[clinic start generated code]*/
1466
1467
static PyObject *
1468
list_extend_impl(PyListObject *self, PyObject *iterable)
1469
/*[clinic end generated code: output=b0eba9e0b186d5ce input=979da7597a515791]*/
1470
21.2M
{
1471
21.2M
    if (_list_extend(self, iterable) < 0) {
1472
639
        return NULL;
1473
639
    }
1474
21.2M
    Py_RETURN_NONE;
1475
21.2M
}
1476
1477
PyObject *
1478
_PyList_Extend(PyListObject *self, PyObject *iterable)
1479
19.8M
{
1480
19.8M
    return list_extend((PyObject*)self, iterable);
1481
19.8M
}
1482
1483
int
1484
PyList_Extend(PyObject *self, PyObject *iterable)
1485
0
{
1486
0
    if (!PyList_Check(self)) {
1487
0
        PyErr_BadInternalCall();
1488
0
        return -1;
1489
0
    }
1490
0
    return _list_extend((PyListObject*)self, iterable);
1491
0
}
1492
1493
1494
int
1495
PyList_Clear(PyObject *self)
1496
0
{
1497
0
    if (!PyList_Check(self)) {
1498
0
        PyErr_BadInternalCall();
1499
0
        return -1;
1500
0
    }
1501
0
    Py_BEGIN_CRITICAL_SECTION(self);
1502
0
    list_clear((PyListObject*)self);
1503
0
    Py_END_CRITICAL_SECTION();
1504
0
    return 0;
1505
0
}
1506
1507
1508
static PyObject *
1509
list_inplace_concat(PyObject *_self, PyObject *other)
1510
422
{
1511
422
    PyListObject *self = (PyListObject *)_self;
1512
422
    if (_list_extend(self, other) < 0) {
1513
0
        return NULL;
1514
0
    }
1515
422
    return Py_NewRef(self);
1516
422
}
1517
1518
/*[clinic input]
1519
@critical_section
1520
list.pop
1521
1522
    index: Py_ssize_t = -1
1523
    /
1524
1525
Remove and return item at index (default last).
1526
1527
Raises IndexError if list is empty or index is out of range.
1528
[clinic start generated code]*/
1529
1530
static PyObject *
1531
list_pop_impl(PyListObject *self, Py_ssize_t index)
1532
/*[clinic end generated code: output=6bd69dcb3f17eca8 input=c269141068ae4b8f]*/
1533
36.3M
{
1534
36.3M
    PyObject *v;
1535
36.3M
    int status;
1536
1537
36.3M
    if (Py_SIZE(self) == 0) {
1538
        /* Special-case most common failure cause */
1539
0
        PyErr_SetString(PyExc_IndexError, "pop from empty list");
1540
0
        return NULL;
1541
0
    }
1542
36.3M
    if (index < 0)
1543
13.9M
        index += Py_SIZE(self);
1544
36.3M
    if (!valid_index(index, Py_SIZE(self))) {
1545
0
        PyErr_SetString(PyExc_IndexError, "pop index out of range");
1546
0
        return NULL;
1547
0
    }
1548
1549
36.3M
    PyObject **items = self->ob_item;
1550
36.3M
    v = items[index];
1551
36.3M
    const Py_ssize_t size_after_pop = Py_SIZE(self) - 1;
1552
36.3M
    if (size_after_pop == 0) {
1553
14.7M
        Py_INCREF(v);
1554
14.7M
        list_clear(self);
1555
14.7M
        status = 0;
1556
14.7M
    }
1557
21.6M
    else {
1558
21.6M
        if ((size_after_pop - index) > 0) {
1559
14.1M
            memmove(&items[index], &items[index+1], (size_after_pop - index) * sizeof(PyObject *));
1560
14.1M
        }
1561
21.6M
        status = list_resize(self, size_after_pop);
1562
21.6M
    }
1563
36.3M
    if (status >= 0) {
1564
36.3M
        return v; // and v now owns the reference the list had
1565
36.3M
    }
1566
0
    else {
1567
        // list resize failed, need to restore
1568
0
        memmove(&items[index+1], &items[index], (size_after_pop - index)* sizeof(PyObject *));
1569
0
        items[index] = v;
1570
0
        return NULL;
1571
0
    }
1572
36.3M
}
1573
1574
/* Reverse a slice of a list in place, from lo up to (exclusive) hi. */
1575
static void
1576
reverse_slice(PyObject **lo, PyObject **hi)
1577
99.1k
{
1578
99.1k
    assert(lo && hi);
1579
1580
99.1k
    --hi;
1581
428k
    while (lo < hi) {
1582
329k
        PyObject *t = *lo;
1583
329k
        *lo = *hi;
1584
329k
        *hi = t;
1585
329k
        ++lo;
1586
329k
        --hi;
1587
329k
    }
1588
99.1k
}
1589
1590
/* Lots of code for an adaptive, stable, natural mergesort.  There are many
1591
 * pieces to this algorithm; read listsort.txt for overviews and details.
1592
 */
1593
1594
/* A sortslice contains a pointer to an array of keys and a pointer to
1595
 * an array of corresponding values.  In other words, keys[i]
1596
 * corresponds with values[i].  If values == NULL, then the keys are
1597
 * also the values.
1598
 *
1599
 * Several convenience routines are provided here, so that keys and
1600
 * values are always moved in sync.
1601
 */
1602
1603
typedef struct {
1604
    PyObject **keys;
1605
    PyObject **values;
1606
} sortslice;
1607
1608
Py_LOCAL_INLINE(void)
1609
sortslice_copy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j)
1610
33.8k
{
1611
33.8k
    s1->keys[i] = s2->keys[j];
1612
33.8k
    if (s1->values != NULL)
1613
32.7k
        s1->values[i] = s2->values[j];
1614
33.8k
}
1615
1616
Py_LOCAL_INLINE(void)
1617
sortslice_copy_incr(sortslice *dst, sortslice *src)
1618
540k
{
1619
540k
    *dst->keys++ = *src->keys++;
1620
540k
    if (dst->values != NULL)
1621
310k
        *dst->values++ = *src->values++;
1622
540k
}
1623
1624
Py_LOCAL_INLINE(void)
1625
sortslice_copy_decr(sortslice *dst, sortslice *src)
1626
289k
{
1627
289k
    *dst->keys-- = *src->keys--;
1628
289k
    if (dst->values != NULL)
1629
214k
        *dst->values-- = *src->values--;
1630
289k
}
1631
1632
1633
Py_LOCAL_INLINE(void)
1634
sortslice_memcpy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
1635
                 Py_ssize_t n)
1636
192k
{
1637
192k
    memcpy(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1638
192k
    if (s1->values != NULL)
1639
156k
        memcpy(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1640
192k
}
1641
1642
Py_LOCAL_INLINE(void)
1643
sortslice_memmove(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
1644
                  Py_ssize_t n)
1645
130k
{
1646
130k
    memmove(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1647
130k
    if (s1->values != NULL)
1648
103k
        memmove(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1649
130k
}
1650
1651
Py_LOCAL_INLINE(void)
1652
sortslice_advance(sortslice *slice, Py_ssize_t n)
1653
776k
{
1654
776k
    slice->keys += n;
1655
776k
    if (slice->values != NULL)
1656
564k
        slice->values += n;
1657
776k
}
1658
1659
/* Comparison function: ms->key_compare, which is set at run-time in
1660
 * listsort_impl to optimize for various special cases.
1661
 * Returns -1 on error, 1 if x < y, 0 if x >= y.
1662
 */
1663
1664
14.6M
#define ISLT(X, Y) (*(ms->key_compare))(X, Y, ms)
1665
1666
/* Compare X to Y via "<".  Goto "fail" if the comparison raises an
1667
   error.  Else "k" is set to true iff X<Y, and an "if (k)" block is
1668
   started.  It makes more sense in context <wink>.  X and Y are PyObject*s.
1669
*/
1670
14.1M
#define IFLT(X, Y) if ((k = ISLT(X, Y)) < 0) goto fail;  \
1671
14.1M
           if (k)
1672
1673
/* The maximum number of entries in a MergeState's pending-runs stack.
1674
 * For a list with n elements, this needs at most floor(log2(n)) + 1 entries
1675
 * even if we didn't force runs to a minimal length.  So the number of bits
1676
 * in a Py_ssize_t is plenty large enough for all cases.
1677
 */
1678
#define MAX_MERGE_PENDING (SIZEOF_SIZE_T * 8)
1679
1680
/* When we get into galloping mode, we stay there until both runs win less
1681
 * often than MIN_GALLOP consecutive times.  See listsort.txt for more info.
1682
 */
1683
982k
#define MIN_GALLOP 7
1684
1685
/* Avoid malloc for small temp arrays. */
1686
1.85M
#define MERGESTATE_TEMP_SIZE 256
1687
1688
/* The largest value of minrun. This must be a power of 2, and >= 1 */
1689
798k
#define MAX_MINRUN 64
1690
#if ((MAX_MINRUN) < 1) || ((MAX_MINRUN) & ((MAX_MINRUN) - 1))
1691
#error "MAX_MINRUN must be a power of 2, and >= 1"
1692
#endif
1693
1694
/* One MergeState exists on the stack per invocation of mergesort.  It's just
1695
 * a convenient way to pass state around among the helper functions.
1696
 */
1697
struct s_slice {
1698
    sortslice base;
1699
    Py_ssize_t len;   /* length of run */
1700
    int power; /* node "level" for powersort merge strategy */
1701
};
1702
1703
typedef struct s_MergeState MergeState;
1704
struct s_MergeState {
1705
    /* This controls when we get *into* galloping mode.  It's initialized
1706
     * to MIN_GALLOP.  merge_lo and merge_hi tend to nudge it higher for
1707
     * random data, and lower for highly structured data.
1708
     */
1709
    Py_ssize_t min_gallop;
1710
1711
    Py_ssize_t listlen;     /* len(input_list) - read only */
1712
    PyObject **basekeys;    /* base address of keys array - read only */
1713
1714
    /* 'a' is temp storage to help with merges.  It contains room for
1715
     * alloced entries.
1716
     */
1717
    sortslice a;        /* may point to temparray below */
1718
    Py_ssize_t alloced;
1719
1720
    /* A stack of n pending runs yet to be merged.  Run #i starts at
1721
     * address base[i] and extends for len[i] elements.  It's always
1722
     * true (so long as the indices are in bounds) that
1723
     *
1724
     *     pending[i].base + pending[i].len == pending[i+1].base
1725
     *
1726
     * so we could cut the storage for this, but it's a minor amount,
1727
     * and keeping all the info explicit simplifies the code.
1728
     */
1729
    int n;
1730
    struct s_slice pending[MAX_MERGE_PENDING];
1731
1732
    /* 'a' points to this when possible, rather than muck with malloc. */
1733
    PyObject *temparray[MERGESTATE_TEMP_SIZE];
1734
1735
    /* This is the function we will use to compare two keys,
1736
     * even when none of our special cases apply and we have to use
1737
     * safe_object_compare. */
1738
    int (*key_compare)(PyObject *, PyObject *, MergeState *);
1739
1740
    /* This function is used by unsafe_object_compare to optimize comparisons
1741
     * when we know our list is type-homogeneous but we can't assume anything else.
1742
     * In the pre-sort check it is set equal to Py_TYPE(key)->tp_richcompare */
1743
    PyObject *(*key_richcompare)(PyObject *, PyObject *, int);
1744
1745
    /* This function is used by unsafe_tuple_compare to compare the first elements
1746
     * of tuples. It may be set to safe_object_compare, but the idea is that hopefully
1747
     * we can assume more, and use one of the special-case compares. */
1748
    int (*tuple_elem_compare)(PyObject *, PyObject *, MergeState *);
1749
1750
    /* Varisbles used for minrun computation. The "ideal" minrun length is
1751
     * the infinite precision listlen / 2**e. See listsort.txt.
1752
     */
1753
     Py_ssize_t mr_current, mr_e, mr_mask;
1754
};
1755
1756
/* binarysort is the best method for sorting small arrays: it does few
1757
   compares, but can do data movement quadratic in the number of elements.
1758
   ss->keys is viewed as an array of n kays, a[:n]. a[:ok] is already sorted.
1759
   Pass ok = 0 (or 1) if you don't know.
1760
   It's sorted in-place, by a stable binary insertion sort. If ss->values
1761
   isn't NULL, it's permuted in lockstap with ss->keys.
1762
   On entry, must have n >= 1, and 0 <= ok <= n <= MAX_MINRUN.
1763
   Return -1 if comparison raises an exception, else 0.
1764
   Even in case of error, the output slice will be some permutation of
1765
   the input (nothing is lost or duplicated).
1766
*/
1767
static int
1768
binarysort(MergeState *ms, const sortslice *ss, Py_ssize_t n, Py_ssize_t ok)
1769
132k
{
1770
132k
    Py_ssize_t k; /* for IFLT macro expansion */
1771
132k
    PyObject ** const a = ss->keys;
1772
132k
    PyObject ** const v = ss->values;
1773
132k
    const bool has_values = v != NULL;
1774
132k
    PyObject *pivot;
1775
132k
    Py_ssize_t M;
1776
1777
132k
    assert(0 <= ok && ok <= n && 1 <= n && n <= MAX_MINRUN);
1778
    /* assert a[:ok] is sorted */
1779
132k
    if (! ok)
1780
0
        ++ok;
1781
    /* Regular insertion sort has average- and worst-case O(n**2) cost
1782
       for both # of comparisons and number of bytes moved. But its branches
1783
       are highly predictable, and it loves sorted input (n-1 compares and no
1784
       data movement). This is significant in cases like sortperf.py's %sort,
1785
       where an out-of-order element near the start of a run is moved into
1786
       place slowly but then the remaining elements up to length minrun are
1787
       generally at worst one slot away from their correct position (so only
1788
       need 1 or 2 commpares to resolve). If comparisons are very fast (such
1789
       as for a list of Python floats), the simple inner loop leaves it
1790
       very competitive with binary insertion, despite that it does
1791
       significantly more compares overall on random data.
1792
1793
       Binary insertion sort has worst, average, and best case O(n log n)
1794
       cost for # of comparisons, but worst and average case O(n**2) cost
1795
       for data movement. The more expensive comparisons, the more important
1796
       the comparison advantage. But its branches are less predictable the
1797
       more "randomish" the data, and that's so significant its worst case
1798
       in real life is random input rather than reverse-ordered (which does
1799
       about twice the data movement than random input does).
1800
1801
       Note that the number of bytes moved doesn't seem to matter. MAX_MINRUN
1802
       of 64 is so small that the key and value pointers all fit in a corner
1803
       of L1 cache, and moving things around in that is very fast. */
1804
#if 0 // ordinary insertion sort.
1805
    PyObject * vpivot = NULL;
1806
    for (; ok < n; ++ok) {
1807
        pivot = a[ok];
1808
        if (has_values)
1809
            vpivot = v[ok];
1810
        for (M = ok - 1; M >= 0; --M) {
1811
            k = ISLT(pivot, a[M]);
1812
            if (k < 0) {
1813
                a[M + 1] = pivot;
1814
                if (has_values)
1815
                    v[M + 1] = vpivot;
1816
                goto fail;
1817
            }
1818
            else if (k) {
1819
                a[M + 1] = a[M];
1820
                if (has_values)
1821
                    v[M + 1] = v[M];
1822
            }
1823
            else
1824
                break;
1825
        }
1826
        a[M + 1] = pivot;
1827
        if (has_values)
1828
            v[M + 1] = vpivot;
1829
    }
1830
#else // binary insertion sort
1831
132k
    Py_ssize_t L, R;
1832
2.13M
    for (; ok < n; ++ok) {
1833
        /* set L to where a[ok] belongs */
1834
1.99M
        L = 0;
1835
1.99M
        R = ok;
1836
1.99M
        pivot = a[ok];
1837
        /* Slice invariants. vacuously true at the start:
1838
         * all a[0:L]  <= pivot
1839
         * all a[L:R]     unknown
1840
         * all a[R:ok]  > pivot
1841
         */
1842
1.99M
        assert(L < R);
1843
8.42M
        do {
1844
            /* don't do silly ;-) things to prevent overflow when finding
1845
               the midpoint; L and R are very far from filling a Py_ssize_t */
1846
8.42M
            M = (L + R) >> 1;
1847
8.42M
#if 1 // straightforward, but highly unpredictable branch on random data
1848
8.42M
            IFLT(pivot, a[M])
1849
3.48M
                R = M;
1850
4.93M
            else
1851
4.93M
                L = M + 1;
1852
#else
1853
            /* Try to get compiler to generate conditional move instructions
1854
               instead. Works fine, but leaving it disabled for now because
1855
               it's not yielding consistently faster sorts. Needs more
1856
               investigation. More computation in the inner loop adds its own
1857
               costs, which can be significant when compares are fast. */
1858
            k = ISLT(pivot, a[M]);
1859
            if (k < 0)
1860
                goto fail;
1861
            Py_ssize_t Mp1 = M + 1;
1862
            R = k ? M : R;
1863
            L = k ? L : Mp1;
1864
#endif
1865
8.42M
        } while (L < R);
1866
1.99M
        assert(L == R);
1867
        /* a[:L] holds all elements from a[:ok] <= pivot now, so pivot belongs
1868
           at index L. Slide a[L:ok] to the right a slot to make room for it.
1869
           Caution: using memmove is much slower under MSVC 5; we're not
1870
           usually moving many slots. Years later: under Visual Studio 2022,
1871
           memmove seems just slightly slower than doing it "by hand". */
1872
14.5M
        for (M = ok; M > L; --M)
1873
12.5M
            a[M] = a[M - 1];
1874
1.99M
        a[L] = pivot;
1875
1.99M
        if (has_values) {
1876
1.40M
            pivot = v[ok];
1877
6.94M
            for (M = ok; M > L; --M)
1878
5.54M
                v[M] = v[M - 1];
1879
1.40M
            v[L] = pivot;
1880
1.40M
        }
1881
1.99M
    }
1882
132k
#endif // pick binary or regular insertion sort
1883
132k
    return 0;
1884
1885
0
 fail:
1886
0
    return -1;
1887
132k
}
1888
1889
static void
1890
sortslice_reverse(sortslice *s, Py_ssize_t n)
1891
61.4k
{
1892
61.4k
    reverse_slice(s->keys, &s->keys[n]);
1893
61.4k
    if (s->values != NULL)
1894
37.6k
        reverse_slice(s->values, &s->values[n]);
1895
61.4k
}
1896
1897
/*
1898
Return the length of the run beginning at slo->keys, spanning no more than
1899
nremaining elements. The run beginning there may be ascending or descending,
1900
but the function permutes it in place, if needed, so that it's always ascending
1901
upon return.
1902
1903
Returns -1 in case of error.
1904
*/
1905
static Py_ssize_t
1906
count_run(MergeState *ms, sortslice *slo, Py_ssize_t nremaining)
1907
267k
{
1908
267k
    Py_ssize_t k; /* used by IFLT macro expansion */
1909
267k
    Py_ssize_t n;
1910
267k
    PyObject ** const lo = slo->keys;
1911
1912
    /* In general, as things go on we've established that the slice starts
1913
       with a monotone run of n elements, starting at lo. */
1914
1915
    /* We're n elements into the slice, and the most recent neq+1 elements are
1916
     * all equal. This reverses them in-place, and resets neq for reuse.
1917
     */
1918
267k
#define REVERSE_LAST_NEQ                        \
1919
267k
    if (neq) {                                  \
1920
5.20k
        sortslice slice = *slo;                 \
1921
5.20k
        ++neq;                                  \
1922
5.20k
        sortslice_advance(&slice, n - neq);     \
1923
5.20k
        sortslice_reverse(&slice, neq);         \
1924
5.20k
        neq = 0;                                \
1925
5.20k
    }
1926
1927
    /* Sticking to only __lt__ compares is confusing and error-prone. But in
1928
     * this routine, almost all uses of IFLT can be captured by tiny macros
1929
     * giving mnemonic names to the intent. Note that inline functions don't
1930
     * work for this (IFLT expands to code including `goto fail`).
1931
     */
1932
267k
#define IF_NEXT_LARGER  IFLT(lo[n-1], lo[n])
1933
3.38M
#define IF_NEXT_SMALLER IFLT(lo[n], lo[n-1])
1934
1935
267k
    assert(nremaining);
1936
    /* try ascending run first */
1937
2.94M
    for (n = 1; n < nremaining; ++n) {
1938
2.84M
        IF_NEXT_SMALLER
1939
173k
            break;
1940
2.84M
    }
1941
267k
    if (n == nremaining)
1942
94.4k
        return n;
1943
    /* lo[n] is strictly less */
1944
    /* If n is 1 now, then the first compare established it's a descending
1945
     * run, so fall through to the descending case. But if n > 1, there are
1946
     * n elements in an ascending run terminated by the strictly less lo[n].
1947
     * If the first key < lo[n-1], *somewhere* along the way the sequence
1948
     * increased, so we're done (there is no descending run).
1949
     * Else first key >= lo[n-1], which implies that the entire ascending run
1950
     * consists of equal elements. In that case, this is a descending run,
1951
     * and we reverse the all-equal prefix in-place.
1952
     */
1953
173k
    if (n > 1) {
1954
127k
        IFLT(lo[0], lo[n-1])
1955
122k
            return n;
1956
5.10k
        sortslice_reverse(slo, n);
1957
5.10k
    }
1958
51.1k
    ++n; /* in all cases it's been established that lo[n] has been resolved */
1959
1960
    /* Finish descending run. All-squal subruns are reversed in-place on the
1961
     * fly. Their original order will be restored at the end by the whole-slice
1962
     * reversal.
1963
     */
1964
51.1k
    Py_ssize_t neq = 0;
1965
86.1k
    for ( ; n < nremaining; ++n) {
1966
67.4k
        IF_NEXT_SMALLER {
1967
            /* This ends the most recent run of equal elements, but still in
1968
             * the "descending" direction.
1969
             */
1970
12.9k
            REVERSE_LAST_NEQ
1971
12.9k
        }
1972
54.5k
        else {
1973
54.5k
            IF_NEXT_LARGER /* descending run is over */
1974
32.4k
                break;
1975
22.0k
            else /* not x < y and not y < x implies x == y */
1976
22.0k
                ++neq;
1977
54.5k
        }
1978
67.4k
    }
1979
51.1k
    REVERSE_LAST_NEQ
1980
51.1k
    sortslice_reverse(slo, n); /* transform to ascending run */
1981
1982
    /* And after reversing, it's possible this can be extended by a
1983
     * naturally increasing suffix; e.g., [3, 2, 3, 4, 1] makes an
1984
     * ascending run from the first 4 elements.
1985
     */
1986
490k
    for ( ; n < nremaining; ++n) {
1987
470k
        IF_NEXT_SMALLER
1988
30.8k
            break;
1989
470k
    }
1990
1991
51.1k
    return n;
1992
0
fail:
1993
0
    return -1;
1994
1995
51.1k
#undef REVERSE_LAST_NEQ
1996
51.1k
#undef IF_NEXT_SMALLER
1997
51.1k
#undef IF_NEXT_LARGER
1998
51.1k
}
1999
2000
/*
2001
Locate the proper position of key in a sorted vector; if the vector contains
2002
an element equal to key, return the position immediately to the left of
2003
the leftmost equal element.  [gallop_right() does the same except returns
2004
the position to the right of the rightmost equal element (if any).]
2005
2006
"a" is a sorted vector with n elements, starting at a[0].  n must be > 0.
2007
2008
"hint" is an index at which to begin the search, 0 <= hint < n.  The closer
2009
hint is to the final result, the faster this runs.
2010
2011
The return value is the int k in 0..n such that
2012
2013
    a[k-1] < key <= a[k]
2014
2015
pretending that *(a-1) is minus infinity and a[n] is plus infinity.  IOW,
2016
key belongs at index k; or, IOW, the first k elements of a should precede
2017
key, and the last n-k should follow key.
2018
2019
Returns -1 on error.  See listsort.txt for info on the method.
2020
*/
2021
static Py_ssize_t
2022
gallop_left(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
2023
182k
{
2024
182k
    Py_ssize_t ofs;
2025
182k
    Py_ssize_t lastofs;
2026
182k
    Py_ssize_t k;
2027
2028
182k
    assert(key && a && n > 0 && hint >= 0 && hint < n);
2029
2030
182k
    a += hint;
2031
182k
    lastofs = 0;
2032
182k
    ofs = 1;
2033
182k
    IFLT(*a, key) {
2034
        /* a[hint] < key -- gallop right, until
2035
         * a[hint + lastofs] < key <= a[hint + ofs]
2036
         */
2037
104k
        const Py_ssize_t maxofs = n - hint;             /* &a[n-1] is highest */
2038
357k
        while (ofs < maxofs) {
2039
282k
            IFLT(a[ofs], key) {
2040
252k
                lastofs = ofs;
2041
252k
                assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2042
252k
                ofs = (ofs << 1) + 1;
2043
252k
            }
2044
30.0k
            else                /* key <= a[hint + ofs] */
2045
30.0k
                break;
2046
282k
        }
2047
104k
        if (ofs > maxofs)
2048
32.8k
            ofs = maxofs;
2049
        /* Translate back to offsets relative to &a[0]. */
2050
104k
        lastofs += hint;
2051
104k
        ofs += hint;
2052
104k
    }
2053
77.9k
    else {
2054
        /* key <= a[hint] -- gallop left, until
2055
         * a[hint - ofs] < key <= a[hint - lastofs]
2056
         */
2057
77.9k
        const Py_ssize_t maxofs = hint + 1;             /* &a[0] is lowest */
2058
261k
        while (ofs < maxofs) {
2059
235k
            IFLT(*(a-ofs), key)
2060
52.4k
                break;
2061
            /* key <= a[hint - ofs] */
2062
183k
            lastofs = ofs;
2063
183k
            assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2064
183k
            ofs = (ofs << 1) + 1;
2065
183k
        }
2066
77.9k
        if (ofs > maxofs)
2067
19.2k
            ofs = maxofs;
2068
        /* Translate back to positive offsets relative to &a[0]. */
2069
77.9k
        k = lastofs;
2070
77.9k
        lastofs = hint - ofs;
2071
77.9k
        ofs = hint - k;
2072
77.9k
    }
2073
182k
    a -= hint;
2074
2075
182k
    assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
2076
    /* Now a[lastofs] < key <= a[ofs], so key belongs somewhere to the
2077
     * right of lastofs but no farther right than ofs.  Do a binary
2078
     * search, with invariant a[lastofs-1] < key <= a[ofs].
2079
     */
2080
182k
    ++lastofs;
2081
549k
    while (lastofs < ofs) {
2082
367k
        Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
2083
2084
367k
        IFLT(a[m], key)
2085
190k
            lastofs = m+1;              /* a[m] < key */
2086
176k
        else
2087
176k
            ofs = m;                    /* key <= a[m] */
2088
367k
    }
2089
182k
    assert(lastofs == ofs);             /* so a[ofs-1] < key <= a[ofs] */
2090
182k
    return ofs;
2091
2092
0
fail:
2093
0
    return -1;
2094
182k
}
2095
2096
/*
2097
Exactly like gallop_left(), except that if key already exists in a[0:n],
2098
finds the position immediately to the right of the rightmost equal value.
2099
2100
The return value is the int k in 0..n such that
2101
2102
    a[k-1] <= key < a[k]
2103
2104
or -1 if error.
2105
2106
The code duplication is massive, but this is enough different given that
2107
we're sticking to "<" comparisons that it's much harder to follow if
2108
written as one routine with yet another "left or right?" flag.
2109
*/
2110
static Py_ssize_t
2111
gallop_right(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
2112
204k
{
2113
204k
    Py_ssize_t ofs;
2114
204k
    Py_ssize_t lastofs;
2115
204k
    Py_ssize_t k;
2116
2117
204k
    assert(key && a && n > 0 && hint >= 0 && hint < n);
2118
2119
204k
    a += hint;
2120
204k
    lastofs = 0;
2121
204k
    ofs = 1;
2122
204k
    IFLT(key, *a) {
2123
        /* key < a[hint] -- gallop left, until
2124
         * a[hint - ofs] <= key < a[hint - lastofs]
2125
         */
2126
81.4k
        const Py_ssize_t maxofs = hint + 1;             /* &a[0] is lowest */
2127
190k
        while (ofs < maxofs) {
2128
123k
            IFLT(key, *(a-ofs)) {
2129
108k
                lastofs = ofs;
2130
108k
                assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2131
108k
                ofs = (ofs << 1) + 1;
2132
108k
            }
2133
14.2k
            else                /* a[hint - ofs] <= key */
2134
14.2k
                break;
2135
123k
        }
2136
81.4k
        if (ofs > maxofs)
2137
12.9k
            ofs = maxofs;
2138
        /* Translate back to positive offsets relative to &a[0]. */
2139
81.4k
        k = lastofs;
2140
81.4k
        lastofs = hint - ofs;
2141
81.4k
        ofs = hint - k;
2142
81.4k
    }
2143
123k
    else {
2144
        /* a[hint] <= key -- gallop right, until
2145
         * a[hint + lastofs] <= key < a[hint + ofs]
2146
        */
2147
123k
        const Py_ssize_t maxofs = n - hint;             /* &a[n-1] is highest */
2148
425k
        while (ofs < maxofs) {
2149
370k
            IFLT(key, a[ofs])
2150
68.5k
                break;
2151
            /* a[hint + ofs] <= key */
2152
301k
            lastofs = ofs;
2153
301k
            assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2154
301k
            ofs = (ofs << 1) + 1;
2155
301k
        }
2156
123k
        if (ofs > maxofs)
2157
32.5k
            ofs = maxofs;
2158
        /* Translate back to offsets relative to &a[0]. */
2159
123k
        lastofs += hint;
2160
123k
        ofs += hint;
2161
123k
    }
2162
204k
    a -= hint;
2163
2164
204k
    assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
2165
    /* Now a[lastofs] <= key < a[ofs], so key belongs somewhere to the
2166
     * right of lastofs but no farther right than ofs.  Do a binary
2167
     * search, with invariant a[lastofs-1] <= key < a[ofs].
2168
     */
2169
204k
    ++lastofs;
2170
555k
    while (lastofs < ofs) {
2171
350k
        Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
2172
2173
350k
        IFLT(key, a[m])
2174
184k
            ofs = m;                    /* key < a[m] */
2175
166k
        else
2176
166k
            lastofs = m+1;              /* a[m] <= key */
2177
350k
    }
2178
204k
    assert(lastofs == ofs);             /* so a[ofs-1] <= key < a[ofs] */
2179
204k
    return ofs;
2180
2181
0
fail:
2182
0
    return -1;
2183
204k
}
2184
2185
/* Conceptually a MergeState's constructor. */
2186
static void
2187
merge_init(MergeState *ms, Py_ssize_t list_size, int has_keyfunc,
2188
           sortslice *lo)
2189
772k
{
2190
772k
    assert(ms != NULL);
2191
772k
    if (has_keyfunc) {
2192
        /* The temporary space for merging will need at most half the list
2193
         * size rounded up.  Use the minimum possible space so we can use the
2194
         * rest of temparray for other things.  In particular, if there is
2195
         * enough extra space, listsort() will use it to store the keys.
2196
         */
2197
540k
        ms->alloced = (list_size + 1) / 2;
2198
2199
        /* ms->alloced describes how many keys will be stored at
2200
           ms->temparray, but we also need to store the values.  Hence,
2201
           ms->alloced is capped at half of MERGESTATE_TEMP_SIZE. */
2202
540k
        if (MERGESTATE_TEMP_SIZE / 2 < ms->alloced)
2203
2.29k
            ms->alloced = MERGESTATE_TEMP_SIZE / 2;
2204
540k
        ms->a.values = &ms->temparray[ms->alloced];
2205
540k
    }
2206
231k
    else {
2207
231k
        ms->alloced = MERGESTATE_TEMP_SIZE;
2208
231k
        ms->a.values = NULL;
2209
231k
    }
2210
772k
    ms->a.keys = ms->temparray;
2211
772k
    ms->n = 0;
2212
772k
    ms->min_gallop = MIN_GALLOP;
2213
772k
    ms->listlen = list_size;
2214
772k
    ms->basekeys = lo->keys;
2215
2216
    /* State for generating minrun values. See listsort.txt. */
2217
772k
    ms->mr_e = 0;
2218
798k
    while (list_size >> ms->mr_e >= MAX_MINRUN) {
2219
25.7k
        ++ms->mr_e;
2220
25.7k
    }
2221
772k
    ms->mr_mask = (1 << ms->mr_e) - 1;
2222
772k
    ms->mr_current = 0;
2223
772k
}
2224
2225
/* Free all the temp memory owned by the MergeState.  This must be called
2226
 * when you're done with a MergeState, and may be called before then if
2227
 * you want to free the temp memory early.
2228
 */
2229
static void
2230
merge_freemem(MergeState *ms)
2231
777k
{
2232
777k
    assert(ms != NULL);
2233
777k
    if (ms->a.keys != ms->temparray) {
2234
5.12k
        PyMem_Free(ms->a.keys);
2235
5.12k
        ms->a.keys = NULL;
2236
5.12k
    }
2237
777k
}
2238
2239
/* Ensure enough temp memory for 'need' array slots is available.
2240
 * Returns 0 on success and -1 if the memory can't be gotten.
2241
 */
2242
static int
2243
merge_getmem(MergeState *ms, Py_ssize_t need)
2244
5.12k
{
2245
5.12k
    int multiplier;
2246
2247
5.12k
    assert(ms != NULL);
2248
5.12k
    if (need <= ms->alloced)
2249
0
        return 0;
2250
2251
5.12k
    multiplier = ms->a.values != NULL ? 2 : 1;
2252
2253
    /* Don't realloc!  That can cost cycles to copy the old data, but
2254
     * we don't care what's in the block.
2255
     */
2256
5.12k
    merge_freemem(ms);
2257
5.12k
    if ((size_t)need > PY_SSIZE_T_MAX / sizeof(PyObject *) / multiplier) {
2258
0
        PyErr_NoMemory();
2259
0
        return -1;
2260
0
    }
2261
5.12k
    ms->a.keys = (PyObject **)PyMem_Malloc(multiplier * need
2262
5.12k
                                          * sizeof(PyObject *));
2263
5.12k
    if (ms->a.keys != NULL) {
2264
5.12k
        ms->alloced = need;
2265
5.12k
        if (ms->a.values != NULL)
2266
4.59k
            ms->a.values = &ms->a.keys[need];
2267
5.12k
        return 0;
2268
5.12k
    }
2269
0
    PyErr_NoMemory();
2270
0
    return -1;
2271
5.12k
}
2272
71.9k
#define MERGE_GETMEM(MS, NEED) ((NEED) <= (MS)->alloced ? 0 :   \
2273
71.9k
                                merge_getmem(MS, NEED))
2274
2275
/* Merge the na elements starting at ssa with the nb elements starting at
2276
 * ssb.keys = ssa.keys + na in a stable way, in-place.  na and nb must be > 0.
2277
 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
2278
 * should have na <= nb.  See listsort.txt for more info.  Return 0 if
2279
 * successful, -1 if error.
2280
 */
2281
static Py_ssize_t
2282
merge_lo(MergeState *ms, sortslice ssa, Py_ssize_t na,
2283
         sortslice ssb, Py_ssize_t nb)
2284
47.2k
{
2285
47.2k
    Py_ssize_t k;
2286
47.2k
    sortslice dest;
2287
47.2k
    int result = -1;            /* guilty until proved innocent */
2288
47.2k
    Py_ssize_t min_gallop;
2289
2290
47.2k
    assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
2291
47.2k
    assert(ssa.keys + na == ssb.keys);
2292
47.2k
    if (MERGE_GETMEM(ms, na) < 0)
2293
0
        return -1;
2294
47.2k
    sortslice_memcpy(&ms->a, 0, &ssa, 0, na);
2295
47.2k
    dest = ssa;
2296
47.2k
    ssa = ms->a;
2297
2298
47.2k
    sortslice_copy_incr(&dest, &ssb);
2299
47.2k
    --nb;
2300
47.2k
    if (nb == 0)
2301
3.17k
        goto Succeed;
2302
44.0k
    if (na == 1)
2303
6.71k
        goto CopyB;
2304
2305
37.3k
    min_gallop = ms->min_gallop;
2306
55.3k
    for (;;) {
2307
55.3k
        Py_ssize_t acount = 0;          /* # of times A won in a row */
2308
55.3k
        Py_ssize_t bcount = 0;          /* # of times B won in a row */
2309
2310
        /* Do the straightforward thing until (if ever) one run
2311
         * appears to win consistently.
2312
         */
2313
360k
        for (;;) {
2314
360k
            assert(na > 1 && nb > 0);
2315
360k
            k = ISLT(ssb.keys[0], ssa.keys[0]);
2316
360k
            if (k) {
2317
197k
                if (k < 0)
2318
0
                    goto Fail;
2319
197k
                sortslice_copy_incr(&dest, &ssb);
2320
197k
                ++bcount;
2321
197k
                acount = 0;
2322
197k
                --nb;
2323
197k
                if (nb == 0)
2324
3.54k
                    goto Succeed;
2325
194k
                if (bcount >= min_gallop)
2326
26.8k
                    break;
2327
194k
            }
2328
162k
            else {
2329
162k
                sortslice_copy_incr(&dest, &ssa);
2330
162k
                ++acount;
2331
162k
                bcount = 0;
2332
162k
                --na;
2333
162k
                if (na == 1)
2334
2.43k
                    goto CopyB;
2335
160k
                if (acount >= min_gallop)
2336
22.5k
                    break;
2337
160k
            }
2338
360k
        }
2339
2340
        /* One run is winning so consistently that galloping may
2341
         * be a huge win.  So try that, and continue galloping until
2342
         * (if ever) neither run appears to be winning consistently
2343
         * anymore.
2344
         */
2345
49.3k
        ++min_gallop;
2346
84.5k
        do {
2347
84.5k
            assert(na > 1 && nb > 0);
2348
84.5k
            min_gallop -= min_gallop > 1;
2349
84.5k
            ms->min_gallop = min_gallop;
2350
84.5k
            k = gallop_right(ms, ssb.keys[0], ssa.keys, na, 0);
2351
84.5k
            acount = k;
2352
84.5k
            if (k) {
2353
49.3k
                if (k < 0)
2354
0
                    goto Fail;
2355
49.3k
                sortslice_memcpy(&dest, 0, &ssa, 0, k);
2356
49.3k
                sortslice_advance(&dest, k);
2357
49.3k
                sortslice_advance(&ssa, k);
2358
49.3k
                na -= k;
2359
49.3k
                if (na == 1)
2360
8.43k
                    goto CopyB;
2361
                /* na==0 is impossible now if the comparison
2362
                 * function is consistent, but we can't assume
2363
                 * that it is.
2364
                 */
2365
40.8k
                if (na == 0)
2366
0
                    goto Succeed;
2367
40.8k
            }
2368
76.1k
            sortslice_copy_incr(&dest, &ssb);
2369
76.1k
            --nb;
2370
76.1k
            if (nb == 0)
2371
2.20k
                goto Succeed;
2372
2373
73.9k
            k = gallop_left(ms, ssa.keys[0], ssb.keys, nb, 0);
2374
73.9k
            bcount = k;
2375
73.9k
            if (k) {
2376
68.3k
                if (k < 0)
2377
0
                    goto Fail;
2378
68.3k
                sortslice_memmove(&dest, 0, &ssb, 0, k);
2379
68.3k
                sortslice_advance(&dest, k);
2380
68.3k
                sortslice_advance(&ssb, k);
2381
68.3k
                nb -= k;
2382
68.3k
                if (nb == 0)
2383
17.0k
                    goto Succeed;
2384
68.3k
            }
2385
56.8k
            sortslice_copy_incr(&dest, &ssa);
2386
56.8k
            --na;
2387
56.8k
            if (na == 1)
2388
3.75k
                goto CopyB;
2389
56.8k
        } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
2390
17.9k
        ++min_gallop;           /* penalize it for leaving galloping mode */
2391
17.9k
        ms->min_gallop = min_gallop;
2392
17.9k
    }
2393
25.9k
Succeed:
2394
25.9k
    result = 0;
2395
25.9k
Fail:
2396
25.9k
    if (na)
2397
25.9k
        sortslice_memcpy(&dest, 0, &ssa, 0, na);
2398
25.9k
    return result;
2399
21.3k
CopyB:
2400
21.3k
    assert(na == 1 && nb > 0);
2401
    /* The last element of ssa belongs at the end of the merge. */
2402
21.3k
    sortslice_memmove(&dest, 0, &ssb, 0, nb);
2403
21.3k
    sortslice_copy(&dest, nb, &ssa, 0);
2404
21.3k
    return 0;
2405
25.9k
}
2406
2407
/* Merge the na elements starting at pa with the nb elements starting at
2408
 * ssb.keys = ssa.keys + na in a stable way, in-place.  na and nb must be > 0.
2409
 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
2410
 * should have na >= nb.  See listsort.txt for more info.  Return 0 if
2411
 * successful, -1 if error.
2412
 */
2413
static Py_ssize_t
2414
merge_hi(MergeState *ms, sortslice ssa, Py_ssize_t na,
2415
         sortslice ssb, Py_ssize_t nb)
2416
24.6k
{
2417
24.6k
    Py_ssize_t k;
2418
24.6k
    sortslice dest, basea, baseb;
2419
24.6k
    int result = -1;            /* guilty until proved innocent */
2420
24.6k
    Py_ssize_t min_gallop;
2421
2422
24.6k
    assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
2423
24.6k
    assert(ssa.keys + na == ssb.keys);
2424
24.6k
    if (MERGE_GETMEM(ms, nb) < 0)
2425
0
        return -1;
2426
24.6k
    dest = ssb;
2427
24.6k
    sortslice_advance(&dest, nb-1);
2428
24.6k
    sortslice_memcpy(&ms->a, 0, &ssb, 0, nb);
2429
24.6k
    basea = ssa;
2430
24.6k
    baseb = ms->a;
2431
24.6k
    ssb.keys = ms->a.keys + nb - 1;
2432
24.6k
    if (ssb.values != NULL)
2433
20.9k
        ssb.values = ms->a.values + nb - 1;
2434
24.6k
    sortslice_advance(&ssa, na - 1);
2435
2436
24.6k
    sortslice_copy_decr(&dest, &ssa);
2437
24.6k
    --na;
2438
24.6k
    if (na == 0)
2439
0
        goto Succeed;
2440
24.6k
    if (nb == 1)
2441
832
        goto CopyA;
2442
2443
23.8k
    min_gallop = ms->min_gallop;
2444
30.9k
    for (;;) {
2445
30.9k
        Py_ssize_t acount = 0;          /* # of times A won in a row */
2446
30.9k
        Py_ssize_t bcount = 0;          /* # of times B won in a row */
2447
2448
        /* Do the straightforward thing until (if ever) one run
2449
         * appears to win consistently.
2450
         */
2451
200k
        for (;;) {
2452
200k
            assert(na > 0 && nb > 1);
2453
200k
            k = ISLT(ssb.keys[0], ssa.keys[0]);
2454
200k
            if (k) {
2455
91.5k
                if (k < 0)
2456
0
                    goto Fail;
2457
91.5k
                sortslice_copy_decr(&dest, &ssa);
2458
91.5k
                ++acount;
2459
91.5k
                bcount = 0;
2460
91.5k
                --na;
2461
91.5k
                if (na == 0)
2462
420
                    goto Succeed;
2463
91.1k
                if (acount >= min_gallop)
2464
13.3k
                    break;
2465
91.1k
            }
2466
109k
            else {
2467
109k
                sortslice_copy_decr(&dest, &ssb);
2468
109k
                ++bcount;
2469
109k
                acount = 0;
2470
109k
                --nb;
2471
109k
                if (nb == 1)
2472
382
                    goto CopyA;
2473
109k
                if (bcount >= min_gallop)
2474
16.7k
                    break;
2475
109k
            }
2476
200k
        }
2477
2478
        /* One run is winning so consistently that galloping may
2479
         * be a huge win.  So try that, and continue galloping until
2480
         * (if ever) neither run appears to be winning consistently
2481
         * anymore.
2482
         */
2483
30.1k
        ++min_gallop;
2484
48.4k
        do {
2485
48.4k
            assert(na > 0 && nb > 1);
2486
48.4k
            min_gallop -= min_gallop > 1;
2487
48.4k
            ms->min_gallop = min_gallop;
2488
48.4k
            k = gallop_right(ms, ssb.keys[0], basea.keys, na, na-1);
2489
48.4k
            if (k < 0)
2490
0
                goto Fail;
2491
48.4k
            k = na - k;
2492
48.4k
            acount = k;
2493
48.4k
            if (k) {
2494
28.1k
                sortslice_advance(&dest, -k);
2495
28.1k
                sortslice_advance(&ssa, -k);
2496
28.1k
                sortslice_memmove(&dest, 1, &ssa, 1, k);
2497
28.1k
                na -= k;
2498
28.1k
                if (na == 0)
2499
10.6k
                    goto Succeed;
2500
28.1k
            }
2501
37.8k
            sortslice_copy_decr(&dest, &ssb);
2502
37.8k
            --nb;
2503
37.8k
            if (nb == 1)
2504
785
                goto CopyA;
2505
2506
37.0k
            k = gallop_left(ms, ssa.keys[0], baseb.keys, nb, nb-1);
2507
37.0k
            if (k < 0)
2508
0
                goto Fail;
2509
37.0k
            k = nb - k;
2510
37.0k
            bcount = k;
2511
37.0k
            if (k) {
2512
32.8k
                sortslice_advance(&dest, -k);
2513
32.8k
                sortslice_advance(&ssb, -k);
2514
32.8k
                sortslice_memcpy(&dest, 1, &ssb, 1, k);
2515
32.8k
                nb -= k;
2516
32.8k
                if (nb == 1)
2517
10.5k
                    goto CopyA;
2518
                /* nb==0 is impossible now if the comparison
2519
                 * function is consistent, but we can't assume
2520
                 * that it is.
2521
                 */
2522
22.3k
                if (nb == 0)
2523
0
                    goto Succeed;
2524
22.3k
            }
2525
26.5k
            sortslice_copy_decr(&dest, &ssa);
2526
26.5k
            --na;
2527
26.5k
            if (na == 0)
2528
1.12k
                goto Succeed;
2529
26.5k
        } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
2530
7.07k
        ++min_gallop;           /* penalize it for leaving galloping mode */
2531
7.07k
        ms->min_gallop = min_gallop;
2532
7.07k
    }
2533
12.1k
Succeed:
2534
12.1k
    result = 0;
2535
12.1k
Fail:
2536
12.1k
    if (nb)
2537
12.1k
        sortslice_memcpy(&dest, -(nb-1), &baseb, 0, nb);
2538
12.1k
    return result;
2539
12.5k
CopyA:
2540
12.5k
    assert(nb == 1 && na > 0);
2541
    /* The first element of ssb belongs at the front of the merge. */
2542
12.5k
    sortslice_memmove(&dest, 1-na, &ssa, 1-na, na);
2543
12.5k
    sortslice_advance(&dest, -na);
2544
12.5k
    sortslice_advance(&ssa, -na);
2545
12.5k
    sortslice_copy(&dest, 0, &ssb, 0);
2546
12.5k
    return 0;
2547
12.1k
}
2548
2549
/* Merge the two runs at stack indices i and i+1.
2550
 * Returns 0 on success, -1 on error.
2551
 */
2552
static Py_ssize_t
2553
merge_at(MergeState *ms, Py_ssize_t i)
2554
71.9k
{
2555
71.9k
    sortslice ssa, ssb;
2556
71.9k
    Py_ssize_t na, nb;
2557
71.9k
    Py_ssize_t k;
2558
2559
71.9k
    assert(ms != NULL);
2560
71.9k
    assert(ms->n >= 2);
2561
71.9k
    assert(i >= 0);
2562
71.9k
    assert(i == ms->n - 2 || i == ms->n - 3);
2563
2564
71.9k
    ssa = ms->pending[i].base;
2565
71.9k
    na = ms->pending[i].len;
2566
71.9k
    ssb = ms->pending[i+1].base;
2567
71.9k
    nb = ms->pending[i+1].len;
2568
71.9k
    assert(na > 0 && nb > 0);
2569
71.9k
    assert(ssa.keys + na == ssb.keys);
2570
2571
    /* Record the length of the combined runs; if i is the 3rd-last
2572
     * run now, also slide over the last run (which isn't involved
2573
     * in this merge).  The current run i+1 goes away in any case.
2574
     */
2575
71.9k
    ms->pending[i].len = na + nb;
2576
71.9k
    if (i == ms->n - 3)
2577
393
        ms->pending[i+1] = ms->pending[i+2];
2578
71.9k
    --ms->n;
2579
2580
    /* Where does b start in a?  Elements in a before that can be
2581
     * ignored (already in place).
2582
     */
2583
71.9k
    k = gallop_right(ms, *ssb.keys, ssa.keys, na, 0);
2584
71.9k
    if (k < 0)
2585
0
        return -1;
2586
71.9k
    sortslice_advance(&ssa, k);
2587
71.9k
    na -= k;
2588
71.9k
    if (na == 0)
2589
26
        return 0;
2590
2591
    /* Where does a end in b?  Elements in b after that can be
2592
     * ignored (already in place).
2593
     */
2594
71.9k
    nb = gallop_left(ms, ssa.keys[na-1], ssb.keys, nb, nb-1);
2595
71.9k
    if (nb <= 0)
2596
0
        return nb;
2597
2598
    /* Merge what remains of the runs, using a temp array with
2599
     * min(na, nb) elements.
2600
     */
2601
71.9k
    if (na <= nb)
2602
47.2k
        return merge_lo(ms, ssa, na, ssb, nb);
2603
24.6k
    else
2604
24.6k
        return merge_hi(ms, ssa, na, ssb, nb);
2605
71.9k
}
2606
2607
/* Two adjacent runs begin at index s1. The first run has length n1, and
2608
 * the second run (starting at index s1+n1) has length n2. The list has total
2609
 * length n.
2610
 * Compute the "power" of the first run. See listsort.txt for details.
2611
 */
2612
static int
2613
powerloop(Py_ssize_t s1, Py_ssize_t n1, Py_ssize_t n2, Py_ssize_t n)
2614
71.9k
{
2615
71.9k
    int result = 0;
2616
71.9k
    assert(s1 >= 0);
2617
71.9k
    assert(n1 > 0 && n2 > 0);
2618
71.9k
    assert(s1 + n1 + n2 <= n);
2619
    /* midpoints a and b:
2620
     * a = s1 + n1/2
2621
     * b = s1 + n1 + n2/2 = a + (n1 + n2)/2
2622
     *
2623
     * Those may not be integers, though, because of the "/2". So we work with
2624
     * 2*a and 2*b instead, which are necessarily integers. It makes no
2625
     * difference to the outcome, since the bits in the expansion of (2*i)/n
2626
     * are merely shifted one position from those of i/n.
2627
     */
2628
71.9k
    Py_ssize_t a = 2 * s1 + n1;  /* 2*a */
2629
71.9k
    Py_ssize_t b = a + n1 + n2;  /* 2*b */
2630
    /* Emulate a/n and b/n one bit a time, until bits differ. */
2631
291k
    for (;;) {
2632
291k
        ++result;
2633
291k
        if (a >= n) {  /* both quotient bits are 1 */
2634
112k
            assert(b >= a);
2635
112k
            a -= n;
2636
112k
            b -= n;
2637
112k
        }
2638
178k
        else if (b >= n) {  /* a/n bit is 0, b/n bit is 1 */
2639
71.9k
            break;
2640
71.9k
        } /* else both quotient bits are 0 */
2641
219k
        assert(a < b && b < n);
2642
219k
        a <<= 1;
2643
219k
        b <<= 1;
2644
219k
    }
2645
71.9k
    return result;
2646
71.9k
}
2647
2648
/* The next run has been identified, of length n2.
2649
 * If there's already a run on the stack, apply the "powersort" merge strategy:
2650
 * compute the topmost run's "power" (depth in a conceptual binary merge tree)
2651
 * and merge adjacent runs on the stack with greater power. See listsort.txt
2652
 * for more info.
2653
 *
2654
 * It's the caller's responsibility to push the new run on the stack when this
2655
 * returns.
2656
 *
2657
 * Returns 0 on success, -1 on error.
2658
 */
2659
static int
2660
found_new_run(MergeState *ms, Py_ssize_t n2)
2661
267k
{
2662
267k
    assert(ms);
2663
267k
    if (ms->n) {
2664
71.9k
        assert(ms->n > 0);
2665
71.9k
        struct s_slice *p = ms->pending;
2666
71.9k
        Py_ssize_t s1 = p[ms->n - 1].base.keys - ms->basekeys; /* start index */
2667
71.9k
        Py_ssize_t n1 = p[ms->n - 1].len;
2668
71.9k
        int power = powerloop(s1, n1, n2, ms->listlen);
2669
120k
        while (ms->n > 1 && p[ms->n - 2].power > power) {
2670
48.6k
            if (merge_at(ms, ms->n - 2) < 0)
2671
0
                return -1;
2672
48.6k
        }
2673
71.9k
        assert(ms->n < 2 || p[ms->n - 2].power < power);
2674
71.9k
        p[ms->n - 1].power = power;
2675
71.9k
    }
2676
267k
    return 0;
2677
267k
}
2678
2679
/* Regardless of invariants, merge all runs on the stack until only one
2680
 * remains.  This is used at the end of the mergesort.
2681
 *
2682
 * Returns 0 on success, -1 on error.
2683
 */
2684
static int
2685
merge_force_collapse(MergeState *ms)
2686
195k
{
2687
195k
    struct s_slice *p = ms->pending;
2688
2689
195k
    assert(ms);
2690
219k
    while (ms->n > 1) {
2691
23.3k
        Py_ssize_t n = ms->n - 2;
2692
23.3k
        if (n > 0 && p[n-1].len < p[n+1].len)
2693
393
            --n;
2694
23.3k
        if (merge_at(ms, n) < 0)
2695
0
            return -1;
2696
23.3k
    }
2697
195k
    return 0;
2698
195k
}
2699
2700
/* Return the next minrun value to use. See listsort.txt. */
2701
Py_LOCAL_INLINE(Py_ssize_t)
2702
minrun_next(MergeState *ms)
2703
267k
{
2704
267k
    ms->mr_current += ms->listlen;
2705
267k
    assert(ms->mr_current >= 0); /* no overflow */
2706
267k
    Py_ssize_t result = ms->mr_current >> ms->mr_e;
2707
267k
    ms->mr_current &= ms->mr_mask;
2708
267k
    return result;
2709
267k
}
2710
2711
/* Here we define custom comparison functions to optimize for the cases one commonly
2712
 * encounters in practice: homogeneous lists, often of one of the basic types. */
2713
2714
/* This struct holds the comparison function and helper functions
2715
 * selected in the pre-sort check. */
2716
2717
/* These are the special case compare functions.
2718
 * ms->key_compare will always point to one of these: */
2719
2720
/* Heterogeneous compare: default, always safe to fall back on. */
2721
static int
2722
safe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
2723
0
{
2724
    /* No assumptions necessary! */
2725
0
    return PyObject_RichCompareBool(v, w, Py_LT);
2726
0
}
2727
2728
/* Homogeneous compare: safe for any two comparable objects of the same type.
2729
 * (ms->key_richcompare is set to ob_type->tp_richcompare in the
2730
 *  pre-sort check.)
2731
 */
2732
static int
2733
unsafe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
2734
9.22M
{
2735
9.22M
    PyObject *res_obj; int res;
2736
2737
    /* No assumptions, because we check first: */
2738
9.22M
    if (Py_TYPE(v)->tp_richcompare != ms->key_richcompare)
2739
0
        return PyObject_RichCompareBool(v, w, Py_LT);
2740
2741
9.22M
    assert(ms->key_richcompare != NULL);
2742
9.22M
    res_obj = (*(ms->key_richcompare))(v, w, Py_LT);
2743
2744
9.22M
    if (res_obj == Py_NotImplemented) {
2745
0
        Py_DECREF(res_obj);
2746
0
        return PyObject_RichCompareBool(v, w, Py_LT);
2747
0
    }
2748
9.22M
    if (res_obj == NULL)
2749
0
        return -1;
2750
2751
9.22M
    if (PyBool_Check(res_obj)) {
2752
9.22M
        res = (res_obj == Py_True);
2753
9.22M
    }
2754
0
    else {
2755
0
        res = PyObject_IsTrue(res_obj);
2756
0
    }
2757
9.22M
    Py_DECREF(res_obj);
2758
2759
    /* Note that we can't assert
2760
     *     res == PyObject_RichCompareBool(v, w, Py_LT);
2761
     * because of evil compare functions like this:
2762
     *     lambda a, b:  int(random.random() * 3) - 1)
2763
     * (which is actually in test_sort.py) */
2764
9.22M
    return res;
2765
9.22M
}
2766
2767
/* Latin string compare: safe for any two latin (one byte per char) strings. */
2768
static int
2769
unsafe_latin_compare(PyObject *v, PyObject *w, MergeState *ms)
2770
271k
{
2771
271k
    Py_ssize_t len;
2772
271k
    int res;
2773
2774
    /* Modified from Objects/unicodeobject.c:unicode_compare, assuming: */
2775
271k
    assert(Py_IS_TYPE(v, &PyUnicode_Type));
2776
271k
    assert(Py_IS_TYPE(w, &PyUnicode_Type));
2777
271k
    assert(PyUnicode_KIND(v) == PyUnicode_KIND(w));
2778
271k
    assert(PyUnicode_KIND(v) == PyUnicode_1BYTE_KIND);
2779
2780
271k
    len = Py_MIN(PyUnicode_GET_LENGTH(v), PyUnicode_GET_LENGTH(w));
2781
271k
    res = memcmp(PyUnicode_DATA(v), PyUnicode_DATA(w), len);
2782
2783
271k
    res = (res != 0 ?
2784
266k
           res < 0 :
2785
271k
           PyUnicode_GET_LENGTH(v) < PyUnicode_GET_LENGTH(w));
2786
2787
271k
    assert(res == PyObject_RichCompareBool(v, w, Py_LT));;
2788
271k
    return res;
2789
271k
}
2790
2791
/* Bounded int compare: compare any two longs that fit in a single machine word. */
2792
static int
2793
unsafe_long_compare(PyObject *v, PyObject *w, MergeState *ms)
2794
5.16M
{
2795
5.16M
    PyLongObject *vl, *wl;
2796
5.16M
    intptr_t v0, w0;
2797
5.16M
    int res;
2798
2799
    /* Modified from Objects/longobject.c:long_compare, assuming: */
2800
5.16M
    assert(Py_IS_TYPE(v, &PyLong_Type));
2801
5.16M
    assert(Py_IS_TYPE(w, &PyLong_Type));
2802
5.16M
    assert(_PyLong_IsCompact((PyLongObject *)v));
2803
5.16M
    assert(_PyLong_IsCompact((PyLongObject *)w));
2804
2805
5.16M
    vl = (PyLongObject*)v;
2806
5.16M
    wl = (PyLongObject*)w;
2807
2808
5.16M
    v0 = _PyLong_CompactValue(vl);
2809
5.16M
    w0 = _PyLong_CompactValue(wl);
2810
2811
5.16M
    res = v0 < w0;
2812
5.16M
    assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2813
5.16M
    return res;
2814
5.16M
}
2815
2816
/* Float compare: compare any two floats. */
2817
static int
2818
unsafe_float_compare(PyObject *v, PyObject *w, MergeState *ms)
2819
0
{
2820
0
    int res;
2821
2822
    /* Modified from Objects/floatobject.c:float_richcompare, assuming: */
2823
0
    assert(Py_IS_TYPE(v, &PyFloat_Type));
2824
0
    assert(Py_IS_TYPE(w, &PyFloat_Type));
2825
2826
0
    res = PyFloat_AS_DOUBLE(v) < PyFloat_AS_DOUBLE(w);
2827
0
    assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2828
0
    return res;
2829
0
}
2830
2831
/* Tuple compare: compare *any* two tuples, using
2832
 * ms->tuple_elem_compare to compare the first elements, which is set
2833
 * using the same pre-sort check as we use for ms->key_compare,
2834
 * but run on the list [x[0] for x in L]. This allows us to optimize compares
2835
 * on two levels (as long as [x[0] for x in L] is type-homogeneous.) The idea is
2836
 * that most tuple compares don't involve x[1:]. */
2837
static int
2838
unsafe_tuple_compare(PyObject *v, PyObject *w, MergeState *ms)
2839
1.26k
{
2840
1.26k
    PyTupleObject *vt, *wt;
2841
1.26k
    Py_ssize_t i, vlen, wlen;
2842
1.26k
    int k;
2843
2844
    /* Modified from Objects/tupleobject.c:tuplerichcompare, assuming: */
2845
1.26k
    assert(Py_IS_TYPE(v, &PyTuple_Type));
2846
1.26k
    assert(Py_IS_TYPE(w, &PyTuple_Type));
2847
1.26k
    assert(Py_SIZE(v) > 0);
2848
1.26k
    assert(Py_SIZE(w) > 0);
2849
2850
1.26k
    vt = (PyTupleObject *)v;
2851
1.26k
    wt = (PyTupleObject *)w;
2852
2853
1.26k
    vlen = Py_SIZE(vt);
2854
1.26k
    wlen = Py_SIZE(wt);
2855
2856
1.27k
    for (i = 0; i < vlen && i < wlen; i++) {
2857
1.27k
        k = PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_EQ);
2858
1.27k
        if (k < 0)
2859
0
            return -1;
2860
1.27k
        if (!k)
2861
1.26k
            break;
2862
1.27k
    }
2863
2864
1.26k
    if (i >= vlen || i >= wlen)
2865
0
        return vlen < wlen;
2866
2867
1.26k
    if (i == 0)
2868
1.24k
        return ms->tuple_elem_compare(vt->ob_item[i], wt->ob_item[i], ms);
2869
12
    else
2870
12
        return PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_LT);
2871
1.26k
}
2872
2873
/* An adaptive, stable, natural mergesort.  See listsort.txt.
2874
 * Returns Py_None on success, NULL on error.  Even in case of error, the
2875
 * list will be some permutation of its input state (nothing is lost or
2876
 * duplicated).
2877
 */
2878
/*[clinic input]
2879
@permit_long_docstring_body
2880
@critical_section
2881
list.sort
2882
2883
    *
2884
    key as keyfunc: object = None
2885
    reverse: bool = False
2886
2887
Sort the list in ascending order and return None.
2888
2889
The sort is in-place (i.e. the list itself is modified) and stable (i.e. the
2890
order of two equal elements is maintained).
2891
2892
If a key function is given, apply it once to each list item and sort them,
2893
ascending or descending, according to their function values.
2894
2895
The reverse flag can be set to sort in descending order.
2896
[clinic start generated code]*/
2897
2898
static PyObject *
2899
list_sort_impl(PyListObject *self, PyObject *keyfunc, int reverse)
2900
/*[clinic end generated code: output=57b9f9c5e23fbe42 input=e4f6b6069181ad7d]*/
2901
772k
{
2902
772k
    MergeState ms;
2903
772k
    Py_ssize_t nremaining;
2904
772k
    Py_ssize_t minrun;
2905
772k
    sortslice lo;
2906
772k
    Py_ssize_t saved_ob_size, saved_allocated;
2907
772k
    PyObject **saved_ob_item;
2908
772k
    PyObject **final_ob_item;
2909
772k
    PyObject *result = NULL;            /* guilty until proved innocent */
2910
772k
    Py_ssize_t i;
2911
772k
    PyObject **keys;
2912
2913
772k
    assert(self != NULL);
2914
772k
    assert(PyList_Check(self));
2915
772k
    if (keyfunc == Py_None)
2916
216k
        keyfunc = NULL;
2917
2918
    /* The list is temporarily made empty, so that mutations performed
2919
     * by comparison functions can't affect the slice of memory we're
2920
     * sorting (allowing mutations during sorting is a core-dump
2921
     * factory, since ob_item may change).
2922
     */
2923
772k
    saved_ob_size = Py_SIZE(self);
2924
772k
    saved_ob_item = self->ob_item;
2925
772k
    saved_allocated = self->allocated;
2926
772k
    Py_SET_SIZE(self, 0);
2927
772k
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item, NULL);
2928
772k
    self->allocated = -1; /* any operation will reset it to >= 0 */
2929
2930
772k
    if (keyfunc == NULL) {
2931
231k
        keys = NULL;
2932
231k
        lo.keys = saved_ob_item;
2933
231k
        lo.values = NULL;
2934
231k
    }
2935
540k
    else {
2936
540k
        if (saved_ob_size < MERGESTATE_TEMP_SIZE/2)
2937
            /* Leverage stack space we allocated but won't otherwise use */
2938
536k
            keys = &ms.temparray[saved_ob_size+1];
2939
4.12k
        else {
2940
4.12k
            keys = PyMem_Malloc(sizeof(PyObject *) * saved_ob_size);
2941
4.12k
            if (keys == NULL) {
2942
0
                PyErr_NoMemory();
2943
0
                goto keyfunc_fail;
2944
0
            }
2945
4.12k
        }
2946
2947
5.19M
        for (i = 0; i < saved_ob_size ; i++) {
2948
4.64M
            keys[i] = PyObject_CallOneArg(keyfunc, saved_ob_item[i]);
2949
4.64M
            if (keys[i] == NULL) {
2950
0
                for (i=i-1 ; i>=0 ; i--)
2951
0
                    Py_DECREF(keys[i]);
2952
0
                if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
2953
0
                    PyMem_Free(keys);
2954
0
                goto keyfunc_fail;
2955
0
            }
2956
4.64M
        }
2957
2958
540k
        lo.keys = keys;
2959
540k
        lo.values = saved_ob_item;
2960
540k
    }
2961
2962
2963
    /* The pre-sort check: here's where we decide which compare function to use.
2964
     * How much optimization is safe? We test for homogeneity with respect to
2965
     * several properties that are expensive to check at compare-time, and
2966
     * set ms appropriately. */
2967
772k
    if (saved_ob_size > 1) {
2968
        /* Assume the first element is representative of the whole list. */
2969
195k
        int keys_are_in_tuples = (Py_IS_TYPE(lo.keys[0], &PyTuple_Type) &&
2970
195k
                                  Py_SIZE(lo.keys[0]) > 0);
2971
2972
195k
        PyTypeObject* key_type = (keys_are_in_tuples ?
2973
65
                                  Py_TYPE(PyTuple_GET_ITEM(lo.keys[0], 0)) :
2974
195k
                                  Py_TYPE(lo.keys[0]));
2975
2976
195k
        int keys_are_all_same_type = 1;
2977
195k
        int strings_are_latin = 1;
2978
195k
        int ints_are_bounded = 1;
2979
2980
        /* Prove that assumption by checking every key. */
2981
5.66M
        for (i=0; i < saved_ob_size; i++) {
2982
2983
5.46M
            if (keys_are_in_tuples &&
2984
5.46M
                !(Py_IS_TYPE(lo.keys[i], &PyTuple_Type) && Py_SIZE(lo.keys[i]) != 0)) {
2985
0
                keys_are_in_tuples = 0;
2986
0
                keys_are_all_same_type = 0;
2987
0
                break;
2988
0
            }
2989
2990
            /* Note: for lists of tuples, key is the first element of the tuple
2991
             * lo.keys[i], not lo.keys[i] itself! We verify type-homogeneity
2992
             * for lists of tuples in the if-statement directly above. */
2993
5.46M
            PyObject *key = (keys_are_in_tuples ?
2994
595
                             PyTuple_GET_ITEM(lo.keys[i], 0) :
2995
5.46M
                             lo.keys[i]);
2996
2997
5.46M
            if (!Py_IS_TYPE(key, key_type)) {
2998
0
                keys_are_all_same_type = 0;
2999
                /* If keys are in tuple we must loop over the whole list to make
3000
                   sure all items are tuples */
3001
0
                if (!keys_are_in_tuples) {
3002
0
                    break;
3003
0
                }
3004
0
            }
3005
3006
5.46M
            if (keys_are_all_same_type) {
3007
5.46M
                if (key_type == &PyLong_Type &&
3008
5.46M
                    ints_are_bounded &&
3009
5.46M
                    !_PyLong_IsCompact((PyLongObject *)key)) {
3010
3011
4.85k
                    ints_are_bounded = 0;
3012
4.85k
                }
3013
5.46M
                else if (key_type == &PyUnicode_Type &&
3014
5.46M
                         strings_are_latin &&
3015
5.46M
                         PyUnicode_KIND(key) != PyUnicode_1BYTE_KIND) {
3016
3017
6.76k
                        strings_are_latin = 0;
3018
6.76k
                    }
3019
5.46M
                }
3020
5.46M
            }
3021
3022
        /* Choose the best compare, given what we now know about the keys. */
3023
195k
        if (keys_are_all_same_type) {
3024
3025
195k
            if (key_type == &PyUnicode_Type && strings_are_latin) {
3026
12.3k
                ms.key_compare = unsafe_latin_compare;
3027
12.3k
            }
3028
183k
            else if (key_type == &PyLong_Type && ints_are_bounded) {
3029
74.1k
                ms.key_compare = unsafe_long_compare;
3030
74.1k
            }
3031
109k
            else if (key_type == &PyFloat_Type) {
3032
0
                ms.key_compare = unsafe_float_compare;
3033
0
            }
3034
109k
            else if ((ms.key_richcompare = key_type->tp_richcompare) != NULL) {
3035
109k
                ms.key_compare = unsafe_object_compare;
3036
109k
            }
3037
0
            else {
3038
0
                ms.key_compare = safe_object_compare;
3039
0
            }
3040
195k
        }
3041
0
        else {
3042
0
            ms.key_compare = safe_object_compare;
3043
0
        }
3044
3045
195k
        if (keys_are_in_tuples) {
3046
            /* Make sure we're not dealing with tuples of tuples
3047
             * (remember: here, key_type refers list [key[0] for key in keys]) */
3048
65
            if (key_type == &PyTuple_Type) {
3049
0
                ms.tuple_elem_compare = safe_object_compare;
3050
0
            }
3051
65
            else {
3052
65
                ms.tuple_elem_compare = ms.key_compare;
3053
65
            }
3054
3055
65
            ms.key_compare = unsafe_tuple_compare;
3056
65
        }
3057
195k
    }
3058
    /* End of pre-sort check: ms is now set properly! */
3059
3060
772k
    merge_init(&ms, saved_ob_size, keys != NULL, &lo);
3061
3062
772k
    nremaining = saved_ob_size;
3063
772k
    if (nremaining < 2)
3064
576k
        goto succeed;
3065
3066
    /* Reverse sort stability achieved by initially reversing the list,
3067
    applying a stable forward sort, then reversing the final result. */
3068
195k
    if (reverse) {
3069
2
        if (keys != NULL)
3070
0
            reverse_slice(&keys[0], &keys[saved_ob_size]);
3071
2
        reverse_slice(&saved_ob_item[0], &saved_ob_item[saved_ob_size]);
3072
2
    }
3073
3074
    /* March over the array once, left to right, finding natural runs,
3075
     * and extending short natural runs to minrun elements.
3076
     */
3077
267k
    do {
3078
267k
        Py_ssize_t n;
3079
3080
        /* Identify next run. */
3081
267k
        n = count_run(&ms, &lo, nremaining);
3082
267k
        if (n < 0)
3083
0
            goto fail;
3084
        /* If short, extend to min(minrun, nremaining). */
3085
267k
        minrun = minrun_next(&ms);
3086
267k
        if (n < minrun) {
3087
132k
            const Py_ssize_t force = nremaining <= minrun ?
3088
85.6k
                              nremaining : minrun;
3089
132k
            if (binarysort(&ms, &lo, force, n) < 0)
3090
0
                goto fail;
3091
132k
            n = force;
3092
132k
        }
3093
        /* Maybe merge pending runs. */
3094
267k
        assert(ms.n == 0 || ms.pending[ms.n -1].base.keys +
3095
267k
                            ms.pending[ms.n-1].len == lo.keys);
3096
267k
        if (found_new_run(&ms, n) < 0)
3097
0
            goto fail;
3098
        /* Push new run on stack. */
3099
267k
        assert(ms.n < MAX_MERGE_PENDING);
3100
267k
        ms.pending[ms.n].base = lo;
3101
267k
        ms.pending[ms.n].len = n;
3102
267k
        ++ms.n;
3103
        /* Advance to find next run. */
3104
267k
        sortslice_advance(&lo, n);
3105
267k
        nremaining -= n;
3106
267k
    } while (nremaining);
3107
3108
195k
    if (merge_force_collapse(&ms) < 0)
3109
0
        goto fail;
3110
195k
    assert(ms.n == 1);
3111
195k
    assert(keys == NULL
3112
195k
           ? ms.pending[0].base.keys == saved_ob_item
3113
195k
           : ms.pending[0].base.keys == &keys[0]);
3114
195k
    assert(ms.pending[0].len == saved_ob_size);
3115
195k
    lo = ms.pending[0].base;
3116
3117
772k
succeed:
3118
772k
    result = Py_None;
3119
772k
fail:
3120
772k
    if (keys != NULL) {
3121
5.19M
        for (i = 0; i < saved_ob_size; i++)
3122
4.64M
            Py_DECREF(keys[i]);
3123
540k
        if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
3124
4.12k
            PyMem_Free(keys);
3125
540k
    }
3126
3127
772k
    if (self->allocated != -1 && result != NULL) {
3128
        /* The user mucked with the list during the sort,
3129
         * and we don't already have another error to report.
3130
         */
3131
0
        PyErr_SetString(PyExc_ValueError, "list modified during sort");
3132
0
        result = NULL;
3133
0
    }
3134
3135
772k
    if (reverse && saved_ob_size > 1)
3136
2
        reverse_slice(saved_ob_item, saved_ob_item + saved_ob_size);
3137
3138
772k
    merge_freemem(&ms);
3139
3140
772k
keyfunc_fail:
3141
772k
    final_ob_item = self->ob_item;
3142
772k
    i = Py_SIZE(self);
3143
772k
    Py_SET_SIZE(self, saved_ob_size);
3144
772k
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item, saved_ob_item);
3145
772k
    FT_ATOMIC_STORE_SSIZE_RELAXED(self->allocated, saved_allocated);
3146
772k
    if (final_ob_item != NULL) {
3147
        /* we cannot use list_clear() for this because it does not
3148
           guarantee that the list is really empty when it returns */
3149
0
        while (--i >= 0) {
3150
0
            Py_XDECREF(final_ob_item[i]);
3151
0
        }
3152
#ifdef Py_GIL_DISABLED
3153
        ensure_shared_on_resize(self);
3154
        bool use_qsbr = _PyObject_GC_IS_SHARED(self);
3155
#else
3156
0
        bool use_qsbr = false;
3157
0
#endif
3158
0
        free_list_items(final_ob_item, use_qsbr);
3159
0
    }
3160
772k
    return Py_XNewRef(result);
3161
772k
}
3162
#undef IFLT
3163
#undef ISLT
3164
3165
int
3166
PyList_Sort(PyObject *v)
3167
15.0k
{
3168
15.0k
    if (v == NULL || !PyList_Check(v)) {
3169
0
        PyErr_BadInternalCall();
3170
0
        return -1;
3171
0
    }
3172
15.0k
    Py_BEGIN_CRITICAL_SECTION(v);
3173
15.0k
    v = list_sort_impl((PyListObject *)v, NULL, 0);
3174
15.0k
    Py_END_CRITICAL_SECTION();
3175
15.0k
    if (v == NULL)
3176
0
        return -1;
3177
15.0k
    Py_DECREF(v);
3178
15.0k
    return 0;
3179
15.0k
}
3180
3181
/*[clinic input]
3182
@critical_section
3183
list.reverse
3184
3185
Reverse *IN PLACE*.
3186
[clinic start generated code]*/
3187
3188
static PyObject *
3189
list_reverse_impl(PyListObject *self)
3190
/*[clinic end generated code: output=482544fc451abea9 input=04ac8e0c6a66e4d9]*/
3191
0
{
3192
0
    if (Py_SIZE(self) > 1)
3193
0
        reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
3194
0
    Py_RETURN_NONE;
3195
0
}
3196
3197
int
3198
PyList_Reverse(PyObject *v)
3199
50
{
3200
50
    PyListObject *self = (PyListObject *)v;
3201
3202
50
    if (v == NULL || !PyList_Check(v)) {
3203
0
        PyErr_BadInternalCall();
3204
0
        return -1;
3205
0
    }
3206
50
    Py_BEGIN_CRITICAL_SECTION(self);
3207
50
    if (Py_SIZE(self) > 1) {
3208
50
        reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
3209
50
    }
3210
50
    Py_END_CRITICAL_SECTION()
3211
50
    return 0;
3212
50
}
3213
3214
PyObject *
3215
PyList_AsTuple(PyObject *v)
3216
307k
{
3217
307k
    if (v == NULL || !PyList_Check(v)) {
3218
0
        PyErr_BadInternalCall();
3219
0
        return NULL;
3220
0
    }
3221
307k
    PyObject *ret;
3222
307k
    PyListObject *self = (PyListObject *)v;
3223
307k
    Py_BEGIN_CRITICAL_SECTION(self);
3224
307k
    ret = _PyTuple_FromArray(self->ob_item, Py_SIZE(v));
3225
307k
    Py_END_CRITICAL_SECTION();
3226
307k
    return ret;
3227
307k
}
3228
3229
PyObject *
3230
_PyList_AsTupleAndClear(PyListObject *self)
3231
24
{
3232
24
    assert(self != NULL);
3233
24
    PyObject *ret;
3234
24
    if (self->ob_item == NULL) {
3235
0
        return PyTuple_New(0);
3236
0
    }
3237
24
    Py_BEGIN_CRITICAL_SECTION(self);
3238
24
    PyObject **items = self->ob_item;
3239
24
    Py_ssize_t size = Py_SIZE(self);
3240
24
    self->ob_item = NULL;
3241
24
    Py_SET_SIZE(self, 0);
3242
24
    ret = _PyTuple_FromArraySteal(items, size);
3243
24
    free_list_items(items, false);
3244
24
    Py_END_CRITICAL_SECTION();
3245
24
    return ret;
3246
24
}
3247
3248
PyObject *
3249
_PyList_FromStackRefStealOnSuccess(const _PyStackRef *src, Py_ssize_t n)
3250
197M
{
3251
197M
    if (n == 0) {
3252
178M
        return PyList_New(0);
3253
178M
    }
3254
3255
18.4M
    PyListObject *list = (PyListObject *)PyList_New(n);
3256
18.4M
    if (list == NULL) {
3257
0
        return NULL;
3258
0
    }
3259
3260
18.4M
    PyObject **dst = list->ob_item;
3261
52.1M
    for (Py_ssize_t i = 0; i < n; i++) {
3262
33.7M
        dst[i] = PyStackRef_AsPyObjectSteal(src[i]);
3263
33.7M
    }
3264
3265
18.4M
    return (PyObject *)list;
3266
18.4M
}
3267
3268
/*[clinic input]
3269
list.index
3270
3271
    value: object
3272
    start: slice_index(accept={int}) = 0
3273
    stop: slice_index(accept={int}, c_default="PY_SSIZE_T_MAX") = sys.maxsize
3274
    /
3275
3276
Return first index of value.
3277
3278
Raises ValueError if the value is not present.
3279
[clinic start generated code]*/
3280
3281
static PyObject *
3282
list_index_impl(PyListObject *self, PyObject *value, Py_ssize_t start,
3283
                Py_ssize_t stop)
3284
/*[clinic end generated code: output=ec51b88787e4e481 input=40ec5826303a0eb1]*/
3285
0
{
3286
0
    if (start < 0) {
3287
0
        start += Py_SIZE(self);
3288
0
        if (start < 0)
3289
0
            start = 0;
3290
0
    }
3291
0
    if (stop < 0) {
3292
0
        stop += Py_SIZE(self);
3293
0
        if (stop < 0)
3294
0
            stop = 0;
3295
0
    }
3296
0
    for (Py_ssize_t i = start; i < stop; i++) {
3297
0
        PyObject *obj = list_get_item_ref(self, i);
3298
0
        if (obj == NULL) {
3299
            // out-of-bounds
3300
0
            break;
3301
0
        }
3302
0
        int cmp = PyObject_RichCompareBool(obj, value, Py_EQ);
3303
0
        Py_DECREF(obj);
3304
0
        if (cmp > 0)
3305
0
            return PyLong_FromSsize_t(i);
3306
0
        else if (cmp < 0)
3307
0
            return NULL;
3308
0
    }
3309
0
    PyErr_SetString(PyExc_ValueError, "list.index(x): x not in list");
3310
0
    return NULL;
3311
0
}
3312
3313
/*[clinic input]
3314
list.count
3315
3316
     value: object
3317
     /
3318
3319
Return number of occurrences of value.
3320
[clinic start generated code]*/
3321
3322
static PyObject *
3323
list_count_impl(PyListObject *self, PyObject *value)
3324
/*[clinic end generated code: output=eff66f14aef2df86 input=3bdc3a5e6f749565]*/
3325
0
{
3326
0
    Py_ssize_t count = 0;
3327
0
    for (Py_ssize_t i = 0; ; i++) {
3328
0
        PyObject *obj = list_get_item_ref(self, i);
3329
0
        if (obj == NULL) {
3330
            // out-of-bounds
3331
0
            break;
3332
0
        }
3333
0
        if (obj == value) {
3334
0
           count++;
3335
0
           Py_DECREF(obj);
3336
0
           continue;
3337
0
        }
3338
0
        int cmp = PyObject_RichCompareBool(obj, value, Py_EQ);
3339
0
        Py_DECREF(obj);
3340
0
        if (cmp > 0)
3341
0
            count++;
3342
0
        else if (cmp < 0)
3343
0
            return NULL;
3344
0
    }
3345
0
    return PyLong_FromSsize_t(count);
3346
0
}
3347
3348
/*[clinic input]
3349
@critical_section
3350
list.remove
3351
3352
     value: object
3353
     /
3354
3355
Remove first occurrence of value.
3356
3357
Raises ValueError if the value is not present.
3358
[clinic start generated code]*/
3359
3360
static PyObject *
3361
list_remove_impl(PyListObject *self, PyObject *value)
3362
/*[clinic end generated code: output=b9b76a6633b18778 input=26c813dbb95aa93b]*/
3363
2.78k
{
3364
2.78k
    Py_ssize_t i;
3365
3366
2.79k
    for (i = 0; i < Py_SIZE(self); i++) {
3367
2.79k
        PyObject *obj = self->ob_item[i];
3368
2.79k
        Py_INCREF(obj);
3369
2.79k
        int cmp = PyObject_RichCompareBool(obj, value, Py_EQ);
3370
2.79k
        Py_DECREF(obj);
3371
2.79k
        if (cmp > 0) {
3372
2.78k
            if (list_ass_slice_lock_held(self, i, i+1, NULL) == 0)
3373
2.78k
                Py_RETURN_NONE;
3374
0
            return NULL;
3375
2.78k
        }
3376
10
        else if (cmp < 0)
3377
0
            return NULL;
3378
2.79k
    }
3379
2
    PyErr_SetString(PyExc_ValueError, "list.remove(x): x not in list");
3380
2
    return NULL;
3381
2.78k
}
3382
3383
static int
3384
list_traverse(PyObject *self, visitproc visit, void *arg)
3385
59.5M
{
3386
59.5M
    PyListObject *o = (PyListObject *)self;
3387
59.5M
    Py_ssize_t i;
3388
3389
749M
    for (i = Py_SIZE(o); --i >= 0; )
3390
689M
        Py_VISIT(o->ob_item[i]);
3391
59.5M
    return 0;
3392
59.5M
}
3393
3394
static PyObject *
3395
list_richcompare_impl(PyObject *v, PyObject *w, int op)
3396
4.09k
{
3397
4.09k
    PyListObject *vl, *wl;
3398
4.09k
    Py_ssize_t i;
3399
3400
4.09k
    if (!PyList_Check(v) || !PyList_Check(w))
3401
763
        Py_RETURN_NOTIMPLEMENTED;
3402
3403
3.32k
    vl = (PyListObject *)v;
3404
3.32k
    wl = (PyListObject *)w;
3405
3406
3.32k
    if (Py_SIZE(vl) != Py_SIZE(wl) && (op == Py_EQ || op == Py_NE)) {
3407
        /* Shortcut: if the lengths differ, the lists differ */
3408
476
        if (op == Py_EQ)
3409
476
            Py_RETURN_FALSE;
3410
0
        else
3411
0
            Py_RETURN_TRUE;
3412
476
    }
3413
3414
    /* Search for the first index where items are different */
3415
3.05k
    for (i = 0; i < Py_SIZE(vl) && i < Py_SIZE(wl); i++) {
3416
412
        PyObject *vitem = vl->ob_item[i];
3417
412
        PyObject *witem = wl->ob_item[i];
3418
412
        if (vitem == witem) {
3419
158
            continue;
3420
158
        }
3421
3422
254
        Py_INCREF(vitem);
3423
254
        Py_INCREF(witem);
3424
254
        int k = PyObject_RichCompareBool(vitem, witem, Py_EQ);
3425
254
        Py_DECREF(vitem);
3426
254
        Py_DECREF(witem);
3427
254
        if (k < 0)
3428
0
            return NULL;
3429
254
        if (!k)
3430
206
            break;
3431
254
    }
3432
3433
2.85k
    if (i >= Py_SIZE(vl) || i >= Py_SIZE(wl)) {
3434
        /* No more items to compare -- compare sizes */
3435
2.64k
        Py_RETURN_RICHCOMPARE(Py_SIZE(vl), Py_SIZE(wl), op);
3436
2.64k
    }
3437
3438
    /* We have an item that differs -- shortcuts for EQ/NE */
3439
206
    if (op == Py_EQ) {
3440
194
        Py_RETURN_FALSE;
3441
194
    }
3442
12
    if (op == Py_NE) {
3443
12
        Py_RETURN_TRUE;
3444
12
    }
3445
3446
    /* Compare the final item again using the proper operator */
3447
0
    PyObject *vitem = vl->ob_item[i];
3448
0
    PyObject *witem = wl->ob_item[i];
3449
0
    Py_INCREF(vitem);
3450
0
    Py_INCREF(witem);
3451
0
    PyObject *result = PyObject_RichCompare(vl->ob_item[i], wl->ob_item[i], op);
3452
0
    Py_DECREF(vitem);
3453
0
    Py_DECREF(witem);
3454
0
    return result;
3455
12
}
3456
3457
static PyObject *
3458
list_richcompare(PyObject *v, PyObject *w, int op)
3459
4.09k
{
3460
4.09k
    PyObject *ret;
3461
4.09k
    Py_BEGIN_CRITICAL_SECTION2(v, w);
3462
4.09k
    ret = list_richcompare_impl(v, w, op);
3463
4.09k
    Py_END_CRITICAL_SECTION2()
3464
4.09k
    return ret;
3465
4.09k
}
3466
3467
/*[clinic input]
3468
list.__init__
3469
3470
    iterable: object(c_default="NULL") = ()
3471
    /
3472
3473
Built-in mutable sequence.
3474
3475
If no argument is given, the constructor creates a new empty list.
3476
The argument must be an iterable if specified.
3477
[clinic start generated code]*/
3478
3479
static int
3480
list___init___impl(PyListObject *self, PyObject *iterable)
3481
/*[clinic end generated code: output=0f3c21379d01de48 input=b3f3fe7206af8f6b]*/
3482
20.1M
{
3483
    /* Verify list invariants established by PyType_GenericAlloc() */
3484
20.1M
    assert(0 <= Py_SIZE(self));
3485
20.1M
    assert(Py_SIZE(self) <= self->allocated || self->allocated == -1);
3486
20.1M
    assert(self->ob_item != NULL ||
3487
20.1M
           self->allocated == 0 || self->allocated == -1);
3488
3489
    /* Empty previous contents */
3490
20.1M
    if (self->ob_item != NULL) {
3491
0
        Py_BEGIN_CRITICAL_SECTION(self);
3492
0
        list_clear(self);
3493
0
        Py_END_CRITICAL_SECTION();
3494
0
    }
3495
20.1M
    if (iterable != NULL) {
3496
8.99M
        if (_list_extend(self, iterable) < 0) {
3497
0
            return -1;
3498
0
        }
3499
8.99M
    }
3500
20.1M
    return 0;
3501
20.1M
}
3502
3503
static PyObject *
3504
list_vectorcall(PyObject *type, PyObject * const*args,
3505
                size_t nargsf, PyObject *kwnames)
3506
8.99M
{
3507
8.99M
    if (!_PyArg_NoKwnames("list", kwnames)) {
3508
0
        return NULL;
3509
0
    }
3510
8.99M
    Py_ssize_t nargs = PyVectorcall_NARGS(nargsf);
3511
8.99M
    if (!_PyArg_CheckPositional("list", nargs, 0, 1)) {
3512
0
        return NULL;
3513
0
    }
3514
3515
8.99M
    PyObject *list = PyType_GenericAlloc(_PyType_CAST(type), 0);
3516
8.99M
    if (list == NULL) {
3517
0
        return NULL;
3518
0
    }
3519
8.99M
    if (nargs) {
3520
8.99M
        if (list___init___impl((PyListObject *)list, args[0])) {
3521
0
            Py_DECREF(list);
3522
0
            return NULL;
3523
0
        }
3524
8.99M
    }
3525
8.99M
    return list;
3526
8.99M
}
3527
3528
3529
/*[clinic input]
3530
list.__sizeof__
3531
3532
Return the size of the list in memory, in bytes.
3533
[clinic start generated code]*/
3534
3535
static PyObject *
3536
list___sizeof___impl(PyListObject *self)
3537
/*[clinic end generated code: output=3417541f95f9a53e input=b8030a5d5ce8a187]*/
3538
0
{
3539
0
    size_t res = _PyObject_SIZE(Py_TYPE(self));
3540
0
    Py_ssize_t allocated = FT_ATOMIC_LOAD_SSIZE_RELAXED(self->allocated);
3541
0
    res += (size_t)allocated * sizeof(void*);
3542
0
    return PyLong_FromSize_t(res);
3543
0
}
3544
3545
static PyObject *list_iter(PyObject *seq);
3546
static PyObject *list_subscript(PyObject*, PyObject*);
3547
3548
static PyMethodDef list_methods[] = {
3549
    {"__getitem__", list_subscript, METH_O|METH_COEXIST,
3550
     PyDoc_STR("__getitem__($self, index, /)\n--\n\nReturn self[index].")},
3551
    LIST___REVERSED___METHODDEF
3552
    LIST___SIZEOF___METHODDEF
3553
    PY_LIST_CLEAR_METHODDEF
3554
    LIST_COPY_METHODDEF
3555
    LIST_APPEND_METHODDEF
3556
    LIST_INSERT_METHODDEF
3557
    LIST_EXTEND_METHODDEF
3558
    LIST_POP_METHODDEF
3559
    LIST_REMOVE_METHODDEF
3560
    LIST_INDEX_METHODDEF
3561
    LIST_COUNT_METHODDEF
3562
    LIST_REVERSE_METHODDEF
3563
    LIST_SORT_METHODDEF
3564
    {"__class_getitem__", Py_GenericAlias, METH_O|METH_CLASS, PyDoc_STR("See PEP 585")},
3565
    {NULL,              NULL}           /* sentinel */
3566
};
3567
3568
static PySequenceMethods list_as_sequence = {
3569
    list_length,                                /* sq_length */
3570
    list_concat,                                /* sq_concat */
3571
    list_repeat,                                /* sq_repeat */
3572
    list_item,                                  /* sq_item */
3573
    0,                                          /* sq_slice */
3574
    list_ass_item,                              /* sq_ass_item */
3575
    0,                                          /* sq_ass_slice */
3576
    list_contains,                              /* sq_contains */
3577
    list_inplace_concat,                        /* sq_inplace_concat */
3578
    list_inplace_repeat,                        /* sq_inplace_repeat */
3579
};
3580
3581
static inline PyObject *
3582
list_slice_step_lock_held(PyListObject *a, Py_ssize_t start, Py_ssize_t step, Py_ssize_t len)
3583
48
{
3584
48
    PyListObject *np = (PyListObject *)list_new_prealloc(len);
3585
48
    if (np == NULL) {
3586
0
        return NULL;
3587
0
    }
3588
48
    size_t cur;
3589
48
    Py_ssize_t i;
3590
48
    PyObject **src = a->ob_item;
3591
48
    PyObject **dest = np->ob_item;
3592
480
    for (cur = start, i = 0; i < len;
3593
432
            cur += (size_t)step, i++) {
3594
432
        PyObject *v = src[cur];
3595
432
        dest[i] = Py_NewRef(v);
3596
432
    }
3597
48
    Py_SET_SIZE(np, len);
3598
48
    return (PyObject *)np;
3599
48
}
3600
3601
static PyObject *
3602
list_slice_wrap(PyListObject *aa, Py_ssize_t start, Py_ssize_t stop, Py_ssize_t step)
3603
2.50M
{
3604
2.50M
    PyObject *res = NULL;
3605
2.50M
    Py_BEGIN_CRITICAL_SECTION(aa);
3606
2.50M
    Py_ssize_t len = PySlice_AdjustIndices(Py_SIZE(aa), &start, &stop, step);
3607
2.50M
    if (len <= 0) {
3608
440k
        res = PyList_New(0);
3609
440k
    }
3610
2.06M
    else if (step == 1) {
3611
2.06M
        res = list_slice_lock_held(aa, start, stop);
3612
2.06M
    }
3613
48
    else {
3614
48
        res = list_slice_step_lock_held(aa, start, step, len);
3615
48
    }
3616
2.50M
    Py_END_CRITICAL_SECTION();
3617
2.50M
    return res;
3618
2.50M
}
3619
3620
static inline PyObject*
3621
list_slice_subscript(PyObject* self, PyObject* item)
3622
2.50M
{
3623
2.50M
    assert(PyList_Check(self));
3624
2.50M
    assert(PySlice_Check(item));
3625
2.50M
    Py_ssize_t start, stop, step;
3626
2.50M
    if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
3627
0
        return NULL;
3628
0
    }
3629
2.50M
    return list_slice_wrap((PyListObject *)self, start, stop, step);
3630
2.50M
}
3631
3632
PyObject *
3633
_PyList_SliceSubscript(PyObject* _self, PyObject* item)
3634
2.36M
{
3635
2.36M
    return list_slice_subscript(_self, item);
3636
2.36M
}
3637
3638
static PyObject *
3639
list_subscript(PyObject* _self, PyObject* item)
3640
16.6M
{
3641
16.6M
    PyListObject* self = (PyListObject*)_self;
3642
16.6M
    if (_PyIndex_Check(item)) {
3643
16.4M
        Py_ssize_t i;
3644
16.4M
        i = PyNumber_AsSsize_t(item, PyExc_IndexError);
3645
16.4M
        if (i == -1 && PyErr_Occurred())
3646
0
            return NULL;
3647
16.4M
        if (i < 0)
3648
12.9M
            i += PyList_GET_SIZE(self);
3649
16.4M
        return list_item((PyObject *)self, i);
3650
16.4M
    }
3651
144k
    else if (PySlice_Check(item)) {
3652
144k
        return list_slice_subscript(_self, item);
3653
144k
    }
3654
0
    else {
3655
0
        PyErr_Format(PyExc_TypeError,
3656
0
                     "list indices must be integers or slices, not %.200s",
3657
0
                     Py_TYPE(item)->tp_name);
3658
0
        return NULL;
3659
0
    }
3660
16.6M
}
3661
3662
static Py_ssize_t
3663
adjust_slice_indexes(PyListObject *lst,
3664
                     Py_ssize_t *start, Py_ssize_t *stop,
3665
                     Py_ssize_t step)
3666
252k
{
3667
252k
    Py_ssize_t slicelength = PySlice_AdjustIndices(Py_SIZE(lst), start, stop,
3668
252k
                                                   step);
3669
3670
    /* Make sure s[5:2] = [..] inserts at the right place:
3671
        before 5, not before 2. */
3672
252k
    if ((step < 0 && *start < *stop) ||
3673
252k
        (step > 0 && *start > *stop))
3674
0
        *stop = *start;
3675
3676
252k
    return slicelength;
3677
252k
}
3678
3679
static int
3680
list_ass_subscript_lock_held(PyObject *_self, PyObject *item, PyObject *value)
3681
255k
{
3682
255k
    _Py_CRITICAL_SECTION_ASSERT_OBJECT_LOCKED(_self);
3683
3684
255k
    PyListObject *self = (PyListObject *)_self;
3685
255k
    if (_PyIndex_Check(item)) {
3686
3.18k
        Py_ssize_t i = PyNumber_AsSsize_t(item, PyExc_IndexError);
3687
3.18k
        if (i == -1 && PyErr_Occurred())
3688
0
            return -1;
3689
3.18k
        if (i < 0)
3690
3.04k
            i += PyList_GET_SIZE(self);
3691
3.18k
        return list_ass_item_lock_held(self, i, value);
3692
3.18k
    }
3693
252k
    else if (PySlice_Check(item)) {
3694
252k
        Py_ssize_t start, stop, step;
3695
3696
252k
        if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
3697
0
            return -1;
3698
0
        }
3699
3700
252k
        if (value == NULL) {
3701
            /* delete slice */
3702
12
            PyObject **garbage;
3703
12
            size_t cur;
3704
12
            Py_ssize_t i;
3705
12
            int res;
3706
3707
12
            Py_ssize_t slicelength = adjust_slice_indexes(self, &start, &stop,
3708
12
                                                          step);
3709
3710
12
            if (step == 1)
3711
12
                return list_ass_slice_lock_held(self, start, stop, value);
3712
3713
0
            if (slicelength <= 0)
3714
0
                return 0;
3715
3716
0
            if (step < 0) {
3717
0
                stop = start + 1;
3718
0
                start = stop + step*(slicelength - 1) - 1;
3719
0
                step = -step;
3720
0
            }
3721
3722
0
            garbage = (PyObject**)
3723
0
                PyMem_Malloc(slicelength*sizeof(PyObject*));
3724
0
            if (!garbage) {
3725
0
                PyErr_NoMemory();
3726
0
                return -1;
3727
0
            }
3728
3729
            /* drawing pictures might help understand these for
3730
               loops. Basically, we memmove the parts of the
3731
               list that are *not* part of the slice: step-1
3732
               items for each item that is part of the slice,
3733
               and then tail end of the list that was not
3734
               covered by the slice */
3735
0
            for (cur = start, i = 0;
3736
0
                 cur < (size_t)stop;
3737
0
                 cur += step, i++) {
3738
0
                Py_ssize_t lim = step - 1;
3739
3740
0
                garbage[i] = PyList_GET_ITEM(self, cur);
3741
3742
0
                if (cur + step >= (size_t)Py_SIZE(self)) {
3743
0
                    lim = Py_SIZE(self) - cur - 1;
3744
0
                }
3745
3746
0
                memmove(self->ob_item + cur - i,
3747
0
                    self->ob_item + cur + 1,
3748
0
                    lim * sizeof(PyObject *));
3749
0
            }
3750
0
            cur = start + (size_t)slicelength * step;
3751
0
            if (cur < (size_t)Py_SIZE(self)) {
3752
0
                memmove(self->ob_item + cur - slicelength,
3753
0
                    self->ob_item + cur,
3754
0
                    (Py_SIZE(self) - cur) *
3755
0
                     sizeof(PyObject *));
3756
0
            }
3757
3758
0
            Py_SET_SIZE(self, Py_SIZE(self) - slicelength);
3759
0
            res = list_resize(self, Py_SIZE(self));
3760
3761
0
            for (i = 0; i < slicelength; i++) {
3762
0
                Py_DECREF(garbage[i]);
3763
0
            }
3764
0
            PyMem_Free(garbage);
3765
3766
0
            return res;
3767
0
        }
3768
252k
        else {
3769
            /* assign slice */
3770
252k
            PyObject *ins, *seq;
3771
252k
            PyObject **garbage, **seqitems, **selfitems;
3772
252k
            Py_ssize_t i;
3773
252k
            size_t cur;
3774
3775
            /* protect against a[::-1] = a */
3776
252k
            if (self == (PyListObject*)value) {
3777
0
                seq = list_slice_lock_held((PyListObject *)value, 0,
3778
0
                                            Py_SIZE(value));
3779
0
            }
3780
252k
            else {
3781
252k
                seq = PySequence_Fast(value,
3782
252k
                                      "must assign iterable "
3783
252k
                                      "to extended slice");
3784
252k
            }
3785
252k
            if (!seq)
3786
0
                return -1;
3787
3788
252k
            Py_ssize_t slicelength = adjust_slice_indexes(self, &start, &stop,
3789
252k
                                                          step);
3790
3791
252k
            if (step == 1) {
3792
252k
                int res = list_ass_slice_lock_held(self, start, stop, seq);
3793
252k
                Py_DECREF(seq);
3794
252k
                return res;
3795
252k
            }
3796
3797
0
            if (PySequence_Fast_GET_SIZE(seq) != slicelength) {
3798
0
                PyErr_Format(PyExc_ValueError,
3799
0
                    "attempt to assign sequence of "
3800
0
                    "size %zd to extended slice of "
3801
0
                    "size %zd",
3802
0
                         PySequence_Fast_GET_SIZE(seq),
3803
0
                         slicelength);
3804
0
                Py_DECREF(seq);
3805
0
                return -1;
3806
0
            }
3807
3808
0
            if (!slicelength) {
3809
0
                Py_DECREF(seq);
3810
0
                return 0;
3811
0
            }
3812
3813
0
            garbage = (PyObject**)
3814
0
                PyMem_Malloc(slicelength*sizeof(PyObject*));
3815
0
            if (!garbage) {
3816
0
                Py_DECREF(seq);
3817
0
                PyErr_NoMemory();
3818
0
                return -1;
3819
0
            }
3820
3821
0
            selfitems = self->ob_item;
3822
0
            seqitems = PySequence_Fast_ITEMS(seq);
3823
0
            for (cur = start, i = 0; i < slicelength;
3824
0
                 cur += (size_t)step, i++) {
3825
0
                garbage[i] = selfitems[cur];
3826
0
                ins = Py_NewRef(seqitems[i]);
3827
0
                selfitems[cur] = ins;
3828
0
            }
3829
3830
0
            for (i = 0; i < slicelength; i++) {
3831
0
                Py_DECREF(garbage[i]);
3832
0
            }
3833
3834
0
            PyMem_Free(garbage);
3835
0
            Py_DECREF(seq);
3836
3837
0
            return 0;
3838
0
        }
3839
252k
    }
3840
0
    else {
3841
0
        PyErr_Format(PyExc_TypeError,
3842
0
                     "list indices must be integers or slices, not %.200s",
3843
0
                     Py_TYPE(item)->tp_name);
3844
0
        return -1;
3845
0
    }
3846
255k
}
3847
3848
static int
3849
list_ass_subscript(PyObject *self, PyObject *item, PyObject *value)
3850
255k
{
3851
255k
    int res;
3852
#ifdef Py_GIL_DISABLED
3853
    if (PySlice_Check(item) && value != NULL && PyList_CheckExact(value)) {
3854
        Py_BEGIN_CRITICAL_SECTION2(self, value);
3855
        res = list_ass_subscript_lock_held(self, item, value);
3856
        Py_END_CRITICAL_SECTION2();
3857
        return res;
3858
    }
3859
#endif
3860
255k
    Py_BEGIN_CRITICAL_SECTION(self);
3861
255k
    res = list_ass_subscript_lock_held(self, item, value);
3862
255k
    Py_END_CRITICAL_SECTION();
3863
255k
    return res;
3864
255k
}
3865
3866
static PyMappingMethods list_as_mapping = {
3867
    list_length,
3868
    list_subscript,
3869
    list_ass_subscript
3870
};
3871
3872
PyTypeObject PyList_Type = {
3873
    PyVarObject_HEAD_INIT(&PyType_Type, 0)
3874
    "list",
3875
    sizeof(PyListObject),
3876
    0,
3877
    list_dealloc,                               /* tp_dealloc */
3878
    0,                                          /* tp_vectorcall_offset */
3879
    0,                                          /* tp_getattr */
3880
    0,                                          /* tp_setattr */
3881
    0,                                          /* tp_as_async */
3882
    list_repr,                                  /* tp_repr */
3883
    0,                                          /* tp_as_number */
3884
    &list_as_sequence,                          /* tp_as_sequence */
3885
    &list_as_mapping,                           /* tp_as_mapping */
3886
    PyObject_HashNotImplemented,                /* tp_hash */
3887
    0,                                          /* tp_call */
3888
    0,                                          /* tp_str */
3889
    PyObject_GenericGetAttr,                    /* tp_getattro */
3890
    0,                                          /* tp_setattro */
3891
    0,                                          /* tp_as_buffer */
3892
    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
3893
        Py_TPFLAGS_BASETYPE | Py_TPFLAGS_LIST_SUBCLASS |
3894
        _Py_TPFLAGS_MATCH_SELF | Py_TPFLAGS_SEQUENCE,  /* tp_flags */
3895
    list___init____doc__,                       /* tp_doc */
3896
    list_traverse,                              /* tp_traverse */
3897
    list_clear_slot,                            /* tp_clear */
3898
    list_richcompare,                           /* tp_richcompare */
3899
    0,                                          /* tp_weaklistoffset */
3900
    list_iter,                                  /* tp_iter */
3901
    0,                                          /* tp_iternext */
3902
    list_methods,                               /* tp_methods */
3903
    0,                                          /* tp_members */
3904
    0,                                          /* tp_getset */
3905
    0,                                          /* tp_base */
3906
    0,                                          /* tp_dict */
3907
    0,                                          /* tp_descr_get */
3908
    0,                                          /* tp_descr_set */
3909
    0,                                          /* tp_dictoffset */
3910
    list___init__,                              /* tp_init */
3911
    PyType_GenericAlloc,                        /* tp_alloc */
3912
    PyType_GenericNew,                          /* tp_new */
3913
    PyObject_GC_Del,                            /* tp_free */
3914
    .tp_vectorcall = list_vectorcall,
3915
    .tp_version_tag = _Py_TYPE_VERSION_LIST,
3916
};
3917
3918
/*********************** List Iterator **************************/
3919
3920
static void listiter_dealloc(PyObject *);
3921
static int listiter_traverse(PyObject *, visitproc, void *);
3922
static PyObject *listiter_next(PyObject *);
3923
static PyObject *listiter_len(PyObject *, PyObject *);
3924
static PyObject *listiter_reduce_general(void *_it, int forward);
3925
static PyObject *listiter_reduce(PyObject *, PyObject *);
3926
static PyObject *listiter_setstate(PyObject *, PyObject *state);
3927
3928
PyDoc_STRVAR(length_hint_doc, "Private method returning an estimate of len(list(it)).");
3929
PyDoc_STRVAR(reduce_doc, "Return state information for pickling.");
3930
PyDoc_STRVAR(setstate_doc, "Set state information for unpickling.");
3931
3932
static PyMethodDef listiter_methods[] = {
3933
    {"__length_hint__", listiter_len, METH_NOARGS, length_hint_doc},
3934
    {"__reduce__", listiter_reduce, METH_NOARGS, reduce_doc},
3935
    {"__setstate__", listiter_setstate, METH_O, setstate_doc},
3936
    {NULL,              NULL}           /* sentinel */
3937
};
3938
3939
PyTypeObject PyListIter_Type = {
3940
    PyVarObject_HEAD_INIT(&PyType_Type, 0)
3941
    "list_iterator",                            /* tp_name */
3942
    sizeof(_PyListIterObject),                  /* tp_basicsize */
3943
    0,                                          /* tp_itemsize */
3944
    /* methods */
3945
    listiter_dealloc,               /* tp_dealloc */
3946
    0,                                          /* tp_vectorcall_offset */
3947
    0,                                          /* tp_getattr */
3948
    0,                                          /* tp_setattr */
3949
    0,                                          /* tp_as_async */
3950
    0,                                          /* tp_repr */
3951
    0,                                          /* tp_as_number */
3952
    0,                                          /* tp_as_sequence */
3953
    0,                                          /* tp_as_mapping */
3954
    0,                                          /* tp_hash */
3955
    0,                                          /* tp_call */
3956
    0,                                          /* tp_str */
3957
    PyObject_GenericGetAttr,                    /* tp_getattro */
3958
    0,                                          /* tp_setattro */
3959
    0,                                          /* tp_as_buffer */
3960
    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3961
    0,                                          /* tp_doc */
3962
    listiter_traverse,                          /* tp_traverse */
3963
    0,                                          /* tp_clear */
3964
    0,                                          /* tp_richcompare */
3965
    0,                                          /* tp_weaklistoffset */
3966
    PyObject_SelfIter,                          /* tp_iter */
3967
    listiter_next,                              /* tp_iternext */
3968
    listiter_methods,                           /* tp_methods */
3969
    0,                                          /* tp_members */
3970
};
3971
3972
3973
static PyObject *
3974
list_iter(PyObject *seq)
3975
33.7M
{
3976
33.7M
    if (!PyList_Check(seq)) {
3977
0
        PyErr_BadInternalCall();
3978
0
        return NULL;
3979
0
    }
3980
33.7M
    _PyListIterObject *it = _Py_FREELIST_POP(_PyListIterObject, list_iters);
3981
33.7M
    if (it == NULL) {
3982
1.74M
        it = PyObject_GC_New(_PyListIterObject, &PyListIter_Type);
3983
1.74M
        if (it == NULL) {
3984
0
            return NULL;
3985
0
        }
3986
1.74M
    }
3987
33.7M
    it->it_index = 0;
3988
33.7M
    it->it_seq = (PyListObject *)Py_NewRef(seq);
3989
33.7M
    _PyObject_GC_TRACK(it);
3990
33.7M
    return (PyObject *)it;
3991
33.7M
}
3992
3993
static void
3994
listiter_dealloc(PyObject *self)
3995
33.7M
{
3996
33.7M
    _PyListIterObject *it = (_PyListIterObject *)self;
3997
33.7M
    _PyObject_GC_UNTRACK(it);
3998
33.7M
    Py_XDECREF(it->it_seq);
3999
33.7M
    assert(Py_IS_TYPE(self, &PyListIter_Type));
4000
33.7M
    _Py_FREELIST_FREE(list_iters, it, PyObject_GC_Del);
4001
33.7M
}
4002
4003
static int
4004
listiter_traverse(PyObject *it, visitproc visit, void *arg)
4005
334k
{
4006
334k
    Py_VISIT(((_PyListIterObject *)it)->it_seq);
4007
334k
    return 0;
4008
334k
}
4009
4010
static PyObject *
4011
listiter_next(PyObject *self)
4012
147M
{
4013
147M
    _PyListIterObject *it = (_PyListIterObject *)self;
4014
147M
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4015
147M
    if (index < 0) {
4016
164
        return NULL;
4017
164
    }
4018
4019
147M
    PyObject *item = list_get_item_ref(it->it_seq, index);
4020
147M
    if (item == NULL) {
4021
        // out-of-bounds
4022
33.1M
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, -1);
4023
33.1M
#ifndef Py_GIL_DISABLED
4024
33.1M
        PyListObject *seq = it->it_seq;
4025
33.1M
        it->it_seq = NULL;
4026
33.1M
        Py_DECREF(seq);
4027
33.1M
#endif
4028
33.1M
        return NULL;
4029
33.1M
    }
4030
114M
    FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index + 1);
4031
114M
    return item;
4032
147M
}
4033
4034
static PyObject *
4035
listiter_len(PyObject *self, PyObject *Py_UNUSED(ignored))
4036
1.37M
{
4037
1.37M
    assert(self != NULL);
4038
1.37M
    _PyListIterObject *it = (_PyListIterObject *)self;
4039
1.37M
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4040
1.37M
    if (index >= 0) {
4041
1.37M
        Py_ssize_t len = PyList_GET_SIZE(it->it_seq) - index;
4042
1.37M
        if (len >= 0)
4043
1.37M
            return PyLong_FromSsize_t(len);
4044
1.37M
    }
4045
0
    return PyLong_FromLong(0);
4046
1.37M
}
4047
4048
static PyObject *
4049
listiter_reduce(PyObject *it, PyObject *Py_UNUSED(ignored))
4050
0
{
4051
0
    return listiter_reduce_general(it, 1);
4052
0
}
4053
4054
static PyObject *
4055
listiter_setstate(PyObject *self, PyObject *state)
4056
0
{
4057
0
    _PyListIterObject *it = (_PyListIterObject *)self;
4058
0
    Py_ssize_t index = PyLong_AsSsize_t(state);
4059
0
    if (index == -1 && PyErr_Occurred())
4060
0
        return NULL;
4061
0
    if (it->it_seq != NULL) {
4062
0
        if (index < -1)
4063
0
            index = -1;
4064
0
        else if (index > PyList_GET_SIZE(it->it_seq))
4065
0
            index = PyList_GET_SIZE(it->it_seq); /* iterator exhausted */
4066
0
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index);
4067
0
    }
4068
0
    Py_RETURN_NONE;
4069
0
}
4070
4071
/*********************** List Reverse Iterator **************************/
4072
4073
typedef struct {
4074
    PyObject_HEAD
4075
    Py_ssize_t it_index;
4076
    PyListObject *it_seq; /* Set to NULL when iterator is exhausted */
4077
} listreviterobject;
4078
4079
static void listreviter_dealloc(PyObject *);
4080
static int listreviter_traverse(PyObject *, visitproc, void *);
4081
static PyObject *listreviter_next(PyObject *);
4082
static PyObject *listreviter_len(PyObject *, PyObject *);
4083
static PyObject *listreviter_reduce(PyObject *, PyObject *);
4084
static PyObject *listreviter_setstate(PyObject *, PyObject *);
4085
4086
static PyMethodDef listreviter_methods[] = {
4087
    {"__length_hint__", listreviter_len, METH_NOARGS, length_hint_doc},
4088
    {"__reduce__", listreviter_reduce, METH_NOARGS, reduce_doc},
4089
    {"__setstate__", listreviter_setstate, METH_O, setstate_doc},
4090
    {NULL,              NULL}           /* sentinel */
4091
};
4092
4093
PyTypeObject PyListRevIter_Type = {
4094
    PyVarObject_HEAD_INIT(&PyType_Type, 0)
4095
    "list_reverseiterator",                     /* tp_name */
4096
    sizeof(listreviterobject),                  /* tp_basicsize */
4097
    0,                                          /* tp_itemsize */
4098
    /* methods */
4099
    listreviter_dealloc,                        /* tp_dealloc */
4100
    0,                                          /* tp_vectorcall_offset */
4101
    0,                                          /* tp_getattr */
4102
    0,                                          /* tp_setattr */
4103
    0,                                          /* tp_as_async */
4104
    0,                                          /* tp_repr */
4105
    0,                                          /* tp_as_number */
4106
    0,                                          /* tp_as_sequence */
4107
    0,                                          /* tp_as_mapping */
4108
    0,                                          /* tp_hash */
4109
    0,                                          /* tp_call */
4110
    0,                                          /* tp_str */
4111
    PyObject_GenericGetAttr,                    /* tp_getattro */
4112
    0,                                          /* tp_setattro */
4113
    0,                                          /* tp_as_buffer */
4114
    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4115
    0,                                          /* tp_doc */
4116
    listreviter_traverse,                       /* tp_traverse */
4117
    0,                                          /* tp_clear */
4118
    0,                                          /* tp_richcompare */
4119
    0,                                          /* tp_weaklistoffset */
4120
    PyObject_SelfIter,                          /* tp_iter */
4121
    listreviter_next,                           /* tp_iternext */
4122
    listreviter_methods,                /* tp_methods */
4123
    0,
4124
};
4125
4126
/*[clinic input]
4127
list.__reversed__
4128
4129
Return a reverse iterator over the list.
4130
[clinic start generated code]*/
4131
4132
static PyObject *
4133
list___reversed___impl(PyListObject *self)
4134
/*[clinic end generated code: output=b166f073208c888c input=eadb6e17f8a6a280]*/
4135
40.6M
{
4136
40.6M
    listreviterobject *it;
4137
4138
40.6M
    it = PyObject_GC_New(listreviterobject, &PyListRevIter_Type);
4139
40.6M
    if (it == NULL)
4140
0
        return NULL;
4141
40.6M
    assert(PyList_Check(self));
4142
40.6M
    it->it_index = PyList_GET_SIZE(self) - 1;
4143
40.6M
    it->it_seq = (PyListObject*)Py_NewRef(self);
4144
40.6M
    PyObject_GC_Track(it);
4145
40.6M
    return (PyObject *)it;
4146
40.6M
}
4147
4148
static void
4149
listreviter_dealloc(PyObject *self)
4150
40.6M
{
4151
40.6M
    listreviterobject *it = (listreviterobject *)self;
4152
40.6M
    PyObject_GC_UnTrack(it);
4153
40.6M
    Py_XDECREF(it->it_seq);
4154
40.6M
    PyObject_GC_Del(it);
4155
40.6M
}
4156
4157
static int
4158
listreviter_traverse(PyObject *it, visitproc visit, void *arg)
4159
661
{
4160
661
    Py_VISIT(((listreviterobject *)it)->it_seq);
4161
661
    return 0;
4162
661
}
4163
4164
static PyObject *
4165
listreviter_next(PyObject *self)
4166
51.7M
{
4167
51.7M
    listreviterobject *it = (listreviterobject *)self;
4168
51.7M
    assert(it != NULL);
4169
51.7M
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4170
51.7M
    if (index < 0) {
4171
29.0M
        return NULL;
4172
29.0M
    }
4173
4174
22.6M
    PyListObject *seq = it->it_seq;
4175
22.6M
    assert(PyList_Check(seq));
4176
22.6M
    PyObject *item = list_get_item_ref(seq, index);
4177
22.6M
    if (item != NULL) {
4178
22.6M
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index - 1);
4179
22.6M
        return item;
4180
22.6M
    }
4181
0
    FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, -1);
4182
0
#ifndef Py_GIL_DISABLED
4183
0
    it->it_seq = NULL;
4184
0
    Py_DECREF(seq);
4185
0
#endif
4186
0
    return NULL;
4187
22.6M
}
4188
4189
static PyObject *
4190
listreviter_len(PyObject *self, PyObject *Py_UNUSED(ignored))
4191
0
{
4192
0
    listreviterobject *it = (listreviterobject *)self;
4193
0
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4194
0
    Py_ssize_t len = index + 1;
4195
0
    if (it->it_seq == NULL || PyList_GET_SIZE(it->it_seq) < len)
4196
0
        len = 0;
4197
0
    return PyLong_FromSsize_t(len);
4198
0
}
4199
4200
static PyObject *
4201
listreviter_reduce(PyObject *it, PyObject *Py_UNUSED(ignored))
4202
0
{
4203
0
    return listiter_reduce_general(it, 0);
4204
0
}
4205
4206
static PyObject *
4207
listreviter_setstate(PyObject *self, PyObject *state)
4208
0
{
4209
0
    listreviterobject *it = (listreviterobject *)self;
4210
0
    Py_ssize_t index = PyLong_AsSsize_t(state);
4211
0
    if (index == -1 && PyErr_Occurred())
4212
0
        return NULL;
4213
0
    if (it->it_seq != NULL) {
4214
0
        if (index < -1)
4215
0
            index = -1;
4216
0
        else if (index > PyList_GET_SIZE(it->it_seq) - 1)
4217
0
            index = PyList_GET_SIZE(it->it_seq) - 1;
4218
0
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index);
4219
0
    }
4220
0
    Py_RETURN_NONE;
4221
0
}
4222
4223
/* common pickling support */
4224
4225
static PyObject *
4226
listiter_reduce_general(void *_it, int forward)
4227
0
{
4228
0
    PyObject *list;
4229
0
    PyObject *iter;
4230
4231
    /* _PyEval_GetBuiltin can invoke arbitrary code,
4232
     * call must be before access of iterator pointers.
4233
     * see issue #101765 */
4234
4235
0
    if (forward) {
4236
0
        iter = _PyEval_GetBuiltin(&_Py_ID(iter));
4237
0
        _PyListIterObject *it = (_PyListIterObject *)_it;
4238
0
        Py_ssize_t idx = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4239
0
        if (idx >= 0) {
4240
0
            return Py_BuildValue("N(O)n", iter, it->it_seq, idx);
4241
0
        }
4242
0
    } else {
4243
0
        iter = _PyEval_GetBuiltin(&_Py_ID(reversed));
4244
0
        listreviterobject *it = (listreviterobject *)_it;
4245
0
        Py_ssize_t idx = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4246
0
        if (idx >= 0) {
4247
0
            return Py_BuildValue("N(O)n", iter, it->it_seq, idx);
4248
0
        }
4249
0
    }
4250
    /* empty iterator, create an empty list */
4251
0
    list = PyList_New(0);
4252
0
    if (list == NULL)
4253
0
        return NULL;
4254
0
    return Py_BuildValue("N(N)", iter, list);
4255
0
}