Coverage Report

Created: 2025-09-05 07:10

/src/cpython/Objects/listobject.c
Line
Count
Source (jump to first uncovered line)
1
/* List object implementation */
2
3
#include "Python.h"
4
#include "pycore_abstract.h"      // _PyIndex_Check()
5
#include "pycore_ceval.h"         // _PyEval_GetBuiltin()
6
#include "pycore_critical_section.h"  // _Py_CRITICAL_SECTION_ASSERT_OBJECT_LOCKED()
7
#include "pycore_dict.h"          // _PyDictViewObject
8
#include "pycore_freelist.h"      // _Py_FREELIST_FREE(), _Py_FREELIST_POP()
9
#include "pycore_pyatomic_ft_wrappers.h"
10
#include "pycore_interp.h"        // PyInterpreterState.list
11
#include "pycore_list.h"          // struct _Py_list_freelist, _PyListIterObject
12
#include "pycore_long.h"          // _PyLong_DigitCount
13
#include "pycore_modsupport.h"    // _PyArg_NoKwnames()
14
#include "pycore_object.h"        // _PyObject_GC_TRACK(), _PyDebugAllocatorStats()
15
#include "pycore_stackref.h"      // _Py_TryIncrefCompareStackRef()
16
#include "pycore_tuple.h"         // _PyTuple_FromArray()
17
#include "pycore_typeobject.h"    // _Py_TYPE_VERSION_LIST
18
#include "pycore_setobject.h"     // _PySet_NextEntry()
19
#include <stddef.h>
20
21
/*[clinic input]
22
class list "PyListObject *" "&PyList_Type"
23
[clinic start generated code]*/
24
/*[clinic end generated code: output=da39a3ee5e6b4b0d input=f9b222678f9f71e0]*/
25
26
#include "clinic/listobject.c.h"
27
28
_Py_DECLARE_STR(list_err, "list index out of range");
29
30
#ifdef Py_GIL_DISABLED
31
typedef struct {
32
    Py_ssize_t allocated;
33
    PyObject *ob_item[];
34
} _PyListArray;
35
36
static _PyListArray *
37
list_allocate_array(size_t capacity)
38
{
39
    if (capacity > PY_SSIZE_T_MAX/sizeof(PyObject*) - 1) {
40
        return NULL;
41
    }
42
    _PyListArray *array = PyMem_Malloc(sizeof(_PyListArray) + capacity * sizeof(PyObject *));
43
    if (array == NULL) {
44
        return NULL;
45
    }
46
    array->allocated = capacity;
47
    return array;
48
}
49
50
static Py_ssize_t
51
list_capacity(PyObject **items)
52
{
53
    _PyListArray *array = _Py_CONTAINER_OF(items, _PyListArray, ob_item);
54
    return array->allocated;
55
}
56
#endif
57
58
static void
59
free_list_items(PyObject** items, bool use_qsbr)
60
111M
{
61
#ifdef Py_GIL_DISABLED
62
    _PyListArray *array = _Py_CONTAINER_OF(items, _PyListArray, ob_item);
63
    if (use_qsbr) {
64
        size_t size = sizeof(_PyListArray) + array->allocated * sizeof(PyObject *);
65
        _PyMem_FreeDelayed(array, size);
66
    }
67
    else {
68
        PyMem_Free(array);
69
    }
70
#else
71
111M
    PyMem_Free(items);
72
111M
#endif
73
111M
}
74
75
static void
76
ensure_shared_on_resize(PyListObject *self)
77
80.3M
{
78
#ifdef Py_GIL_DISABLED
79
    // We can't use _Py_CRITICAL_SECTION_ASSERT_OBJECT_LOCKED here because
80
    // the `CALL_LIST_APPEND` bytecode handler may lock the list without
81
    // a critical section.
82
    assert(Py_REFCNT(self) == 1 || PyMutex_IsLocked(&_PyObject_CAST(self)->ob_mutex));
83
84
    // Ensure that the list array is freed using QSBR if we are not the
85
    // owning thread.
86
    if (!_Py_IsOwnedByCurrentThread((PyObject *)self) &&
87
        !_PyObject_GC_IS_SHARED(self))
88
    {
89
        _PyObject_GC_SET_SHARED(self);
90
    }
91
#endif
92
80.3M
}
93
94
/* Ensure ob_item has room for at least newsize elements, and set
95
 * ob_size to newsize.  If newsize > ob_size on entry, the content
96
 * of the new slots at exit is undefined heap trash; it's the caller's
97
 * responsibility to overwrite them with sane values.
98
 * The number of allocated elements may grow, shrink, or stay the same.
99
 * Failure is impossible if newsize <= self.allocated on entry, although
100
 * that partly relies on an assumption that the system realloc() never
101
 * fails when passed a number of bytes <= the number of bytes last
102
 * allocated (the C standard doesn't guarantee this, but it's hard to
103
 * imagine a realloc implementation where it wouldn't be true).
104
 * Note that self->ob_item may change, and even if newsize is less
105
 * than ob_size on entry.
106
 */
107
static int
108
list_resize(PyListObject *self, Py_ssize_t newsize)
109
95.9M
{
110
95.9M
    size_t new_allocated, target_bytes;
111
95.9M
    Py_ssize_t allocated = self->allocated;
112
113
    /* Bypass realloc() when a previous overallocation is large enough
114
       to accommodate the newsize.  If the newsize falls lower than half
115
       the allocated size, then proceed with the realloc() to shrink the list.
116
    */
117
95.9M
    if (allocated >= newsize && newsize >= (allocated >> 1)) {
118
15.6M
        assert(self->ob_item != NULL || newsize == 0);
119
15.6M
        Py_SET_SIZE(self, newsize);
120
15.6M
        return 0;
121
15.6M
    }
122
123
    /* This over-allocates proportional to the list size, making room
124
     * for additional growth.  The over-allocation is mild, but is
125
     * enough to give linear-time amortized behavior over a long
126
     * sequence of appends() in the presence of a poorly-performing
127
     * system realloc().
128
     * Add padding to make the allocated size multiple of 4.
129
     * The growth pattern is:  0, 4, 8, 16, 24, 32, 40, 52, 64, 76, ...
130
     * Note: new_allocated won't overflow because the largest possible value
131
     *       is PY_SSIZE_T_MAX * (9 / 8) + 6 which always fits in a size_t.
132
     */
133
80.3M
    new_allocated = ((size_t)newsize + (newsize >> 3) + 6) & ~(size_t)3;
134
    /* Do not overallocate if the new size is closer to overallocated size
135
     * than to the old size.
136
     */
137
80.3M
    if (newsize - Py_SIZE(self) > (Py_ssize_t)(new_allocated - newsize))
138
9.43k
        new_allocated = ((size_t)newsize + 3) & ~(size_t)3;
139
140
80.3M
    if (newsize == 0)
141
2.42k
        new_allocated = 0;
142
143
80.3M
    ensure_shared_on_resize(self);
144
145
#ifdef Py_GIL_DISABLED
146
    _PyListArray *array = list_allocate_array(new_allocated);
147
    if (array == NULL) {
148
        PyErr_NoMemory();
149
        return -1;
150
    }
151
    PyObject **old_items = self->ob_item;
152
    if (self->ob_item) {
153
        if (new_allocated < (size_t)allocated) {
154
            target_bytes = new_allocated * sizeof(PyObject*);
155
        }
156
        else {
157
            target_bytes = allocated * sizeof(PyObject*);
158
        }
159
        memcpy(array->ob_item, self->ob_item, target_bytes);
160
    }
161
    if (new_allocated > (size_t)allocated) {
162
        memset(array->ob_item + allocated, 0, sizeof(PyObject *) * (new_allocated - allocated));
163
    }
164
     _Py_atomic_store_ptr_release(&self->ob_item, &array->ob_item);
165
    self->allocated = new_allocated;
166
    Py_SET_SIZE(self, newsize);
167
    if (old_items != NULL) {
168
        free_list_items(old_items, _PyObject_GC_IS_SHARED(self));
169
    }
170
#else
171
80.3M
    PyObject **items;
172
80.3M
    if (new_allocated <= (size_t)PY_SSIZE_T_MAX / sizeof(PyObject *)) {
173
80.3M
        target_bytes = new_allocated * sizeof(PyObject *);
174
80.3M
        items = (PyObject **)PyMem_Realloc(self->ob_item, target_bytes);
175
80.3M
    }
176
0
    else {
177
        // integer overflow
178
0
        items = NULL;
179
0
    }
180
80.3M
    if (items == NULL) {
181
0
        PyErr_NoMemory();
182
0
        return -1;
183
0
    }
184
80.3M
    self->ob_item = items;
185
80.3M
    Py_SET_SIZE(self, newsize);
186
80.3M
    self->allocated = new_allocated;
187
80.3M
#endif
188
80.3M
    return 0;
189
80.3M
}
190
191
static int
192
list_preallocate_exact(PyListObject *self, Py_ssize_t size)
193
5.96M
{
194
5.96M
    PyObject **items;
195
5.96M
    assert(self->ob_item == NULL);
196
5.96M
    assert(size > 0);
197
198
    /* Since the Python memory allocator has granularity of 16 bytes on 64-bit
199
     * platforms (8 on 32-bit), there is no benefit of allocating space for
200
     * the odd number of items, and there is no drawback of rounding the
201
     * allocated size up to the nearest even number.
202
     */
203
5.96M
    size = (size + 1) & ~(size_t)1;
204
#ifdef Py_GIL_DISABLED
205
    _PyListArray *array = list_allocate_array(size);
206
    if (array == NULL) {
207
        PyErr_NoMemory();
208
        return -1;
209
    }
210
    items = array->ob_item;
211
    memset(items, 0, size * sizeof(PyObject *));
212
#else
213
5.96M
    items = PyMem_New(PyObject*, size);
214
5.96M
    if (items == NULL) {
215
0
        PyErr_NoMemory();
216
0
        return -1;
217
0
    }
218
5.96M
#endif
219
5.96M
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item, items);
220
5.96M
    self->allocated = size;
221
5.96M
    return 0;
222
5.96M
}
223
224
/* Print summary info about the state of the optimized allocator */
225
void
226
_PyList_DebugMallocStats(FILE *out)
227
0
{
228
0
    _PyDebugAllocatorStats(out,
229
0
                           "free PyListObject",
230
0
                            _Py_FREELIST_SIZE(lists),
231
0
                           sizeof(PyListObject));
232
0
}
233
234
PyObject *
235
PyList_New(Py_ssize_t size)
236
243M
{
237
243M
    if (size < 0) {
238
0
        PyErr_BadInternalCall();
239
0
        return NULL;
240
0
    }
241
242
243M
    PyListObject *op = _Py_FREELIST_POP(PyListObject, lists);
243
243M
    if (op == NULL) {
244
29.6M
        op = PyObject_GC_New(PyListObject, &PyList_Type);
245
29.6M
        if (op == NULL) {
246
0
            return NULL;
247
0
        }
248
29.6M
    }
249
243M
    if (size <= 0) {
250
202M
        op->ob_item = NULL;
251
202M
    }
252
40.9M
    else {
253
#ifdef Py_GIL_DISABLED
254
        _PyListArray *array = list_allocate_array(size);
255
        if (array == NULL) {
256
            Py_DECREF(op);
257
            return PyErr_NoMemory();
258
        }
259
        memset(&array->ob_item, 0, size * sizeof(PyObject *));
260
        op->ob_item = array->ob_item;
261
#else
262
40.9M
        op->ob_item = (PyObject **) PyMem_Calloc(size, sizeof(PyObject *));
263
40.9M
#endif
264
40.9M
        if (op->ob_item == NULL) {
265
0
            Py_DECREF(op);
266
0
            return PyErr_NoMemory();
267
0
        }
268
40.9M
    }
269
243M
    Py_SET_SIZE(op, size);
270
243M
    op->allocated = size;
271
243M
    _PyObject_GC_TRACK(op);
272
243M
    return (PyObject *) op;
273
243M
}
274
275
static PyObject *
276
list_new_prealloc(Py_ssize_t size)
277
13.6M
{
278
13.6M
    assert(size > 0);
279
13.6M
    PyListObject *op = (PyListObject *) PyList_New(0);
280
13.6M
    if (op == NULL) {
281
0
        return NULL;
282
0
    }
283
13.6M
    assert(op->ob_item == NULL);
284
#ifdef Py_GIL_DISABLED
285
    _PyListArray *array = list_allocate_array(size);
286
    if (array == NULL) {
287
        Py_DECREF(op);
288
        return PyErr_NoMemory();
289
    }
290
    op->ob_item = array->ob_item;
291
#else
292
13.6M
    op->ob_item = PyMem_New(PyObject *, size);
293
13.6M
    if (op->ob_item == NULL) {
294
0
        Py_DECREF(op);
295
0
        return PyErr_NoMemory();
296
0
    }
297
13.6M
#endif
298
13.6M
    op->allocated = size;
299
13.6M
    return (PyObject *) op;
300
13.6M
}
301
302
Py_ssize_t
303
PyList_Size(PyObject *op)
304
98.7k
{
305
98.7k
    if (!PyList_Check(op)) {
306
0
        PyErr_BadInternalCall();
307
0
        return -1;
308
0
    }
309
98.7k
    else {
310
98.7k
        return PyList_GET_SIZE(op);
311
98.7k
    }
312
98.7k
}
313
314
static inline int
315
valid_index(Py_ssize_t i, Py_ssize_t limit)
316
197M
{
317
    /* The cast to size_t lets us use just a single comparison
318
       to check whether i is in the range: 0 <= i < limit.
319
320
       See:  Section 14.2 "Bounds Checking" in the Agner Fog
321
       optimization manual found at:
322
       https://www.agner.org/optimize/optimizing_cpp.pdf
323
    */
324
197M
    return (size_t) i < (size_t) limit;
325
197M
}
326
327
#ifdef Py_GIL_DISABLED
328
329
static PyObject *
330
list_item_impl(PyListObject *self, Py_ssize_t idx)
331
{
332
    PyObject *item = NULL;
333
    Py_BEGIN_CRITICAL_SECTION(self);
334
    if (!_PyObject_GC_IS_SHARED(self)) {
335
        _PyObject_GC_SET_SHARED(self);
336
    }
337
    Py_ssize_t size = Py_SIZE(self);
338
    if (!valid_index(idx, size)) {
339
        goto exit;
340
    }
341
    item = _Py_NewRefWithLock(self->ob_item[idx]);
342
exit:
343
    Py_END_CRITICAL_SECTION();
344
    return item;
345
}
346
347
static inline PyObject*
348
list_get_item_ref(PyListObject *op, Py_ssize_t i)
349
{
350
    if (!_Py_IsOwnedByCurrentThread((PyObject *)op) && !_PyObject_GC_IS_SHARED(op)) {
351
        return list_item_impl(op, i);
352
    }
353
    // Need atomic operation for the getting size.
354
    Py_ssize_t size = PyList_GET_SIZE(op);
355
    if (!valid_index(i, size)) {
356
        return NULL;
357
    }
358
    PyObject **ob_item = _Py_atomic_load_ptr(&op->ob_item);
359
    if (ob_item == NULL) {
360
        return NULL;
361
    }
362
    Py_ssize_t cap = list_capacity(ob_item);
363
    assert(cap != -1);
364
    if (!valid_index(i, cap)) {
365
        return NULL;
366
    }
367
    PyObject *item = _Py_TryXGetRef(&ob_item[i]);
368
    if (item == NULL) {
369
        return list_item_impl(op, i);
370
    }
371
    return item;
372
}
373
#else
374
static inline PyObject*
375
list_get_item_ref(PyListObject *op, Py_ssize_t i)
376
153M
{
377
153M
    if (!valid_index(i, Py_SIZE(op))) {
378
30.4M
        return NULL;
379
30.4M
    }
380
122M
    return Py_NewRef(PyList_GET_ITEM(op, i));
381
153M
}
382
#endif
383
384
PyObject *
385
PyList_GetItem(PyObject *op, Py_ssize_t i)
386
594
{
387
594
    if (!PyList_Check(op)) {
388
0
        PyErr_BadInternalCall();
389
0
        return NULL;
390
0
    }
391
594
    if (!valid_index(i, Py_SIZE(op))) {
392
0
        _Py_DECLARE_STR(list_err, "list index out of range");
393
0
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
394
0
        return NULL;
395
0
    }
396
594
    return ((PyListObject *)op) -> ob_item[i];
397
594
}
398
399
PyObject *
400
PyList_GetItemRef(PyObject *op, Py_ssize_t i)
401
91.9k
{
402
91.9k
    if (!PyList_Check(op)) {
403
0
        PyErr_SetString(PyExc_TypeError, "expected a list");
404
0
        return NULL;
405
0
    }
406
91.9k
    PyObject *item = list_get_item_ref((PyListObject *)op, i);
407
91.9k
    if (item == NULL) {
408
0
        _Py_DECLARE_STR(list_err, "list index out of range");
409
0
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
410
0
        return NULL;
411
0
    }
412
91.9k
    return item;
413
91.9k
}
414
415
PyObject *
416
_PyList_GetItemRef(PyListObject *list, Py_ssize_t i)
417
1.85k
{
418
1.85k
    return list_get_item_ref(list, i);
419
1.85k
}
420
421
#ifdef Py_GIL_DISABLED
422
int
423
_PyList_GetItemRefNoLock(PyListObject *list, Py_ssize_t i, _PyStackRef *result)
424
{
425
    assert(_Py_IsOwnedByCurrentThread((PyObject *)list) ||
426
           _PyObject_GC_IS_SHARED(list));
427
    if (!valid_index(i, PyList_GET_SIZE(list))) {
428
        return 0;
429
    }
430
    PyObject **ob_item = _Py_atomic_load_ptr(&list->ob_item);
431
    if (ob_item == NULL) {
432
        return 0;
433
    }
434
    Py_ssize_t cap = list_capacity(ob_item);
435
    assert(cap != -1);
436
    if (!valid_index(i, cap)) {
437
        return 0;
438
    }
439
    PyObject *obj = _Py_atomic_load_ptr(&ob_item[i]);
440
    if (obj == NULL || !_Py_TryIncrefCompareStackRef(&ob_item[i], obj, result)) {
441
        return -1;
442
    }
443
    return 1;
444
}
445
#endif
446
447
int
448
PyList_SetItem(PyObject *op, Py_ssize_t i,
449
               PyObject *newitem)
450
22.4k
{
451
22.4k
    if (!PyList_Check(op)) {
452
0
        Py_XDECREF(newitem);
453
0
        PyErr_BadInternalCall();
454
0
        return -1;
455
0
    }
456
22.4k
    int ret;
457
22.4k
    PyListObject *self = ((PyListObject *)op);
458
22.4k
    Py_BEGIN_CRITICAL_SECTION(self);
459
22.4k
    if (!valid_index(i, Py_SIZE(self))) {
460
0
        Py_XDECREF(newitem);
461
0
        PyErr_SetString(PyExc_IndexError,
462
0
                        "list assignment index out of range");
463
0
        ret = -1;
464
0
        goto end;
465
0
    }
466
22.4k
    PyObject *tmp = self->ob_item[i];
467
22.4k
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item[i], newitem);
468
22.4k
    Py_XDECREF(tmp);
469
22.4k
    ret = 0;
470
22.4k
end:;
471
22.4k
    Py_END_CRITICAL_SECTION();
472
22.4k
    return ret;
473
22.4k
}
474
475
static int
476
ins1(PyListObject *self, Py_ssize_t where, PyObject *v)
477
76
{
478
76
    Py_ssize_t i, n = Py_SIZE(self);
479
76
    PyObject **items;
480
76
    if (v == NULL) {
481
0
        PyErr_BadInternalCall();
482
0
        return -1;
483
0
    }
484
485
76
    assert((size_t)n + 1 < PY_SSIZE_T_MAX);
486
76
    if (list_resize(self, n+1) < 0)
487
0
        return -1;
488
489
76
    if (where < 0) {
490
0
        where += n;
491
0
        if (where < 0)
492
0
            where = 0;
493
0
    }
494
76
    if (where > n)
495
0
        where = n;
496
76
    items = self->ob_item;
497
462
    for (i = n; --i >= where; )
498
386
        FT_ATOMIC_STORE_PTR_RELAXED(items[i+1], items[i]);
499
76
    FT_ATOMIC_STORE_PTR_RELEASE(items[where], Py_NewRef(v));
500
76
    return 0;
501
76
}
502
503
int
504
PyList_Insert(PyObject *op, Py_ssize_t where, PyObject *newitem)
505
16
{
506
16
    if (!PyList_Check(op)) {
507
0
        PyErr_BadInternalCall();
508
0
        return -1;
509
0
    }
510
16
    PyListObject *self = (PyListObject *)op;
511
16
    int err;
512
16
    Py_BEGIN_CRITICAL_SECTION(self);
513
16
    err = ins1(self, where, newitem);
514
16
    Py_END_CRITICAL_SECTION();
515
16
    return err;
516
16
}
517
518
/* internal, used by _PyList_AppendTakeRef */
519
int
520
_PyList_AppendTakeRefListResize(PyListObject *self, PyObject *newitem)
521
59.2M
{
522
59.2M
    Py_ssize_t len = Py_SIZE(self);
523
59.2M
    assert(self->allocated == -1 || self->allocated == len);
524
59.2M
    if (list_resize(self, len + 1) < 0) {
525
0
        Py_DECREF(newitem);
526
0
        return -1;
527
0
    }
528
59.2M
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item[len], newitem);
529
59.2M
    return 0;
530
59.2M
}
531
532
int
533
PyList_Append(PyObject *op, PyObject *newitem)
534
152M
{
535
152M
    if (PyList_Check(op) && (newitem != NULL)) {
536
152M
        int ret;
537
152M
        Py_BEGIN_CRITICAL_SECTION(op);
538
152M
        ret = _PyList_AppendTakeRef((PyListObject *)op, Py_NewRef(newitem));
539
152M
        Py_END_CRITICAL_SECTION();
540
152M
        return ret;
541
152M
    }
542
0
    PyErr_BadInternalCall();
543
0
    return -1;
544
152M
}
545
546
/* Methods */
547
548
static void
549
list_dealloc(PyObject *self)
550
262M
{
551
262M
    PyListObject *op = (PyListObject *)self;
552
262M
    Py_ssize_t i;
553
262M
    PyObject_GC_UnTrack(op);
554
262M
    if (op->ob_item != NULL) {
555
        /* Do it backwards, for Christian Tismer.
556
           There's a simple test case where somehow this reduces
557
           thrashing when a *very* large list is created and
558
           immediately deleted. */
559
99.1M
        i = Py_SIZE(op);
560
1.44G
        while (--i >= 0) {
561
1.34G
            Py_XDECREF(op->ob_item[i]);
562
1.34G
        }
563
99.1M
        free_list_items(op->ob_item, false);
564
99.1M
        op->ob_item = NULL;
565
99.1M
    }
566
262M
    if (PyList_CheckExact(op)) {
567
252M
        _Py_FREELIST_FREE(lists, op, PyObject_GC_Del);
568
252M
    }
569
10.4M
    else {
570
10.4M
        PyObject_GC_Del(op);
571
10.4M
    }
572
262M
}
573
574
static PyObject *
575
list_repr_impl(PyListObject *v)
576
3.69M
{
577
3.69M
    int res = Py_ReprEnter((PyObject*)v);
578
3.69M
    if (res != 0) {
579
0
        return (res > 0 ? PyUnicode_FromString("[...]") : NULL);
580
0
    }
581
582
    /* "[" + "1" + ", 2" * (len - 1) + "]" */
583
3.69M
    Py_ssize_t prealloc = 1 + 1 + (2 + 1) * (Py_SIZE(v) - 1) + 1;
584
3.69M
    PyUnicodeWriter *writer = PyUnicodeWriter_Create(prealloc);
585
3.69M
    PyObject *item = NULL;
586
3.69M
    if (writer == NULL) {
587
0
        goto error;
588
0
    }
589
590
3.69M
    if (PyUnicodeWriter_WriteChar(writer, '[') < 0) {
591
0
        goto error;
592
0
    }
593
594
    /* Do repr() on each element.  Note that this may mutate the list,
595
       so must refetch the list size on each iteration. */
596
10.3M
    for (Py_ssize_t i = 0; i < Py_SIZE(v); ++i) {
597
        /* Hold a strong reference since repr(item) can mutate the list */
598
6.64M
        item = Py_NewRef(v->ob_item[i]);
599
600
6.64M
        if (i > 0) {
601
2.95M
            if (PyUnicodeWriter_WriteChar(writer, ',') < 0) {
602
0
                goto error;
603
0
            }
604
2.95M
            if (PyUnicodeWriter_WriteChar(writer, ' ') < 0) {
605
0
                goto error;
606
0
            }
607
2.95M
        }
608
609
6.64M
        if (PyUnicodeWriter_WriteRepr(writer, item) < 0) {
610
0
            goto error;
611
0
        }
612
6.64M
        Py_CLEAR(item);
613
6.64M
    }
614
615
3.69M
    if (PyUnicodeWriter_WriteChar(writer, ']') < 0) {
616
0
        goto error;
617
0
    }
618
619
3.69M
    Py_ReprLeave((PyObject *)v);
620
3.69M
    return PyUnicodeWriter_Finish(writer);
621
622
0
error:
623
0
    Py_XDECREF(item);
624
0
    PyUnicodeWriter_Discard(writer);
625
0
    Py_ReprLeave((PyObject *)v);
626
0
    return NULL;
627
3.69M
}
628
629
static PyObject *
630
list_repr(PyObject *self)
631
3.70M
{
632
3.70M
    if (PyList_GET_SIZE(self) == 0) {
633
4.63k
        return PyUnicode_FromString("[]");
634
4.63k
    }
635
3.69M
    PyListObject *v = (PyListObject *)self;
636
3.69M
    PyObject *ret = NULL;
637
3.69M
    Py_BEGIN_CRITICAL_SECTION(v);
638
3.69M
    ret = list_repr_impl(v);
639
3.69M
    Py_END_CRITICAL_SECTION();
640
3.69M
    return ret;
641
3.70M
}
642
643
static Py_ssize_t
644
list_length(PyObject *a)
645
47.6M
{
646
47.6M
    return PyList_GET_SIZE(a);
647
47.6M
}
648
649
static int
650
list_contains(PyObject *aa, PyObject *el)
651
2.34k
{
652
653
28.8k
    for (Py_ssize_t i = 0; ; i++) {
654
28.8k
        PyObject *item = list_get_item_ref((PyListObject *)aa, i);
655
28.8k
        if (item == NULL) {
656
            // out-of-bounds
657
1.72k
            return 0;
658
1.72k
        }
659
27.1k
        int cmp = PyObject_RichCompareBool(item, el, Py_EQ);
660
27.1k
        Py_DECREF(item);
661
27.1k
        if (cmp != 0) {
662
612
            return cmp;
663
612
        }
664
27.1k
    }
665
0
    return 0;
666
2.34k
}
667
668
static PyObject *
669
list_item(PyObject *aa, Py_ssize_t i)
670
14.8M
{
671
14.8M
    PyListObject *a = (PyListObject *)aa;
672
14.8M
    if (!valid_index(i, PyList_GET_SIZE(a))) {
673
972
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
674
972
        return NULL;
675
972
    }
676
14.8M
    PyObject *item;
677
#ifdef Py_GIL_DISABLED
678
    item = list_get_item_ref(a, i);
679
    if (item == NULL) {
680
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
681
        return NULL;
682
    }
683
#else
684
14.8M
    item = Py_NewRef(a->ob_item[i]);
685
14.8M
#endif
686
14.8M
    return item;
687
14.8M
}
688
689
static PyObject *
690
list_slice_lock_held(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
691
1.90M
{
692
1.90M
    PyListObject *np;
693
1.90M
    PyObject **src, **dest;
694
1.90M
    Py_ssize_t i, len;
695
1.90M
    len = ihigh - ilow;
696
1.90M
    if (len <= 0) {
697
0
        return PyList_New(0);
698
0
    }
699
1.90M
    np = (PyListObject *) list_new_prealloc(len);
700
1.90M
    if (np == NULL)
701
0
        return NULL;
702
703
1.90M
    src = a->ob_item + ilow;
704
1.90M
    dest = np->ob_item;
705
33.3M
    for (i = 0; i < len; i++) {
706
31.4M
        PyObject *v = src[i];
707
31.4M
        dest[i] = Py_NewRef(v);
708
31.4M
    }
709
1.90M
    Py_SET_SIZE(np, len);
710
1.90M
    return (PyObject *)np;
711
1.90M
}
712
713
PyObject *
714
PyList_GetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
715
0
{
716
0
    if (!PyList_Check(a)) {
717
0
        PyErr_BadInternalCall();
718
0
        return NULL;
719
0
    }
720
0
    PyObject *ret;
721
0
    Py_BEGIN_CRITICAL_SECTION(a);
722
0
    if (ilow < 0) {
723
0
        ilow = 0;
724
0
    }
725
0
    else if (ilow > Py_SIZE(a)) {
726
0
        ilow = Py_SIZE(a);
727
0
    }
728
0
    if (ihigh < ilow) {
729
0
        ihigh = ilow;
730
0
    }
731
0
    else if (ihigh > Py_SIZE(a)) {
732
0
        ihigh = Py_SIZE(a);
733
0
    }
734
0
    ret = list_slice_lock_held((PyListObject *)a, ilow, ihigh);
735
0
    Py_END_CRITICAL_SECTION();
736
0
    return ret;
737
0
}
738
739
static PyObject *
740
list_concat_lock_held(PyListObject *a, PyListObject *b)
741
19.1M
{
742
19.1M
    Py_ssize_t size;
743
19.1M
    Py_ssize_t i;
744
19.1M
    PyObject **src, **dest;
745
19.1M
    PyListObject *np;
746
19.1M
    assert((size_t)Py_SIZE(a) + (size_t)Py_SIZE(b) < PY_SSIZE_T_MAX);
747
19.1M
    size = Py_SIZE(a) + Py_SIZE(b);
748
19.1M
    if (size == 0) {
749
7.47M
        return PyList_New(0);
750
7.47M
    }
751
11.7M
    np = (PyListObject *) list_new_prealloc(size);
752
11.7M
    if (np == NULL) {
753
0
        return NULL;
754
0
    }
755
11.7M
    src = a->ob_item;
756
11.7M
    dest = np->ob_item;
757
492M
    for (i = 0; i < Py_SIZE(a); i++) {
758
480M
        PyObject *v = src[i];
759
480M
        dest[i] = Py_NewRef(v);
760
480M
    }
761
11.7M
    src = b->ob_item;
762
11.7M
    dest = np->ob_item + Py_SIZE(a);
763
177M
    for (i = 0; i < Py_SIZE(b); i++) {
764
165M
        PyObject *v = src[i];
765
165M
        dest[i] = Py_NewRef(v);
766
165M
    }
767
11.7M
    Py_SET_SIZE(np, size);
768
11.7M
    return (PyObject *)np;
769
11.7M
}
770
771
static PyObject *
772
list_concat(PyObject *aa, PyObject *bb)
773
19.1M
{
774
19.1M
    if (!PyList_Check(bb)) {
775
0
        PyErr_Format(PyExc_TypeError,
776
0
                  "can only concatenate list (not \"%.200s\") to list",
777
0
                  Py_TYPE(bb)->tp_name);
778
0
        return NULL;
779
0
    }
780
19.1M
    PyListObject *a = (PyListObject *)aa;
781
19.1M
    PyListObject *b = (PyListObject *)bb;
782
19.1M
    PyObject *ret;
783
19.1M
    Py_BEGIN_CRITICAL_SECTION2(a, b);
784
19.1M
    ret = list_concat_lock_held(a, b);
785
19.1M
    Py_END_CRITICAL_SECTION2();
786
19.1M
    return ret;
787
19.1M
}
788
789
static PyObject *
790
list_repeat_lock_held(PyListObject *a, Py_ssize_t n)
791
14.8k
{
792
14.8k
    const Py_ssize_t input_size = Py_SIZE(a);
793
14.8k
    if (input_size == 0 || n <= 0)
794
2.44k
        return PyList_New(0);
795
12.4k
    assert(n > 0);
796
797
12.4k
    if (input_size > PY_SSIZE_T_MAX / n)
798
0
        return PyErr_NoMemory();
799
12.4k
    Py_ssize_t output_size = input_size * n;
800
801
12.4k
    PyListObject *np = (PyListObject *) list_new_prealloc(output_size);
802
12.4k
    if (np == NULL)
803
0
        return NULL;
804
805
12.4k
    PyObject **dest = np->ob_item;
806
12.4k
    if (input_size == 1) {
807
12.4k
        PyObject *elem = a->ob_item[0];
808
12.4k
        _Py_RefcntAdd(elem, n);
809
12.4k
        PyObject **dest_end = dest + output_size;
810
10.8M
        while (dest < dest_end) {
811
10.8M
            *dest++ = elem;
812
10.8M
        }
813
12.4k
    }
814
0
    else {
815
0
        PyObject **src = a->ob_item;
816
0
        PyObject **src_end = src + input_size;
817
0
        while (src < src_end) {
818
0
            _Py_RefcntAdd(*src, n);
819
0
            *dest++ = *src++;
820
0
        }
821
        // TODO: _Py_memory_repeat calls are not safe for shared lists in
822
        // GIL_DISABLED builds. (See issue #129069)
823
0
        _Py_memory_repeat((char *)np->ob_item, sizeof(PyObject *)*output_size,
824
0
                                        sizeof(PyObject *)*input_size);
825
0
    }
826
827
12.4k
    Py_SET_SIZE(np, output_size);
828
12.4k
    return (PyObject *) np;
829
12.4k
}
830
831
static PyObject *
832
list_repeat(PyObject *aa, Py_ssize_t n)
833
14.8k
{
834
14.8k
    PyObject *ret;
835
14.8k
    PyListObject *a = (PyListObject *)aa;
836
14.8k
    Py_BEGIN_CRITICAL_SECTION(a);
837
14.8k
    ret = list_repeat_lock_held(a, n);
838
14.8k
    Py_END_CRITICAL_SECTION();
839
14.8k
    return ret;
840
14.8k
}
841
842
static void
843
list_clear_impl(PyListObject *a, bool is_resize)
844
12.6M
{
845
12.6M
    PyObject **items = a->ob_item;
846
12.6M
    if (items == NULL) {
847
0
        return;
848
0
    }
849
850
    /* Because XDECREF can recursively invoke operations on
851
       this list, we make it empty first. */
852
12.6M
    Py_ssize_t i = Py_SIZE(a);
853
12.6M
    Py_SET_SIZE(a, 0);
854
12.6M
    FT_ATOMIC_STORE_PTR_RELEASE(a->ob_item, NULL);
855
12.6M
    a->allocated = 0;
856
25.4M
    while (--i >= 0) {
857
12.7M
        Py_XDECREF(items[i]);
858
12.7M
    }
859
#ifdef Py_GIL_DISABLED
860
    if (is_resize) {
861
        ensure_shared_on_resize(a);
862
    }
863
    bool use_qsbr = is_resize && _PyObject_GC_IS_SHARED(a);
864
#else
865
12.6M
    bool use_qsbr = false;
866
12.6M
#endif
867
12.6M
    free_list_items(items, use_qsbr);
868
    // Note that there is no guarantee that the list is actually empty
869
    // at this point, because XDECREF may have populated it indirectly again!
870
12.6M
}
871
872
static void
873
list_clear(PyListObject *a)
874
12.6M
{
875
12.6M
    list_clear_impl(a, true);
876
12.6M
}
877
878
static int
879
list_clear_slot(PyObject *self)
880
0
{
881
0
    list_clear_impl((PyListObject *)self, false);
882
0
    return 0;
883
0
}
884
885
/* a[ilow:ihigh] = v if v != NULL.
886
 * del a[ilow:ihigh] if v == NULL.
887
 *
888
 * Special speed gimmick:  when v is NULL and ihigh - ilow <= 8, it's
889
 * guaranteed the call cannot fail.
890
 */
891
static int
892
list_ass_slice_lock_held(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
893
3.90M
{
894
    /* Because [X]DECREF can recursively invoke list operations on
895
       this list, we must postpone all [X]DECREF activity until
896
       after the list is back in its canonical shape.  Therefore
897
       we must allocate an additional array, 'recycle', into which
898
       we temporarily copy the items that are deleted from the
899
       list. :-( */
900
3.90M
    PyObject *recycle_on_stack[8];
901
3.90M
    PyObject **recycle = recycle_on_stack; /* will allocate more if needed */
902
3.90M
    PyObject **item;
903
3.90M
    PyObject **vitem = NULL;
904
3.90M
    PyObject *v_as_SF = NULL; /* PySequence_Fast(v) */
905
3.90M
    Py_ssize_t n; /* # of elements in replacement list */
906
3.90M
    Py_ssize_t norig; /* # of elements in list getting replaced */
907
3.90M
    Py_ssize_t d; /* Change in size */
908
3.90M
    Py_ssize_t k;
909
3.90M
    size_t s;
910
3.90M
    int result = -1;            /* guilty until proved innocent */
911
3.90M
#define b ((PyListObject *)v)
912
3.90M
    if (v == NULL)
913
3.71M
        n = 0;
914
191k
    else {
915
191k
        v_as_SF = PySequence_Fast(v, "can only assign an iterable");
916
191k
        if(v_as_SF == NULL)
917
0
            goto Error;
918
191k
        n = PySequence_Fast_GET_SIZE(v_as_SF);
919
191k
        vitem = PySequence_Fast_ITEMS(v_as_SF);
920
191k
    }
921
3.90M
    if (ilow < 0)
922
0
        ilow = 0;
923
3.90M
    else if (ilow > Py_SIZE(a))
924
0
        ilow = Py_SIZE(a);
925
926
3.90M
    if (ihigh < ilow)
927
0
        ihigh = ilow;
928
3.90M
    else if (ihigh > Py_SIZE(a))
929
0
        ihigh = Py_SIZE(a);
930
931
3.90M
    norig = ihigh - ilow;
932
3.90M
    assert(norig >= 0);
933
3.90M
    d = n - norig;
934
3.90M
    if (Py_SIZE(a) + d == 0) {
935
556k
        Py_XDECREF(v_as_SF);
936
556k
        list_clear(a);
937
556k
        return 0;
938
556k
    }
939
3.34M
    item = a->ob_item;
940
    /* recycle the items that we are about to remove */
941
3.34M
    s = norig * sizeof(PyObject *);
942
    /* If norig == 0, item might be NULL, in which case we may not memcpy from it. */
943
3.34M
    if (s) {
944
3.17M
        if (s > sizeof(recycle_on_stack)) {
945
122
            recycle = (PyObject **)PyMem_Malloc(s);
946
122
            if (recycle == NULL) {
947
0
                PyErr_NoMemory();
948
0
                goto Error;
949
0
            }
950
122
        }
951
3.17M
        memcpy(recycle, &item[ilow], s);
952
3.17M
    }
953
954
3.34M
    if (d < 0) { /* Delete -d items */
955
3.17M
        Py_ssize_t tail;
956
3.17M
        tail = (Py_SIZE(a) - ihigh) * sizeof(PyObject *);
957
        // TODO: these memmove/memcpy calls are not safe for shared lists in
958
        // GIL_DISABLED builds. (See issue #129069)
959
3.17M
        memmove(&item[ihigh+d], &item[ihigh], tail);
960
3.17M
        if (list_resize(a, Py_SIZE(a) + d) < 0) {
961
0
            memmove(&item[ihigh], &item[ihigh+d], tail);
962
0
            memcpy(&item[ilow], recycle, s);
963
0
            goto Error;
964
0
        }
965
3.17M
        item = a->ob_item;
966
3.17M
    }
967
176k
    else if (d > 0) { /* Insert d items */
968
176k
        k = Py_SIZE(a);
969
176k
        if (list_resize(a, k+d) < 0)
970
0
            goto Error;
971
176k
        item = a->ob_item;
972
        // TODO: these memmove/memcpy calls are not safe for shared lists in
973
        // GIL_DISABLED builds. (See issue #129069)
974
176k
        memmove(&item[ihigh+d], &item[ihigh],
975
176k
            (k - ihigh)*sizeof(PyObject *));
976
176k
    }
977
3.52M
    for (k = 0; k < n; k++, ilow++) {
978
176k
        PyObject *w = vitem[k];
979
176k
        FT_ATOMIC_STORE_PTR_RELEASE(item[ilow], Py_XNewRef(w));
980
176k
    }
981
6.53M
    for (k = norig - 1; k >= 0; --k)
982
3.18M
        Py_XDECREF(recycle[k]);
983
3.34M
    result = 0;
984
3.34M
 Error:
985
3.34M
    if (recycle != recycle_on_stack)
986
122
        PyMem_Free(recycle);
987
3.34M
    Py_XDECREF(v_as_SF);
988
3.34M
    return result;
989
3.34M
#undef b
990
3.34M
}
991
992
static int
993
list_ass_slice(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
994
3.71M
{
995
3.71M
    int ret;
996
3.71M
    if (a == (PyListObject *)v) {
997
0
        Py_BEGIN_CRITICAL_SECTION(a);
998
0
        Py_ssize_t n = PyList_GET_SIZE(a);
999
0
        PyObject *copy = list_slice_lock_held(a, 0, n);
1000
0
        if (copy == NULL) {
1001
0
            ret = -1;
1002
0
        }
1003
0
        else {
1004
0
            ret = list_ass_slice_lock_held(a, ilow, ihigh, copy);
1005
0
            Py_DECREF(copy);
1006
0
        }
1007
0
        Py_END_CRITICAL_SECTION();
1008
0
    }
1009
3.71M
    else if (v != NULL && PyList_CheckExact(v)) {
1010
225
        Py_BEGIN_CRITICAL_SECTION2(a, v);
1011
225
        ret = list_ass_slice_lock_held(a, ilow, ihigh, v);
1012
225
        Py_END_CRITICAL_SECTION2();
1013
225
    }
1014
3.71M
    else {
1015
3.71M
        Py_BEGIN_CRITICAL_SECTION(a);
1016
3.71M
        ret = list_ass_slice_lock_held(a, ilow, ihigh, v);
1017
3.71M
        Py_END_CRITICAL_SECTION();
1018
3.71M
    }
1019
3.71M
    return ret;
1020
3.71M
}
1021
1022
int
1023
PyList_SetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
1024
3.71M
{
1025
3.71M
    if (!PyList_Check(a)) {
1026
0
        PyErr_BadInternalCall();
1027
0
        return -1;
1028
0
    }
1029
3.71M
    return list_ass_slice((PyListObject *)a, ilow, ihigh, v);
1030
3.71M
}
1031
1032
static int
1033
list_inplace_repeat_lock_held(PyListObject *self, Py_ssize_t n)
1034
0
{
1035
0
    Py_ssize_t input_size = PyList_GET_SIZE(self);
1036
0
    if (input_size == 0 || n == 1) {
1037
0
        return 0;
1038
0
    }
1039
1040
0
    if (n < 1) {
1041
0
        list_clear(self);
1042
0
        return 0;
1043
0
    }
1044
1045
0
    if (input_size > PY_SSIZE_T_MAX / n) {
1046
0
        PyErr_NoMemory();
1047
0
        return -1;
1048
0
    }
1049
0
    Py_ssize_t output_size = input_size * n;
1050
1051
0
    if (list_resize(self, output_size) < 0) {
1052
0
        return -1;
1053
0
    }
1054
1055
0
    PyObject **items = self->ob_item;
1056
0
    for (Py_ssize_t j = 0; j < input_size; j++) {
1057
0
        _Py_RefcntAdd(items[j], n-1);
1058
0
    }
1059
    // TODO: _Py_memory_repeat calls are not safe for shared lists in
1060
    // GIL_DISABLED builds. (See issue #129069)
1061
0
    _Py_memory_repeat((char *)items, sizeof(PyObject *)*output_size,
1062
0
                      sizeof(PyObject *)*input_size);
1063
0
    return 0;
1064
0
}
1065
1066
static PyObject *
1067
list_inplace_repeat(PyObject *_self, Py_ssize_t n)
1068
0
{
1069
0
    PyObject *ret;
1070
0
    PyListObject *self = (PyListObject *) _self;
1071
0
    Py_BEGIN_CRITICAL_SECTION(self);
1072
0
    if (list_inplace_repeat_lock_held(self, n) < 0) {
1073
0
        ret = NULL;
1074
0
    }
1075
0
    else {
1076
0
        ret = Py_NewRef(self);
1077
0
    }
1078
0
    Py_END_CRITICAL_SECTION();
1079
0
    return ret;
1080
0
}
1081
1082
static int
1083
list_ass_item_lock_held(PyListObject *a, Py_ssize_t i, PyObject *v)
1084
9.32k
{
1085
9.32k
    if (!valid_index(i, Py_SIZE(a))) {
1086
0
        PyErr_SetString(PyExc_IndexError,
1087
0
                        "list assignment index out of range");
1088
0
        return -1;
1089
0
    }
1090
9.32k
    PyObject *tmp = a->ob_item[i];
1091
9.32k
    if (v == NULL) {
1092
6.46k
        Py_ssize_t size = Py_SIZE(a);
1093
6.46k
        for (Py_ssize_t idx = i; idx < size - 1; idx++) {
1094
0
            FT_ATOMIC_STORE_PTR_RELAXED(a->ob_item[idx], a->ob_item[idx + 1]);
1095
0
        }
1096
6.46k
        Py_SET_SIZE(a, size - 1);
1097
6.46k
    }
1098
2.85k
    else {
1099
2.85k
        FT_ATOMIC_STORE_PTR_RELEASE(a->ob_item[i], Py_NewRef(v));
1100
2.85k
    }
1101
9.32k
    Py_DECREF(tmp);
1102
9.32k
    return 0;
1103
9.32k
}
1104
1105
static int
1106
list_ass_item(PyObject *aa, Py_ssize_t i, PyObject *v)
1107
6.38k
{
1108
6.38k
    int ret;
1109
6.38k
    PyListObject *a = (PyListObject *)aa;
1110
6.38k
    Py_BEGIN_CRITICAL_SECTION(a);
1111
6.38k
    ret = list_ass_item_lock_held(a, i, v);
1112
6.38k
    Py_END_CRITICAL_SECTION();
1113
6.38k
    return ret;
1114
6.38k
}
1115
1116
/*[clinic input]
1117
@critical_section
1118
list.insert
1119
1120
    index: Py_ssize_t
1121
    object: object
1122
    /
1123
1124
Insert object before index.
1125
[clinic start generated code]*/
1126
1127
static PyObject *
1128
list_insert_impl(PyListObject *self, Py_ssize_t index, PyObject *object)
1129
/*[clinic end generated code: output=7f35e32f60c8cb78 input=b1987ca998a4ae2d]*/
1130
60
{
1131
60
    if (ins1(self, index, object) == 0) {
1132
60
        Py_RETURN_NONE;
1133
60
    }
1134
0
    return NULL;
1135
60
}
1136
1137
/*[clinic input]
1138
@critical_section
1139
list.clear as py_list_clear
1140
1141
Remove all items from list.
1142
[clinic start generated code]*/
1143
1144
static PyObject *
1145
py_list_clear_impl(PyListObject *self)
1146
/*[clinic end generated code: output=83726743807e3518 input=e285b7f09051a9ba]*/
1147
170
{
1148
170
    list_clear(self);
1149
170
    Py_RETURN_NONE;
1150
170
}
1151
1152
/*[clinic input]
1153
@critical_section
1154
list.copy
1155
1156
Return a shallow copy of the list.
1157
[clinic start generated code]*/
1158
1159
static PyObject *
1160
list_copy_impl(PyListObject *self)
1161
/*[clinic end generated code: output=ec6b72d6209d418e input=81c54b0c7bb4f73d]*/
1162
0
{
1163
0
    return list_slice_lock_held(self, 0, Py_SIZE(self));
1164
0
}
1165
1166
/*[clinic input]
1167
@critical_section
1168
list.append
1169
1170
     object: object
1171
     /
1172
1173
Append object to the end of the list.
1174
[clinic start generated code]*/
1175
1176
static PyObject *
1177
list_append_impl(PyListObject *self, PyObject *object)
1178
/*[clinic end generated code: output=78423561d92ed405 input=122b0853de54004f]*/
1179
18.7M
{
1180
18.7M
    if (_PyList_AppendTakeRef(self, Py_NewRef(object)) < 0) {
1181
0
        return NULL;
1182
0
    }
1183
18.7M
    Py_RETURN_NONE;
1184
18.7M
}
1185
1186
static int
1187
list_extend_fast(PyListObject *self, PyObject *iterable)
1188
21.2M
{
1189
21.2M
    Py_ssize_t n = PySequence_Fast_GET_SIZE(iterable);
1190
21.2M
    if (n == 0) {
1191
        /* short circuit when iterable is empty */
1192
8.49M
        return 0;
1193
8.49M
    }
1194
1195
12.7M
    Py_ssize_t m = Py_SIZE(self);
1196
    // It should not be possible to allocate a list large enough to cause
1197
    // an overflow on any relevant platform.
1198
12.7M
    assert(m < PY_SSIZE_T_MAX - n);
1199
12.7M
    if (self->ob_item == NULL) {
1200
1.29M
        if (list_preallocate_exact(self, n) < 0) {
1201
0
            return -1;
1202
0
        }
1203
1.29M
        Py_SET_SIZE(self, n);
1204
1.29M
    }
1205
11.4M
    else if (list_resize(self, m + n) < 0) {
1206
0
        return -1;
1207
0
    }
1208
1209
    // note that we may still have self == iterable here for the
1210
    // situation a.extend(a), but the following code works
1211
    // in that case too.  Just make sure to resize self
1212
    // before calling PySequence_Fast_ITEMS.
1213
    //
1214
    // populate the end of self with iterable's items.
1215
12.7M
    PyObject **src = PySequence_Fast_ITEMS(iterable);
1216
12.7M
    PyObject **dest = self->ob_item + m;
1217
40.4M
    for (Py_ssize_t i = 0; i < n; i++) {
1218
27.7M
        PyObject *o = src[i];
1219
27.7M
        FT_ATOMIC_STORE_PTR_RELEASE(dest[i], Py_NewRef(o));
1220
27.7M
    }
1221
12.7M
    return 0;
1222
12.7M
}
1223
1224
static int
1225
list_extend_iter_lock_held(PyListObject *self, PyObject *iterable)
1226
5.33M
{
1227
5.33M
    PyObject *it = PyObject_GetIter(iterable);
1228
5.33M
    if (it == NULL) {
1229
0
        return -1;
1230
0
    }
1231
5.33M
    PyObject *(*iternext)(PyObject *) = *Py_TYPE(it)->tp_iternext;
1232
1233
    /* Guess a result list size. */
1234
5.33M
    Py_ssize_t n = PyObject_LengthHint(iterable, 8);
1235
5.33M
    if (n < 0) {
1236
0
        Py_DECREF(it);
1237
0
        return -1;
1238
0
    }
1239
1240
5.33M
    Py_ssize_t m = Py_SIZE(self);
1241
5.33M
    if (m > PY_SSIZE_T_MAX - n) {
1242
        /* m + n overflowed; on the chance that n lied, and there really
1243
         * is enough room, ignore it.  If n was telling the truth, we'll
1244
         * eventually run out of memory during the loop.
1245
         */
1246
0
    }
1247
5.33M
    else if (self->ob_item == NULL) {
1248
4.99M
        if (n && list_preallocate_exact(self, n) < 0)
1249
0
            goto error;
1250
4.99M
    }
1251
334k
    else {
1252
        /* Make room. */
1253
334k
        if (list_resize(self, m + n) < 0) {
1254
0
            goto error;
1255
0
        }
1256
1257
        /* Make the list sane again. */
1258
334k
        Py_SET_SIZE(self, m);
1259
334k
    }
1260
1261
    /* Run iterator to exhaustion. */
1262
61.1M
    for (;;) {
1263
61.1M
        PyObject *item = iternext(it);
1264
61.1M
        if (item == NULL) {
1265
5.33M
            if (PyErr_Occurred()) {
1266
613
                if (PyErr_ExceptionMatches(PyExc_StopIteration))
1267
0
                    PyErr_Clear();
1268
613
                else
1269
613
                    goto error;
1270
613
            }
1271
5.33M
            break;
1272
5.33M
        }
1273
1274
55.8M
        if (Py_SIZE(self) < self->allocated) {
1275
54.8M
            Py_ssize_t len = Py_SIZE(self);
1276
54.8M
            FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item[len], item);  // steals item ref
1277
54.8M
            Py_SET_SIZE(self, len + 1);
1278
54.8M
        }
1279
962k
        else {
1280
962k
            if (_PyList_AppendTakeRef(self, item) < 0)
1281
0
                goto error;
1282
962k
        }
1283
55.8M
    }
1284
1285
    /* Cut back result list if initial guess was too large. */
1286
5.33M
    if (Py_SIZE(self) < self->allocated) {
1287
4.05M
        if (list_resize(self, Py_SIZE(self)) < 0)
1288
0
            goto error;
1289
4.05M
    }
1290
1291
5.33M
    Py_DECREF(it);
1292
5.33M
    return 0;
1293
1294
613
  error:
1295
613
    Py_DECREF(it);
1296
613
    return -1;
1297
5.33M
}
1298
1299
static int
1300
list_extend_lock_held(PyListObject *self, PyObject *iterable)
1301
21.2M
{
1302
21.2M
    PyObject *seq = PySequence_Fast(iterable, "argument must be iterable");
1303
21.2M
    if (!seq) {
1304
0
        return -1;
1305
0
    }
1306
1307
21.2M
    int res = list_extend_fast(self, seq);
1308
21.2M
    Py_DECREF(seq);
1309
21.2M
    return res;
1310
21.2M
}
1311
1312
static int
1313
list_extend_set(PyListObject *self, PySetObject *other)
1314
19.6k
{
1315
19.6k
    Py_ssize_t m = Py_SIZE(self);
1316
19.6k
    Py_ssize_t n = PySet_GET_SIZE(other);
1317
19.6k
    Py_ssize_t r = m + n;
1318
19.6k
    if (r == 0) {
1319
896
        return 0;
1320
896
    }
1321
18.7k
    if (list_resize(self, r) < 0) {
1322
0
        return -1;
1323
0
    }
1324
1325
18.7k
    assert(self->ob_item != NULL);
1326
    /* populate the end of self with iterable's items */
1327
18.7k
    Py_ssize_t setpos = 0;
1328
18.7k
    Py_hash_t hash;
1329
18.7k
    PyObject *key;
1330
18.7k
    PyObject **dest = self->ob_item + m;
1331
117k
    while (_PySet_NextEntryRef((PyObject *)other, &setpos, &key, &hash)) {
1332
98.5k
        FT_ATOMIC_STORE_PTR_RELEASE(*dest, key);
1333
98.5k
        dest++;
1334
98.5k
    }
1335
18.7k
    Py_SET_SIZE(self, r);
1336
18.7k
    return 0;
1337
18.7k
}
1338
1339
static int
1340
list_extend_dict(PyListObject *self, PyDictObject *dict, int which_item)
1341
311
{
1342
    // which_item: 0 for keys and 1 for values
1343
311
    Py_ssize_t m = Py_SIZE(self);
1344
311
    Py_ssize_t n = PyDict_GET_SIZE(dict);
1345
311
    Py_ssize_t r = m + n;
1346
311
    if (r == 0) {
1347
0
        return 0;
1348
0
    }
1349
311
    if (list_resize(self, r) < 0) {
1350
0
        return -1;
1351
0
    }
1352
1353
311
    assert(self->ob_item != NULL);
1354
311
    PyObject **dest = self->ob_item + m;
1355
311
    Py_ssize_t pos = 0;
1356
311
    PyObject *keyvalue[2];
1357
1.69k
    while (_PyDict_Next((PyObject *)dict, &pos, &keyvalue[0], &keyvalue[1], NULL)) {
1358
1.38k
        PyObject *obj = keyvalue[which_item];
1359
1.38k
        Py_INCREF(obj);
1360
1.38k
        FT_ATOMIC_STORE_PTR_RELEASE(*dest, obj);
1361
1.38k
        dest++;
1362
1.38k
    }
1363
1364
311
    Py_SET_SIZE(self, r);
1365
311
    return 0;
1366
311
}
1367
1368
static int
1369
list_extend_dictitems(PyListObject *self, PyDictObject *dict)
1370
0
{
1371
0
    Py_ssize_t m = Py_SIZE(self);
1372
0
    Py_ssize_t n = PyDict_GET_SIZE(dict);
1373
0
    Py_ssize_t r = m + n;
1374
0
    if (r == 0) {
1375
0
        return 0;
1376
0
    }
1377
0
    if (list_resize(self, r) < 0) {
1378
0
        return -1;
1379
0
    }
1380
1381
0
    assert(self->ob_item != NULL);
1382
0
    PyObject **dest = self->ob_item + m;
1383
0
    Py_ssize_t pos = 0;
1384
0
    Py_ssize_t i = 0;
1385
0
    PyObject *key, *value;
1386
0
    while (_PyDict_Next((PyObject *)dict, &pos, &key, &value, NULL)) {
1387
0
        PyObject *item = PyTuple_Pack(2, key, value);
1388
0
        if (item == NULL) {
1389
0
            Py_SET_SIZE(self, m + i);
1390
0
            return -1;
1391
0
        }
1392
0
        FT_ATOMIC_STORE_PTR_RELEASE(*dest, item);
1393
0
        dest++;
1394
0
        i++;
1395
0
    }
1396
1397
0
    Py_SET_SIZE(self, r);
1398
0
    return 0;
1399
0
}
1400
1401
static int
1402
_list_extend(PyListObject *self, PyObject *iterable)
1403
26.6M
{
1404
    // Special case:
1405
    // lists and tuples which can use PySequence_Fast ops
1406
26.6M
    int res = -1;
1407
26.6M
    if ((PyObject *)self == iterable) {
1408
0
        Py_BEGIN_CRITICAL_SECTION(self);
1409
0
        res = list_inplace_repeat_lock_held(self, 2);
1410
0
        Py_END_CRITICAL_SECTION();
1411
0
    }
1412
26.6M
    else if (PyList_CheckExact(iterable)) {
1413
9.76M
        Py_BEGIN_CRITICAL_SECTION2(self, iterable);
1414
9.76M
        res = list_extend_lock_held(self, iterable);
1415
9.76M
        Py_END_CRITICAL_SECTION2();
1416
9.76M
    }
1417
16.8M
    else if (PyTuple_CheckExact(iterable)) {
1418
11.4M
        Py_BEGIN_CRITICAL_SECTION(self);
1419
11.4M
        res = list_extend_lock_held(self, iterable);
1420
11.4M
        Py_END_CRITICAL_SECTION();
1421
11.4M
    }
1422
5.35M
    else if (PyAnySet_CheckExact(iterable)) {
1423
19.6k
        Py_BEGIN_CRITICAL_SECTION2(self, iterable);
1424
19.6k
        res = list_extend_set(self, (PySetObject *)iterable);
1425
19.6k
        Py_END_CRITICAL_SECTION2();
1426
19.6k
    }
1427
5.33M
    else if (PyDict_CheckExact(iterable)) {
1428
309
        Py_BEGIN_CRITICAL_SECTION2(self, iterable);
1429
309
        res = list_extend_dict(self, (PyDictObject *)iterable, 0 /*keys*/);
1430
309
        Py_END_CRITICAL_SECTION2();
1431
309
    }
1432
5.33M
    else if (Py_IS_TYPE(iterable, &PyDictKeys_Type)) {
1433
0
        PyDictObject *dict = ((_PyDictViewObject *)iterable)->dv_dict;
1434
0
        Py_BEGIN_CRITICAL_SECTION2(self, dict);
1435
0
        res = list_extend_dict(self, dict, 0 /*keys*/);
1436
0
        Py_END_CRITICAL_SECTION2();
1437
0
    }
1438
5.33M
    else if (Py_IS_TYPE(iterable, &PyDictValues_Type)) {
1439
2
        PyDictObject *dict = ((_PyDictViewObject *)iterable)->dv_dict;
1440
2
        Py_BEGIN_CRITICAL_SECTION2(self, dict);
1441
2
        res = list_extend_dict(self, dict, 1 /*values*/);
1442
2
        Py_END_CRITICAL_SECTION2();
1443
2
    }
1444
5.33M
    else if (Py_IS_TYPE(iterable, &PyDictItems_Type)) {
1445
0
        PyDictObject *dict = ((_PyDictViewObject *)iterable)->dv_dict;
1446
0
        Py_BEGIN_CRITICAL_SECTION2(self, dict);
1447
0
        res = list_extend_dictitems(self, dict);
1448
0
        Py_END_CRITICAL_SECTION2();
1449
0
    }
1450
5.33M
    else {
1451
5.33M
        Py_BEGIN_CRITICAL_SECTION(self);
1452
5.33M
        res = list_extend_iter_lock_held(self, iterable);
1453
5.33M
        Py_END_CRITICAL_SECTION();
1454
5.33M
    }
1455
26.6M
    return res;
1456
26.6M
}
1457
1458
/*[clinic input]
1459
list.extend as list_extend
1460
1461
     iterable: object
1462
     /
1463
1464
Extend list by appending elements from the iterable.
1465
[clinic start generated code]*/
1466
1467
static PyObject *
1468
list_extend_impl(PyListObject *self, PyObject *iterable)
1469
/*[clinic end generated code: output=b0eba9e0b186d5ce input=979da7597a515791]*/
1470
17.6M
{
1471
17.6M
    if (_list_extend(self, iterable) < 0) {
1472
613
        return NULL;
1473
613
    }
1474
17.6M
    Py_RETURN_NONE;
1475
17.6M
}
1476
1477
PyObject *
1478
_PyList_Extend(PyListObject *self, PyObject *iterable)
1479
16.3M
{
1480
16.3M
    return list_extend((PyObject*)self, iterable);
1481
16.3M
}
1482
1483
int
1484
PyList_Extend(PyObject *self, PyObject *iterable)
1485
0
{
1486
0
    if (!PyList_Check(self)) {
1487
0
        PyErr_BadInternalCall();
1488
0
        return -1;
1489
0
    }
1490
0
    return _list_extend((PyListObject*)self, iterable);
1491
0
}
1492
1493
1494
int
1495
PyList_Clear(PyObject *self)
1496
0
{
1497
0
    if (!PyList_Check(self)) {
1498
0
        PyErr_BadInternalCall();
1499
0
        return -1;
1500
0
    }
1501
0
    Py_BEGIN_CRITICAL_SECTION(self);
1502
0
    list_clear((PyListObject*)self);
1503
0
    Py_END_CRITICAL_SECTION();
1504
0
    return 0;
1505
0
}
1506
1507
1508
static PyObject *
1509
list_inplace_concat(PyObject *_self, PyObject *other)
1510
422
{
1511
422
    PyListObject *self = (PyListObject *)_self;
1512
422
    if (_list_extend(self, other) < 0) {
1513
0
        return NULL;
1514
0
    }
1515
422
    return Py_NewRef(self);
1516
422
}
1517
1518
/*[clinic input]
1519
@critical_section
1520
list.pop
1521
1522
    index: Py_ssize_t = -1
1523
    /
1524
1525
Remove and return item at index (default last).
1526
1527
Raises IndexError if list is empty or index is out of range.
1528
[clinic start generated code]*/
1529
1530
static PyObject *
1531
list_pop_impl(PyListObject *self, Py_ssize_t index)
1532
/*[clinic end generated code: output=6bd69dcb3f17eca8 input=c269141068ae4b8f]*/
1533
29.5M
{
1534
29.5M
    PyObject *v;
1535
29.5M
    int status;
1536
1537
29.5M
    if (Py_SIZE(self) == 0) {
1538
        /* Special-case most common failure cause */
1539
0
        PyErr_SetString(PyExc_IndexError, "pop from empty list");
1540
0
        return NULL;
1541
0
    }
1542
29.5M
    if (index < 0)
1543
12.1M
        index += Py_SIZE(self);
1544
29.5M
    if (!valid_index(index, Py_SIZE(self))) {
1545
0
        PyErr_SetString(PyExc_IndexError, "pop index out of range");
1546
0
        return NULL;
1547
0
    }
1548
1549
29.5M
    PyObject **items = self->ob_item;
1550
29.5M
    v = items[index];
1551
29.5M
    const Py_ssize_t size_after_pop = Py_SIZE(self) - 1;
1552
29.5M
    if (size_after_pop == 0) {
1553
12.1M
        Py_INCREF(v);
1554
12.1M
        list_clear(self);
1555
12.1M
        status = 0;
1556
12.1M
    }
1557
17.4M
    else {
1558
17.4M
        if ((size_after_pop - index) > 0) {
1559
10.9M
            memmove(&items[index], &items[index+1], (size_after_pop - index) * sizeof(PyObject *));
1560
10.9M
        }
1561
17.4M
        status = list_resize(self, size_after_pop);
1562
17.4M
    }
1563
29.5M
    if (status >= 0) {
1564
29.5M
        return v; // and v now owns the reference the list had
1565
29.5M
    }
1566
0
    else {
1567
        // list resize failed, need to restore
1568
0
        memmove(&items[index+1], &items[index], (size_after_pop - index)* sizeof(PyObject *));
1569
0
        items[index] = v;
1570
0
        return NULL;
1571
0
    }
1572
29.5M
}
1573
1574
/* Reverse a slice of a list in place, from lo up to (exclusive) hi. */
1575
static void
1576
reverse_slice(PyObject **lo, PyObject **hi)
1577
113k
{
1578
113k
    assert(lo && hi);
1579
1580
113k
    --hi;
1581
464k
    while (lo < hi) {
1582
351k
        PyObject *t = *lo;
1583
351k
        *lo = *hi;
1584
351k
        *hi = t;
1585
351k
        ++lo;
1586
351k
        --hi;
1587
351k
    }
1588
113k
}
1589
1590
/* Lots of code for an adaptive, stable, natural mergesort.  There are many
1591
 * pieces to this algorithm; read listsort.txt for overviews and details.
1592
 */
1593
1594
/* A sortslice contains a pointer to an array of keys and a pointer to
1595
 * an array of corresponding values.  In other words, keys[i]
1596
 * corresponds with values[i].  If values == NULL, then the keys are
1597
 * also the values.
1598
 *
1599
 * Several convenience routines are provided here, so that keys and
1600
 * values are always moved in sync.
1601
 */
1602
1603
typedef struct {
1604
    PyObject **keys;
1605
    PyObject **values;
1606
} sortslice;
1607
1608
Py_LOCAL_INLINE(void)
1609
sortslice_copy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j)
1610
35.8k
{
1611
35.8k
    s1->keys[i] = s2->keys[j];
1612
35.8k
    if (s1->values != NULL)
1613
34.8k
        s1->values[i] = s2->values[j];
1614
35.8k
}
1615
1616
Py_LOCAL_INLINE(void)
1617
sortslice_copy_incr(sortslice *dst, sortslice *src)
1618
556k
{
1619
556k
    *dst->keys++ = *src->keys++;
1620
556k
    if (dst->values != NULL)
1621
336k
        *dst->values++ = *src->values++;
1622
556k
}
1623
1624
Py_LOCAL_INLINE(void)
1625
sortslice_copy_decr(sortslice *dst, sortslice *src)
1626
330k
{
1627
330k
    *dst->keys-- = *src->keys--;
1628
330k
    if (dst->values != NULL)
1629
259k
        *dst->values-- = *src->values--;
1630
330k
}
1631
1632
1633
Py_LOCAL_INLINE(void)
1634
sortslice_memcpy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
1635
                 Py_ssize_t n)
1636
204k
{
1637
204k
    memcpy(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1638
204k
    if (s1->values != NULL)
1639
169k
        memcpy(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1640
204k
}
1641
1642
Py_LOCAL_INLINE(void)
1643
sortslice_memmove(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
1644
                  Py_ssize_t n)
1645
140k
{
1646
140k
    memmove(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1647
140k
    if (s1->values != NULL)
1648
112k
        memmove(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1649
140k
}
1650
1651
Py_LOCAL_INLINE(void)
1652
sortslice_advance(sortslice *slice, Py_ssize_t n)
1653
820k
{
1654
820k
    slice->keys += n;
1655
820k
    if (slice->values != NULL)
1656
615k
        slice->values += n;
1657
820k
}
1658
1659
/* Comparison function: ms->key_compare, which is set at run-time in
1660
 * listsort_impl to optimize for various special cases.
1661
 * Returns -1 on error, 1 if x < y, 0 if x >= y.
1662
 */
1663
1664
15.3M
#define ISLT(X, Y) (*(ms->key_compare))(X, Y, ms)
1665
1666
/* Compare X to Y via "<".  Goto "fail" if the comparison raises an
1667
   error.  Else "k" is set to true iff X<Y, and an "if (k)" block is
1668
   started.  It makes more sense in context <wink>.  X and Y are PyObject*s.
1669
*/
1670
14.7M
#define IFLT(X, Y) if ((k = ISLT(X, Y)) < 0) goto fail;  \
1671
14.7M
           if (k)
1672
1673
/* The maximum number of entries in a MergeState's pending-runs stack.
1674
 * For a list with n elements, this needs at most floor(log2(n)) + 1 entries
1675
 * even if we didn't force runs to a minimal length.  So the number of bits
1676
 * in a Py_ssize_t is plenty large enough for all cases.
1677
 */
1678
#define MAX_MERGE_PENDING (SIZEOF_SIZE_T * 8)
1679
1680
/* When we get into galloping mode, we stay there until both runs win less
1681
 * often than MIN_GALLOP consecutive times.  See listsort.txt for more info.
1682
 */
1683
1.00M
#define MIN_GALLOP 7
1684
1685
/* Avoid malloc for small temp arrays. */
1686
1.87M
#define MERGESTATE_TEMP_SIZE 256
1687
1688
/* The largest value of minrun. This must be a power of 2, and >= 1 */
1689
795k
#define MAX_MINRUN 64
1690
#if ((MAX_MINRUN) < 1) || ((MAX_MINRUN) & ((MAX_MINRUN) - 1))
1691
#error "MAX_MINRUN must be a power of 2, and >= 1"
1692
#endif
1693
1694
/* One MergeState exists on the stack per invocation of mergesort.  It's just
1695
 * a convenient way to pass state around among the helper functions.
1696
 */
1697
struct s_slice {
1698
    sortslice base;
1699
    Py_ssize_t len;   /* length of run */
1700
    int power; /* node "level" for powersort merge strategy */
1701
};
1702
1703
typedef struct s_MergeState MergeState;
1704
struct s_MergeState {
1705
    /* This controls when we get *into* galloping mode.  It's initialized
1706
     * to MIN_GALLOP.  merge_lo and merge_hi tend to nudge it higher for
1707
     * random data, and lower for highly structured data.
1708
     */
1709
    Py_ssize_t min_gallop;
1710
1711
    Py_ssize_t listlen;     /* len(input_list) - read only */
1712
    PyObject **basekeys;    /* base address of keys array - read only */
1713
1714
    /* 'a' is temp storage to help with merges.  It contains room for
1715
     * alloced entries.
1716
     */
1717
    sortslice a;        /* may point to temparray below */
1718
    Py_ssize_t alloced;
1719
1720
    /* A stack of n pending runs yet to be merged.  Run #i starts at
1721
     * address base[i] and extends for len[i] elements.  It's always
1722
     * true (so long as the indices are in bounds) that
1723
     *
1724
     *     pending[i].base + pending[i].len == pending[i+1].base
1725
     *
1726
     * so we could cut the storage for this, but it's a minor amount,
1727
     * and keeping all the info explicit simplifies the code.
1728
     */
1729
    int n;
1730
    struct s_slice pending[MAX_MERGE_PENDING];
1731
1732
    /* 'a' points to this when possible, rather than muck with malloc. */
1733
    PyObject *temparray[MERGESTATE_TEMP_SIZE];
1734
1735
    /* This is the function we will use to compare two keys,
1736
     * even when none of our special cases apply and we have to use
1737
     * safe_object_compare. */
1738
    int (*key_compare)(PyObject *, PyObject *, MergeState *);
1739
1740
    /* This function is used by unsafe_object_compare to optimize comparisons
1741
     * when we know our list is type-homogeneous but we can't assume anything else.
1742
     * In the pre-sort check it is set equal to Py_TYPE(key)->tp_richcompare */
1743
    PyObject *(*key_richcompare)(PyObject *, PyObject *, int);
1744
1745
    /* This function is used by unsafe_tuple_compare to compare the first elements
1746
     * of tuples. It may be set to safe_object_compare, but the idea is that hopefully
1747
     * we can assume more, and use one of the special-case compares. */
1748
    int (*tuple_elem_compare)(PyObject *, PyObject *, MergeState *);
1749
1750
    /* Varisbles used for minrun computation. The "ideal" minrun length is
1751
     * the infinite precision listlen / 2**e. See listsort.txt.
1752
     */
1753
     Py_ssize_t mr_current, mr_e, mr_mask;
1754
};
1755
1756
/* binarysort is the best method for sorting small arrays: it does few
1757
   compares, but can do data movement quadratic in the number of elements.
1758
   ss->keys is viewed as an array of n kays, a[:n]. a[:ok] is already sorted.
1759
   Pass ok = 0 (or 1) if you don't know.
1760
   It's sorted in-place, by a stable binary insertion sort. If ss->values
1761
   isn't NULL, it's permuted in lockstap with ss->keys.
1762
   On entry, must have n >= 1, and 0 <= ok <= n <= MAX_MINRUN.
1763
   Return -1 if comparison raises an exception, else 0.
1764
   Even in case of error, the output slice will be some permutation of
1765
   the input (nothing is lost or duplicated).
1766
*/
1767
static int
1768
binarysort(MergeState *ms, const sortslice *ss, Py_ssize_t n, Py_ssize_t ok)
1769
124k
{
1770
124k
    Py_ssize_t k; /* for IFLT macro expansion */
1771
124k
    PyObject ** const a = ss->keys;
1772
124k
    PyObject ** const v = ss->values;
1773
124k
    const bool has_values = v != NULL;
1774
124k
    PyObject *pivot;
1775
124k
    Py_ssize_t M;
1776
1777
124k
    assert(0 <= ok && ok <= n && 1 <= n && n <= MAX_MINRUN);
1778
    /* assert a[:ok] is sorted */
1779
124k
    if (! ok)
1780
0
        ++ok;
1781
    /* Regular insertion sort has average- and worst-case O(n**2) cost
1782
       for both # of comparisons and number of bytes moved. But its branches
1783
       are highly predictable, and it loves sorted input (n-1 compares and no
1784
       data movement). This is significant in cases like sortperf.py's %sort,
1785
       where an out-of-order element near the start of a run is moved into
1786
       place slowly but then the remaining elements up to length minrun are
1787
       generally at worst one slot away from their correct position (so only
1788
       need 1 or 2 commpares to resolve). If comparisons are very fast (such
1789
       as for a list of Python floats), the simple inner loop leaves it
1790
       very competitive with binary insertion, despite that it does
1791
       significantly more compares overall on random data.
1792
1793
       Binary insertion sort has worst, average, and best case O(n log n)
1794
       cost for # of comparisons, but worst and average case O(n**2) cost
1795
       for data movement. The more expensive comparisons, the more important
1796
       the comparison advantage. But its branches are less predictable the
1797
       more "randomish" the data, and that's so significant its worst case
1798
       in real life is random input rather than reverse-ordered (which does
1799
       about twice the data movement than random input does).
1800
1801
       Note that the number of bytes moved doesn't seem to matter. MAX_MINRUN
1802
       of 64 is so small that the key and value pointers all fit in a corner
1803
       of L1 cache, and moving things around in that is very fast. */
1804
#if 0 // ordinary insertion sort.
1805
    PyObject * vpivot = NULL;
1806
    for (; ok < n; ++ok) {
1807
        pivot = a[ok];
1808
        if (has_values)
1809
            vpivot = v[ok];
1810
        for (M = ok - 1; M >= 0; --M) {
1811
            k = ISLT(pivot, a[M]);
1812
            if (k < 0) {
1813
                a[M + 1] = pivot;
1814
                if (has_values)
1815
                    v[M + 1] = vpivot;
1816
                goto fail;
1817
            }
1818
            else if (k) {
1819
                a[M + 1] = a[M];
1820
                if (has_values)
1821
                    v[M + 1] = v[M];
1822
            }
1823
            else
1824
                break;
1825
        }
1826
        a[M + 1] = pivot;
1827
        if (has_values)
1828
            v[M + 1] = vpivot;
1829
    }
1830
#else // binary insertion sort
1831
124k
    Py_ssize_t L, R;
1832
2.20M
    for (; ok < n; ++ok) {
1833
        /* set L to where a[ok] belongs */
1834
2.07M
        L = 0;
1835
2.07M
        R = ok;
1836
2.07M
        pivot = a[ok];
1837
        /* Slice invariants. vacuously true at the start:
1838
         * all a[0:L]  <= pivot
1839
         * all a[L:R]     unknown
1840
         * all a[R:ok]  > pivot
1841
         */
1842
2.07M
        assert(L < R);
1843
8.84M
        do {
1844
            /* don't do silly ;-) things to prevent overflow when finding
1845
               the midpoint; L and R are very far from filling a Py_ssize_t */
1846
8.84M
            M = (L + R) >> 1;
1847
8.84M
#if 1 // straightforward, but highly unpredictable branch on random data
1848
8.84M
            IFLT(pivot, a[M])
1849
3.65M
                R = M;
1850
5.19M
            else
1851
5.19M
                L = M + 1;
1852
#else
1853
            /* Try to get compiler to generate conditional move instructions
1854
               instead. Works fine, but leaving it disabled for now because
1855
               it's not yielding consistently faster sorts. Needs more
1856
               investigation. More computation in the inner loop adds its own
1857
               costs, which can be significant when compares are fast. */
1858
            k = ISLT(pivot, a[M]);
1859
            if (k < 0)
1860
                goto fail;
1861
            Py_ssize_t Mp1 = M + 1;
1862
            R = k ? M : R;
1863
            L = k ? L : Mp1;
1864
#endif
1865
8.84M
        } while (L < R);
1866
2.07M
        assert(L == R);
1867
        /* a[:L] holds all elements from a[:ok] <= pivot now, so pivot belongs
1868
           at index L. Slide a[L:ok] to the right a slot to make room for it.
1869
           Caution: using memmove is much slower under MSVC 5; we're not
1870
           usually moving many slots. Years later: under Visual Studio 2022,
1871
           memmove seems just slightly slower than doing it "by hand". */
1872
15.4M
        for (M = ok; M > L; --M)
1873
13.3M
            a[M] = a[M - 1];
1874
2.07M
        a[L] = pivot;
1875
2.07M
        if (has_values) {
1876
1.52M
            pivot = v[ok];
1877
7.86M
            for (M = ok; M > L; --M)
1878
6.34M
                v[M] = v[M - 1];
1879
1.52M
            v[L] = pivot;
1880
1.52M
        }
1881
2.07M
    }
1882
124k
#endif // pick binary or regular insertion sort
1883
124k
    return 0;
1884
1885
0
 fail:
1886
0
    return -1;
1887
124k
}
1888
1889
static void
1890
sortslice_reverse(sortslice *s, Py_ssize_t n)
1891
66.6k
{
1892
66.6k
    reverse_slice(s->keys, &s->keys[n]);
1893
66.6k
    if (s->values != NULL)
1894
46.5k
        reverse_slice(s->values, &s->values[n]);
1895
66.6k
}
1896
1897
/*
1898
Return the length of the run beginning at slo->keys, spanning no more than
1899
nremaining elements. The run beginning there may be ascending or descending,
1900
but the function permutes it in place, if needed, so that it's always ascending
1901
upon return.
1902
1903
Returns -1 in case of error.
1904
*/
1905
static Py_ssize_t
1906
count_run(MergeState *ms, sortslice *slo, Py_ssize_t nremaining)
1907
273k
{
1908
273k
    Py_ssize_t k; /* used by IFLT macro expansion */
1909
273k
    Py_ssize_t n;
1910
273k
    PyObject ** const lo = slo->keys;
1911
1912
    /* In general, as things go on we've established that the slice starts
1913
       with a monotone run of n elements, starting at lo. */
1914
1915
    /* We're n elements into the slice, and the most recent neq+1 elements are
1916
     * all equal. This reverses them in-place, and resets neq for reuse.
1917
     */
1918
273k
#define REVERSE_LAST_NEQ                        \
1919
273k
    if (neq) {                                  \
1920
5.66k
        sortslice slice = *slo;                 \
1921
5.66k
        ++neq;                                  \
1922
5.66k
        sortslice_advance(&slice, n - neq);     \
1923
5.66k
        sortslice_reverse(&slice, neq);         \
1924
5.66k
        neq = 0;                                \
1925
5.66k
    }
1926
1927
    /* Sticking to only __lt__ compares is confusing and error-prone. But in
1928
     * this routine, almost all uses of IFLT can be captured by tiny macros
1929
     * giving mnemonic names to the intent. Note that inline functions don't
1930
     * work for this (IFLT expands to code including `goto fail`).
1931
     */
1932
273k
#define IF_NEXT_LARGER  IFLT(lo[n-1], lo[n])
1933
3.47M
#define IF_NEXT_SMALLER IFLT(lo[n], lo[n-1])
1934
1935
273k
    assert(nremaining);
1936
    /* try ascending run first */
1937
3.01M
    for (n = 1; n < nremaining; ++n) {
1938
2.90M
        IF_NEXT_SMALLER
1939
167k
            break;
1940
2.90M
    }
1941
273k
    if (n == nremaining)
1942
106k
        return n;
1943
    /* lo[n] is strictly less */
1944
    /* If n is 1 now, then the first compare established it's a descending
1945
     * run, so fall through to the descending case. But if n > 1, there are
1946
     * n elements in an ascending run terminated by the strictly less lo[n].
1947
     * If the first key < lo[n-1], *somewhere* along the way the sequence
1948
     * increased, so we're done (there is no descending run).
1949
     * Else first key >= lo[n-1], which implies that the entire ascending run
1950
     * consists of equal elements. In that case, this is a descending run,
1951
     * and we reverse the all-equal prefix in-place.
1952
     */
1953
167k
    if (n > 1) {
1954
116k
        IFLT(lo[0], lo[n-1])
1955
111k
            return n;
1956
5.20k
        sortslice_reverse(slo, n);
1957
5.20k
    }
1958
55.7k
    ++n; /* in all cases it's been established that lo[n] has been resolved */
1959
1960
    /* Finish descending run. All-squal subruns are reversed in-place on the
1961
     * fly. Their original order will be restored at the end by the whole-slice
1962
     * reversal.
1963
     */
1964
55.7k
    Py_ssize_t neq = 0;
1965
97.9k
    for ( ; n < nremaining; ++n) {
1966
78.0k
        IF_NEXT_SMALLER {
1967
            /* This ends the most recent run of equal elements, but still in
1968
             * the "descending" direction.
1969
             */
1970
19.6k
            REVERSE_LAST_NEQ
1971
19.6k
        }
1972
58.4k
        else {
1973
58.4k
            IF_NEXT_LARGER /* descending run is over */
1974
35.8k
                break;
1975
22.6k
            else /* not x < y and not y < x implies x == y */
1976
22.6k
                ++neq;
1977
58.4k
        }
1978
78.0k
    }
1979
55.7k
    REVERSE_LAST_NEQ
1980
55.7k
    sortslice_reverse(slo, n); /* transform to ascending run */
1981
1982
    /* And after reversing, it's possible this can be extended by a
1983
     * naturally increasing suffix; e.g., [3, 2, 3, 4, 1] makes an
1984
     * ascending run from the first 4 elements.
1985
     */
1986
510k
    for ( ; n < nremaining; ++n) {
1987
488k
        IF_NEXT_SMALLER
1988
34.2k
            break;
1989
488k
    }
1990
1991
55.7k
    return n;
1992
0
fail:
1993
0
    return -1;
1994
1995
55.7k
#undef REVERSE_LAST_NEQ
1996
55.7k
#undef IF_NEXT_SMALLER
1997
55.7k
#undef IF_NEXT_LARGER
1998
55.7k
}
1999
2000
/*
2001
Locate the proper position of key in a sorted vector; if the vector contains
2002
an element equal to key, return the position immediately to the left of
2003
the leftmost equal element.  [gallop_right() does the same except returns
2004
the position to the right of the rightmost equal element (if any).]
2005
2006
"a" is a sorted vector with n elements, starting at a[0].  n must be > 0.
2007
2008
"hint" is an index at which to begin the search, 0 <= hint < n.  The closer
2009
hint is to the final result, the faster this runs.
2010
2011
The return value is the int k in 0..n such that
2012
2013
    a[k-1] < key <= a[k]
2014
2015
pretending that *(a-1) is minus infinity and a[n] is plus infinity.  IOW,
2016
key belongs at index k; or, IOW, the first k elements of a should precede
2017
key, and the last n-k should follow key.
2018
2019
Returns -1 on error.  See listsort.txt for info on the method.
2020
*/
2021
static Py_ssize_t
2022
gallop_left(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
2023
196k
{
2024
196k
    Py_ssize_t ofs;
2025
196k
    Py_ssize_t lastofs;
2026
196k
    Py_ssize_t k;
2027
2028
196k
    assert(key && a && n > 0 && hint >= 0 && hint < n);
2029
2030
196k
    a += hint;
2031
196k
    lastofs = 0;
2032
196k
    ofs = 1;
2033
196k
    IFLT(*a, key) {
2034
        /* a[hint] < key -- gallop right, until
2035
         * a[hint + lastofs] < key <= a[hint + ofs]
2036
         */
2037
110k
        const Py_ssize_t maxofs = n - hint;             /* &a[n-1] is highest */
2038
375k
        while (ofs < maxofs) {
2039
298k
            IFLT(a[ofs], key) {
2040
265k
                lastofs = ofs;
2041
265k
                assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2042
265k
                ofs = (ofs << 1) + 1;
2043
265k
            }
2044
33.0k
            else                /* key <= a[hint + ofs] */
2045
33.0k
                break;
2046
298k
        }
2047
110k
        if (ofs > maxofs)
2048
33.5k
            ofs = maxofs;
2049
        /* Translate back to offsets relative to &a[0]. */
2050
110k
        lastofs += hint;
2051
110k
        ofs += hint;
2052
110k
    }
2053
85.6k
    else {
2054
        /* key <= a[hint] -- gallop left, until
2055
         * a[hint - ofs] < key <= a[hint - lastofs]
2056
         */
2057
85.6k
        const Py_ssize_t maxofs = hint + 1;             /* &a[0] is lowest */
2058
284k
        while (ofs < maxofs) {
2059
257k
            IFLT(*(a-ofs), key)
2060
58.4k
                break;
2061
            /* key <= a[hint - ofs] */
2062
199k
            lastofs = ofs;
2063
199k
            assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2064
199k
            ofs = (ofs << 1) + 1;
2065
199k
        }
2066
85.6k
        if (ofs > maxofs)
2067
20.2k
            ofs = maxofs;
2068
        /* Translate back to positive offsets relative to &a[0]. */
2069
85.6k
        k = lastofs;
2070
85.6k
        lastofs = hint - ofs;
2071
85.6k
        ofs = hint - k;
2072
85.6k
    }
2073
196k
    a -= hint;
2074
2075
196k
    assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
2076
    /* Now a[lastofs] < key <= a[ofs], so key belongs somewhere to the
2077
     * right of lastofs but no farther right than ofs.  Do a binary
2078
     * search, with invariant a[lastofs-1] < key <= a[ofs].
2079
     */
2080
196k
    ++lastofs;
2081
590k
    while (lastofs < ofs) {
2082
394k
        Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
2083
2084
394k
        IFLT(a[m], key)
2085
204k
            lastofs = m+1;              /* a[m] < key */
2086
190k
        else
2087
190k
            ofs = m;                    /* key <= a[m] */
2088
394k
    }
2089
196k
    assert(lastofs == ofs);             /* so a[ofs-1] < key <= a[ofs] */
2090
196k
    return ofs;
2091
2092
0
fail:
2093
0
    return -1;
2094
196k
}
2095
2096
/*
2097
Exactly like gallop_left(), except that if key already exists in a[0:n],
2098
finds the position immediately to the right of the rightmost equal value.
2099
2100
The return value is the int k in 0..n such that
2101
2102
    a[k-1] <= key < a[k]
2103
2104
or -1 if error.
2105
2106
The code duplication is massive, but this is enough different given that
2107
we're sticking to "<" comparisons that it's much harder to follow if
2108
written as one routine with yet another "left or right?" flag.
2109
*/
2110
static Py_ssize_t
2111
gallop_right(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
2112
219k
{
2113
219k
    Py_ssize_t ofs;
2114
219k
    Py_ssize_t lastofs;
2115
219k
    Py_ssize_t k;
2116
2117
219k
    assert(key && a && n > 0 && hint >= 0 && hint < n);
2118
2119
219k
    a += hint;
2120
219k
    lastofs = 0;
2121
219k
    ofs = 1;
2122
219k
    IFLT(key, *a) {
2123
        /* key < a[hint] -- gallop left, until
2124
         * a[hint - ofs] <= key < a[hint - lastofs]
2125
         */
2126
87.3k
        const Py_ssize_t maxofs = hint + 1;             /* &a[0] is lowest */
2127
206k
        while (ofs < maxofs) {
2128
136k
            IFLT(key, *(a-ofs)) {
2129
118k
                lastofs = ofs;
2130
118k
                assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2131
118k
                ofs = (ofs << 1) + 1;
2132
118k
            }
2133
17.4k
            else                /* a[hint - ofs] <= key */
2134
17.4k
                break;
2135
136k
        }
2136
87.3k
        if (ofs > maxofs)
2137
13.3k
            ofs = maxofs;
2138
        /* Translate back to positive offsets relative to &a[0]. */
2139
87.3k
        k = lastofs;
2140
87.3k
        lastofs = hint - ofs;
2141
87.3k
        ofs = hint - k;
2142
87.3k
    }
2143
131k
    else {
2144
        /* a[hint] <= key -- gallop right, until
2145
         * a[hint + lastofs] <= key < a[hint + ofs]
2146
        */
2147
131k
        const Py_ssize_t maxofs = n - hint;             /* &a[n-1] is highest */
2148
453k
        while (ofs < maxofs) {
2149
394k
            IFLT(key, a[ofs])
2150
73.3k
                break;
2151
            /* a[hint + ofs] <= key */
2152
321k
            lastofs = ofs;
2153
321k
            assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2154
321k
            ofs = (ofs << 1) + 1;
2155
321k
        }
2156
131k
        if (ofs > maxofs)
2157
33.7k
            ofs = maxofs;
2158
        /* Translate back to offsets relative to &a[0]. */
2159
131k
        lastofs += hint;
2160
131k
        ofs += hint;
2161
131k
    }
2162
219k
    a -= hint;
2163
2164
219k
    assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
2165
    /* Now a[lastofs] <= key < a[ofs], so key belongs somewhere to the
2166
     * right of lastofs but no farther right than ofs.  Do a binary
2167
     * search, with invariant a[lastofs-1] <= key < a[ofs].
2168
     */
2169
219k
    ++lastofs;
2170
596k
    while (lastofs < ofs) {
2171
376k
        Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
2172
2173
376k
        IFLT(key, a[m])
2174
197k
            ofs = m;                    /* key < a[m] */
2175
179k
        else
2176
179k
            lastofs = m+1;              /* a[m] <= key */
2177
376k
    }
2178
219k
    assert(lastofs == ofs);             /* so a[ofs-1] <= key < a[ofs] */
2179
219k
    return ofs;
2180
2181
0
fail:
2182
0
    return -1;
2183
219k
}
2184
2185
/* Conceptually a MergeState's constructor. */
2186
static void
2187
merge_init(MergeState *ms, Py_ssize_t list_size, int has_keyfunc,
2188
           sortslice *lo)
2189
769k
{
2190
769k
    assert(ms != NULL);
2191
769k
    if (has_keyfunc) {
2192
        /* The temporary space for merging will need at most half the list
2193
         * size rounded up.  Use the minimum possible space so we can use the
2194
         * rest of temparray for other things.  In particular, if there is
2195
         * enough extra space, listsort() will use it to store the keys.
2196
         */
2197
551k
        ms->alloced = (list_size + 1) / 2;
2198
2199
        /* ms->alloced describes how many keys will be stored at
2200
           ms->temparray, but we also need to store the values.  Hence,
2201
           ms->alloced is capped at half of MERGESTATE_TEMP_SIZE. */
2202
551k
        if (MERGESTATE_TEMP_SIZE / 2 < ms->alloced)
2203
2.29k
            ms->alloced = MERGESTATE_TEMP_SIZE / 2;
2204
551k
        ms->a.values = &ms->temparray[ms->alloced];
2205
551k
    }
2206
217k
    else {
2207
217k
        ms->alloced = MERGESTATE_TEMP_SIZE;
2208
217k
        ms->a.values = NULL;
2209
217k
    }
2210
769k
    ms->a.keys = ms->temparray;
2211
769k
    ms->n = 0;
2212
769k
    ms->min_gallop = MIN_GALLOP;
2213
769k
    ms->listlen = list_size;
2214
769k
    ms->basekeys = lo->keys;
2215
2216
    /* State for generating minrun values. See listsort.txt. */
2217
769k
    ms->mr_e = 0;
2218
795k
    while (list_size >> ms->mr_e >= MAX_MINRUN) {
2219
26.7k
        ++ms->mr_e;
2220
26.7k
    }
2221
769k
    ms->mr_mask = (1 << ms->mr_e) - 1;
2222
769k
    ms->mr_current = 0;
2223
769k
}
2224
2225
/* Free all the temp memory owned by the MergeState.  This must be called
2226
 * when you're done with a MergeState, and may be called before then if
2227
 * you want to free the temp memory early.
2228
 */
2229
static void
2230
merge_freemem(MergeState *ms)
2231
774k
{
2232
774k
    assert(ms != NULL);
2233
774k
    if (ms->a.keys != ms->temparray) {
2234
5.31k
        PyMem_Free(ms->a.keys);
2235
5.31k
        ms->a.keys = NULL;
2236
5.31k
    }
2237
774k
}
2238
2239
/* Ensure enough temp memory for 'need' array slots is available.
2240
 * Returns 0 on success and -1 if the memory can't be gotten.
2241
 */
2242
static int
2243
merge_getmem(MergeState *ms, Py_ssize_t need)
2244
5.31k
{
2245
5.31k
    int multiplier;
2246
2247
5.31k
    assert(ms != NULL);
2248
5.31k
    if (need <= ms->alloced)
2249
0
        return 0;
2250
2251
5.31k
    multiplier = ms->a.values != NULL ? 2 : 1;
2252
2253
    /* Don't realloc!  That can cost cycles to copy the old data, but
2254
     * we don't care what's in the block.
2255
     */
2256
5.31k
    merge_freemem(ms);
2257
5.31k
    if ((size_t)need > PY_SSIZE_T_MAX / sizeof(PyObject *) / multiplier) {
2258
0
        PyErr_NoMemory();
2259
0
        return -1;
2260
0
    }
2261
5.31k
    ms->a.keys = (PyObject **)PyMem_Malloc(multiplier * need
2262
5.31k
                                          * sizeof(PyObject *));
2263
5.31k
    if (ms->a.keys != NULL) {
2264
5.31k
        ms->alloced = need;
2265
5.31k
        if (ms->a.values != NULL)
2266
4.80k
            ms->a.values = &ms->a.keys[need];
2267
5.31k
        return 0;
2268
5.31k
    }
2269
0
    PyErr_NoMemory();
2270
0
    return -1;
2271
5.31k
}
2272
75.5k
#define MERGE_GETMEM(MS, NEED) ((NEED) <= (MS)->alloced ? 0 :   \
2273
75.5k
                                merge_getmem(MS, NEED))
2274
2275
/* Merge the na elements starting at ssa with the nb elements starting at
2276
 * ssb.keys = ssa.keys + na in a stable way, in-place.  na and nb must be > 0.
2277
 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
2278
 * should have na <= nb.  See listsort.txt for more info.  Return 0 if
2279
 * successful, -1 if error.
2280
 */
2281
static Py_ssize_t
2282
merge_lo(MergeState *ms, sortslice ssa, Py_ssize_t na,
2283
         sortslice ssb, Py_ssize_t nb)
2284
49.5k
{
2285
49.5k
    Py_ssize_t k;
2286
49.5k
    sortslice dest;
2287
49.5k
    int result = -1;            /* guilty until proved innocent */
2288
49.5k
    Py_ssize_t min_gallop;
2289
2290
49.5k
    assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
2291
49.5k
    assert(ssa.keys + na == ssb.keys);
2292
49.5k
    if (MERGE_GETMEM(ms, na) < 0)
2293
0
        return -1;
2294
49.5k
    sortslice_memcpy(&ms->a, 0, &ssa, 0, na);
2295
49.5k
    dest = ssa;
2296
49.5k
    ssa = ms->a;
2297
2298
49.5k
    sortslice_copy_incr(&dest, &ssb);
2299
49.5k
    --nb;
2300
49.5k
    if (nb == 0)
2301
3.67k
        goto Succeed;
2302
45.8k
    if (na == 1)
2303
7.15k
        goto CopyB;
2304
2305
38.6k
    min_gallop = ms->min_gallop;
2306
57.9k
    for (;;) {
2307
57.9k
        Py_ssize_t acount = 0;          /* # of times A won in a row */
2308
57.9k
        Py_ssize_t bcount = 0;          /* # of times B won in a row */
2309
2310
        /* Do the straightforward thing until (if ever) one run
2311
         * appears to win consistently.
2312
         */
2313
365k
        for (;;) {
2314
365k
            assert(na > 1 && nb > 0);
2315
365k
            k = ISLT(ssb.keys[0], ssa.keys[0]);
2316
365k
            if (k) {
2317
198k
                if (k < 0)
2318
0
                    goto Fail;
2319
198k
                sortslice_copy_incr(&dest, &ssb);
2320
198k
                ++bcount;
2321
198k
                acount = 0;
2322
198k
                --nb;
2323
198k
                if (nb == 0)
2324
3.58k
                    goto Succeed;
2325
195k
                if (bcount >= min_gallop)
2326
27.9k
                    break;
2327
195k
            }
2328
166k
            else {
2329
166k
                sortslice_copy_incr(&dest, &ssa);
2330
166k
                ++acount;
2331
166k
                bcount = 0;
2332
166k
                --na;
2333
166k
                if (na == 1)
2334
2.75k
                    goto CopyB;
2335
163k
                if (acount >= min_gallop)
2336
23.6k
                    break;
2337
163k
            }
2338
365k
        }
2339
2340
        /* One run is winning so consistently that galloping may
2341
         * be a huge win.  So try that, and continue galloping until
2342
         * (if ever) neither run appears to be winning consistently
2343
         * anymore.
2344
         */
2345
51.5k
        ++min_gallop;
2346
89.4k
        do {
2347
89.4k
            assert(na > 1 && nb > 0);
2348
89.4k
            min_gallop -= min_gallop > 1;
2349
89.4k
            ms->min_gallop = min_gallop;
2350
89.4k
            k = gallop_right(ms, ssb.keys[0], ssa.keys, na, 0);
2351
89.4k
            acount = k;
2352
89.4k
            if (k) {
2353
52.1k
                if (k < 0)
2354
0
                    goto Fail;
2355
52.1k
                sortslice_memcpy(&dest, 0, &ssa, 0, k);
2356
52.1k
                sortslice_advance(&dest, k);
2357
52.1k
                sortslice_advance(&ssa, k);
2358
52.1k
                na -= k;
2359
52.1k
                if (na == 1)
2360
8.81k
                    goto CopyB;
2361
                /* na==0 is impossible now if the comparison
2362
                 * function is consistent, but we can't assume
2363
                 * that it is.
2364
                 */
2365
43.3k
                if (na == 0)
2366
0
                    goto Succeed;
2367
43.3k
            }
2368
80.6k
            sortslice_copy_incr(&dest, &ssb);
2369
80.6k
            --nb;
2370
80.6k
            if (nb == 0)
2371
2.26k
                goto Succeed;
2372
2373
78.4k
            k = gallop_left(ms, ssa.keys[0], ssb.keys, nb, 0);
2374
78.4k
            bcount = k;
2375
78.4k
            if (k) {
2376
72.2k
                if (k < 0)
2377
0
                    goto Fail;
2378
72.2k
                sortslice_memmove(&dest, 0, &ssb, 0, k);
2379
72.2k
                sortslice_advance(&dest, k);
2380
72.2k
                sortslice_advance(&ssb, k);
2381
72.2k
                nb -= k;
2382
72.2k
                if (nb == 0)
2383
17.3k
                    goto Succeed;
2384
72.2k
            }
2385
61.0k
            sortslice_copy_incr(&dest, &ssa);
2386
61.0k
            --na;
2387
61.0k
            if (na == 1)
2388
3.94k
                goto CopyB;
2389
61.0k
        } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
2390
19.2k
        ++min_gallop;           /* penalize it for leaving galloping mode */
2391
19.2k
        ms->min_gallop = min_gallop;
2392
19.2k
    }
2393
26.8k
Succeed:
2394
26.8k
    result = 0;
2395
26.8k
Fail:
2396
26.8k
    if (na)
2397
26.8k
        sortslice_memcpy(&dest, 0, &ssa, 0, na);
2398
26.8k
    return result;
2399
22.6k
CopyB:
2400
22.6k
    assert(na == 1 && nb > 0);
2401
    /* The last element of ssa belongs at the end of the merge. */
2402
22.6k
    sortslice_memmove(&dest, 0, &ssb, 0, nb);
2403
22.6k
    sortslice_copy(&dest, nb, &ssa, 0);
2404
22.6k
    return 0;
2405
26.8k
}
2406
2407
/* Merge the na elements starting at pa with the nb elements starting at
2408
 * ssb.keys = ssa.keys + na in a stable way, in-place.  na and nb must be > 0.
2409
 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
2410
 * should have na >= nb.  See listsort.txt for more info.  Return 0 if
2411
 * successful, -1 if error.
2412
 */
2413
static Py_ssize_t
2414
merge_hi(MergeState *ms, sortslice ssa, Py_ssize_t na,
2415
         sortslice ssb, Py_ssize_t nb)
2416
25.9k
{
2417
25.9k
    Py_ssize_t k;
2418
25.9k
    sortslice dest, basea, baseb;
2419
25.9k
    int result = -1;            /* guilty until proved innocent */
2420
25.9k
    Py_ssize_t min_gallop;
2421
2422
25.9k
    assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
2423
25.9k
    assert(ssa.keys + na == ssb.keys);
2424
25.9k
    if (MERGE_GETMEM(ms, nb) < 0)
2425
0
        return -1;
2426
25.9k
    dest = ssb;
2427
25.9k
    sortslice_advance(&dest, nb-1);
2428
25.9k
    sortslice_memcpy(&ms->a, 0, &ssb, 0, nb);
2429
25.9k
    basea = ssa;
2430
25.9k
    baseb = ms->a;
2431
25.9k
    ssb.keys = ms->a.keys + nb - 1;
2432
25.9k
    if (ssb.values != NULL)
2433
22.5k
        ssb.values = ms->a.values + nb - 1;
2434
25.9k
    sortslice_advance(&ssa, na - 1);
2435
2436
25.9k
    sortslice_copy_decr(&dest, &ssa);
2437
25.9k
    --na;
2438
25.9k
    if (na == 0)
2439
0
        goto Succeed;
2440
25.9k
    if (nb == 1)
2441
876
        goto CopyA;
2442
2443
25.1k
    min_gallop = ms->min_gallop;
2444
33.9k
    for (;;) {
2445
33.9k
        Py_ssize_t acount = 0;          /* # of times A won in a row */
2446
33.9k
        Py_ssize_t bcount = 0;          /* # of times B won in a row */
2447
2448
        /* Do the straightforward thing until (if ever) one run
2449
         * appears to win consistently.
2450
         */
2451
230k
        for (;;) {
2452
230k
            assert(na > 0 && nb > 1);
2453
230k
            k = ISLT(ssb.keys[0], ssa.keys[0]);
2454
230k
            if (k) {
2455
106k
                if (k < 0)
2456
0
                    goto Fail;
2457
106k
                sortslice_copy_decr(&dest, &ssa);
2458
106k
                ++acount;
2459
106k
                bcount = 0;
2460
106k
                --na;
2461
106k
                if (na == 0)
2462
592
                    goto Succeed;
2463
105k
                if (acount >= min_gallop)
2464
14.7k
                    break;
2465
105k
            }
2466
123k
            else {
2467
123k
                sortslice_copy_decr(&dest, &ssb);
2468
123k
                ++bcount;
2469
123k
                acount = 0;
2470
123k
                --nb;
2471
123k
                if (nb == 1)
2472
383
                    goto CopyA;
2473
123k
                if (bcount >= min_gallop)
2474
18.2k
                    break;
2475
123k
            }
2476
230k
        }
2477
2478
        /* One run is winning so consistently that galloping may
2479
         * be a huge win.  So try that, and continue galloping until
2480
         * (if ever) neither run appears to be winning consistently
2481
         * anymore.
2482
         */
2483
32.9k
        ++min_gallop;
2484
54.0k
        do {
2485
54.0k
            assert(na > 0 && nb > 1);
2486
54.0k
            min_gallop -= min_gallop > 1;
2487
54.0k
            ms->min_gallop = min_gallop;
2488
54.0k
            k = gallop_right(ms, ssb.keys[0], basea.keys, na, na-1);
2489
54.0k
            if (k < 0)
2490
0
                goto Fail;
2491
54.0k
            k = na - k;
2492
54.0k
            acount = k;
2493
54.0k
            if (k) {
2494
31.9k
                sortslice_advance(&dest, -k);
2495
31.9k
                sortslice_advance(&ssa, -k);
2496
31.9k
                sortslice_memmove(&dest, 1, &ssa, 1, k);
2497
31.9k
                na -= k;
2498
31.9k
                if (na == 0)
2499
11.1k
                    goto Succeed;
2500
31.9k
            }
2501
42.9k
            sortslice_copy_decr(&dest, &ssb);
2502
42.9k
            --nb;
2503
42.9k
            if (nb == 1)
2504
811
                goto CopyA;
2505
2506
42.1k
            k = gallop_left(ms, ssa.keys[0], baseb.keys, nb, nb-1);
2507
42.1k
            if (k < 0)
2508
0
                goto Fail;
2509
42.1k
            k = nb - k;
2510
42.1k
            bcount = k;
2511
42.1k
            if (k) {
2512
37.0k
                sortslice_advance(&dest, -k);
2513
37.0k
                sortslice_advance(&ssb, -k);
2514
37.0k
                sortslice_memcpy(&dest, 1, &ssb, 1, k);
2515
37.0k
                nb -= k;
2516
37.0k
                if (nb == 1)
2517
11.1k
                    goto CopyA;
2518
                /* nb==0 is impossible now if the comparison
2519
                 * function is consistent, but we can't assume
2520
                 * that it is.
2521
                 */
2522
25.8k
                if (nb == 0)
2523
0
                    goto Succeed;
2524
25.8k
            }
2525
31.0k
            sortslice_copy_decr(&dest, &ssa);
2526
31.0k
            --na;
2527
31.0k
            if (na == 0)
2528
1.10k
                goto Succeed;
2529
31.0k
        } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
2530
8.84k
        ++min_gallop;           /* penalize it for leaving galloping mode */
2531
8.84k
        ms->min_gallop = min_gallop;
2532
8.84k
    }
2533
12.8k
Succeed:
2534
12.8k
    result = 0;
2535
12.8k
Fail:
2536
12.8k
    if (nb)
2537
12.8k
        sortslice_memcpy(&dest, -(nb-1), &baseb, 0, nb);
2538
12.8k
    return result;
2539
13.1k
CopyA:
2540
13.1k
    assert(nb == 1 && na > 0);
2541
    /* The first element of ssb belongs at the front of the merge. */
2542
13.1k
    sortslice_memmove(&dest, 1-na, &ssa, 1-na, na);
2543
13.1k
    sortslice_advance(&dest, -na);
2544
13.1k
    sortslice_advance(&ssa, -na);
2545
13.1k
    sortslice_copy(&dest, 0, &ssb, 0);
2546
13.1k
    return 0;
2547
12.8k
}
2548
2549
/* Merge the two runs at stack indices i and i+1.
2550
 * Returns 0 on success, -1 on error.
2551
 */
2552
static Py_ssize_t
2553
merge_at(MergeState *ms, Py_ssize_t i)
2554
75.5k
{
2555
75.5k
    sortslice ssa, ssb;
2556
75.5k
    Py_ssize_t na, nb;
2557
75.5k
    Py_ssize_t k;
2558
2559
75.5k
    assert(ms != NULL);
2560
75.5k
    assert(ms->n >= 2);
2561
75.5k
    assert(i >= 0);
2562
75.5k
    assert(i == ms->n - 2 || i == ms->n - 3);
2563
2564
75.5k
    ssa = ms->pending[i].base;
2565
75.5k
    na = ms->pending[i].len;
2566
75.5k
    ssb = ms->pending[i+1].base;
2567
75.5k
    nb = ms->pending[i+1].len;
2568
75.5k
    assert(na > 0 && nb > 0);
2569
75.5k
    assert(ssa.keys + na == ssb.keys);
2570
2571
    /* Record the length of the combined runs; if i is the 3rd-last
2572
     * run now, also slide over the last run (which isn't involved
2573
     * in this merge).  The current run i+1 goes away in any case.
2574
     */
2575
75.5k
    ms->pending[i].len = na + nb;
2576
75.5k
    if (i == ms->n - 3)
2577
441
        ms->pending[i+1] = ms->pending[i+2];
2578
75.5k
    --ms->n;
2579
2580
    /* Where does b start in a?  Elements in a before that can be
2581
     * ignored (already in place).
2582
     */
2583
75.5k
    k = gallop_right(ms, *ssb.keys, ssa.keys, na, 0);
2584
75.5k
    if (k < 0)
2585
0
        return -1;
2586
75.5k
    sortslice_advance(&ssa, k);
2587
75.5k
    na -= k;
2588
75.5k
    if (na == 0)
2589
26
        return 0;
2590
2591
    /* Where does a end in b?  Elements in b after that can be
2592
     * ignored (already in place).
2593
     */
2594
75.5k
    nb = gallop_left(ms, ssa.keys[na-1], ssb.keys, nb, nb-1);
2595
75.5k
    if (nb <= 0)
2596
0
        return nb;
2597
2598
    /* Merge what remains of the runs, using a temp array with
2599
     * min(na, nb) elements.
2600
     */
2601
75.5k
    if (na <= nb)
2602
49.5k
        return merge_lo(ms, ssa, na, ssb, nb);
2603
25.9k
    else
2604
25.9k
        return merge_hi(ms, ssa, na, ssb, nb);
2605
75.5k
}
2606
2607
/* Two adjacent runs begin at index s1. The first run has length n1, and
2608
 * the second run (starting at index s1+n1) has length n2. The list has total
2609
 * length n.
2610
 * Compute the "power" of the first run. See listsort.txt for details.
2611
 */
2612
static int
2613
powerloop(Py_ssize_t s1, Py_ssize_t n1, Py_ssize_t n2, Py_ssize_t n)
2614
75.5k
{
2615
75.5k
    int result = 0;
2616
75.5k
    assert(s1 >= 0);
2617
75.5k
    assert(n1 > 0 && n2 > 0);
2618
75.5k
    assert(s1 + n1 + n2 <= n);
2619
    /* midpoints a and b:
2620
     * a = s1 + n1/2
2621
     * b = s1 + n1 + n2/2 = a + (n1 + n2)/2
2622
     *
2623
     * Those may not be integers, though, because of the "/2". So we work with
2624
     * 2*a and 2*b instead, which are necessarily integers. It makes no
2625
     * difference to the outcome, since the bits in the expansion of (2*i)/n
2626
     * are merely shifted one position from those of i/n.
2627
     */
2628
75.5k
    Py_ssize_t a = 2 * s1 + n1;  /* 2*a */
2629
75.5k
    Py_ssize_t b = a + n1 + n2;  /* 2*b */
2630
    /* Emulate a/n and b/n one bit a time, until bits differ. */
2631
307k
    for (;;) {
2632
307k
        ++result;
2633
307k
        if (a >= n) {  /* both quotient bits are 1 */
2634
119k
            assert(b >= a);
2635
119k
            a -= n;
2636
119k
            b -= n;
2637
119k
        }
2638
188k
        else if (b >= n) {  /* a/n bit is 0, b/n bit is 1 */
2639
75.5k
            break;
2640
75.5k
        } /* else both quotient bits are 0 */
2641
231k
        assert(a < b && b < n);
2642
231k
        a <<= 1;
2643
231k
        b <<= 1;
2644
231k
    }
2645
75.5k
    return result;
2646
75.5k
}
2647
2648
/* The next run has been identified, of length n2.
2649
 * If there's already a run on the stack, apply the "powersort" merge strategy:
2650
 * compute the topmost run's "power" (depth in a conceptual binary merge tree)
2651
 * and merge adjacent runs on the stack with greater power. See listsort.txt
2652
 * for more info.
2653
 *
2654
 * It's the caller's responsibility to push the new run on the stack when this
2655
 * returns.
2656
 *
2657
 * Returns 0 on success, -1 on error.
2658
 */
2659
static int
2660
found_new_run(MergeState *ms, Py_ssize_t n2)
2661
273k
{
2662
273k
    assert(ms);
2663
273k
    if (ms->n) {
2664
75.5k
        assert(ms->n > 0);
2665
75.5k
        struct s_slice *p = ms->pending;
2666
75.5k
        Py_ssize_t s1 = p[ms->n - 1].base.keys - ms->basekeys; /* start index */
2667
75.5k
        Py_ssize_t n1 = p[ms->n - 1].len;
2668
75.5k
        int power = powerloop(s1, n1, n2, ms->listlen);
2669
126k
        while (ms->n > 1 && p[ms->n - 2].power > power) {
2670
50.8k
            if (merge_at(ms, ms->n - 2) < 0)
2671
0
                return -1;
2672
50.8k
        }
2673
75.5k
        assert(ms->n < 2 || p[ms->n - 2].power < power);
2674
75.5k
        p[ms->n - 1].power = power;
2675
75.5k
    }
2676
273k
    return 0;
2677
273k
}
2678
2679
/* Regardless of invariants, merge all runs on the stack until only one
2680
 * remains.  This is used at the end of the mergesort.
2681
 *
2682
 * Returns 0 on success, -1 on error.
2683
 */
2684
static int
2685
merge_force_collapse(MergeState *ms)
2686
198k
{
2687
198k
    struct s_slice *p = ms->pending;
2688
2689
198k
    assert(ms);
2690
223k
    while (ms->n > 1) {
2691
24.6k
        Py_ssize_t n = ms->n - 2;
2692
24.6k
        if (n > 0 && p[n-1].len < p[n+1].len)
2693
441
            --n;
2694
24.6k
        if (merge_at(ms, n) < 0)
2695
0
            return -1;
2696
24.6k
    }
2697
198k
    return 0;
2698
198k
}
2699
2700
/* Return the next minrun value to use. See listsort.txt. */
2701
Py_LOCAL_INLINE(Py_ssize_t)
2702
minrun_next(MergeState *ms)
2703
273k
{
2704
273k
    ms->mr_current += ms->listlen;
2705
273k
    assert(ms->mr_current >= 0); /* no overflow */
2706
273k
    Py_ssize_t result = ms->mr_current >> ms->mr_e;
2707
273k
    ms->mr_current &= ms->mr_mask;
2708
273k
    return result;
2709
273k
}
2710
2711
/* Here we define custom comparison functions to optimize for the cases one commonly
2712
 * encounters in practice: homogeneous lists, often of one of the basic types. */
2713
2714
/* This struct holds the comparison function and helper functions
2715
 * selected in the pre-sort check. */
2716
2717
/* These are the special case compare functions.
2718
 * ms->key_compare will always point to one of these: */
2719
2720
/* Heterogeneous compare: default, always safe to fall back on. */
2721
static int
2722
safe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
2723
0
{
2724
    /* No assumptions necessary! */
2725
0
    return PyObject_RichCompareBool(v, w, Py_LT);
2726
0
}
2727
2728
/* Homogeneous compare: safe for any two comparable objects of the same type.
2729
 * (ms->key_richcompare is set to ob_type->tp_richcompare in the
2730
 *  pre-sort check.)
2731
 */
2732
static int
2733
unsafe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
2734
9.55M
{
2735
9.55M
    PyObject *res_obj; int res;
2736
2737
    /* No assumptions, because we check first: */
2738
9.55M
    if (Py_TYPE(v)->tp_richcompare != ms->key_richcompare)
2739
0
        return PyObject_RichCompareBool(v, w, Py_LT);
2740
2741
9.55M
    assert(ms->key_richcompare != NULL);
2742
9.55M
    res_obj = (*(ms->key_richcompare))(v, w, Py_LT);
2743
2744
9.55M
    if (res_obj == Py_NotImplemented) {
2745
0
        Py_DECREF(res_obj);
2746
0
        return PyObject_RichCompareBool(v, w, Py_LT);
2747
0
    }
2748
9.55M
    if (res_obj == NULL)
2749
0
        return -1;
2750
2751
9.55M
    if (PyBool_Check(res_obj)) {
2752
9.55M
        res = (res_obj == Py_True);
2753
9.55M
    }
2754
0
    else {
2755
0
        res = PyObject_IsTrue(res_obj);
2756
0
    }
2757
9.55M
    Py_DECREF(res_obj);
2758
2759
    /* Note that we can't assert
2760
     *     res == PyObject_RichCompareBool(v, w, Py_LT);
2761
     * because of evil compare functions like this:
2762
     *     lambda a, b:  int(random.random() * 3) - 1)
2763
     * (which is actually in test_sort.py) */
2764
9.55M
    return res;
2765
9.55M
}
2766
2767
/* Latin string compare: safe for any two latin (one byte per char) strings. */
2768
static int
2769
unsafe_latin_compare(PyObject *v, PyObject *w, MergeState *ms)
2770
274k
{
2771
274k
    Py_ssize_t len;
2772
274k
    int res;
2773
2774
    /* Modified from Objects/unicodeobject.c:unicode_compare, assuming: */
2775
274k
    assert(Py_IS_TYPE(v, &PyUnicode_Type));
2776
274k
    assert(Py_IS_TYPE(w, &PyUnicode_Type));
2777
274k
    assert(PyUnicode_KIND(v) == PyUnicode_KIND(w));
2778
274k
    assert(PyUnicode_KIND(v) == PyUnicode_1BYTE_KIND);
2779
2780
274k
    len = Py_MIN(PyUnicode_GET_LENGTH(v), PyUnicode_GET_LENGTH(w));
2781
274k
    res = memcmp(PyUnicode_DATA(v), PyUnicode_DATA(w), len);
2782
2783
274k
    res = (res != 0 ?
2784
269k
           res < 0 :
2785
274k
           PyUnicode_GET_LENGTH(v) < PyUnicode_GET_LENGTH(w));
2786
2787
274k
    assert(res == PyObject_RichCompareBool(v, w, Py_LT));;
2788
274k
    return res;
2789
274k
}
2790
2791
/* Bounded int compare: compare any two longs that fit in a single machine word. */
2792
static int
2793
unsafe_long_compare(PyObject *v, PyObject *w, MergeState *ms)
2794
5.53M
{
2795
5.53M
    PyLongObject *vl, *wl;
2796
5.53M
    intptr_t v0, w0;
2797
5.53M
    int res;
2798
2799
    /* Modified from Objects/longobject.c:long_compare, assuming: */
2800
5.53M
    assert(Py_IS_TYPE(v, &PyLong_Type));
2801
5.53M
    assert(Py_IS_TYPE(w, &PyLong_Type));
2802
5.53M
    assert(_PyLong_IsCompact((PyLongObject *)v));
2803
5.53M
    assert(_PyLong_IsCompact((PyLongObject *)w));
2804
2805
5.53M
    vl = (PyLongObject*)v;
2806
5.53M
    wl = (PyLongObject*)w;
2807
2808
5.53M
    v0 = _PyLong_CompactValue(vl);
2809
5.53M
    w0 = _PyLong_CompactValue(wl);
2810
2811
5.53M
    res = v0 < w0;
2812
5.53M
    assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2813
5.53M
    return res;
2814
5.53M
}
2815
2816
/* Float compare: compare any two floats. */
2817
static int
2818
unsafe_float_compare(PyObject *v, PyObject *w, MergeState *ms)
2819
0
{
2820
0
    int res;
2821
2822
    /* Modified from Objects/floatobject.c:float_richcompare, assuming: */
2823
0
    assert(Py_IS_TYPE(v, &PyFloat_Type));
2824
0
    assert(Py_IS_TYPE(w, &PyFloat_Type));
2825
2826
0
    res = PyFloat_AS_DOUBLE(v) < PyFloat_AS_DOUBLE(w);
2827
0
    assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2828
0
    return res;
2829
0
}
2830
2831
/* Tuple compare: compare *any* two tuples, using
2832
 * ms->tuple_elem_compare to compare the first elements, which is set
2833
 * using the same pre-sort check as we use for ms->key_compare,
2834
 * but run on the list [x[0] for x in L]. This allows us to optimize compares
2835
 * on two levels (as long as [x[0] for x in L] is type-homogeneous.) The idea is
2836
 * that most tuple compares don't involve x[1:]. */
2837
static int
2838
unsafe_tuple_compare(PyObject *v, PyObject *w, MergeState *ms)
2839
1.26k
{
2840
1.26k
    PyTupleObject *vt, *wt;
2841
1.26k
    Py_ssize_t i, vlen, wlen;
2842
1.26k
    int k;
2843
2844
    /* Modified from Objects/tupleobject.c:tuplerichcompare, assuming: */
2845
1.26k
    assert(Py_IS_TYPE(v, &PyTuple_Type));
2846
1.26k
    assert(Py_IS_TYPE(w, &PyTuple_Type));
2847
1.26k
    assert(Py_SIZE(v) > 0);
2848
1.26k
    assert(Py_SIZE(w) > 0);
2849
2850
1.26k
    vt = (PyTupleObject *)v;
2851
1.26k
    wt = (PyTupleObject *)w;
2852
2853
1.26k
    vlen = Py_SIZE(vt);
2854
1.26k
    wlen = Py_SIZE(wt);
2855
2856
1.27k
    for (i = 0; i < vlen && i < wlen; i++) {
2857
1.27k
        k = PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_EQ);
2858
1.27k
        if (k < 0)
2859
0
            return -1;
2860
1.27k
        if (!k)
2861
1.26k
            break;
2862
1.27k
    }
2863
2864
1.26k
    if (i >= vlen || i >= wlen)
2865
0
        return vlen < wlen;
2866
2867
1.26k
    if (i == 0)
2868
1.25k
        return ms->tuple_elem_compare(vt->ob_item[i], wt->ob_item[i], ms);
2869
12
    else
2870
12
        return PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_LT);
2871
1.26k
}
2872
2873
/* An adaptive, stable, natural mergesort.  See listsort.txt.
2874
 * Returns Py_None on success, NULL on error.  Even in case of error, the
2875
 * list will be some permutation of its input state (nothing is lost or
2876
 * duplicated).
2877
 */
2878
/*[clinic input]
2879
@permit_long_docstring_body
2880
@critical_section
2881
list.sort
2882
2883
    *
2884
    key as keyfunc: object = None
2885
    reverse: bool = False
2886
2887
Sort the list in ascending order and return None.
2888
2889
The sort is in-place (i.e. the list itself is modified) and stable (i.e. the
2890
order of two equal elements is maintained).
2891
2892
If a key function is given, apply it once to each list item and sort them,
2893
ascending or descending, according to their function values.
2894
2895
The reverse flag can be set to sort in descending order.
2896
[clinic start generated code]*/
2897
2898
static PyObject *
2899
list_sort_impl(PyListObject *self, PyObject *keyfunc, int reverse)
2900
/*[clinic end generated code: output=57b9f9c5e23fbe42 input=e4f6b6069181ad7d]*/
2901
769k
{
2902
769k
    MergeState ms;
2903
769k
    Py_ssize_t nremaining;
2904
769k
    Py_ssize_t minrun;
2905
769k
    sortslice lo;
2906
769k
    Py_ssize_t saved_ob_size, saved_allocated;
2907
769k
    PyObject **saved_ob_item;
2908
769k
    PyObject **final_ob_item;
2909
769k
    PyObject *result = NULL;            /* guilty until proved innocent */
2910
769k
    Py_ssize_t i;
2911
769k
    PyObject **keys;
2912
2913
769k
    assert(self != NULL);
2914
769k
    assert(PyList_Check(self));
2915
769k
    if (keyfunc == Py_None)
2916
201k
        keyfunc = NULL;
2917
2918
    /* The list is temporarily made empty, so that mutations performed
2919
     * by comparison functions can't affect the slice of memory we're
2920
     * sorting (allowing mutations during sorting is a core-dump
2921
     * factory, since ob_item may change).
2922
     */
2923
769k
    saved_ob_size = Py_SIZE(self);
2924
769k
    saved_ob_item = self->ob_item;
2925
769k
    saved_allocated = self->allocated;
2926
769k
    Py_SET_SIZE(self, 0);
2927
769k
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item, NULL);
2928
769k
    self->allocated = -1; /* any operation will reset it to >= 0 */
2929
2930
769k
    if (keyfunc == NULL) {
2931
217k
        keys = NULL;
2932
217k
        lo.keys = saved_ob_item;
2933
217k
        lo.values = NULL;
2934
217k
    }
2935
551k
    else {
2936
551k
        if (saved_ob_size < MERGESTATE_TEMP_SIZE/2)
2937
            /* Leverage stack space we allocated but won't otherwise use */
2938
547k
            keys = &ms.temparray[saved_ob_size+1];
2939
4.08k
        else {
2940
4.08k
            keys = PyMem_Malloc(sizeof(PyObject *) * saved_ob_size);
2941
4.08k
            if (keys == NULL) {
2942
0
                PyErr_NoMemory();
2943
0
                goto keyfunc_fail;
2944
0
            }
2945
4.08k
        }
2946
2947
5.46M
        for (i = 0; i < saved_ob_size ; i++) {
2948
4.91M
            keys[i] = PyObject_CallOneArg(keyfunc, saved_ob_item[i]);
2949
4.91M
            if (keys[i] == NULL) {
2950
0
                for (i=i-1 ; i>=0 ; i--)
2951
0
                    Py_DECREF(keys[i]);
2952
0
                if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
2953
0
                    PyMem_Free(keys);
2954
0
                goto keyfunc_fail;
2955
0
            }
2956
4.91M
        }
2957
2958
551k
        lo.keys = keys;
2959
551k
        lo.values = saved_ob_item;
2960
551k
    }
2961
2962
2963
    /* The pre-sort check: here's where we decide which compare function to use.
2964
     * How much optimization is safe? We test for homogeneity with respect to
2965
     * several properties that are expensive to check at compare-time, and
2966
     * set ms appropriately. */
2967
769k
    if (saved_ob_size > 1) {
2968
        /* Assume the first element is representative of the whole list. */
2969
198k
        int keys_are_in_tuples = (Py_IS_TYPE(lo.keys[0], &PyTuple_Type) &&
2970
198k
                                  Py_SIZE(lo.keys[0]) > 0);
2971
2972
198k
        PyTypeObject* key_type = (keys_are_in_tuples ?
2973
65
                                  Py_TYPE(PyTuple_GET_ITEM(lo.keys[0], 0)) :
2974
198k
                                  Py_TYPE(lo.keys[0]));
2975
2976
198k
        int keys_are_all_same_type = 1;
2977
198k
        int strings_are_latin = 1;
2978
198k
        int ints_are_bounded = 1;
2979
2980
        /* Prove that assumption by checking every key. */
2981
5.84M
        for (i=0; i < saved_ob_size; i++) {
2982
2983
5.64M
            if (keys_are_in_tuples &&
2984
5.64M
                !(Py_IS_TYPE(lo.keys[i], &PyTuple_Type) && Py_SIZE(lo.keys[i]) != 0)) {
2985
0
                keys_are_in_tuples = 0;
2986
0
                keys_are_all_same_type = 0;
2987
0
                break;
2988
0
            }
2989
2990
            /* Note: for lists of tuples, key is the first element of the tuple
2991
             * lo.keys[i], not lo.keys[i] itself! We verify type-homogeneity
2992
             * for lists of tuples in the if-statement directly above. */
2993
5.64M
            PyObject *key = (keys_are_in_tuples ?
2994
595
                             PyTuple_GET_ITEM(lo.keys[i], 0) :
2995
5.64M
                             lo.keys[i]);
2996
2997
5.64M
            if (!Py_IS_TYPE(key, key_type)) {
2998
0
                keys_are_all_same_type = 0;
2999
                /* If keys are in tuple we must loop over the whole list to make
3000
                   sure all items are tuples */
3001
0
                if (!keys_are_in_tuples) {
3002
0
                    break;
3003
0
                }
3004
0
            }
3005
3006
5.64M
            if (keys_are_all_same_type) {
3007
5.64M
                if (key_type == &PyLong_Type &&
3008
5.64M
                    ints_are_bounded &&
3009
5.64M
                    !_PyLong_IsCompact((PyLongObject *)key)) {
3010
3011
5.14k
                    ints_are_bounded = 0;
3012
5.14k
                }
3013
5.63M
                else if (key_type == &PyUnicode_Type &&
3014
5.63M
                         strings_are_latin &&
3015
5.63M
                         PyUnicode_KIND(key) != PyUnicode_1BYTE_KIND) {
3016
3017
6.56k
                        strings_are_latin = 0;
3018
6.56k
                    }
3019
5.64M
                }
3020
5.64M
            }
3021
3022
        /* Choose the best compare, given what we now know about the keys. */
3023
198k
        if (keys_are_all_same_type) {
3024
3025
198k
            if (key_type == &PyUnicode_Type && strings_are_latin) {
3026
12.5k
                ms.key_compare = unsafe_latin_compare;
3027
12.5k
            }
3028
185k
            else if (key_type == &PyLong_Type && ints_are_bounded) {
3029
84.2k
                ms.key_compare = unsafe_long_compare;
3030
84.2k
            }
3031
101k
            else if (key_type == &PyFloat_Type) {
3032
0
                ms.key_compare = unsafe_float_compare;
3033
0
            }
3034
101k
            else if ((ms.key_richcompare = key_type->tp_richcompare) != NULL) {
3035
101k
                ms.key_compare = unsafe_object_compare;
3036
101k
            }
3037
0
            else {
3038
0
                ms.key_compare = safe_object_compare;
3039
0
            }
3040
198k
        }
3041
0
        else {
3042
0
            ms.key_compare = safe_object_compare;
3043
0
        }
3044
3045
198k
        if (keys_are_in_tuples) {
3046
            /* Make sure we're not dealing with tuples of tuples
3047
             * (remember: here, key_type refers list [key[0] for key in keys]) */
3048
65
            if (key_type == &PyTuple_Type) {
3049
0
                ms.tuple_elem_compare = safe_object_compare;
3050
0
            }
3051
65
            else {
3052
65
                ms.tuple_elem_compare = ms.key_compare;
3053
65
            }
3054
3055
65
            ms.key_compare = unsafe_tuple_compare;
3056
65
        }
3057
198k
    }
3058
    /* End of pre-sort check: ms is now set properly! */
3059
3060
769k
    merge_init(&ms, saved_ob_size, keys != NULL, &lo);
3061
3062
769k
    nremaining = saved_ob_size;
3063
769k
    if (nremaining < 2)
3064
570k
        goto succeed;
3065
3066
    /* Reverse sort stability achieved by initially reversing the list,
3067
    applying a stable forward sort, then reversing the final result. */
3068
198k
    if (reverse) {
3069
2
        if (keys != NULL)
3070
0
            reverse_slice(&keys[0], &keys[saved_ob_size]);
3071
2
        reverse_slice(&saved_ob_item[0], &saved_ob_item[saved_ob_size]);
3072
2
    }
3073
3074
    /* March over the array once, left to right, finding natural runs,
3075
     * and extending short natural runs to minrun elements.
3076
     */
3077
273k
    do {
3078
273k
        Py_ssize_t n;
3079
3080
        /* Identify next run. */
3081
273k
        n = count_run(&ms, &lo, nremaining);
3082
273k
        if (n < 0)
3083
0
            goto fail;
3084
        /* If short, extend to min(minrun, nremaining). */
3085
273k
        minrun = minrun_next(&ms);
3086
273k
        if (n < minrun) {
3087
124k
            const Py_ssize_t force = nremaining <= minrun ?
3088
75.6k
                              nremaining : minrun;
3089
124k
            if (binarysort(&ms, &lo, force, n) < 0)
3090
0
                goto fail;
3091
124k
            n = force;
3092
124k
        }
3093
        /* Maybe merge pending runs. */
3094
273k
        assert(ms.n == 0 || ms.pending[ms.n -1].base.keys +
3095
273k
                            ms.pending[ms.n-1].len == lo.keys);
3096
273k
        if (found_new_run(&ms, n) < 0)
3097
0
            goto fail;
3098
        /* Push new run on stack. */
3099
273k
        assert(ms.n < MAX_MERGE_PENDING);
3100
273k
        ms.pending[ms.n].base = lo;
3101
273k
        ms.pending[ms.n].len = n;
3102
273k
        ++ms.n;
3103
        /* Advance to find next run. */
3104
273k
        sortslice_advance(&lo, n);
3105
273k
        nremaining -= n;
3106
273k
    } while (nremaining);
3107
3108
198k
    if (merge_force_collapse(&ms) < 0)
3109
0
        goto fail;
3110
198k
    assert(ms.n == 1);
3111
198k
    assert(keys == NULL
3112
198k
           ? ms.pending[0].base.keys == saved_ob_item
3113
198k
           : ms.pending[0].base.keys == &keys[0]);
3114
198k
    assert(ms.pending[0].len == saved_ob_size);
3115
198k
    lo = ms.pending[0].base;
3116
3117
769k
succeed:
3118
769k
    result = Py_None;
3119
769k
fail:
3120
769k
    if (keys != NULL) {
3121
5.46M
        for (i = 0; i < saved_ob_size; i++)
3122
4.91M
            Py_DECREF(keys[i]);
3123
551k
        if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
3124
4.08k
            PyMem_Free(keys);
3125
551k
    }
3126
3127
769k
    if (self->allocated != -1 && result != NULL) {
3128
        /* The user mucked with the list during the sort,
3129
         * and we don't already have another error to report.
3130
         */
3131
0
        PyErr_SetString(PyExc_ValueError, "list modified during sort");
3132
0
        result = NULL;
3133
0
    }
3134
3135
769k
    if (reverse && saved_ob_size > 1)
3136
2
        reverse_slice(saved_ob_item, saved_ob_item + saved_ob_size);
3137
3138
769k
    merge_freemem(&ms);
3139
3140
769k
keyfunc_fail:
3141
769k
    final_ob_item = self->ob_item;
3142
769k
    i = Py_SIZE(self);
3143
769k
    Py_SET_SIZE(self, saved_ob_size);
3144
769k
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item, saved_ob_item);
3145
769k
    FT_ATOMIC_STORE_SSIZE_RELAXED(self->allocated, saved_allocated);
3146
769k
    if (final_ob_item != NULL) {
3147
        /* we cannot use list_clear() for this because it does not
3148
           guarantee that the list is really empty when it returns */
3149
0
        while (--i >= 0) {
3150
0
            Py_XDECREF(final_ob_item[i]);
3151
0
        }
3152
#ifdef Py_GIL_DISABLED
3153
        ensure_shared_on_resize(self);
3154
        bool use_qsbr = _PyObject_GC_IS_SHARED(self);
3155
#else
3156
0
        bool use_qsbr = false;
3157
0
#endif
3158
0
        free_list_items(final_ob_item, use_qsbr);
3159
0
    }
3160
769k
    return Py_XNewRef(result);
3161
769k
}
3162
#undef IFLT
3163
#undef ISLT
3164
3165
int
3166
PyList_Sort(PyObject *v)
3167
15.4k
{
3168
15.4k
    if (v == NULL || !PyList_Check(v)) {
3169
0
        PyErr_BadInternalCall();
3170
0
        return -1;
3171
0
    }
3172
15.4k
    Py_BEGIN_CRITICAL_SECTION(v);
3173
15.4k
    v = list_sort_impl((PyListObject *)v, NULL, 0);
3174
15.4k
    Py_END_CRITICAL_SECTION();
3175
15.4k
    if (v == NULL)
3176
0
        return -1;
3177
15.4k
    Py_DECREF(v);
3178
15.4k
    return 0;
3179
15.4k
}
3180
3181
/*[clinic input]
3182
@critical_section
3183
list.reverse
3184
3185
Reverse *IN PLACE*.
3186
[clinic start generated code]*/
3187
3188
static PyObject *
3189
list_reverse_impl(PyListObject *self)
3190
/*[clinic end generated code: output=482544fc451abea9 input=04ac8e0c6a66e4d9]*/
3191
0
{
3192
0
    if (Py_SIZE(self) > 1)
3193
0
        reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
3194
0
    Py_RETURN_NONE;
3195
0
}
3196
3197
int
3198
PyList_Reverse(PyObject *v)
3199
50
{
3200
50
    PyListObject *self = (PyListObject *)v;
3201
3202
50
    if (v == NULL || !PyList_Check(v)) {
3203
0
        PyErr_BadInternalCall();
3204
0
        return -1;
3205
0
    }
3206
50
    Py_BEGIN_CRITICAL_SECTION(self);
3207
50
    if (Py_SIZE(self) > 1) {
3208
50
        reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
3209
50
    }
3210
50
    Py_END_CRITICAL_SECTION()
3211
50
    return 0;
3212
50
}
3213
3214
PyObject *
3215
PyList_AsTuple(PyObject *v)
3216
265k
{
3217
265k
    if (v == NULL || !PyList_Check(v)) {
3218
0
        PyErr_BadInternalCall();
3219
0
        return NULL;
3220
0
    }
3221
265k
    PyObject *ret;
3222
265k
    PyListObject *self = (PyListObject *)v;
3223
265k
    Py_BEGIN_CRITICAL_SECTION(self);
3224
265k
    ret = _PyTuple_FromArray(self->ob_item, Py_SIZE(v));
3225
265k
    Py_END_CRITICAL_SECTION();
3226
265k
    return ret;
3227
265k
}
3228
3229
PyObject *
3230
_PyList_AsTupleAndClear(PyListObject *self)
3231
24
{
3232
24
    assert(self != NULL);
3233
24
    PyObject *ret;
3234
24
    if (self->ob_item == NULL) {
3235
0
        return PyTuple_New(0);
3236
0
    }
3237
24
    Py_BEGIN_CRITICAL_SECTION(self);
3238
24
    PyObject **items = self->ob_item;
3239
24
    Py_ssize_t size = Py_SIZE(self);
3240
24
    self->ob_item = NULL;
3241
24
    Py_SET_SIZE(self, 0);
3242
24
    ret = _PyTuple_FromArraySteal(items, size);
3243
24
    free_list_items(items, false);
3244
24
    Py_END_CRITICAL_SECTION();
3245
24
    return ret;
3246
24
}
3247
3248
PyObject *
3249
_PyList_FromStackRefStealOnSuccess(const _PyStackRef *src, Py_ssize_t n)
3250
160M
{
3251
160M
    if (n == 0) {
3252
144M
        return PyList_New(0);
3253
144M
    }
3254
3255
15.3M
    PyListObject *list = (PyListObject *)PyList_New(n);
3256
15.3M
    if (list == NULL) {
3257
0
        return NULL;
3258
0
    }
3259
3260
15.3M
    PyObject **dst = list->ob_item;
3261
42.9M
    for (Py_ssize_t i = 0; i < n; i++) {
3262
27.5M
        dst[i] = PyStackRef_AsPyObjectSteal(src[i]);
3263
27.5M
    }
3264
3265
15.3M
    return (PyObject *)list;
3266
15.3M
}
3267
3268
/*[clinic input]
3269
list.index
3270
3271
    value: object
3272
    start: slice_index(accept={int}) = 0
3273
    stop: slice_index(accept={int}, c_default="PY_SSIZE_T_MAX") = sys.maxsize
3274
    /
3275
3276
Return first index of value.
3277
3278
Raises ValueError if the value is not present.
3279
[clinic start generated code]*/
3280
3281
static PyObject *
3282
list_index_impl(PyListObject *self, PyObject *value, Py_ssize_t start,
3283
                Py_ssize_t stop)
3284
/*[clinic end generated code: output=ec51b88787e4e481 input=40ec5826303a0eb1]*/
3285
0
{
3286
0
    if (start < 0) {
3287
0
        start += Py_SIZE(self);
3288
0
        if (start < 0)
3289
0
            start = 0;
3290
0
    }
3291
0
    if (stop < 0) {
3292
0
        stop += Py_SIZE(self);
3293
0
        if (stop < 0)
3294
0
            stop = 0;
3295
0
    }
3296
0
    for (Py_ssize_t i = start; i < stop; i++) {
3297
0
        PyObject *obj = list_get_item_ref(self, i);
3298
0
        if (obj == NULL) {
3299
            // out-of-bounds
3300
0
            break;
3301
0
        }
3302
0
        int cmp = PyObject_RichCompareBool(obj, value, Py_EQ);
3303
0
        Py_DECREF(obj);
3304
0
        if (cmp > 0)
3305
0
            return PyLong_FromSsize_t(i);
3306
0
        else if (cmp < 0)
3307
0
            return NULL;
3308
0
    }
3309
0
    PyErr_SetString(PyExc_ValueError, "list.index(x): x not in list");
3310
0
    return NULL;
3311
0
}
3312
3313
/*[clinic input]
3314
list.count
3315
3316
     value: object
3317
     /
3318
3319
Return number of occurrences of value.
3320
[clinic start generated code]*/
3321
3322
static PyObject *
3323
list_count_impl(PyListObject *self, PyObject *value)
3324
/*[clinic end generated code: output=eff66f14aef2df86 input=3bdc3a5e6f749565]*/
3325
0
{
3326
0
    Py_ssize_t count = 0;
3327
0
    for (Py_ssize_t i = 0; ; i++) {
3328
0
        PyObject *obj = list_get_item_ref(self, i);
3329
0
        if (obj == NULL) {
3330
            // out-of-bounds
3331
0
            break;
3332
0
        }
3333
0
        if (obj == value) {
3334
0
           count++;
3335
0
           Py_DECREF(obj);
3336
0
           continue;
3337
0
        }
3338
0
        int cmp = PyObject_RichCompareBool(obj, value, Py_EQ);
3339
0
        Py_DECREF(obj);
3340
0
        if (cmp > 0)
3341
0
            count++;
3342
0
        else if (cmp < 0)
3343
0
            return NULL;
3344
0
    }
3345
0
    return PyLong_FromSsize_t(count);
3346
0
}
3347
3348
/*[clinic input]
3349
@critical_section
3350
list.remove
3351
3352
     value: object
3353
     /
3354
3355
Remove first occurrence of value.
3356
3357
Raises ValueError if the value is not present.
3358
[clinic start generated code]*/
3359
3360
static PyObject *
3361
list_remove_impl(PyListObject *self, PyObject *value)
3362
/*[clinic end generated code: output=b9b76a6633b18778 input=26c813dbb95aa93b]*/
3363
2.73k
{
3364
2.73k
    Py_ssize_t i;
3365
3366
2.74k
    for (i = 0; i < Py_SIZE(self); i++) {
3367
2.74k
        PyObject *obj = self->ob_item[i];
3368
2.74k
        Py_INCREF(obj);
3369
2.74k
        int cmp = PyObject_RichCompareBool(obj, value, Py_EQ);
3370
2.74k
        Py_DECREF(obj);
3371
2.74k
        if (cmp > 0) {
3372
2.73k
            if (list_ass_slice_lock_held(self, i, i+1, NULL) == 0)
3373
2.73k
                Py_RETURN_NONE;
3374
0
            return NULL;
3375
2.73k
        }
3376
10
        else if (cmp < 0)
3377
0
            return NULL;
3378
2.74k
    }
3379
2
    PyErr_SetString(PyExc_ValueError, "list.remove(x): x not in list");
3380
2
    return NULL;
3381
2.73k
}
3382
3383
static int
3384
list_traverse(PyObject *self, visitproc visit, void *arg)
3385
53.4M
{
3386
53.4M
    PyListObject *o = (PyListObject *)self;
3387
53.4M
    Py_ssize_t i;
3388
3389
782M
    for (i = Py_SIZE(o); --i >= 0; )
3390
729M
        Py_VISIT(o->ob_item[i]);
3391
53.4M
    return 0;
3392
53.4M
}
3393
3394
static PyObject *
3395
list_richcompare_impl(PyObject *v, PyObject *w, int op)
3396
4.02k
{
3397
4.02k
    PyListObject *vl, *wl;
3398
4.02k
    Py_ssize_t i;
3399
3400
4.02k
    if (!PyList_Check(v) || !PyList_Check(w))
3401
758
        Py_RETURN_NOTIMPLEMENTED;
3402
3403
3.27k
    vl = (PyListObject *)v;
3404
3.27k
    wl = (PyListObject *)w;
3405
3406
3.27k
    if (Py_SIZE(vl) != Py_SIZE(wl) && (op == Py_EQ || op == Py_NE)) {
3407
        /* Shortcut: if the lengths differ, the lists differ */
3408
476
        if (op == Py_EQ)
3409
476
            Py_RETURN_FALSE;
3410
0
        else
3411
0
            Py_RETURN_TRUE;
3412
476
    }
3413
3414
    /* Search for the first index where items are different */
3415
3.00k
    for (i = 0; i < Py_SIZE(vl) && i < Py_SIZE(wl); i++) {
3416
412
        PyObject *vitem = vl->ob_item[i];
3417
412
        PyObject *witem = wl->ob_item[i];
3418
412
        if (vitem == witem) {
3419
158
            continue;
3420
158
        }
3421
3422
254
        Py_INCREF(vitem);
3423
254
        Py_INCREF(witem);
3424
254
        int k = PyObject_RichCompareBool(vitem, witem, Py_EQ);
3425
254
        Py_DECREF(vitem);
3426
254
        Py_DECREF(witem);
3427
254
        if (k < 0)
3428
0
            return NULL;
3429
254
        if (!k)
3430
206
            break;
3431
254
    }
3432
3433
2.79k
    if (i >= Py_SIZE(vl) || i >= Py_SIZE(wl)) {
3434
        /* No more items to compare -- compare sizes */
3435
2.58k
        Py_RETURN_RICHCOMPARE(Py_SIZE(vl), Py_SIZE(wl), op);
3436
2.58k
    }
3437
3438
    /* We have an item that differs -- shortcuts for EQ/NE */
3439
206
    if (op == Py_EQ) {
3440
194
        Py_RETURN_FALSE;
3441
194
    }
3442
12
    if (op == Py_NE) {
3443
12
        Py_RETURN_TRUE;
3444
12
    }
3445
3446
    /* Compare the final item again using the proper operator */
3447
0
    PyObject *vitem = vl->ob_item[i];
3448
0
    PyObject *witem = wl->ob_item[i];
3449
0
    Py_INCREF(vitem);
3450
0
    Py_INCREF(witem);
3451
0
    PyObject *result = PyObject_RichCompare(vl->ob_item[i], wl->ob_item[i], op);
3452
0
    Py_DECREF(vitem);
3453
0
    Py_DECREF(witem);
3454
0
    return result;
3455
12
}
3456
3457
static PyObject *
3458
list_richcompare(PyObject *v, PyObject *w, int op)
3459
4.02k
{
3460
4.02k
    PyObject *ret;
3461
4.02k
    Py_BEGIN_CRITICAL_SECTION2(v, w);
3462
4.02k
    ret = list_richcompare_impl(v, w, op);
3463
4.02k
    Py_END_CRITICAL_SECTION2()
3464
4.02k
    return ret;
3465
4.02k
}
3466
3467
/*[clinic input]
3468
list.__init__
3469
3470
    iterable: object(c_default="NULL") = ()
3471
    /
3472
3473
Built-in mutable sequence.
3474
3475
If no argument is given, the constructor creates a new empty list.
3476
The argument must be an iterable if specified.
3477
[clinic start generated code]*/
3478
3479
static int
3480
list___init___impl(PyListObject *self, PyObject *iterable)
3481
/*[clinic end generated code: output=0f3c21379d01de48 input=b3f3fe7206af8f6b]*/
3482
19.3M
{
3483
    /* Verify list invariants established by PyType_GenericAlloc() */
3484
19.3M
    assert(0 <= Py_SIZE(self));
3485
19.3M
    assert(Py_SIZE(self) <= self->allocated || self->allocated == -1);
3486
19.3M
    assert(self->ob_item != NULL ||
3487
19.3M
           self->allocated == 0 || self->allocated == -1);
3488
3489
    /* Empty previous contents */
3490
19.3M
    if (self->ob_item != NULL) {
3491
0
        Py_BEGIN_CRITICAL_SECTION(self);
3492
0
        list_clear(self);
3493
0
        Py_END_CRITICAL_SECTION();
3494
0
    }
3495
19.3M
    if (iterable != NULL) {
3496
8.94M
        if (_list_extend(self, iterable) < 0) {
3497
0
            return -1;
3498
0
        }
3499
8.94M
    }
3500
19.3M
    return 0;
3501
19.3M
}
3502
3503
static PyObject *
3504
list_vectorcall(PyObject *type, PyObject * const*args,
3505
                size_t nargsf, PyObject *kwnames)
3506
8.94M
{
3507
8.94M
    if (!_PyArg_NoKwnames("list", kwnames)) {
3508
0
        return NULL;
3509
0
    }
3510
8.94M
    Py_ssize_t nargs = PyVectorcall_NARGS(nargsf);
3511
8.94M
    if (!_PyArg_CheckPositional("list", nargs, 0, 1)) {
3512
0
        return NULL;
3513
0
    }
3514
3515
8.94M
    PyObject *list = PyType_GenericAlloc(_PyType_CAST(type), 0);
3516
8.94M
    if (list == NULL) {
3517
0
        return NULL;
3518
0
    }
3519
8.94M
    if (nargs) {
3520
8.94M
        if (list___init___impl((PyListObject *)list, args[0])) {
3521
0
            Py_DECREF(list);
3522
0
            return NULL;
3523
0
        }
3524
8.94M
    }
3525
8.94M
    return list;
3526
8.94M
}
3527
3528
3529
/*[clinic input]
3530
list.__sizeof__
3531
3532
Return the size of the list in memory, in bytes.
3533
[clinic start generated code]*/
3534
3535
static PyObject *
3536
list___sizeof___impl(PyListObject *self)
3537
/*[clinic end generated code: output=3417541f95f9a53e input=b8030a5d5ce8a187]*/
3538
0
{
3539
0
    size_t res = _PyObject_SIZE(Py_TYPE(self));
3540
0
    Py_ssize_t allocated = FT_ATOMIC_LOAD_SSIZE_RELAXED(self->allocated);
3541
0
    res += (size_t)allocated * sizeof(void*);
3542
0
    return PyLong_FromSize_t(res);
3543
0
}
3544
3545
static PyObject *list_iter(PyObject *seq);
3546
static PyObject *list_subscript(PyObject*, PyObject*);
3547
3548
static PyMethodDef list_methods[] = {
3549
    {"__getitem__", list_subscript, METH_O|METH_COEXIST,
3550
     PyDoc_STR("__getitem__($self, index, /)\n--\n\nReturn self[index].")},
3551
    LIST___REVERSED___METHODDEF
3552
    LIST___SIZEOF___METHODDEF
3553
    PY_LIST_CLEAR_METHODDEF
3554
    LIST_COPY_METHODDEF
3555
    LIST_APPEND_METHODDEF
3556
    LIST_INSERT_METHODDEF
3557
    LIST_EXTEND_METHODDEF
3558
    LIST_POP_METHODDEF
3559
    LIST_REMOVE_METHODDEF
3560
    LIST_INDEX_METHODDEF
3561
    LIST_COUNT_METHODDEF
3562
    LIST_REVERSE_METHODDEF
3563
    LIST_SORT_METHODDEF
3564
    {"__class_getitem__", Py_GenericAlias, METH_O|METH_CLASS, PyDoc_STR("See PEP 585")},
3565
    {NULL,              NULL}           /* sentinel */
3566
};
3567
3568
static PySequenceMethods list_as_sequence = {
3569
    list_length,                                /* sq_length */
3570
    list_concat,                                /* sq_concat */
3571
    list_repeat,                                /* sq_repeat */
3572
    list_item,                                  /* sq_item */
3573
    0,                                          /* sq_slice */
3574
    list_ass_item,                              /* sq_ass_item */
3575
    0,                                          /* sq_ass_slice */
3576
    list_contains,                              /* sq_contains */
3577
    list_inplace_concat,                        /* sq_inplace_concat */
3578
    list_inplace_repeat,                        /* sq_inplace_repeat */
3579
};
3580
3581
static inline PyObject *
3582
list_slice_step_lock_held(PyListObject *a, Py_ssize_t start, Py_ssize_t step, Py_ssize_t len)
3583
48
{
3584
48
    PyListObject *np = (PyListObject *)list_new_prealloc(len);
3585
48
    if (np == NULL) {
3586
0
        return NULL;
3587
0
    }
3588
48
    size_t cur;
3589
48
    Py_ssize_t i;
3590
48
    PyObject **src = a->ob_item;
3591
48
    PyObject **dest = np->ob_item;
3592
480
    for (cur = start, i = 0; i < len;
3593
432
            cur += (size_t)step, i++) {
3594
432
        PyObject *v = src[cur];
3595
432
        dest[i] = Py_NewRef(v);
3596
432
    }
3597
48
    Py_SET_SIZE(np, len);
3598
48
    return (PyObject *)np;
3599
48
}
3600
3601
static PyObject *
3602
list_slice_wrap(PyListObject *aa, Py_ssize_t start, Py_ssize_t stop, Py_ssize_t step)
3603
2.33M
{
3604
2.33M
    PyObject *res = NULL;
3605
2.33M
    Py_BEGIN_CRITICAL_SECTION(aa);
3606
2.33M
    Py_ssize_t len = PySlice_AdjustIndices(Py_SIZE(aa), &start, &stop, step);
3607
2.33M
    if (len <= 0) {
3608
435k
        res = PyList_New(0);
3609
435k
    }
3610
1.90M
    else if (step == 1) {
3611
1.90M
        res = list_slice_lock_held(aa, start, stop);
3612
1.90M
    }
3613
48
    else {
3614
48
        res = list_slice_step_lock_held(aa, start, step, len);
3615
48
    }
3616
2.33M
    Py_END_CRITICAL_SECTION();
3617
2.33M
    return res;
3618
2.33M
}
3619
3620
static inline PyObject*
3621
list_slice_subscript(PyObject* self, PyObject* item)
3622
2.33M
{
3623
2.33M
    assert(PyList_Check(self));
3624
2.33M
    assert(PySlice_Check(item));
3625
2.33M
    Py_ssize_t start, stop, step;
3626
2.33M
    if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
3627
0
        return NULL;
3628
0
    }
3629
2.33M
    return list_slice_wrap((PyListObject *)self, start, stop, step);
3630
2.33M
}
3631
3632
PyObject *
3633
_PyList_SliceSubscript(PyObject* _self, PyObject* item)
3634
2.19M
{
3635
2.19M
    return list_slice_subscript(_self, item);
3636
2.19M
}
3637
3638
static PyObject *
3639
list_subscript(PyObject* _self, PyObject* item)
3640
15.0M
{
3641
15.0M
    PyListObject* self = (PyListObject*)_self;
3642
15.0M
    if (_PyIndex_Check(item)) {
3643
14.8M
        Py_ssize_t i;
3644
14.8M
        i = PyNumber_AsSsize_t(item, PyExc_IndexError);
3645
14.8M
        if (i == -1 && PyErr_Occurred())
3646
0
            return NULL;
3647
14.8M
        if (i < 0)
3648
11.2M
            i += PyList_GET_SIZE(self);
3649
14.8M
        return list_item((PyObject *)self, i);
3650
14.8M
    }
3651
144k
    else if (PySlice_Check(item)) {
3652
144k
        return list_slice_subscript(_self, item);
3653
144k
    }
3654
0
    else {
3655
0
        PyErr_Format(PyExc_TypeError,
3656
0
                     "list indices must be integers or slices, not %.200s",
3657
0
                     Py_TYPE(item)->tp_name);
3658
0
        return NULL;
3659
0
    }
3660
15.0M
}
3661
3662
static Py_ssize_t
3663
adjust_slice_indexes(PyListObject *lst,
3664
                     Py_ssize_t *start, Py_ssize_t *stop,
3665
                     Py_ssize_t step)
3666
191k
{
3667
191k
    Py_ssize_t slicelength = PySlice_AdjustIndices(Py_SIZE(lst), start, stop,
3668
191k
                                                   step);
3669
3670
    /* Make sure s[5:2] = [..] inserts at the right place:
3671
        before 5, not before 2. */
3672
191k
    if ((step < 0 && *start < *stop) ||
3673
191k
        (step > 0 && *start > *stop))
3674
0
        *stop = *start;
3675
3676
191k
    return slicelength;
3677
191k
}
3678
3679
static int
3680
list_ass_subscript_lock_held(PyObject *_self, PyObject *item, PyObject *value)
3681
194k
{
3682
194k
    _Py_CRITICAL_SECTION_ASSERT_OBJECT_LOCKED(_self);
3683
3684
194k
    PyListObject *self = (PyListObject *)_self;
3685
194k
    if (_PyIndex_Check(item)) {
3686
2.94k
        Py_ssize_t i = PyNumber_AsSsize_t(item, PyExc_IndexError);
3687
2.94k
        if (i == -1 && PyErr_Occurred())
3688
0
            return -1;
3689
2.94k
        if (i < 0)
3690
2.79k
            i += PyList_GET_SIZE(self);
3691
2.94k
        return list_ass_item_lock_held(self, i, value);
3692
2.94k
    }
3693
191k
    else if (PySlice_Check(item)) {
3694
191k
        Py_ssize_t start, stop, step;
3695
3696
191k
        if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
3697
0
            return -1;
3698
0
        }
3699
3700
191k
        if (value == NULL) {
3701
            /* delete slice */
3702
12
            PyObject **garbage;
3703
12
            size_t cur;
3704
12
            Py_ssize_t i;
3705
12
            int res;
3706
3707
12
            Py_ssize_t slicelength = adjust_slice_indexes(self, &start, &stop,
3708
12
                                                          step);
3709
3710
12
            if (step == 1)
3711
12
                return list_ass_slice_lock_held(self, start, stop, value);
3712
3713
0
            if (slicelength <= 0)
3714
0
                return 0;
3715
3716
0
            if (step < 0) {
3717
0
                stop = start + 1;
3718
0
                start = stop + step*(slicelength - 1) - 1;
3719
0
                step = -step;
3720
0
            }
3721
3722
0
            garbage = (PyObject**)
3723
0
                PyMem_Malloc(slicelength*sizeof(PyObject*));
3724
0
            if (!garbage) {
3725
0
                PyErr_NoMemory();
3726
0
                return -1;
3727
0
            }
3728
3729
            /* drawing pictures might help understand these for
3730
               loops. Basically, we memmove the parts of the
3731
               list that are *not* part of the slice: step-1
3732
               items for each item that is part of the slice,
3733
               and then tail end of the list that was not
3734
               covered by the slice */
3735
0
            for (cur = start, i = 0;
3736
0
                 cur < (size_t)stop;
3737
0
                 cur += step, i++) {
3738
0
                Py_ssize_t lim = step - 1;
3739
3740
0
                garbage[i] = PyList_GET_ITEM(self, cur);
3741
3742
0
                if (cur + step >= (size_t)Py_SIZE(self)) {
3743
0
                    lim = Py_SIZE(self) - cur - 1;
3744
0
                }
3745
3746
0
                memmove(self->ob_item + cur - i,
3747
0
                    self->ob_item + cur + 1,
3748
0
                    lim * sizeof(PyObject *));
3749
0
            }
3750
0
            cur = start + (size_t)slicelength * step;
3751
0
            if (cur < (size_t)Py_SIZE(self)) {
3752
0
                memmove(self->ob_item + cur - slicelength,
3753
0
                    self->ob_item + cur,
3754
0
                    (Py_SIZE(self) - cur) *
3755
0
                     sizeof(PyObject *));
3756
0
            }
3757
3758
0
            Py_SET_SIZE(self, Py_SIZE(self) - slicelength);
3759
0
            res = list_resize(self, Py_SIZE(self));
3760
3761
0
            for (i = 0; i < slicelength; i++) {
3762
0
                Py_DECREF(garbage[i]);
3763
0
            }
3764
0
            PyMem_Free(garbage);
3765
3766
0
            return res;
3767
0
        }
3768
191k
        else {
3769
            /* assign slice */
3770
191k
            PyObject *ins, *seq;
3771
191k
            PyObject **garbage, **seqitems, **selfitems;
3772
191k
            Py_ssize_t i;
3773
191k
            size_t cur;
3774
3775
            /* protect against a[::-1] = a */
3776
191k
            if (self == (PyListObject*)value) {
3777
0
                seq = list_slice_lock_held((PyListObject *)value, 0,
3778
0
                                            Py_SIZE(value));
3779
0
            }
3780
191k
            else {
3781
191k
                seq = PySequence_Fast(value,
3782
191k
                                      "must assign iterable "
3783
191k
                                      "to extended slice");
3784
191k
            }
3785
191k
            if (!seq)
3786
0
                return -1;
3787
3788
191k
            Py_ssize_t slicelength = adjust_slice_indexes(self, &start, &stop,
3789
191k
                                                          step);
3790
3791
191k
            if (step == 1) {
3792
191k
                int res = list_ass_slice_lock_held(self, start, stop, seq);
3793
191k
                Py_DECREF(seq);
3794
191k
                return res;
3795
191k
            }
3796
3797
0
            if (PySequence_Fast_GET_SIZE(seq) != slicelength) {
3798
0
                PyErr_Format(PyExc_ValueError,
3799
0
                    "attempt to assign sequence of "
3800
0
                    "size %zd to extended slice of "
3801
0
                    "size %zd",
3802
0
                         PySequence_Fast_GET_SIZE(seq),
3803
0
                         slicelength);
3804
0
                Py_DECREF(seq);
3805
0
                return -1;
3806
0
            }
3807
3808
0
            if (!slicelength) {
3809
0
                Py_DECREF(seq);
3810
0
                return 0;
3811
0
            }
3812
3813
0
            garbage = (PyObject**)
3814
0
                PyMem_Malloc(slicelength*sizeof(PyObject*));
3815
0
            if (!garbage) {
3816
0
                Py_DECREF(seq);
3817
0
                PyErr_NoMemory();
3818
0
                return -1;
3819
0
            }
3820
3821
0
            selfitems = self->ob_item;
3822
0
            seqitems = PySequence_Fast_ITEMS(seq);
3823
0
            for (cur = start, i = 0; i < slicelength;
3824
0
                 cur += (size_t)step, i++) {
3825
0
                garbage[i] = selfitems[cur];
3826
0
                ins = Py_NewRef(seqitems[i]);
3827
0
                selfitems[cur] = ins;
3828
0
            }
3829
3830
0
            for (i = 0; i < slicelength; i++) {
3831
0
                Py_DECREF(garbage[i]);
3832
0
            }
3833
3834
0
            PyMem_Free(garbage);
3835
0
            Py_DECREF(seq);
3836
3837
0
            return 0;
3838
0
        }
3839
191k
    }
3840
0
    else {
3841
0
        PyErr_Format(PyExc_TypeError,
3842
0
                     "list indices must be integers or slices, not %.200s",
3843
0
                     Py_TYPE(item)->tp_name);
3844
0
        return -1;
3845
0
    }
3846
194k
}
3847
3848
static int
3849
list_ass_subscript(PyObject *self, PyObject *item, PyObject *value)
3850
194k
{
3851
194k
    int res;
3852
#ifdef Py_GIL_DISABLED
3853
    if (PySlice_Check(item) && value != NULL && PyList_CheckExact(value)) {
3854
        Py_BEGIN_CRITICAL_SECTION2(self, value);
3855
        res = list_ass_subscript_lock_held(self, item, value);
3856
        Py_END_CRITICAL_SECTION2();
3857
        return res;
3858
    }
3859
#endif
3860
194k
    Py_BEGIN_CRITICAL_SECTION(self);
3861
194k
    res = list_ass_subscript_lock_held(self, item, value);
3862
194k
    Py_END_CRITICAL_SECTION();
3863
194k
    return res;
3864
194k
}
3865
3866
static PyMappingMethods list_as_mapping = {
3867
    list_length,
3868
    list_subscript,
3869
    list_ass_subscript
3870
};
3871
3872
PyTypeObject PyList_Type = {
3873
    PyVarObject_HEAD_INIT(&PyType_Type, 0)
3874
    "list",
3875
    sizeof(PyListObject),
3876
    0,
3877
    list_dealloc,                               /* tp_dealloc */
3878
    0,                                          /* tp_vectorcall_offset */
3879
    0,                                          /* tp_getattr */
3880
    0,                                          /* tp_setattr */
3881
    0,                                          /* tp_as_async */
3882
    list_repr,                                  /* tp_repr */
3883
    0,                                          /* tp_as_number */
3884
    &list_as_sequence,                          /* tp_as_sequence */
3885
    &list_as_mapping,                           /* tp_as_mapping */
3886
    PyObject_HashNotImplemented,                /* tp_hash */
3887
    0,                                          /* tp_call */
3888
    0,                                          /* tp_str */
3889
    PyObject_GenericGetAttr,                    /* tp_getattro */
3890
    0,                                          /* tp_setattro */
3891
    0,                                          /* tp_as_buffer */
3892
    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
3893
        Py_TPFLAGS_BASETYPE | Py_TPFLAGS_LIST_SUBCLASS |
3894
        _Py_TPFLAGS_MATCH_SELF | Py_TPFLAGS_SEQUENCE,  /* tp_flags */
3895
    list___init____doc__,                       /* tp_doc */
3896
    list_traverse,                              /* tp_traverse */
3897
    list_clear_slot,                            /* tp_clear */
3898
    list_richcompare,                           /* tp_richcompare */
3899
    0,                                          /* tp_weaklistoffset */
3900
    list_iter,                                  /* tp_iter */
3901
    0,                                          /* tp_iternext */
3902
    list_methods,                               /* tp_methods */
3903
    0,                                          /* tp_members */
3904
    0,                                          /* tp_getset */
3905
    0,                                          /* tp_base */
3906
    0,                                          /* tp_dict */
3907
    0,                                          /* tp_descr_get */
3908
    0,                                          /* tp_descr_set */
3909
    0,                                          /* tp_dictoffset */
3910
    list___init__,                              /* tp_init */
3911
    PyType_GenericAlloc,                        /* tp_alloc */
3912
    PyType_GenericNew,                          /* tp_new */
3913
    PyObject_GC_Del,                            /* tp_free */
3914
    .tp_vectorcall = list_vectorcall,
3915
    .tp_version_tag = _Py_TYPE_VERSION_LIST,
3916
};
3917
3918
/*********************** List Iterator **************************/
3919
3920
static void listiter_dealloc(PyObject *);
3921
static int listiter_traverse(PyObject *, visitproc, void *);
3922
static PyObject *listiter_next(PyObject *);
3923
static PyObject *listiter_len(PyObject *, PyObject *);
3924
static PyObject *listiter_reduce_general(void *_it, int forward);
3925
static PyObject *listiter_reduce(PyObject *, PyObject *);
3926
static PyObject *listiter_setstate(PyObject *, PyObject *state);
3927
3928
PyDoc_STRVAR(length_hint_doc, "Private method returning an estimate of len(list(it)).");
3929
PyDoc_STRVAR(reduce_doc, "Return state information for pickling.");
3930
PyDoc_STRVAR(setstate_doc, "Set state information for unpickling.");
3931
3932
static PyMethodDef listiter_methods[] = {
3933
    {"__length_hint__", listiter_len, METH_NOARGS, length_hint_doc},
3934
    {"__reduce__", listiter_reduce, METH_NOARGS, reduce_doc},
3935
    {"__setstate__", listiter_setstate, METH_O, setstate_doc},
3936
    {NULL,              NULL}           /* sentinel */
3937
};
3938
3939
PyTypeObject PyListIter_Type = {
3940
    PyVarObject_HEAD_INIT(&PyType_Type, 0)
3941
    "list_iterator",                            /* tp_name */
3942
    sizeof(_PyListIterObject),                  /* tp_basicsize */
3943
    0,                                          /* tp_itemsize */
3944
    /* methods */
3945
    listiter_dealloc,               /* tp_dealloc */
3946
    0,                                          /* tp_vectorcall_offset */
3947
    0,                                          /* tp_getattr */
3948
    0,                                          /* tp_setattr */
3949
    0,                                          /* tp_as_async */
3950
    0,                                          /* tp_repr */
3951
    0,                                          /* tp_as_number */
3952
    0,                                          /* tp_as_sequence */
3953
    0,                                          /* tp_as_mapping */
3954
    0,                                          /* tp_hash */
3955
    0,                                          /* tp_call */
3956
    0,                                          /* tp_str */
3957
    PyObject_GenericGetAttr,                    /* tp_getattro */
3958
    0,                                          /* tp_setattro */
3959
    0,                                          /* tp_as_buffer */
3960
    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3961
    0,                                          /* tp_doc */
3962
    listiter_traverse,                          /* tp_traverse */
3963
    0,                                          /* tp_clear */
3964
    0,                                          /* tp_richcompare */
3965
    0,                                          /* tp_weaklistoffset */
3966
    PyObject_SelfIter,                          /* tp_iter */
3967
    listiter_next,                              /* tp_iternext */
3968
    listiter_methods,                           /* tp_methods */
3969
    0,                                          /* tp_members */
3970
};
3971
3972
3973
static PyObject *
3974
list_iter(PyObject *seq)
3975
30.9M
{
3976
30.9M
    if (!PyList_Check(seq)) {
3977
0
        PyErr_BadInternalCall();
3978
0
        return NULL;
3979
0
    }
3980
30.9M
    _PyListIterObject *it = _Py_FREELIST_POP(_PyListIterObject, list_iters);
3981
30.9M
    if (it == NULL) {
3982
1.64M
        it = PyObject_GC_New(_PyListIterObject, &PyListIter_Type);
3983
1.64M
        if (it == NULL) {
3984
0
            return NULL;
3985
0
        }
3986
1.64M
    }
3987
30.9M
    it->it_index = 0;
3988
30.9M
    it->it_seq = (PyListObject *)Py_NewRef(seq);
3989
30.9M
    _PyObject_GC_TRACK(it);
3990
30.9M
    return (PyObject *)it;
3991
30.9M
}
3992
3993
static void
3994
listiter_dealloc(PyObject *self)
3995
30.9M
{
3996
30.9M
    _PyListIterObject *it = (_PyListIterObject *)self;
3997
30.9M
    _PyObject_GC_UNTRACK(it);
3998
30.9M
    Py_XDECREF(it->it_seq);
3999
30.9M
    assert(Py_IS_TYPE(self, &PyListIter_Type));
4000
30.9M
    _Py_FREELIST_FREE(list_iters, it, PyObject_GC_Del);
4001
30.9M
}
4002
4003
static int
4004
listiter_traverse(PyObject *it, visitproc visit, void *arg)
4005
523k
{
4006
523k
    Py_VISIT(((_PyListIterObject *)it)->it_seq);
4007
523k
    return 0;
4008
523k
}
4009
4010
static PyObject *
4011
listiter_next(PyObject *self)
4012
133M
{
4013
133M
    _PyListIterObject *it = (_PyListIterObject *)self;
4014
133M
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4015
133M
    if (index < 0) {
4016
168
        return NULL;
4017
168
    }
4018
4019
133M
    PyObject *item = list_get_item_ref(it->it_seq, index);
4020
133M
    if (item == NULL) {
4021
        // out-of-bounds
4022
30.4M
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, -1);
4023
30.4M
#ifndef Py_GIL_DISABLED
4024
30.4M
        PyListObject *seq = it->it_seq;
4025
30.4M
        it->it_seq = NULL;
4026
30.4M
        Py_DECREF(seq);
4027
30.4M
#endif
4028
30.4M
        return NULL;
4029
30.4M
    }
4030
103M
    FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index + 1);
4031
103M
    return item;
4032
133M
}
4033
4034
static PyObject *
4035
listiter_len(PyObject *self, PyObject *Py_UNUSED(ignored))
4036
1.38M
{
4037
1.38M
    assert(self != NULL);
4038
1.38M
    _PyListIterObject *it = (_PyListIterObject *)self;
4039
1.38M
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4040
1.38M
    if (index >= 0) {
4041
1.38M
        Py_ssize_t len = PyList_GET_SIZE(it->it_seq) - index;
4042
1.38M
        if (len >= 0)
4043
1.38M
            return PyLong_FromSsize_t(len);
4044
1.38M
    }
4045
0
    return PyLong_FromLong(0);
4046
1.38M
}
4047
4048
static PyObject *
4049
listiter_reduce(PyObject *it, PyObject *Py_UNUSED(ignored))
4050
0
{
4051
0
    return listiter_reduce_general(it, 1);
4052
0
}
4053
4054
static PyObject *
4055
listiter_setstate(PyObject *self, PyObject *state)
4056
0
{
4057
0
    _PyListIterObject *it = (_PyListIterObject *)self;
4058
0
    Py_ssize_t index = PyLong_AsSsize_t(state);
4059
0
    if (index == -1 && PyErr_Occurred())
4060
0
        return NULL;
4061
0
    if (it->it_seq != NULL) {
4062
0
        if (index < -1)
4063
0
            index = -1;
4064
0
        else if (index > PyList_GET_SIZE(it->it_seq))
4065
0
            index = PyList_GET_SIZE(it->it_seq); /* iterator exhausted */
4066
0
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index);
4067
0
    }
4068
0
    Py_RETURN_NONE;
4069
0
}
4070
4071
/*********************** List Reverse Iterator **************************/
4072
4073
typedef struct {
4074
    PyObject_HEAD
4075
    Py_ssize_t it_index;
4076
    PyListObject *it_seq; /* Set to NULL when iterator is exhausted */
4077
} listreviterobject;
4078
4079
static void listreviter_dealloc(PyObject *);
4080
static int listreviter_traverse(PyObject *, visitproc, void *);
4081
static PyObject *listreviter_next(PyObject *);
4082
static PyObject *listreviter_len(PyObject *, PyObject *);
4083
static PyObject *listreviter_reduce(PyObject *, PyObject *);
4084
static PyObject *listreviter_setstate(PyObject *, PyObject *);
4085
4086
static PyMethodDef listreviter_methods[] = {
4087
    {"__length_hint__", listreviter_len, METH_NOARGS, length_hint_doc},
4088
    {"__reduce__", listreviter_reduce, METH_NOARGS, reduce_doc},
4089
    {"__setstate__", listreviter_setstate, METH_O, setstate_doc},
4090
    {NULL,              NULL}           /* sentinel */
4091
};
4092
4093
PyTypeObject PyListRevIter_Type = {
4094
    PyVarObject_HEAD_INIT(&PyType_Type, 0)
4095
    "list_reverseiterator",                     /* tp_name */
4096
    sizeof(listreviterobject),                  /* tp_basicsize */
4097
    0,                                          /* tp_itemsize */
4098
    /* methods */
4099
    listreviter_dealloc,                        /* tp_dealloc */
4100
    0,                                          /* tp_vectorcall_offset */
4101
    0,                                          /* tp_getattr */
4102
    0,                                          /* tp_setattr */
4103
    0,                                          /* tp_as_async */
4104
    0,                                          /* tp_repr */
4105
    0,                                          /* tp_as_number */
4106
    0,                                          /* tp_as_sequence */
4107
    0,                                          /* tp_as_mapping */
4108
    0,                                          /* tp_hash */
4109
    0,                                          /* tp_call */
4110
    0,                                          /* tp_str */
4111
    PyObject_GenericGetAttr,                    /* tp_getattro */
4112
    0,                                          /* tp_setattro */
4113
    0,                                          /* tp_as_buffer */
4114
    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4115
    0,                                          /* tp_doc */
4116
    listreviter_traverse,                       /* tp_traverse */
4117
    0,                                          /* tp_clear */
4118
    0,                                          /* tp_richcompare */
4119
    0,                                          /* tp_weaklistoffset */
4120
    PyObject_SelfIter,                          /* tp_iter */
4121
    listreviter_next,                           /* tp_iternext */
4122
    listreviter_methods,                /* tp_methods */
4123
    0,
4124
};
4125
4126
/*[clinic input]
4127
list.__reversed__
4128
4129
Return a reverse iterator over the list.
4130
[clinic start generated code]*/
4131
4132
static PyObject *
4133
list___reversed___impl(PyListObject *self)
4134
/*[clinic end generated code: output=b166f073208c888c input=eadb6e17f8a6a280]*/
4135
36.3M
{
4136
36.3M
    listreviterobject *it;
4137
4138
36.3M
    it = PyObject_GC_New(listreviterobject, &PyListRevIter_Type);
4139
36.3M
    if (it == NULL)
4140
0
        return NULL;
4141
36.3M
    assert(PyList_Check(self));
4142
36.3M
    it->it_index = PyList_GET_SIZE(self) - 1;
4143
36.3M
    it->it_seq = (PyListObject*)Py_NewRef(self);
4144
36.3M
    PyObject_GC_Track(it);
4145
36.3M
    return (PyObject *)it;
4146
36.3M
}
4147
4148
static void
4149
listreviter_dealloc(PyObject *self)
4150
36.3M
{
4151
36.3M
    listreviterobject *it = (listreviterobject *)self;
4152
36.3M
    PyObject_GC_UnTrack(it);
4153
36.3M
    Py_XDECREF(it->it_seq);
4154
36.3M
    PyObject_GC_Del(it);
4155
36.3M
}
4156
4157
static int
4158
listreviter_traverse(PyObject *it, visitproc visit, void *arg)
4159
530
{
4160
530
    Py_VISIT(((listreviterobject *)it)->it_seq);
4161
530
    return 0;
4162
530
}
4163
4164
static PyObject *
4165
listreviter_next(PyObject *self)
4166
45.6M
{
4167
45.6M
    listreviterobject *it = (listreviterobject *)self;
4168
45.6M
    assert(it != NULL);
4169
45.6M
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4170
45.6M
    if (index < 0) {
4171
26.1M
        return NULL;
4172
26.1M
    }
4173
4174
19.4M
    PyListObject *seq = it->it_seq;
4175
19.4M
    assert(PyList_Check(seq));
4176
19.4M
    PyObject *item = list_get_item_ref(seq, index);
4177
19.4M
    if (item != NULL) {
4178
19.4M
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index - 1);
4179
19.4M
        return item;
4180
19.4M
    }
4181
0
    FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, -1);
4182
0
#ifndef Py_GIL_DISABLED
4183
0
    it->it_seq = NULL;
4184
0
    Py_DECREF(seq);
4185
0
#endif
4186
0
    return NULL;
4187
19.4M
}
4188
4189
static PyObject *
4190
listreviter_len(PyObject *self, PyObject *Py_UNUSED(ignored))
4191
0
{
4192
0
    listreviterobject *it = (listreviterobject *)self;
4193
0
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4194
0
    Py_ssize_t len = index + 1;
4195
0
    if (it->it_seq == NULL || PyList_GET_SIZE(it->it_seq) < len)
4196
0
        len = 0;
4197
0
    return PyLong_FromSsize_t(len);
4198
0
}
4199
4200
static PyObject *
4201
listreviter_reduce(PyObject *it, PyObject *Py_UNUSED(ignored))
4202
0
{
4203
0
    return listiter_reduce_general(it, 0);
4204
0
}
4205
4206
static PyObject *
4207
listreviter_setstate(PyObject *self, PyObject *state)
4208
0
{
4209
0
    listreviterobject *it = (listreviterobject *)self;
4210
0
    Py_ssize_t index = PyLong_AsSsize_t(state);
4211
0
    if (index == -1 && PyErr_Occurred())
4212
0
        return NULL;
4213
0
    if (it->it_seq != NULL) {
4214
0
        if (index < -1)
4215
0
            index = -1;
4216
0
        else if (index > PyList_GET_SIZE(it->it_seq) - 1)
4217
0
            index = PyList_GET_SIZE(it->it_seq) - 1;
4218
0
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index);
4219
0
    }
4220
0
    Py_RETURN_NONE;
4221
0
}
4222
4223
/* common pickling support */
4224
4225
static PyObject *
4226
listiter_reduce_general(void *_it, int forward)
4227
0
{
4228
0
    PyObject *list;
4229
0
    PyObject *iter;
4230
4231
    /* _PyEval_GetBuiltin can invoke arbitrary code,
4232
     * call must be before access of iterator pointers.
4233
     * see issue #101765 */
4234
4235
0
    if (forward) {
4236
0
        iter = _PyEval_GetBuiltin(&_Py_ID(iter));
4237
0
        _PyListIterObject *it = (_PyListIterObject *)_it;
4238
0
        Py_ssize_t idx = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4239
0
        if (idx >= 0) {
4240
0
            return Py_BuildValue("N(O)n", iter, it->it_seq, idx);
4241
0
        }
4242
0
    } else {
4243
0
        iter = _PyEval_GetBuiltin(&_Py_ID(reversed));
4244
0
        listreviterobject *it = (listreviterobject *)_it;
4245
0
        Py_ssize_t idx = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4246
0
        if (idx >= 0) {
4247
0
            return Py_BuildValue("N(O)n", iter, it->it_seq, idx);
4248
0
        }
4249
0
    }
4250
    /* empty iterator, create an empty list */
4251
0
    list = PyList_New(0);
4252
0
    if (list == NULL)
4253
0
        return NULL;
4254
0
    return Py_BuildValue("N(N)", iter, list);
4255
0
}