Coverage Report

Created: 2025-11-11 06:44

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/cpython/Objects/listobject.c
Line
Count
Source
1
/* List object implementation */
2
3
#include "Python.h"
4
#include "pycore_abstract.h"      // _PyIndex_Check()
5
#include "pycore_ceval.h"         // _PyEval_GetBuiltin()
6
#include "pycore_critical_section.h"  // _Py_CRITICAL_SECTION_ASSERT_OBJECT_LOCKED()
7
#include "pycore_dict.h"          // _PyDictViewObject
8
#include "pycore_freelist.h"      // _Py_FREELIST_FREE(), _Py_FREELIST_POP()
9
#include "pycore_interp.h"        // PyInterpreterState.list
10
#include "pycore_list.h"          // struct _Py_list_freelist, _PyListIterObject
11
#include "pycore_long.h"          // _PyLong_DigitCount
12
#include "pycore_modsupport.h"    // _PyArg_NoKwnames()
13
#include "pycore_object.h"        // _PyObject_GC_TRACK(), _PyDebugAllocatorStats()
14
#include "pycore_pyatomic_ft_wrappers.h"
15
#include "pycore_setobject.h"     // _PySet_NextEntry()
16
#include "pycore_stackref.h"      // _Py_TryIncrefCompareStackRef()
17
#include "pycore_tuple.h"         // _PyTuple_FromArraySteal()
18
#include "pycore_typeobject.h"    // _Py_TYPE_VERSION_LIST
19
#include <stddef.h>
20
21
/*[clinic input]
22
class list "PyListObject *" "&PyList_Type"
23
[clinic start generated code]*/
24
/*[clinic end generated code: output=da39a3ee5e6b4b0d input=f9b222678f9f71e0]*/
25
26
#include "clinic/listobject.c.h"
27
28
_Py_DECLARE_STR(list_err, "list index out of range");
29
30
#ifdef Py_GIL_DISABLED
31
typedef struct {
32
    Py_ssize_t allocated;
33
    PyObject *ob_item[];
34
} _PyListArray;
35
36
static _PyListArray *
37
list_allocate_array(size_t capacity)
38
{
39
    if (capacity > PY_SSIZE_T_MAX/sizeof(PyObject*) - 1) {
40
        return NULL;
41
    }
42
    _PyListArray *array = PyMem_Malloc(sizeof(_PyListArray) + capacity * sizeof(PyObject *));
43
    if (array == NULL) {
44
        return NULL;
45
    }
46
    array->allocated = capacity;
47
    return array;
48
}
49
50
static Py_ssize_t
51
list_capacity(PyObject **items)
52
{
53
    _PyListArray *array = _Py_CONTAINER_OF(items, _PyListArray, ob_item);
54
    return array->allocated;
55
}
56
#endif
57
58
static void
59
free_list_items(PyObject** items, bool use_qsbr)
60
127M
{
61
#ifdef Py_GIL_DISABLED
62
    _PyListArray *array = _Py_CONTAINER_OF(items, _PyListArray, ob_item);
63
    if (use_qsbr) {
64
        size_t size = sizeof(_PyListArray) + array->allocated * sizeof(PyObject *);
65
        _PyMem_FreeDelayed(array, size);
66
    }
67
    else {
68
        PyMem_Free(array);
69
    }
70
#else
71
127M
    PyMem_Free(items);
72
127M
#endif
73
127M
}
74
75
static void
76
ensure_shared_on_resize(PyListObject *self)
77
92.8M
{
78
#ifdef Py_GIL_DISABLED
79
    // We can't use _Py_CRITICAL_SECTION_ASSERT_OBJECT_LOCKED here because
80
    // the `CALL_LIST_APPEND` bytecode handler may lock the list without
81
    // a critical section.
82
    assert(Py_REFCNT(self) == 1 || PyMutex_IsLocked(&_PyObject_CAST(self)->ob_mutex));
83
84
    // Ensure that the list array is freed using QSBR if we are not the
85
    // owning thread.
86
    if (!_Py_IsOwnedByCurrentThread((PyObject *)self) &&
87
        !_PyObject_GC_IS_SHARED(self))
88
    {
89
        _PyObject_GC_SET_SHARED(self);
90
    }
91
#endif
92
92.8M
}
93
94
/* Ensure ob_item has room for at least newsize elements, and set
95
 * ob_size to newsize.  If newsize > ob_size on entry, the content
96
 * of the new slots at exit is undefined heap trash; it's the caller's
97
 * responsibility to overwrite them with sane values.
98
 * The number of allocated elements may grow, shrink, or stay the same.
99
 * Failure is impossible if newsize <= self.allocated on entry, although
100
 * that partly relies on an assumption that the system realloc() never
101
 * fails when passed a number of bytes <= the number of bytes last
102
 * allocated (the C standard doesn't guarantee this, but it's hard to
103
 * imagine a realloc implementation where it wouldn't be true).
104
 * Note that self->ob_item may change, and even if newsize is less
105
 * than ob_size on entry.
106
 */
107
static int
108
list_resize(PyListObject *self, Py_ssize_t newsize)
109
109M
{
110
109M
    size_t new_allocated, target_bytes;
111
109M
    Py_ssize_t allocated = self->allocated;
112
113
    /* Bypass realloc() when a previous overallocation is large enough
114
       to accommodate the newsize.  If the newsize falls lower than half
115
       the allocated size, then proceed with the realloc() to shrink the list.
116
    */
117
109M
    if (allocated >= newsize && newsize >= (allocated >> 1)) {
118
16.6M
        assert(self->ob_item != NULL || newsize == 0);
119
16.6M
        Py_SET_SIZE(self, newsize);
120
16.6M
        return 0;
121
16.6M
    }
122
123
    /* This over-allocates proportional to the list size, making room
124
     * for additional growth.  The over-allocation is mild, but is
125
     * enough to give linear-time amortized behavior over a long
126
     * sequence of appends() in the presence of a poorly-performing
127
     * system realloc().
128
     * Add padding to make the allocated size multiple of 4.
129
     * The growth pattern is:  0, 4, 8, 16, 24, 32, 40, 52, 64, 76, ...
130
     * Note: new_allocated won't overflow because the largest possible value
131
     *       is PY_SSIZE_T_MAX * (9 / 8) + 6 which always fits in a size_t.
132
     */
133
92.8M
    new_allocated = ((size_t)newsize + (newsize >> 3) + 6) & ~(size_t)3;
134
    /* Do not overallocate if the new size is closer to overallocated size
135
     * than to the old size.
136
     */
137
92.8M
    if (newsize - Py_SIZE(self) > (Py_ssize_t)(new_allocated - newsize))
138
10.8k
        new_allocated = ((size_t)newsize + 3) & ~(size_t)3;
139
140
92.8M
    if (newsize == 0)
141
3.24k
        new_allocated = 0;
142
143
92.8M
    ensure_shared_on_resize(self);
144
145
#ifdef Py_GIL_DISABLED
146
    _PyListArray *array = list_allocate_array(new_allocated);
147
    if (array == NULL) {
148
        PyErr_NoMemory();
149
        return -1;
150
    }
151
    PyObject **old_items = self->ob_item;
152
    if (self->ob_item) {
153
        if (new_allocated < (size_t)allocated) {
154
            target_bytes = new_allocated * sizeof(PyObject*);
155
        }
156
        else {
157
            target_bytes = allocated * sizeof(PyObject*);
158
        }
159
        memcpy(array->ob_item, self->ob_item, target_bytes);
160
    }
161
    if (new_allocated > (size_t)allocated) {
162
        memset(array->ob_item + allocated, 0, sizeof(PyObject *) * (new_allocated - allocated));
163
    }
164
     _Py_atomic_store_ptr_release(&self->ob_item, &array->ob_item);
165
    self->allocated = new_allocated;
166
    Py_SET_SIZE(self, newsize);
167
    if (old_items != NULL) {
168
        free_list_items(old_items, _PyObject_GC_IS_SHARED(self));
169
    }
170
#else
171
92.8M
    PyObject **items;
172
92.8M
    if (new_allocated <= (size_t)PY_SSIZE_T_MAX / sizeof(PyObject *)) {
173
92.8M
        target_bytes = new_allocated * sizeof(PyObject *);
174
92.8M
        items = (PyObject **)PyMem_Realloc(self->ob_item, target_bytes);
175
92.8M
    }
176
0
    else {
177
        // integer overflow
178
0
        items = NULL;
179
0
    }
180
92.8M
    if (items == NULL) {
181
0
        PyErr_NoMemory();
182
0
        return -1;
183
0
    }
184
92.8M
    self->ob_item = items;
185
92.8M
    Py_SET_SIZE(self, newsize);
186
92.8M
    self->allocated = new_allocated;
187
92.8M
#endif
188
92.8M
    return 0;
189
92.8M
}
190
191
static int
192
list_preallocate_exact(PyListObject *self, Py_ssize_t size)
193
6.86M
{
194
6.86M
    PyObject **items;
195
6.86M
    assert(self->ob_item == NULL);
196
6.86M
    assert(size > 0);
197
198
    /* Since the Python memory allocator has granularity of 16 bytes on 64-bit
199
     * platforms (8 on 32-bit), there is no benefit of allocating space for
200
     * the odd number of items, and there is no drawback of rounding the
201
     * allocated size up to the nearest even number.
202
     */
203
6.86M
    size = (size + 1) & ~(size_t)1;
204
#ifdef Py_GIL_DISABLED
205
    _PyListArray *array = list_allocate_array(size);
206
    if (array == NULL) {
207
        PyErr_NoMemory();
208
        return -1;
209
    }
210
    items = array->ob_item;
211
    memset(items, 0, size * sizeof(PyObject *));
212
#else
213
6.86M
    items = PyMem_New(PyObject*, size);
214
6.86M
    if (items == NULL) {
215
0
        PyErr_NoMemory();
216
0
        return -1;
217
0
    }
218
6.86M
#endif
219
6.86M
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item, items);
220
6.86M
    self->allocated = size;
221
6.86M
    return 0;
222
6.86M
}
223
224
/* Print summary info about the state of the optimized allocator */
225
void
226
_PyList_DebugMallocStats(FILE *out)
227
0
{
228
0
    _PyDebugAllocatorStats(out,
229
0
                           "free PyListObject",
230
0
                            _Py_FREELIST_SIZE(lists),
231
0
                           sizeof(PyListObject));
232
0
}
233
234
PyObject *
235
PyList_New(Py_ssize_t size)
236
294M
{
237
294M
    if (size < 0) {
238
0
        PyErr_BadInternalCall();
239
0
        return NULL;
240
0
    }
241
242
294M
    PyListObject *op = _Py_FREELIST_POP(PyListObject, lists);
243
294M
    if (op == NULL) {
244
38.2M
        op = PyObject_GC_New(PyListObject, &PyList_Type);
245
38.2M
        if (op == NULL) {
246
0
            return NULL;
247
0
        }
248
38.2M
    }
249
294M
    if (size <= 0) {
250
249M
        op->ob_item = NULL;
251
249M
    }
252
44.7M
    else {
253
#ifdef Py_GIL_DISABLED
254
        _PyListArray *array = list_allocate_array(size);
255
        if (array == NULL) {
256
            Py_DECREF(op);
257
            return PyErr_NoMemory();
258
        }
259
        memset(&array->ob_item, 0, size * sizeof(PyObject *));
260
        op->ob_item = array->ob_item;
261
#else
262
44.7M
        op->ob_item = (PyObject **) PyMem_Calloc(size, sizeof(PyObject *));
263
44.7M
#endif
264
44.7M
        if (op->ob_item == NULL) {
265
0
            Py_DECREF(op);
266
0
            return PyErr_NoMemory();
267
0
        }
268
44.7M
    }
269
294M
    Py_SET_SIZE(op, size);
270
294M
    op->allocated = size;
271
294M
    _PyObject_GC_TRACK(op);
272
294M
    return (PyObject *) op;
273
294M
}
274
275
static PyObject *
276
list_new_prealloc(Py_ssize_t size)
277
15.9M
{
278
15.9M
    assert(size > 0);
279
15.9M
    PyListObject *op = (PyListObject *) PyList_New(0);
280
15.9M
    if (op == NULL) {
281
0
        return NULL;
282
0
    }
283
15.9M
    assert(op->ob_item == NULL);
284
#ifdef Py_GIL_DISABLED
285
    _PyListArray *array = list_allocate_array(size);
286
    if (array == NULL) {
287
        Py_DECREF(op);
288
        return PyErr_NoMemory();
289
    }
290
    op->ob_item = array->ob_item;
291
#else
292
15.9M
    op->ob_item = PyMem_New(PyObject *, size);
293
15.9M
    if (op->ob_item == NULL) {
294
0
        Py_DECREF(op);
295
0
        return PyErr_NoMemory();
296
0
    }
297
15.9M
#endif
298
15.9M
    op->allocated = size;
299
15.9M
    return (PyObject *) op;
300
15.9M
}
301
302
Py_ssize_t
303
PyList_Size(PyObject *op)
304
99.0k
{
305
99.0k
    if (!PyList_Check(op)) {
306
0
        PyErr_BadInternalCall();
307
0
        return -1;
308
0
    }
309
99.0k
    else {
310
99.0k
        return PyList_GET_SIZE(op);
311
99.0k
    }
312
99.0k
}
313
314
static inline int
315
valid_index(Py_ssize_t i, Py_ssize_t limit)
316
220M
{
317
    /* The cast to size_t lets us use just a single comparison
318
       to check whether i is in the range: 0 <= i < limit.
319
320
       See:  Section 14.2 "Bounds Checking" in the Agner Fog
321
       optimization manual found at:
322
       https://www.agner.org/optimize/optimizing_cpp.pdf
323
    */
324
220M
    return (size_t) i < (size_t) limit;
325
220M
}
326
327
#ifdef Py_GIL_DISABLED
328
329
static PyObject *
330
list_item_impl(PyListObject *self, Py_ssize_t idx)
331
{
332
    PyObject *item = NULL;
333
    Py_BEGIN_CRITICAL_SECTION(self);
334
    if (!_PyObject_GC_IS_SHARED(self)) {
335
        _PyObject_GC_SET_SHARED(self);
336
    }
337
    Py_ssize_t size = Py_SIZE(self);
338
    if (!valid_index(idx, size)) {
339
        goto exit;
340
    }
341
    item = _Py_NewRefWithLock(self->ob_item[idx]);
342
exit:
343
    Py_END_CRITICAL_SECTION();
344
    return item;
345
}
346
347
static inline PyObject*
348
list_get_item_ref(PyListObject *op, Py_ssize_t i)
349
{
350
    if (!_Py_IsOwnedByCurrentThread((PyObject *)op) && !_PyObject_GC_IS_SHARED(op)) {
351
        return list_item_impl(op, i);
352
    }
353
    // Need atomic operation for the getting size.
354
    Py_ssize_t size = PyList_GET_SIZE(op);
355
    if (!valid_index(i, size)) {
356
        return NULL;
357
    }
358
    PyObject **ob_item = _Py_atomic_load_ptr(&op->ob_item);
359
    if (ob_item == NULL) {
360
        return NULL;
361
    }
362
    Py_ssize_t cap = list_capacity(ob_item);
363
    assert(cap != -1);
364
    if (!valid_index(i, cap)) {
365
        return NULL;
366
    }
367
    PyObject *item = _Py_TryXGetRef(&ob_item[i]);
368
    if (item == NULL) {
369
        return list_item_impl(op, i);
370
    }
371
    return item;
372
}
373
#else
374
static inline PyObject*
375
list_get_item_ref(PyListObject *op, Py_ssize_t i)
376
165M
{
377
165M
    if (!valid_index(i, Py_SIZE(op))) {
378
31.6M
        return NULL;
379
31.6M
    }
380
133M
    return Py_NewRef(PyList_GET_ITEM(op, i));
381
165M
}
382
#endif
383
384
PyObject *
385
PyList_GetItem(PyObject *op, Py_ssize_t i)
386
644
{
387
644
    if (!PyList_Check(op)) {
388
0
        PyErr_BadInternalCall();
389
0
        return NULL;
390
0
    }
391
644
    if (!valid_index(i, Py_SIZE(op))) {
392
0
        _Py_DECLARE_STR(list_err, "list index out of range");
393
0
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
394
0
        return NULL;
395
0
    }
396
644
    return ((PyListObject *)op) -> ob_item[i];
397
644
}
398
399
PyObject *
400
PyList_GetItemRef(PyObject *op, Py_ssize_t i)
401
91.1k
{
402
91.1k
    if (!PyList_Check(op)) {
403
0
        PyErr_SetString(PyExc_TypeError, "expected a list");
404
0
        return NULL;
405
0
    }
406
91.1k
    PyObject *item = list_get_item_ref((PyListObject *)op, i);
407
91.1k
    if (item == NULL) {
408
0
        _Py_DECLARE_STR(list_err, "list index out of range");
409
0
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
410
0
        return NULL;
411
0
    }
412
91.1k
    return item;
413
91.1k
}
414
415
PyObject *
416
_PyList_GetItemRef(PyListObject *list, Py_ssize_t i)
417
1.72k
{
418
1.72k
    return list_get_item_ref(list, i);
419
1.72k
}
420
421
#ifdef Py_GIL_DISABLED
422
int
423
_PyList_GetItemRefNoLock(PyListObject *list, Py_ssize_t i, _PyStackRef *result)
424
{
425
    assert(_Py_IsOwnedByCurrentThread((PyObject *)list) ||
426
           _PyObject_GC_IS_SHARED(list));
427
    if (!valid_index(i, PyList_GET_SIZE(list))) {
428
        return 0;
429
    }
430
    PyObject **ob_item = _Py_atomic_load_ptr(&list->ob_item);
431
    if (ob_item == NULL) {
432
        return 0;
433
    }
434
    Py_ssize_t cap = list_capacity(ob_item);
435
    assert(cap != -1);
436
    if (!valid_index(i, cap)) {
437
        return 0;
438
    }
439
    PyObject *obj = _Py_atomic_load_ptr(&ob_item[i]);
440
    if (obj == NULL || !_Py_TryIncrefCompareStackRef(&ob_item[i], obj, result)) {
441
        return -1;
442
    }
443
    return 1;
444
}
445
#endif
446
447
int
448
PyList_SetItem(PyObject *op, Py_ssize_t i,
449
               PyObject *newitem)
450
25.3k
{
451
25.3k
    if (!PyList_Check(op)) {
452
0
        Py_XDECREF(newitem);
453
0
        PyErr_BadInternalCall();
454
0
        return -1;
455
0
    }
456
25.3k
    int ret;
457
25.3k
    PyListObject *self = ((PyListObject *)op);
458
25.3k
    Py_BEGIN_CRITICAL_SECTION(self);
459
25.3k
    if (!valid_index(i, Py_SIZE(self))) {
460
0
        Py_XDECREF(newitem);
461
0
        PyErr_SetString(PyExc_IndexError,
462
0
                        "list assignment index out of range");
463
0
        ret = -1;
464
0
        goto end;
465
0
    }
466
25.3k
    PyObject *tmp = self->ob_item[i];
467
25.3k
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item[i], newitem);
468
25.3k
    Py_XDECREF(tmp);
469
25.3k
    ret = 0;
470
25.3k
end:;
471
25.3k
    Py_END_CRITICAL_SECTION();
472
25.3k
    return ret;
473
25.3k
}
474
475
static int
476
ins1(PyListObject *self, Py_ssize_t where, PyObject *v)
477
82
{
478
82
    Py_ssize_t i, n = Py_SIZE(self);
479
82
    PyObject **items;
480
82
    if (v == NULL) {
481
0
        PyErr_BadInternalCall();
482
0
        return -1;
483
0
    }
484
485
82
    assert((size_t)n + 1 < PY_SSIZE_T_MAX);
486
82
    if (list_resize(self, n+1) < 0)
487
0
        return -1;
488
489
82
    if (where < 0) {
490
0
        where += n;
491
0
        if (where < 0)
492
0
            where = 0;
493
0
    }
494
82
    if (where > n)
495
0
        where = n;
496
82
    items = self->ob_item;
497
474
    for (i = n; --i >= where; )
498
392
        FT_ATOMIC_STORE_PTR_RELAXED(items[i+1], items[i]);
499
82
    FT_ATOMIC_STORE_PTR_RELEASE(items[where], Py_NewRef(v));
500
82
    return 0;
501
82
}
502
503
int
504
PyList_Insert(PyObject *op, Py_ssize_t where, PyObject *newitem)
505
22
{
506
22
    if (!PyList_Check(op)) {
507
0
        PyErr_BadInternalCall();
508
0
        return -1;
509
0
    }
510
22
    PyListObject *self = (PyListObject *)op;
511
22
    int err;
512
22
    Py_BEGIN_CRITICAL_SECTION(self);
513
22
    err = ins1(self, where, newitem);
514
22
    Py_END_CRITICAL_SECTION();
515
22
    return err;
516
22
}
517
518
/* internal, used by _PyList_AppendTakeRef */
519
int
520
_PyList_AppendTakeRefListResize(PyListObject *self, PyObject *newitem)
521
68.7M
{
522
68.7M
    Py_ssize_t len = Py_SIZE(self);
523
68.7M
    assert(self->allocated == -1 || self->allocated == len);
524
68.7M
    if (list_resize(self, len + 1) < 0) {
525
0
        Py_DECREF(newitem);
526
0
        return -1;
527
0
    }
528
68.7M
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item[len], newitem);
529
68.7M
    return 0;
530
68.7M
}
531
532
int
533
PyList_Append(PyObject *op, PyObject *newitem)
534
170M
{
535
170M
    if (PyList_Check(op) && (newitem != NULL)) {
536
170M
        int ret;
537
170M
        Py_BEGIN_CRITICAL_SECTION(op);
538
170M
        ret = _PyList_AppendTakeRef((PyListObject *)op, Py_NewRef(newitem));
539
170M
        Py_END_CRITICAL_SECTION();
540
170M
        return ret;
541
170M
    }
542
0
    PyErr_BadInternalCall();
543
0
    return -1;
544
170M
}
545
546
/* Methods */
547
548
static void
549
list_dealloc(PyObject *self)
550
315M
{
551
315M
    PyListObject *op = (PyListObject *)self;
552
315M
    Py_ssize_t i;
553
315M
    PyObject_GC_UnTrack(op);
554
315M
    if (op->ob_item != NULL) {
555
        /* Do it backwards, for Christian Tismer.
556
           There's a simple test case where somehow this reduces
557
           thrashing when a *very* large list is created and
558
           immediately deleted. */
559
112M
        i = Py_SIZE(op);
560
1.43G
        while (--i >= 0) {
561
1.32G
            Py_XDECREF(op->ob_item[i]);
562
1.32G
        }
563
112M
        free_list_items(op->ob_item, false);
564
112M
        op->ob_item = NULL;
565
112M
    }
566
315M
    if (PyList_CheckExact(op)) {
567
303M
        _Py_FREELIST_FREE(lists, op, PyObject_GC_Del);
568
303M
    }
569
11.6M
    else {
570
11.6M
        PyObject_GC_Del(op);
571
11.6M
    }
572
315M
}
573
574
static PyObject *
575
list_repr_impl(PyListObject *v)
576
4.16M
{
577
4.16M
    int res = Py_ReprEnter((PyObject*)v);
578
4.16M
    if (res != 0) {
579
0
        return (res > 0 ? PyUnicode_FromString("[...]") : NULL);
580
0
    }
581
582
    /* "[" + "1" + ", 2" * (len - 1) + "]" */
583
4.16M
    Py_ssize_t prealloc = 1 + 1 + (2 + 1) * (Py_SIZE(v) - 1) + 1;
584
4.16M
    PyUnicodeWriter *writer = PyUnicodeWriter_Create(prealloc);
585
4.16M
    PyObject *item = NULL;
586
4.16M
    if (writer == NULL) {
587
0
        goto error;
588
0
    }
589
590
4.16M
    if (PyUnicodeWriter_WriteChar(writer, '[') < 0) {
591
0
        goto error;
592
0
    }
593
594
    /* Do repr() on each element.  Note that this may mutate the list,
595
       so must refetch the list size on each iteration. */
596
11.4M
    for (Py_ssize_t i = 0; i < Py_SIZE(v); ++i) {
597
        /* Hold a strong reference since repr(item) can mutate the list */
598
7.31M
        item = Py_NewRef(v->ob_item[i]);
599
600
7.31M
        if (i > 0) {
601
3.14M
            if (PyUnicodeWriter_WriteChar(writer, ',') < 0) {
602
0
                goto error;
603
0
            }
604
3.14M
            if (PyUnicodeWriter_WriteChar(writer, ' ') < 0) {
605
0
                goto error;
606
0
            }
607
3.14M
        }
608
609
7.31M
        if (PyUnicodeWriter_WriteRepr(writer, item) < 0) {
610
0
            goto error;
611
0
        }
612
7.31M
        Py_CLEAR(item);
613
7.31M
    }
614
615
4.16M
    if (PyUnicodeWriter_WriteChar(writer, ']') < 0) {
616
0
        goto error;
617
0
    }
618
619
4.16M
    Py_ReprLeave((PyObject *)v);
620
4.16M
    return PyUnicodeWriter_Finish(writer);
621
622
0
error:
623
0
    Py_XDECREF(item);
624
0
    PyUnicodeWriter_Discard(writer);
625
0
    Py_ReprLeave((PyObject *)v);
626
0
    return NULL;
627
4.16M
}
628
629
static PyObject *
630
list_repr(PyObject *self)
631
4.17M
{
632
4.17M
    if (PyList_GET_SIZE(self) == 0) {
633
8.07k
        return PyUnicode_FromString("[]");
634
8.07k
    }
635
4.16M
    PyListObject *v = (PyListObject *)self;
636
4.16M
    PyObject *ret = NULL;
637
4.16M
    Py_BEGIN_CRITICAL_SECTION(v);
638
4.16M
    ret = list_repr_impl(v);
639
4.16M
    Py_END_CRITICAL_SECTION();
640
4.16M
    return ret;
641
4.17M
}
642
643
static Py_ssize_t
644
list_length(PyObject *a)
645
51.6M
{
646
51.6M
    return PyList_GET_SIZE(a);
647
51.6M
}
648
649
static int
650
list_contains(PyObject *aa, PyObject *el)
651
8.14k
{
652
653
38.9k
    for (Py_ssize_t i = 0; ; i++) {
654
38.9k
        PyObject *item = list_get_item_ref((PyListObject *)aa, i);
655
38.9k
        if (item == NULL) {
656
            // out-of-bounds
657
7.30k
            return 0;
658
7.30k
        }
659
31.6k
        int cmp = PyObject_RichCompareBool(item, el, Py_EQ);
660
31.6k
        Py_DECREF(item);
661
31.6k
        if (cmp != 0) {
662
840
            return cmp;
663
840
        }
664
31.6k
    }
665
0
    return 0;
666
8.14k
}
667
668
static PyObject *
669
list_item(PyObject *aa, Py_ssize_t i)
670
19.8M
{
671
19.8M
    PyListObject *a = (PyListObject *)aa;
672
19.8M
    if (!valid_index(i, PyList_GET_SIZE(a))) {
673
1.18k
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
674
1.18k
        return NULL;
675
1.18k
    }
676
19.8M
    PyObject *item;
677
#ifdef Py_GIL_DISABLED
678
    item = list_get_item_ref(a, i);
679
    if (item == NULL) {
680
        PyErr_SetObject(PyExc_IndexError, &_Py_STR(list_err));
681
        return NULL;
682
    }
683
#else
684
19.8M
    item = Py_NewRef(a->ob_item[i]);
685
19.8M
#endif
686
19.8M
    return item;
687
19.8M
}
688
689
static PyObject *
690
list_slice_lock_held(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
691
2.45M
{
692
2.45M
    PyListObject *np;
693
2.45M
    PyObject **src, **dest;
694
2.45M
    Py_ssize_t i, len;
695
2.45M
    len = ihigh - ilow;
696
2.45M
    if (len <= 0) {
697
0
        return PyList_New(0);
698
0
    }
699
2.45M
    np = (PyListObject *) list_new_prealloc(len);
700
2.45M
    if (np == NULL)
701
0
        return NULL;
702
703
2.45M
    src = a->ob_item + ilow;
704
2.45M
    dest = np->ob_item;
705
30.5M
    for (i = 0; i < len; i++) {
706
28.1M
        PyObject *v = src[i];
707
28.1M
        dest[i] = Py_NewRef(v);
708
28.1M
    }
709
2.45M
    Py_SET_SIZE(np, len);
710
2.45M
    return (PyObject *)np;
711
2.45M
}
712
713
PyObject *
714
PyList_GetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
715
0
{
716
0
    if (!PyList_Check(a)) {
717
0
        PyErr_BadInternalCall();
718
0
        return NULL;
719
0
    }
720
0
    PyObject *ret;
721
0
    Py_BEGIN_CRITICAL_SECTION(a);
722
0
    if (ilow < 0) {
723
0
        ilow = 0;
724
0
    }
725
0
    else if (ilow > Py_SIZE(a)) {
726
0
        ilow = Py_SIZE(a);
727
0
    }
728
0
    if (ihigh < ilow) {
729
0
        ihigh = ilow;
730
0
    }
731
0
    else if (ihigh > Py_SIZE(a)) {
732
0
        ihigh = Py_SIZE(a);
733
0
    }
734
0
    ret = list_slice_lock_held((PyListObject *)a, ilow, ihigh);
735
0
    Py_END_CRITICAL_SECTION();
736
0
    return ret;
737
0
}
738
739
static PyObject *
740
list_concat_lock_held(PyListObject *a, PyListObject *b)
741
21.7M
{
742
21.7M
    Py_ssize_t size;
743
21.7M
    Py_ssize_t i;
744
21.7M
    PyObject **src, **dest;
745
21.7M
    PyListObject *np;
746
21.7M
    assert((size_t)Py_SIZE(a) + (size_t)Py_SIZE(b) < PY_SSIZE_T_MAX);
747
21.7M
    size = Py_SIZE(a) + Py_SIZE(b);
748
21.7M
    if (size == 0) {
749
8.22M
        return PyList_New(0);
750
8.22M
    }
751
13.4M
    np = (PyListObject *) list_new_prealloc(size);
752
13.4M
    if (np == NULL) {
753
0
        return NULL;
754
0
    }
755
13.4M
    src = a->ob_item;
756
13.4M
    dest = np->ob_item;
757
405M
    for (i = 0; i < Py_SIZE(a); i++) {
758
391M
        PyObject *v = src[i];
759
391M
        dest[i] = Py_NewRef(v);
760
391M
    }
761
13.4M
    src = b->ob_item;
762
13.4M
    dest = np->ob_item + Py_SIZE(a);
763
236M
    for (i = 0; i < Py_SIZE(b); i++) {
764
222M
        PyObject *v = src[i];
765
222M
        dest[i] = Py_NewRef(v);
766
222M
    }
767
13.4M
    Py_SET_SIZE(np, size);
768
13.4M
    return (PyObject *)np;
769
13.4M
}
770
771
static PyObject *
772
list_concat(PyObject *aa, PyObject *bb)
773
21.7M
{
774
21.7M
    if (!PyList_Check(bb)) {
775
0
        PyErr_Format(PyExc_TypeError,
776
0
                  "can only concatenate list (not \"%.200s\") to list",
777
0
                  Py_TYPE(bb)->tp_name);
778
0
        return NULL;
779
0
    }
780
21.7M
    PyListObject *a = (PyListObject *)aa;
781
21.7M
    PyListObject *b = (PyListObject *)bb;
782
21.7M
    PyObject *ret;
783
21.7M
    Py_BEGIN_CRITICAL_SECTION2(a, b);
784
21.7M
    ret = list_concat_lock_held(a, b);
785
21.7M
    Py_END_CRITICAL_SECTION2();
786
21.7M
    return ret;
787
21.7M
}
788
789
static PyObject *
790
list_repeat_lock_held(PyListObject *a, Py_ssize_t n)
791
13.7k
{
792
13.7k
    const Py_ssize_t input_size = Py_SIZE(a);
793
13.7k
    if (input_size == 0 || n <= 0)
794
2.01k
        return PyList_New(0);
795
13.7k
    assert(n > 0);
796
797
11.6k
    if (input_size > PY_SSIZE_T_MAX / n)
798
0
        return PyErr_NoMemory();
799
11.6k
    Py_ssize_t output_size = input_size * n;
800
801
11.6k
    PyListObject *np = (PyListObject *) list_new_prealloc(output_size);
802
11.6k
    if (np == NULL)
803
0
        return NULL;
804
805
11.6k
    PyObject **dest = np->ob_item;
806
11.6k
    if (input_size == 1) {
807
11.6k
        PyObject *elem = a->ob_item[0];
808
11.6k
        _Py_RefcntAdd(elem, n);
809
11.6k
        PyObject **dest_end = dest + output_size;
810
11.1M
        while (dest < dest_end) {
811
11.1M
            *dest++ = elem;
812
11.1M
        }
813
11.6k
    }
814
0
    else {
815
0
        PyObject **src = a->ob_item;
816
0
        PyObject **src_end = src + input_size;
817
0
        while (src < src_end) {
818
0
            _Py_RefcntAdd(*src, n);
819
0
            *dest++ = *src++;
820
0
        }
821
        // TODO: _Py_memory_repeat calls are not safe for shared lists in
822
        // GIL_DISABLED builds. (See issue #129069)
823
0
        _Py_memory_repeat((char *)np->ob_item, sizeof(PyObject *)*output_size,
824
0
                                        sizeof(PyObject *)*input_size);
825
0
    }
826
827
11.6k
    Py_SET_SIZE(np, output_size);
828
11.6k
    return (PyObject *) np;
829
11.6k
}
830
831
static PyObject *
832
list_repeat(PyObject *aa, Py_ssize_t n)
833
13.7k
{
834
13.7k
    PyObject *ret;
835
13.7k
    PyListObject *a = (PyListObject *)aa;
836
13.7k
    Py_BEGIN_CRITICAL_SECTION(a);
837
13.7k
    ret = list_repeat_lock_held(a, n);
838
13.7k
    Py_END_CRITICAL_SECTION();
839
13.7k
    return ret;
840
13.7k
}
841
842
static void
843
list_clear_impl(PyListObject *a, bool is_resize)
844
15.1M
{
845
15.1M
    PyObject **items = a->ob_item;
846
15.1M
    if (items == NULL) {
847
0
        return;
848
0
    }
849
850
    /* Because XDECREF can recursively invoke operations on
851
       this list, we make it empty first. */
852
15.1M
    Py_ssize_t i = Py_SIZE(a);
853
15.1M
    Py_SET_SIZE(a, 0);
854
15.1M
    FT_ATOMIC_STORE_PTR_RELEASE(a->ob_item, NULL);
855
15.1M
    a->allocated = 0;
856
30.4M
    while (--i >= 0) {
857
15.3M
        Py_XDECREF(items[i]);
858
15.3M
    }
859
#ifdef Py_GIL_DISABLED
860
    if (is_resize) {
861
        ensure_shared_on_resize(a);
862
    }
863
    bool use_qsbr = is_resize && _PyObject_GC_IS_SHARED(a);
864
#else
865
15.1M
    bool use_qsbr = false;
866
15.1M
#endif
867
15.1M
    free_list_items(items, use_qsbr);
868
    // Note that there is no guarantee that the list is actually empty
869
    // at this point, because XDECREF may have populated it indirectly again!
870
15.1M
}
871
872
static void
873
list_clear(PyListObject *a)
874
15.1M
{
875
15.1M
    list_clear_impl(a, true);
876
15.1M
}
877
878
static int
879
list_clear_slot(PyObject *self)
880
0
{
881
0
    list_clear_impl((PyListObject *)self, false);
882
0
    return 0;
883
0
}
884
885
/* a[ilow:ihigh] = v if v != NULL.
886
 * del a[ilow:ihigh] if v == NULL.
887
 *
888
 * Special speed gimmick:  when v is NULL and ihigh - ilow <= 8, it's
889
 * guaranteed the call cannot fail.
890
 */
891
static int
892
list_ass_slice_lock_held(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
893
4.41M
{
894
    /* Because [X]DECREF can recursively invoke list operations on
895
       this list, we must postpone all [X]DECREF activity until
896
       after the list is back in its canonical shape.  Therefore
897
       we must allocate an additional array, 'recycle', into which
898
       we temporarily copy the items that are deleted from the
899
       list. :-( */
900
4.41M
    PyObject *recycle_on_stack[8];
901
4.41M
    PyObject **recycle = recycle_on_stack; /* will allocate more if needed */
902
4.41M
    PyObject **item;
903
4.41M
    PyObject **vitem = NULL;
904
4.41M
    PyObject *v_as_SF = NULL; /* PySequence_Fast(v) */
905
4.41M
    Py_ssize_t n; /* # of elements in replacement list */
906
4.41M
    Py_ssize_t norig; /* # of elements in list getting replaced */
907
4.41M
    Py_ssize_t d; /* Change in size */
908
4.41M
    Py_ssize_t k;
909
4.41M
    size_t s;
910
4.41M
    int result = -1;            /* guilty until proved innocent */
911
4.41M
#define b ((PyListObject *)v)
912
4.41M
    if (v == NULL)
913
4.19M
        n = 0;
914
226k
    else {
915
226k
        v_as_SF = PySequence_Fast(v, "can only assign an iterable");
916
226k
        if(v_as_SF == NULL)
917
0
            goto Error;
918
226k
        n = PySequence_Fast_GET_SIZE(v_as_SF);
919
226k
        vitem = PySequence_Fast_ITEMS(v_as_SF);
920
226k
    }
921
4.41M
    if (ilow < 0)
922
0
        ilow = 0;
923
4.41M
    else if (ilow > Py_SIZE(a))
924
0
        ilow = Py_SIZE(a);
925
926
4.41M
    if (ihigh < ilow)
927
0
        ihigh = ilow;
928
4.41M
    else if (ihigh > Py_SIZE(a))
929
0
        ihigh = Py_SIZE(a);
930
931
4.41M
    norig = ihigh - ilow;
932
4.41M
    assert(norig >= 0);
933
4.41M
    d = n - norig;
934
4.41M
    if (Py_SIZE(a) + d == 0) {
935
614k
        Py_XDECREF(v_as_SF);
936
614k
        list_clear(a);
937
614k
        return 0;
938
614k
    }
939
3.80M
    item = a->ob_item;
940
    /* recycle the items that we are about to remove */
941
3.80M
    s = norig * sizeof(PyObject *);
942
    /* If norig == 0, item might be NULL, in which case we may not memcpy from it. */
943
3.80M
    if (s) {
944
3.60M
        if (s > sizeof(recycle_on_stack)) {
945
146
            recycle = (PyObject **)PyMem_Malloc(s);
946
146
            if (recycle == NULL) {
947
0
                PyErr_NoMemory();
948
0
                goto Error;
949
0
            }
950
146
        }
951
3.60M
        memcpy(recycle, &item[ilow], s);
952
3.60M
    }
953
954
3.80M
    if (d < 0) { /* Delete -d items */
955
3.60M
        Py_ssize_t tail;
956
3.60M
        tail = (Py_SIZE(a) - ihigh) * sizeof(PyObject *);
957
        // TODO: these memmove/memcpy calls are not safe for shared lists in
958
        // GIL_DISABLED builds. (See issue #129069)
959
3.60M
        memmove(&item[ihigh+d], &item[ihigh], tail);
960
3.60M
        if (list_resize(a, Py_SIZE(a) + d) < 0) {
961
0
            memmove(&item[ihigh], &item[ihigh+d], tail);
962
0
            memcpy(&item[ilow], recycle, s);
963
0
            goto Error;
964
0
        }
965
3.60M
        item = a->ob_item;
966
3.60M
    }
967
200k
    else if (d > 0) { /* Insert d items */
968
200k
        k = Py_SIZE(a);
969
200k
        if (list_resize(a, k+d) < 0)
970
0
            goto Error;
971
200k
        item = a->ob_item;
972
        // TODO: these memmove/memcpy calls are not safe for shared lists in
973
        // GIL_DISABLED builds. (See issue #129069)
974
200k
        memmove(&item[ihigh+d], &item[ihigh],
975
200k
            (k - ihigh)*sizeof(PyObject *));
976
200k
    }
977
4.00M
    for (k = 0; k < n; k++, ilow++) {
978
200k
        PyObject *w = vitem[k];
979
200k
        FT_ATOMIC_STORE_PTR_RELEASE(item[ilow], Py_XNewRef(w));
980
200k
    }
981
7.41M
    for (k = norig - 1; k >= 0; --k)
982
3.61M
        Py_XDECREF(recycle[k]);
983
3.80M
    result = 0;
984
3.80M
 Error:
985
3.80M
    if (recycle != recycle_on_stack)
986
146
        PyMem_Free(recycle);
987
3.80M
    Py_XDECREF(v_as_SF);
988
3.80M
    return result;
989
3.80M
#undef b
990
3.80M
}
991
992
static int
993
list_ass_slice(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
994
4.18M
{
995
4.18M
    int ret;
996
4.18M
    if (a == (PyListObject *)v) {
997
0
        Py_BEGIN_CRITICAL_SECTION(a);
998
0
        Py_ssize_t n = PyList_GET_SIZE(a);
999
0
        PyObject *copy = list_slice_lock_held(a, 0, n);
1000
0
        if (copy == NULL) {
1001
0
            ret = -1;
1002
0
        }
1003
0
        else {
1004
0
            ret = list_ass_slice_lock_held(a, ilow, ihigh, copy);
1005
0
            Py_DECREF(copy);
1006
0
        }
1007
0
        Py_END_CRITICAL_SECTION();
1008
0
    }
1009
4.18M
    else if (v != NULL && PyList_CheckExact(v)) {
1010
247
        Py_BEGIN_CRITICAL_SECTION2(a, v);
1011
247
        ret = list_ass_slice_lock_held(a, ilow, ihigh, v);
1012
247
        Py_END_CRITICAL_SECTION2();
1013
247
    }
1014
4.18M
    else {
1015
4.18M
        Py_BEGIN_CRITICAL_SECTION(a);
1016
4.18M
        ret = list_ass_slice_lock_held(a, ilow, ihigh, v);
1017
4.18M
        Py_END_CRITICAL_SECTION();
1018
4.18M
    }
1019
4.18M
    return ret;
1020
4.18M
}
1021
1022
int
1023
PyList_SetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
1024
4.18M
{
1025
4.18M
    if (!PyList_Check(a)) {
1026
0
        PyErr_BadInternalCall();
1027
0
        return -1;
1028
0
    }
1029
4.18M
    return list_ass_slice((PyListObject *)a, ilow, ihigh, v);
1030
4.18M
}
1031
1032
static int
1033
list_inplace_repeat_lock_held(PyListObject *self, Py_ssize_t n)
1034
0
{
1035
0
    Py_ssize_t input_size = PyList_GET_SIZE(self);
1036
0
    if (input_size == 0 || n == 1) {
1037
0
        return 0;
1038
0
    }
1039
1040
0
    if (n < 1) {
1041
0
        list_clear(self);
1042
0
        return 0;
1043
0
    }
1044
1045
0
    if (input_size > PY_SSIZE_T_MAX / n) {
1046
0
        PyErr_NoMemory();
1047
0
        return -1;
1048
0
    }
1049
0
    Py_ssize_t output_size = input_size * n;
1050
1051
0
    if (list_resize(self, output_size) < 0) {
1052
0
        return -1;
1053
0
    }
1054
1055
0
    PyObject **items = self->ob_item;
1056
0
    for (Py_ssize_t j = 0; j < input_size; j++) {
1057
0
        _Py_RefcntAdd(items[j], n-1);
1058
0
    }
1059
    // TODO: _Py_memory_repeat calls are not safe for shared lists in
1060
    // GIL_DISABLED builds. (See issue #129069)
1061
0
    _Py_memory_repeat((char *)items, sizeof(PyObject *)*output_size,
1062
0
                      sizeof(PyObject *)*input_size);
1063
0
    return 0;
1064
0
}
1065
1066
static PyObject *
1067
list_inplace_repeat(PyObject *_self, Py_ssize_t n)
1068
0
{
1069
0
    PyObject *ret;
1070
0
    PyListObject *self = (PyListObject *) _self;
1071
0
    Py_BEGIN_CRITICAL_SECTION(self);
1072
0
    if (list_inplace_repeat_lock_held(self, n) < 0) {
1073
0
        ret = NULL;
1074
0
    }
1075
0
    else {
1076
0
        ret = Py_NewRef(self);
1077
0
    }
1078
0
    Py_END_CRITICAL_SECTION();
1079
0
    return ret;
1080
0
}
1081
1082
static int
1083
list_ass_item_lock_held(PyListObject *a, Py_ssize_t i, PyObject *v)
1084
11.0k
{
1085
11.0k
    if (!valid_index(i, Py_SIZE(a))) {
1086
0
        PyErr_SetString(PyExc_IndexError,
1087
0
                        "list assignment index out of range");
1088
0
        return -1;
1089
0
    }
1090
11.0k
    PyObject *tmp = a->ob_item[i];
1091
11.0k
    if (v == NULL) {
1092
7.57k
        Py_ssize_t size = Py_SIZE(a);
1093
7.57k
        for (Py_ssize_t idx = i; idx < size - 1; idx++) {
1094
0
            FT_ATOMIC_STORE_PTR_RELAXED(a->ob_item[idx], a->ob_item[idx + 1]);
1095
0
        }
1096
7.57k
        Py_SET_SIZE(a, size - 1);
1097
7.57k
    }
1098
3.52k
    else {
1099
3.52k
        FT_ATOMIC_STORE_PTR_RELEASE(a->ob_item[i], Py_NewRef(v));
1100
3.52k
    }
1101
11.0k
    Py_DECREF(tmp);
1102
11.0k
    return 0;
1103
11.0k
}
1104
1105
static int
1106
list_ass_item(PyObject *aa, Py_ssize_t i, PyObject *v)
1107
7.49k
{
1108
7.49k
    int ret;
1109
7.49k
    PyListObject *a = (PyListObject *)aa;
1110
7.49k
    Py_BEGIN_CRITICAL_SECTION(a);
1111
7.49k
    ret = list_ass_item_lock_held(a, i, v);
1112
7.49k
    Py_END_CRITICAL_SECTION();
1113
7.49k
    return ret;
1114
7.49k
}
1115
1116
/*[clinic input]
1117
@critical_section
1118
list.insert
1119
1120
    index: Py_ssize_t
1121
    object: object
1122
    /
1123
1124
Insert object before index.
1125
[clinic start generated code]*/
1126
1127
static PyObject *
1128
list_insert_impl(PyListObject *self, Py_ssize_t index, PyObject *object)
1129
/*[clinic end generated code: output=7f35e32f60c8cb78 input=b1987ca998a4ae2d]*/
1130
60
{
1131
60
    if (ins1(self, index, object) == 0) {
1132
60
        Py_RETURN_NONE;
1133
60
    }
1134
0
    return NULL;
1135
60
}
1136
1137
/*[clinic input]
1138
@critical_section
1139
list.clear as py_list_clear
1140
1141
Remove all items from list.
1142
[clinic start generated code]*/
1143
1144
static PyObject *
1145
py_list_clear_impl(PyListObject *self)
1146
/*[clinic end generated code: output=83726743807e3518 input=e285b7f09051a9ba]*/
1147
170
{
1148
170
    list_clear(self);
1149
170
    Py_RETURN_NONE;
1150
170
}
1151
1152
/*[clinic input]
1153
@critical_section
1154
list.copy
1155
1156
Return a shallow copy of the list.
1157
[clinic start generated code]*/
1158
1159
static PyObject *
1160
list_copy_impl(PyListObject *self)
1161
/*[clinic end generated code: output=ec6b72d6209d418e input=81c54b0c7bb4f73d]*/
1162
0
{
1163
0
    return list_slice_lock_held(self, 0, Py_SIZE(self));
1164
0
}
1165
1166
/*[clinic input]
1167
@critical_section
1168
list.append
1169
1170
     object: object
1171
     /
1172
1173
Append object to the end of the list.
1174
[clinic start generated code]*/
1175
1176
static PyObject *
1177
list_append_impl(PyListObject *self, PyObject *object)
1178
/*[clinic end generated code: output=78423561d92ed405 input=122b0853de54004f]*/
1179
20.5M
{
1180
20.5M
    if (_PyList_AppendTakeRef(self, Py_NewRef(object)) < 0) {
1181
0
        return NULL;
1182
0
    }
1183
20.5M
    Py_RETURN_NONE;
1184
20.5M
}
1185
1186
static int
1187
list_extend_fast(PyListObject *self, PyObject *iterable)
1188
22.1M
{
1189
22.1M
    Py_ssize_t n = PySequence_Fast_GET_SIZE(iterable);
1190
22.1M
    if (n == 0) {
1191
        /* short circuit when iterable is empty */
1192
9.08M
        return 0;
1193
9.08M
    }
1194
1195
13.1M
    Py_ssize_t m = Py_SIZE(self);
1196
    // It should not be possible to allocate a list large enough to cause
1197
    // an overflow on any relevant platform.
1198
13.1M
    assert(m < PY_SSIZE_T_MAX - n);
1199
13.1M
    if (self->ob_item == NULL) {
1200
1.44M
        if (list_preallocate_exact(self, n) < 0) {
1201
0
            return -1;
1202
0
        }
1203
1.44M
        Py_SET_SIZE(self, n);
1204
1.44M
    }
1205
11.6M
    else if (list_resize(self, m + n) < 0) {
1206
0
        return -1;
1207
0
    }
1208
1209
    // note that we may still have self == iterable here for the
1210
    // situation a.extend(a), but the following code works
1211
    // in that case too.  Just make sure to resize self
1212
    // before calling PySequence_Fast_ITEMS.
1213
    //
1214
    // populate the end of self with iterable's items.
1215
13.1M
    PyObject **src = PySequence_Fast_ITEMS(iterable);
1216
13.1M
    PyObject **dest = self->ob_item + m;
1217
42.0M
    for (Py_ssize_t i = 0; i < n; i++) {
1218
28.9M
        PyObject *o = src[i];
1219
28.9M
        FT_ATOMIC_STORE_PTR_RELEASE(dest[i], Py_NewRef(o));
1220
28.9M
    }
1221
13.1M
    return 0;
1222
13.1M
}
1223
1224
static int
1225
list_extend_iter_lock_held(PyListObject *self, PyObject *iterable)
1226
6.14M
{
1227
6.14M
    PyObject *it = PyObject_GetIter(iterable);
1228
6.14M
    if (it == NULL) {
1229
0
        return -1;
1230
0
    }
1231
6.14M
    PyObject *(*iternext)(PyObject *) = *Py_TYPE(it)->tp_iternext;
1232
1233
    /* Guess a result list size. */
1234
6.14M
    Py_ssize_t n = PyObject_LengthHint(iterable, 8);
1235
6.14M
    if (n < 0) {
1236
0
        Py_DECREF(it);
1237
0
        return -1;
1238
0
    }
1239
1240
6.14M
    Py_ssize_t m = Py_SIZE(self);
1241
6.14M
    if (m > PY_SSIZE_T_MAX - n) {
1242
        /* m + n overflowed; on the chance that n lied, and there really
1243
         * is enough room, ignore it.  If n was telling the truth, we'll
1244
         * eventually run out of memory during the loop.
1245
         */
1246
0
    }
1247
6.14M
    else if (self->ob_item == NULL) {
1248
5.79M
        if (n && list_preallocate_exact(self, n) < 0)
1249
0
            goto error;
1250
5.79M
    }
1251
350k
    else {
1252
        /* Make room. */
1253
350k
        if (list_resize(self, m + n) < 0) {
1254
0
            goto error;
1255
0
        }
1256
1257
        /* Make the list sane again. */
1258
350k
        Py_SET_SIZE(self, m);
1259
350k
    }
1260
1261
    /* Run iterator to exhaustion. */
1262
72.8M
    for (;;) {
1263
72.8M
        PyObject *item = iternext(it);
1264
72.8M
        if (item == NULL) {
1265
6.14M
            if (PyErr_Occurred()) {
1266
647
                if (PyErr_ExceptionMatches(PyExc_StopIteration))
1267
0
                    PyErr_Clear();
1268
647
                else
1269
647
                    goto error;
1270
647
            }
1271
6.13M
            break;
1272
6.14M
        }
1273
1274
66.6M
        if (Py_SIZE(self) < self->allocated) {
1275
65.5M
            Py_ssize_t len = Py_SIZE(self);
1276
65.5M
            FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item[len], item);  // steals item ref
1277
65.5M
            Py_SET_SIZE(self, len + 1);
1278
65.5M
        }
1279
1.12M
        else {
1280
1.12M
            if (_PyList_AppendTakeRef(self, item) < 0)
1281
0
                goto error;
1282
1.12M
        }
1283
66.6M
    }
1284
1285
    /* Cut back result list if initial guess was too large. */
1286
6.13M
    if (Py_SIZE(self) < self->allocated) {
1287
4.66M
        if (list_resize(self, Py_SIZE(self)) < 0)
1288
0
            goto error;
1289
4.66M
    }
1290
1291
6.13M
    Py_DECREF(it);
1292
6.13M
    return 0;
1293
1294
647
  error:
1295
647
    Py_DECREF(it);
1296
647
    return -1;
1297
6.13M
}
1298
1299
static int
1300
list_extend_lock_held(PyListObject *self, PyObject *iterable)
1301
22.1M
{
1302
22.1M
    PyObject *seq = PySequence_Fast(iterable, "argument must be iterable");
1303
22.1M
    if (!seq) {
1304
0
        return -1;
1305
0
    }
1306
1307
22.1M
    int res = list_extend_fast(self, seq);
1308
22.1M
    Py_DECREF(seq);
1309
22.1M
    return res;
1310
22.1M
}
1311
1312
static int
1313
list_extend_set(PyListObject *self, PySetObject *other)
1314
20.8k
{
1315
20.8k
    Py_ssize_t m = Py_SIZE(self);
1316
20.8k
    Py_ssize_t n = PySet_GET_SIZE(other);
1317
20.8k
    Py_ssize_t r = m + n;
1318
20.8k
    if (r == 0) {
1319
935
        return 0;
1320
935
    }
1321
19.8k
    if (list_resize(self, r) < 0) {
1322
0
        return -1;
1323
0
    }
1324
1325
19.8k
    assert(self->ob_item != NULL);
1326
    /* populate the end of self with iterable's items */
1327
19.8k
    Py_ssize_t setpos = 0;
1328
19.8k
    Py_hash_t hash;
1329
19.8k
    PyObject *key;
1330
19.8k
    PyObject **dest = self->ob_item + m;
1331
117k
    while (_PySet_NextEntryRef((PyObject *)other, &setpos, &key, &hash)) {
1332
98.0k
        FT_ATOMIC_STORE_PTR_RELEASE(*dest, key);
1333
98.0k
        dest++;
1334
98.0k
    }
1335
19.8k
    Py_SET_SIZE(self, r);
1336
19.8k
    return 0;
1337
19.8k
}
1338
1339
static int
1340
list_extend_dict(PyListObject *self, PyDictObject *dict, int which_item)
1341
373
{
1342
    // which_item: 0 for keys and 1 for values
1343
373
    Py_ssize_t m = Py_SIZE(self);
1344
373
    Py_ssize_t n = PyDict_GET_SIZE(dict);
1345
373
    Py_ssize_t r = m + n;
1346
373
    if (r == 0) {
1347
0
        return 0;
1348
0
    }
1349
373
    if (list_resize(self, r) < 0) {
1350
0
        return -1;
1351
0
    }
1352
1353
373
    assert(self->ob_item != NULL);
1354
373
    PyObject **dest = self->ob_item + m;
1355
373
    Py_ssize_t pos = 0;
1356
373
    PyObject *keyvalue[2];
1357
1.89k
    while (_PyDict_Next((PyObject *)dict, &pos, &keyvalue[0], &keyvalue[1], NULL)) {
1358
1.52k
        PyObject *obj = keyvalue[which_item];
1359
1.52k
        Py_INCREF(obj);
1360
1.52k
        FT_ATOMIC_STORE_PTR_RELEASE(*dest, obj);
1361
1.52k
        dest++;
1362
1.52k
    }
1363
1364
373
    Py_SET_SIZE(self, r);
1365
373
    return 0;
1366
373
}
1367
1368
static int
1369
list_extend_dictitems(PyListObject *self, PyDictObject *dict)
1370
0
{
1371
0
    Py_ssize_t m = Py_SIZE(self);
1372
0
    Py_ssize_t n = PyDict_GET_SIZE(dict);
1373
0
    Py_ssize_t r = m + n;
1374
0
    if (r == 0) {
1375
0
        return 0;
1376
0
    }
1377
0
    if (list_resize(self, r) < 0) {
1378
0
        return -1;
1379
0
    }
1380
1381
0
    assert(self->ob_item != NULL);
1382
0
    PyObject **dest = self->ob_item + m;
1383
0
    Py_ssize_t pos = 0;
1384
0
    Py_ssize_t i = 0;
1385
0
    PyObject *key_value[2];
1386
0
    while (_PyDict_Next((PyObject *)dict, &pos, &key_value[0], &key_value[1], NULL)) {
1387
0
        PyObject *item = PyTuple_FromArray(key_value, 2);
1388
0
        if (item == NULL) {
1389
0
            Py_SET_SIZE(self, m + i);
1390
0
            return -1;
1391
0
        }
1392
0
        FT_ATOMIC_STORE_PTR_RELEASE(*dest, item);
1393
0
        dest++;
1394
0
        i++;
1395
0
    }
1396
1397
0
    Py_SET_SIZE(self, r);
1398
0
    return 0;
1399
0
}
1400
1401
static int
1402
_list_extend(PyListObject *self, PyObject *iterable)
1403
28.3M
{
1404
    // Special case:
1405
    // lists and tuples which can use PySequence_Fast ops
1406
28.3M
    int res = -1;
1407
28.3M
    if ((PyObject *)self == iterable) {
1408
0
        Py_BEGIN_CRITICAL_SECTION(self);
1409
0
        res = list_inplace_repeat_lock_held(self, 2);
1410
0
        Py_END_CRITICAL_SECTION();
1411
0
    }
1412
28.3M
    else if (PyList_CheckExact(iterable)) {
1413
10.5M
        Py_BEGIN_CRITICAL_SECTION2(self, iterable);
1414
10.5M
        res = list_extend_lock_held(self, iterable);
1415
10.5M
        Py_END_CRITICAL_SECTION2();
1416
10.5M
    }
1417
17.8M
    else if (PyTuple_CheckExact(iterable)) {
1418
11.6M
        Py_BEGIN_CRITICAL_SECTION(self);
1419
11.6M
        res = list_extend_lock_held(self, iterable);
1420
11.6M
        Py_END_CRITICAL_SECTION();
1421
11.6M
    }
1422
6.16M
    else if (PyAnySet_CheckExact(iterable)) {
1423
20.8k
        Py_BEGIN_CRITICAL_SECTION2(self, iterable);
1424
20.8k
        res = list_extend_set(self, (PySetObject *)iterable);
1425
20.8k
        Py_END_CRITICAL_SECTION2();
1426
20.8k
    }
1427
6.14M
    else if (PyDict_CheckExact(iterable)) {
1428
371
        Py_BEGIN_CRITICAL_SECTION2(self, iterable);
1429
371
        res = list_extend_dict(self, (PyDictObject *)iterable, 0 /*keys*/);
1430
371
        Py_END_CRITICAL_SECTION2();
1431
371
    }
1432
6.14M
    else if (Py_IS_TYPE(iterable, &PyDictKeys_Type)) {
1433
0
        PyDictObject *dict = ((_PyDictViewObject *)iterable)->dv_dict;
1434
0
        Py_BEGIN_CRITICAL_SECTION2(self, dict);
1435
0
        res = list_extend_dict(self, dict, 0 /*keys*/);
1436
0
        Py_END_CRITICAL_SECTION2();
1437
0
    }
1438
6.14M
    else if (Py_IS_TYPE(iterable, &PyDictValues_Type)) {
1439
2
        PyDictObject *dict = ((_PyDictViewObject *)iterable)->dv_dict;
1440
2
        Py_BEGIN_CRITICAL_SECTION2(self, dict);
1441
2
        res = list_extend_dict(self, dict, 1 /*values*/);
1442
2
        Py_END_CRITICAL_SECTION2();
1443
2
    }
1444
6.14M
    else if (Py_IS_TYPE(iterable, &PyDictItems_Type)) {
1445
0
        PyDictObject *dict = ((_PyDictViewObject *)iterable)->dv_dict;
1446
0
        Py_BEGIN_CRITICAL_SECTION2(self, dict);
1447
0
        res = list_extend_dictitems(self, dict);
1448
0
        Py_END_CRITICAL_SECTION2();
1449
0
    }
1450
6.14M
    else {
1451
6.14M
        Py_BEGIN_CRITICAL_SECTION(self);
1452
6.14M
        res = list_extend_iter_lock_held(self, iterable);
1453
6.14M
        Py_END_CRITICAL_SECTION();
1454
6.14M
    }
1455
28.3M
    return res;
1456
28.3M
}
1457
1458
/*[clinic input]
1459
list.extend as list_extend
1460
1461
     iterable: object
1462
     /
1463
1464
Extend list by appending elements from the iterable.
1465
[clinic start generated code]*/
1466
1467
static PyObject *
1468
list_extend_impl(PyListObject *self, PyObject *iterable)
1469
/*[clinic end generated code: output=b0eba9e0b186d5ce input=979da7597a515791]*/
1470
18.8M
{
1471
18.8M
    if (_list_extend(self, iterable) < 0) {
1472
647
        return NULL;
1473
647
    }
1474
18.8M
    Py_RETURN_NONE;
1475
18.8M
}
1476
1477
PyObject *
1478
_PyList_Extend(PyListObject *self, PyObject *iterable)
1479
17.5M
{
1480
17.5M
    return list_extend((PyObject*)self, iterable);
1481
17.5M
}
1482
1483
int
1484
PyList_Extend(PyObject *self, PyObject *iterable)
1485
0
{
1486
0
    if (!PyList_Check(self)) {
1487
0
        PyErr_BadInternalCall();
1488
0
        return -1;
1489
0
    }
1490
0
    return _list_extend((PyListObject*)self, iterable);
1491
0
}
1492
1493
1494
int
1495
PyList_Clear(PyObject *self)
1496
0
{
1497
0
    if (!PyList_Check(self)) {
1498
0
        PyErr_BadInternalCall();
1499
0
        return -1;
1500
0
    }
1501
0
    Py_BEGIN_CRITICAL_SECTION(self);
1502
0
    list_clear((PyListObject*)self);
1503
0
    Py_END_CRITICAL_SECTION();
1504
0
    return 0;
1505
0
}
1506
1507
1508
static PyObject *
1509
list_inplace_concat(PyObject *_self, PyObject *other)
1510
512
{
1511
512
    PyListObject *self = (PyListObject *)_self;
1512
512
    if (_list_extend(self, other) < 0) {
1513
0
        return NULL;
1514
0
    }
1515
512
    return Py_NewRef(self);
1516
512
}
1517
1518
/*[clinic input]
1519
@critical_section
1520
list.pop
1521
1522
    index: Py_ssize_t = -1
1523
    /
1524
1525
Remove and return item at index (default last).
1526
1527
Raises IndexError if list is empty or index is out of range.
1528
[clinic start generated code]*/
1529
1530
static PyObject *
1531
list_pop_impl(PyListObject *self, Py_ssize_t index)
1532
/*[clinic end generated code: output=6bd69dcb3f17eca8 input=c269141068ae4b8f]*/
1533
34.7M
{
1534
34.7M
    PyObject *v;
1535
34.7M
    int status;
1536
1537
34.7M
    if (Py_SIZE(self) == 0) {
1538
        /* Special-case most common failure cause */
1539
0
        PyErr_SetString(PyExc_IndexError, "pop from empty list");
1540
0
        return NULL;
1541
0
    }
1542
34.7M
    if (index < 0)
1543
16.6M
        index += Py_SIZE(self);
1544
34.7M
    if (!valid_index(index, Py_SIZE(self))) {
1545
0
        PyErr_SetString(PyExc_IndexError, "pop index out of range");
1546
0
        return NULL;
1547
0
    }
1548
1549
34.7M
    PyObject **items = self->ob_item;
1550
34.7M
    v = items[index];
1551
34.7M
    const Py_ssize_t size_after_pop = Py_SIZE(self) - 1;
1552
34.7M
    if (size_after_pop == 0) {
1553
14.5M
        Py_INCREF(v);
1554
14.5M
        list_clear(self);
1555
14.5M
        status = 0;
1556
14.5M
    }
1557
20.2M
    else {
1558
20.2M
        if ((size_after_pop - index) > 0) {
1559
11.2M
            memmove(&items[index], &items[index+1], (size_after_pop - index) * sizeof(PyObject *));
1560
11.2M
        }
1561
20.2M
        status = list_resize(self, size_after_pop);
1562
20.2M
    }
1563
34.7M
    if (status >= 0) {
1564
34.7M
        return v; // and v now owns the reference the list had
1565
34.7M
    }
1566
0
    else {
1567
        // list resize failed, need to restore
1568
0
        memmove(&items[index+1], &items[index], (size_after_pop - index)* sizeof(PyObject *));
1569
0
        items[index] = v;
1570
0
        return NULL;
1571
0
    }
1572
34.7M
}
1573
1574
/* Reverse a slice of a list in place, from lo up to (exclusive) hi. */
1575
static void
1576
reverse_slice(PyObject **lo, PyObject **hi)
1577
103k
{
1578
103k
    assert(lo && hi);
1579
1580
103k
    --hi;
1581
401k
    while (lo < hi) {
1582
298k
        PyObject *t = *lo;
1583
298k
        *lo = *hi;
1584
298k
        *hi = t;
1585
298k
        ++lo;
1586
298k
        --hi;
1587
298k
    }
1588
103k
}
1589
1590
/* Lots of code for an adaptive, stable, natural mergesort.  There are many
1591
 * pieces to this algorithm; read listsort.txt for overviews and details.
1592
 */
1593
1594
/* A sortslice contains a pointer to an array of keys and a pointer to
1595
 * an array of corresponding values.  In other words, keys[i]
1596
 * corresponds with values[i].  If values == NULL, then the keys are
1597
 * also the values.
1598
 *
1599
 * Several convenience routines are provided here, so that keys and
1600
 * values are always moved in sync.
1601
 */
1602
1603
typedef struct {
1604
    PyObject **keys;
1605
    PyObject **values;
1606
} sortslice;
1607
1608
Py_LOCAL_INLINE(void)
1609
sortslice_copy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j)
1610
32.5k
{
1611
32.5k
    s1->keys[i] = s2->keys[j];
1612
32.5k
    if (s1->values != NULL)
1613
31.4k
        s1->values[i] = s2->values[j];
1614
32.5k
}
1615
1616
Py_LOCAL_INLINE(void)
1617
sortslice_copy_incr(sortslice *dst, sortslice *src)
1618
532k
{
1619
532k
    *dst->keys++ = *src->keys++;
1620
532k
    if (dst->values != NULL)
1621
318k
        *dst->values++ = *src->values++;
1622
532k
}
1623
1624
Py_LOCAL_INLINE(void)
1625
sortslice_copy_decr(sortslice *dst, sortslice *src)
1626
380k
{
1627
380k
    *dst->keys-- = *src->keys--;
1628
380k
    if (dst->values != NULL)
1629
312k
        *dst->values-- = *src->values--;
1630
380k
}
1631
1632
1633
Py_LOCAL_INLINE(void)
1634
sortslice_memcpy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
1635
                 Py_ssize_t n)
1636
200k
{
1637
200k
    memcpy(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1638
200k
    if (s1->values != NULL)
1639
165k
        memcpy(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1640
200k
}
1641
1642
Py_LOCAL_INLINE(void)
1643
sortslice_memmove(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
1644
                  Py_ssize_t n)
1645
138k
{
1646
138k
    memmove(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1647
138k
    if (s1->values != NULL)
1648
112k
        memmove(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1649
138k
}
1650
1651
Py_LOCAL_INLINE(void)
1652
sortslice_advance(sortslice *slice, Py_ssize_t n)
1653
817k
{
1654
817k
    slice->keys += n;
1655
817k
    if (slice->values != NULL)
1656
622k
        slice->values += n;
1657
817k
}
1658
1659
/* Comparison function: ms->key_compare, which is set at run-time in
1660
 * listsort_impl to optimize for various special cases.
1661
 * Returns -1 on error, 1 if x < y, 0 if x >= y.
1662
 */
1663
1664
15.4M
#define ISLT(X, Y) (*(ms->key_compare))(X, Y, ms)
1665
1666
/* Compare X to Y via "<".  Goto "fail" if the comparison raises an
1667
   error.  Else "k" is set to true iff X<Y, and an "if (k)" block is
1668
   started.  It makes more sense in context <wink>.  X and Y are PyObject*s.
1669
*/
1670
14.8M
#define IFLT(X, Y) if ((k = ISLT(X, Y)) < 0) goto fail;  \
1671
14.8M
           if (k)
1672
1673
/* The maximum number of entries in a MergeState's pending-runs stack.
1674
 * For a list with n elements, this needs at most floor(log2(n)) + 1 entries
1675
 * even if we didn't force runs to a minimal length.  So the number of bits
1676
 * in a Py_ssize_t is plenty large enough for all cases.
1677
 */
1678
#define MAX_MERGE_PENDING (SIZEOF_SIZE_T * 8)
1679
1680
/* When we get into galloping mode, we stay there until both runs win less
1681
 * often than MIN_GALLOP consecutive times.  See listsort.txt for more info.
1682
 */
1683
1.09M
#define MIN_GALLOP 7
1684
1685
/* Avoid malloc for small temp arrays. */
1686
2.18M
#define MERGESTATE_TEMP_SIZE 256
1687
1688
/* The largest value of minrun. This must be a power of 2, and >= 1 */
1689
879k
#define MAX_MINRUN 64
1690
#if ((MAX_MINRUN) < 1) || ((MAX_MINRUN) & ((MAX_MINRUN) - 1))
1691
#error "MAX_MINRUN must be a power of 2, and >= 1"
1692
#endif
1693
1694
/* One MergeState exists on the stack per invocation of mergesort.  It's just
1695
 * a convenient way to pass state around among the helper functions.
1696
 */
1697
struct s_slice {
1698
    sortslice base;
1699
    Py_ssize_t len;   /* length of run */
1700
    int power; /* node "level" for powersort merge strategy */
1701
};
1702
1703
typedef struct s_MergeState MergeState;
1704
struct s_MergeState {
1705
    /* This controls when we get *into* galloping mode.  It's initialized
1706
     * to MIN_GALLOP.  merge_lo and merge_hi tend to nudge it higher for
1707
     * random data, and lower for highly structured data.
1708
     */
1709
    Py_ssize_t min_gallop;
1710
1711
    Py_ssize_t listlen;     /* len(input_list) - read only */
1712
    PyObject **basekeys;    /* base address of keys array - read only */
1713
1714
    /* 'a' is temp storage to help with merges.  It contains room for
1715
     * alloced entries.
1716
     */
1717
    sortslice a;        /* may point to temparray below */
1718
    Py_ssize_t alloced;
1719
1720
    /* A stack of n pending runs yet to be merged.  Run #i starts at
1721
     * address base[i] and extends for len[i] elements.  It's always
1722
     * true (so long as the indices are in bounds) that
1723
     *
1724
     *     pending[i].base + pending[i].len == pending[i+1].base
1725
     *
1726
     * so we could cut the storage for this, but it's a minor amount,
1727
     * and keeping all the info explicit simplifies the code.
1728
     */
1729
    int n;
1730
    struct s_slice pending[MAX_MERGE_PENDING];
1731
1732
    /* 'a' points to this when possible, rather than muck with malloc. */
1733
    PyObject *temparray[MERGESTATE_TEMP_SIZE];
1734
1735
    /* This is the function we will use to compare two keys,
1736
     * even when none of our special cases apply and we have to use
1737
     * safe_object_compare. */
1738
    int (*key_compare)(PyObject *, PyObject *, MergeState *);
1739
1740
    /* This function is used by unsafe_object_compare to optimize comparisons
1741
     * when we know our list is type-homogeneous but we can't assume anything else.
1742
     * In the pre-sort check it is set equal to Py_TYPE(key)->tp_richcompare */
1743
    PyObject *(*key_richcompare)(PyObject *, PyObject *, int);
1744
1745
    /* This function is used by unsafe_tuple_compare to compare the first elements
1746
     * of tuples. It may be set to safe_object_compare, but the idea is that hopefully
1747
     * we can assume more, and use one of the special-case compares. */
1748
    int (*tuple_elem_compare)(PyObject *, PyObject *, MergeState *);
1749
1750
    /* Varisbles used for minrun computation. The "ideal" minrun length is
1751
     * the infinite precision listlen / 2**e. See listsort.txt.
1752
     */
1753
     Py_ssize_t mr_current, mr_e, mr_mask;
1754
};
1755
1756
/* binarysort is the best method for sorting small arrays: it does few
1757
   compares, but can do data movement quadratic in the number of elements.
1758
   ss->keys is viewed as an array of n kays, a[:n]. a[:ok] is already sorted.
1759
   Pass ok = 0 (or 1) if you don't know.
1760
   It's sorted in-place, by a stable binary insertion sort. If ss->values
1761
   isn't NULL, it's permuted in lockstap with ss->keys.
1762
   On entry, must have n >= 1, and 0 <= ok <= n <= MAX_MINRUN.
1763
   Return -1 if comparison raises an exception, else 0.
1764
   Even in case of error, the output slice will be some permutation of
1765
   the input (nothing is lost or duplicated).
1766
*/
1767
static int
1768
binarysort(MergeState *ms, const sortslice *ss, Py_ssize_t n, Py_ssize_t ok)
1769
125k
{
1770
125k
    Py_ssize_t k; /* for IFLT macro expansion */
1771
125k
    PyObject ** const a = ss->keys;
1772
125k
    PyObject ** const v = ss->values;
1773
125k
    const bool has_values = v != NULL;
1774
125k
    PyObject *pivot;
1775
125k
    Py_ssize_t M;
1776
1777
125k
    assert(0 <= ok && ok <= n && 1 <= n && n <= MAX_MINRUN);
1778
    /* assert a[:ok] is sorted */
1779
125k
    if (! ok)
1780
0
        ++ok;
1781
    /* Regular insertion sort has average- and worst-case O(n**2) cost
1782
       for both # of comparisons and number of bytes moved. But its branches
1783
       are highly predictable, and it loves sorted input (n-1 compares and no
1784
       data movement). This is significant in cases like sortperf.py's %sort,
1785
       where an out-of-order element near the start of a run is moved into
1786
       place slowly but then the remaining elements up to length minrun are
1787
       generally at worst one slot away from their correct position (so only
1788
       need 1 or 2 commpares to resolve). If comparisons are very fast (such
1789
       as for a list of Python floats), the simple inner loop leaves it
1790
       very competitive with binary insertion, despite that it does
1791
       significantly more compares overall on random data.
1792
1793
       Binary insertion sort has worst, average, and best case O(n log n)
1794
       cost for # of comparisons, but worst and average case O(n**2) cost
1795
       for data movement. The more expensive comparisons, the more important
1796
       the comparison advantage. But its branches are less predictable the
1797
       more "randomish" the data, and that's so significant its worst case
1798
       in real life is random input rather than reverse-ordered (which does
1799
       about twice the data movement than random input does).
1800
1801
       Note that the number of bytes moved doesn't seem to matter. MAX_MINRUN
1802
       of 64 is so small that the key and value pointers all fit in a corner
1803
       of L1 cache, and moving things around in that is very fast. */
1804
#if 0 // ordinary insertion sort.
1805
    PyObject * vpivot = NULL;
1806
    for (; ok < n; ++ok) {
1807
        pivot = a[ok];
1808
        if (has_values)
1809
            vpivot = v[ok];
1810
        for (M = ok - 1; M >= 0; --M) {
1811
            k = ISLT(pivot, a[M]);
1812
            if (k < 0) {
1813
                a[M + 1] = pivot;
1814
                if (has_values)
1815
                    v[M + 1] = vpivot;
1816
                goto fail;
1817
            }
1818
            else if (k) {
1819
                a[M + 1] = a[M];
1820
                if (has_values)
1821
                    v[M + 1] = v[M];
1822
            }
1823
            else
1824
                break;
1825
        }
1826
        a[M + 1] = pivot;
1827
        if (has_values)
1828
            v[M + 1] = vpivot;
1829
    }
1830
#else // binary insertion sort
1831
125k
    Py_ssize_t L, R;
1832
2.26M
    for (; ok < n; ++ok) {
1833
        /* set L to where a[ok] belongs */
1834
2.13M
        L = 0;
1835
2.13M
        R = ok;
1836
2.13M
        pivot = a[ok];
1837
        /* Slice invariants. vacuously true at the start:
1838
         * all a[0:L]  <= pivot
1839
         * all a[L:R]     unknown
1840
         * all a[R:ok]  > pivot
1841
         */
1842
2.13M
        assert(L < R);
1843
9.08M
        do {
1844
            /* don't do silly ;-) things to prevent overflow when finding
1845
               the midpoint; L and R are very far from filling a Py_ssize_t */
1846
9.08M
            M = (L + R) >> 1;
1847
9.08M
#if 1 // straightforward, but highly unpredictable branch on random data
1848
9.08M
            IFLT(pivot, a[M])
1849
3.78M
                R = M;
1850
5.30M
            else
1851
5.30M
                L = M + 1;
1852
#else
1853
            /* Try to get compiler to generate conditional move instructions
1854
               instead. Works fine, but leaving it disabled for now because
1855
               it's not yielding consistently faster sorts. Needs more
1856
               investigation. More computation in the inner loop adds its own
1857
               costs, which can be significant when compares are fast. */
1858
            k = ISLT(pivot, a[M]);
1859
            if (k < 0)
1860
                goto fail;
1861
            Py_ssize_t Mp1 = M + 1;
1862
            R = k ? M : R;
1863
            L = k ? L : Mp1;
1864
#endif
1865
9.08M
        } while (L < R);
1866
2.13M
        assert(L == R);
1867
        /* a[:L] holds all elements from a[:ok] <= pivot now, so pivot belongs
1868
           at index L. Slide a[L:ok] to the right a slot to make room for it.
1869
           Caution: using memmove is much slower under MSVC 5; we're not
1870
           usually moving many slots. Years later: under Visual Studio 2022,
1871
           memmove seems just slightly slower than doing it "by hand". */
1872
15.9M
        for (M = ok; M > L; --M)
1873
13.7M
            a[M] = a[M - 1];
1874
2.13M
        a[L] = pivot;
1875
2.13M
        if (has_values) {
1876
1.58M
            pivot = v[ok];
1877
8.54M
            for (M = ok; M > L; --M)
1878
6.95M
                v[M] = v[M - 1];
1879
1.58M
            v[L] = pivot;
1880
1.58M
        }
1881
2.13M
    }
1882
125k
#endif // pick binary or regular insertion sort
1883
125k
    return 0;
1884
1885
0
 fail:
1886
0
    return -1;
1887
125k
}
1888
1889
static void
1890
sortslice_reverse(sortslice *s, Py_ssize_t n)
1891
62.0k
{
1892
62.0k
    reverse_slice(s->keys, &s->keys[n]);
1893
62.0k
    if (s->values != NULL)
1894
41.1k
        reverse_slice(s->values, &s->values[n]);
1895
62.0k
}
1896
1897
/*
1898
Return the length of the run beginning at slo->keys, spanning no more than
1899
nremaining elements. The run beginning there may be ascending or descending,
1900
but the function permutes it in place, if needed, so that it's always ascending
1901
upon return.
1902
1903
Returns -1 in case of error.
1904
*/
1905
static Py_ssize_t
1906
count_run(MergeState *ms, sortslice *slo, Py_ssize_t nremaining)
1907
270k
{
1908
270k
    Py_ssize_t k; /* used by IFLT macro expansion */
1909
270k
    Py_ssize_t n;
1910
270k
    PyObject ** const lo = slo->keys;
1911
1912
    /* In general, as things go on we've established that the slice starts
1913
       with a monotone run of n elements, starting at lo. */
1914
1915
    /* We're n elements into the slice, and the most recent neq+1 elements are
1916
     * all equal. This reverses them in-place, and resets neq for reuse.
1917
     */
1918
270k
#define REVERSE_LAST_NEQ                        \
1919
270k
    if (neq) {                                  \
1920
6.19k
        sortslice slice = *slo;                 \
1921
6.19k
        ++neq;                                  \
1922
6.19k
        sortslice_advance(&slice, n - neq);     \
1923
6.19k
        sortslice_reverse(&slice, neq);         \
1924
6.19k
        neq = 0;                                \
1925
6.19k
    }
1926
1927
    /* Sticking to only __lt__ compares is confusing and error-prone. But in
1928
     * this routine, almost all uses of IFLT can be captured by tiny macros
1929
     * giving mnemonic names to the intent. Note that inline functions don't
1930
     * work for this (IFLT expands to code including `goto fail`).
1931
     */
1932
270k
#define IF_NEXT_LARGER  IFLT(lo[n-1], lo[n])
1933
3.35M
#define IF_NEXT_SMALLER IFLT(lo[n], lo[n-1])
1934
1935
270k
    assert(nremaining);
1936
    /* try ascending run first */
1937
3.01M
    for (n = 1; n < nremaining; ++n) {
1938
2.90M
        IF_NEXT_SMALLER
1939
161k
            break;
1940
2.90M
    }
1941
270k
    if (n == nremaining)
1942
109k
        return n;
1943
    /* lo[n] is strictly less */
1944
    /* If n is 1 now, then the first compare established it's a descending
1945
     * run, so fall through to the descending case. But if n > 1, there are
1946
     * n elements in an ascending run terminated by the strictly less lo[n].
1947
     * If the first key < lo[n-1], *somewhere* along the way the sequence
1948
     * increased, so we're done (there is no descending run).
1949
     * Else first key >= lo[n-1], which implies that the entire ascending run
1950
     * consists of equal elements. In that case, this is a descending run,
1951
     * and we reverse the all-equal prefix in-place.
1952
     */
1953
161k
    if (n > 1) {
1954
115k
        IFLT(lo[0], lo[n-1])
1955
110k
            return n;
1956
4.93k
        sortslice_reverse(slo, n);
1957
4.93k
    }
1958
50.8k
    ++n; /* in all cases it's been established that lo[n] has been resolved */
1959
1960
    /* Finish descending run. All-squal subruns are reversed in-place on the
1961
     * fly. Their original order will be restored at the end by the whole-slice
1962
     * reversal.
1963
     */
1964
50.8k
    Py_ssize_t neq = 0;
1965
88.1k
    for ( ; n < nremaining; ++n) {
1966
70.6k
        IF_NEXT_SMALLER {
1967
            /* This ends the most recent run of equal elements, but still in
1968
             * the "descending" direction.
1969
             */
1970
14.3k
            REVERSE_LAST_NEQ
1971
14.3k
        }
1972
56.3k
        else {
1973
56.3k
            IF_NEXT_LARGER /* descending run is over */
1974
33.4k
                break;
1975
22.9k
            else /* not x < y and not y < x implies x == y */
1976
22.9k
                ++neq;
1977
56.3k
        }
1978
70.6k
    }
1979
50.8k
    REVERSE_LAST_NEQ
1980
50.8k
    sortslice_reverse(slo, n); /* transform to ascending run */
1981
1982
    /* And after reversing, it's possible this can be extended by a
1983
     * naturally increasing suffix; e.g., [3, 2, 3, 4, 1] makes an
1984
     * ascending run from the first 4 elements.
1985
     */
1986
392k
    for ( ; n < nremaining; ++n) {
1987
373k
        IF_NEXT_SMALLER
1988
31.7k
            break;
1989
373k
    }
1990
1991
50.8k
    return n;
1992
0
fail:
1993
0
    return -1;
1994
1995
50.8k
#undef REVERSE_LAST_NEQ
1996
50.8k
#undef IF_NEXT_SMALLER
1997
50.8k
#undef IF_NEXT_LARGER
1998
50.8k
}
1999
2000
/*
2001
Locate the proper position of key in a sorted vector; if the vector contains
2002
an element equal to key, return the position immediately to the left of
2003
the leftmost equal element.  [gallop_right() does the same except returns
2004
the position to the right of the rightmost equal element (if any).]
2005
2006
"a" is a sorted vector with n elements, starting at a[0].  n must be > 0.
2007
2008
"hint" is an index at which to begin the search, 0 <= hint < n.  The closer
2009
hint is to the final result, the faster this runs.
2010
2011
The return value is the int k in 0..n such that
2012
2013
    a[k-1] < key <= a[k]
2014
2015
pretending that *(a-1) is minus infinity and a[n] is plus infinity.  IOW,
2016
key belongs at index k; or, IOW, the first k elements of a should precede
2017
key, and the last n-k should follow key.
2018
2019
Returns -1 on error.  See listsort.txt for info on the method.
2020
*/
2021
static Py_ssize_t
2022
gallop_left(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
2023
193k
{
2024
193k
    Py_ssize_t ofs;
2025
193k
    Py_ssize_t lastofs;
2026
193k
    Py_ssize_t k;
2027
2028
193k
    assert(key && a && n > 0 && hint >= 0 && hint < n);
2029
2030
193k
    a += hint;
2031
193k
    lastofs = 0;
2032
193k
    ofs = 1;
2033
193k
    IFLT(*a, key) {
2034
        /* a[hint] < key -- gallop right, until
2035
         * a[hint + lastofs] < key <= a[hint + ofs]
2036
         */
2037
103k
        const Py_ssize_t maxofs = n - hint;             /* &a[n-1] is highest */
2038
348k
        while (ofs < maxofs) {
2039
275k
            IFLT(a[ofs], key) {
2040
244k
                lastofs = ofs;
2041
244k
                assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2042
244k
                ofs = (ofs << 1) + 1;
2043
244k
            }
2044
30.5k
            else                /* key <= a[hint + ofs] */
2045
30.5k
                break;
2046
275k
        }
2047
103k
        if (ofs > maxofs)
2048
31.6k
            ofs = maxofs;
2049
        /* Translate back to offsets relative to &a[0]. */
2050
103k
        lastofs += hint;
2051
103k
        ofs += hint;
2052
103k
    }
2053
90.0k
    else {
2054
        /* key <= a[hint] -- gallop left, until
2055
         * a[hint - ofs] < key <= a[hint - lastofs]
2056
         */
2057
90.0k
        const Py_ssize_t maxofs = hint + 1;             /* &a[0] is lowest */
2058
303k
        while (ofs < maxofs) {
2059
278k
            IFLT(*(a-ofs), key)
2060
64.2k
                break;
2061
            /* key <= a[hint - ofs] */
2062
213k
            lastofs = ofs;
2063
213k
            assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2064
213k
            ofs = (ofs << 1) + 1;
2065
213k
        }
2066
90.0k
        if (ofs > maxofs)
2067
19.4k
            ofs = maxofs;
2068
        /* Translate back to positive offsets relative to &a[0]. */
2069
90.0k
        k = lastofs;
2070
90.0k
        lastofs = hint - ofs;
2071
90.0k
        ofs = hint - k;
2072
90.0k
    }
2073
193k
    a -= hint;
2074
2075
193k
    assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
2076
    /* Now a[lastofs] < key <= a[ofs], so key belongs somewhere to the
2077
     * right of lastofs but no farther right than ofs.  Do a binary
2078
     * search, with invariant a[lastofs-1] < key <= a[ofs].
2079
     */
2080
193k
    ++lastofs;
2081
587k
    while (lastofs < ofs) {
2082
394k
        Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
2083
2084
394k
        IFLT(a[m], key)
2085
204k
            lastofs = m+1;              /* a[m] < key */
2086
189k
        else
2087
189k
            ofs = m;                    /* key <= a[m] */
2088
394k
    }
2089
193k
    assert(lastofs == ofs);             /* so a[ofs-1] < key <= a[ofs] */
2090
193k
    return ofs;
2091
2092
0
fail:
2093
0
    return -1;
2094
193k
}
2095
2096
/*
2097
Exactly like gallop_left(), except that if key already exists in a[0:n],
2098
finds the position immediately to the right of the rightmost equal value.
2099
2100
The return value is the int k in 0..n such that
2101
2102
    a[k-1] <= key < a[k]
2103
2104
or -1 if error.
2105
2106
The code duplication is massive, but this is enough different given that
2107
we're sticking to "<" comparisons that it's much harder to follow if
2108
written as one routine with yet another "left or right?" flag.
2109
*/
2110
static Py_ssize_t
2111
gallop_right(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
2112
215k
{
2113
215k
    Py_ssize_t ofs;
2114
215k
    Py_ssize_t lastofs;
2115
215k
    Py_ssize_t k;
2116
2117
215k
    assert(key && a && n > 0 && hint >= 0 && hint < n);
2118
2119
215k
    a += hint;
2120
215k
    lastofs = 0;
2121
215k
    ofs = 1;
2122
215k
    IFLT(key, *a) {
2123
        /* key < a[hint] -- gallop left, until
2124
         * a[hint - ofs] <= key < a[hint - lastofs]
2125
         */
2126
90.5k
        const Py_ssize_t maxofs = hint + 1;             /* &a[0] is lowest */
2127
224k
        while (ofs < maxofs) {
2128
157k
            IFLT(key, *(a-ofs)) {
2129
134k
                lastofs = ofs;
2130
134k
                assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2131
134k
                ofs = (ofs << 1) + 1;
2132
134k
            }
2133
23.5k
            else                /* a[hint - ofs] <= key */
2134
23.5k
                break;
2135
157k
        }
2136
90.5k
        if (ofs > maxofs)
2137
13.4k
            ofs = maxofs;
2138
        /* Translate back to positive offsets relative to &a[0]. */
2139
90.5k
        k = lastofs;
2140
90.5k
        lastofs = hint - ofs;
2141
90.5k
        ofs = hint - k;
2142
90.5k
    }
2143
124k
    else {
2144
        /* a[hint] <= key -- gallop right, until
2145
         * a[hint + lastofs] <= key < a[hint + ofs]
2146
        */
2147
124k
        const Py_ssize_t maxofs = n - hint;             /* &a[n-1] is highest */
2148
414k
        while (ofs < maxofs) {
2149
358k
            IFLT(key, a[ofs])
2150
69.4k
                break;
2151
            /* a[hint + ofs] <= key */
2152
289k
            lastofs = ofs;
2153
289k
            assert(ofs <= (PY_SSIZE_T_MAX - 1) / 2);
2154
289k
            ofs = (ofs << 1) + 1;
2155
289k
        }
2156
124k
        if (ofs > maxofs)
2157
29.6k
            ofs = maxofs;
2158
        /* Translate back to offsets relative to &a[0]. */
2159
124k
        lastofs += hint;
2160
124k
        ofs += hint;
2161
124k
    }
2162
215k
    a -= hint;
2163
2164
215k
    assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
2165
    /* Now a[lastofs] <= key < a[ofs], so key belongs somewhere to the
2166
     * right of lastofs but no farther right than ofs.  Do a binary
2167
     * search, with invariant a[lastofs-1] <= key < a[ofs].
2168
     */
2169
215k
    ++lastofs;
2170
581k
    while (lastofs < ofs) {
2171
366k
        Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
2172
2173
366k
        IFLT(key, a[m])
2174
192k
            ofs = m;                    /* key < a[m] */
2175
174k
        else
2176
174k
            lastofs = m+1;              /* a[m] <= key */
2177
366k
    }
2178
215k
    assert(lastofs == ofs);             /* so a[ofs-1] <= key < a[ofs] */
2179
215k
    return ofs;
2180
2181
0
fail:
2182
0
    return -1;
2183
215k
}
2184
2185
/* Conceptually a MergeState's constructor. */
2186
static void
2187
merge_init(MergeState *ms, Py_ssize_t list_size, int has_keyfunc,
2188
           sortslice *lo)
2189
850k
{
2190
850k
    assert(ms != NULL);
2191
850k
    if (has_keyfunc) {
2192
        /* The temporary space for merging will need at most half the list
2193
         * size rounded up.  Use the minimum possible space so we can use the
2194
         * rest of temparray for other things.  In particular, if there is
2195
         * enough extra space, listsort() will use it to store the keys.
2196
         */
2197
668k
        ms->alloced = (list_size + 1) / 2;
2198
2199
        /* ms->alloced describes how many keys will be stored at
2200
           ms->temparray, but we also need to store the values.  Hence,
2201
           ms->alloced is capped at half of MERGESTATE_TEMP_SIZE. */
2202
668k
        if (MERGESTATE_TEMP_SIZE / 2 < ms->alloced)
2203
2.26k
            ms->alloced = MERGESTATE_TEMP_SIZE / 2;
2204
668k
        ms->a.values = &ms->temparray[ms->alloced];
2205
668k
    }
2206
182k
    else {
2207
182k
        ms->alloced = MERGESTATE_TEMP_SIZE;
2208
182k
        ms->a.values = NULL;
2209
182k
    }
2210
850k
    ms->a.keys = ms->temparray;
2211
850k
    ms->n = 0;
2212
850k
    ms->min_gallop = MIN_GALLOP;
2213
850k
    ms->listlen = list_size;
2214
850k
    ms->basekeys = lo->keys;
2215
2216
    /* State for generating minrun values. See listsort.txt. */
2217
850k
    ms->mr_e = 0;
2218
879k
    while (list_size >> ms->mr_e >= MAX_MINRUN) {
2219
28.4k
        ++ms->mr_e;
2220
28.4k
    }
2221
850k
    ms->mr_mask = (1 << ms->mr_e) - 1;
2222
850k
    ms->mr_current = 0;
2223
850k
}
2224
2225
/* Free all the temp memory owned by the MergeState.  This must be called
2226
 * when you're done with a MergeState, and may be called before then if
2227
 * you want to free the temp memory early.
2228
 */
2229
static void
2230
merge_freemem(MergeState *ms)
2231
855k
{
2232
855k
    assert(ms != NULL);
2233
855k
    if (ms->a.keys != ms->temparray) {
2234
4.75k
        PyMem_Free(ms->a.keys);
2235
4.75k
        ms->a.keys = NULL;
2236
4.75k
    }
2237
855k
}
2238
2239
/* Ensure enough temp memory for 'need' array slots is available.
2240
 * Returns 0 on success and -1 if the memory can't be gotten.
2241
 */
2242
static int
2243
merge_getmem(MergeState *ms, Py_ssize_t need)
2244
4.75k
{
2245
4.75k
    int multiplier;
2246
2247
4.75k
    assert(ms != NULL);
2248
4.75k
    if (need <= ms->alloced)
2249
0
        return 0;
2250
2251
4.75k
    multiplier = ms->a.values != NULL ? 2 : 1;
2252
2253
    /* Don't realloc!  That can cost cycles to copy the old data, but
2254
     * we don't care what's in the block.
2255
     */
2256
4.75k
    merge_freemem(ms);
2257
4.75k
    if ((size_t)need > PY_SSIZE_T_MAX / sizeof(PyObject *) / multiplier) {
2258
0
        PyErr_NoMemory();
2259
0
        return -1;
2260
0
    }
2261
4.75k
    ms->a.keys = (PyObject **)PyMem_Malloc(multiplier * need
2262
4.75k
                                          * sizeof(PyObject *));
2263
4.75k
    if (ms->a.keys != NULL) {
2264
4.75k
        ms->alloced = need;
2265
4.75k
        if (ms->a.values != NULL)
2266
4.22k
            ms->a.values = &ms->a.keys[need];
2267
4.75k
        return 0;
2268
4.75k
    }
2269
0
    PyErr_NoMemory();
2270
0
    return -1;
2271
4.75k
}
2272
71.2k
#define MERGE_GETMEM(MS, NEED) ((NEED) <= (MS)->alloced ? 0 :   \
2273
71.2k
                                merge_getmem(MS, NEED))
2274
2275
/* Merge the na elements starting at ssa with the nb elements starting at
2276
 * ssb.keys = ssa.keys + na in a stable way, in-place.  na and nb must be > 0.
2277
 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
2278
 * should have na <= nb.  See listsort.txt for more info.  Return 0 if
2279
 * successful, -1 if error.
2280
 */
2281
static Py_ssize_t
2282
merge_lo(MergeState *ms, sortslice ssa, Py_ssize_t na,
2283
         sortslice ssb, Py_ssize_t nb)
2284
45.6k
{
2285
45.6k
    Py_ssize_t k;
2286
45.6k
    sortslice dest;
2287
45.6k
    int result = -1;            /* guilty until proved innocent */
2288
45.6k
    Py_ssize_t min_gallop;
2289
2290
45.6k
    assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
2291
45.6k
    assert(ssa.keys + na == ssb.keys);
2292
45.6k
    if (MERGE_GETMEM(ms, na) < 0)
2293
0
        return -1;
2294
45.6k
    sortslice_memcpy(&ms->a, 0, &ssa, 0, na);
2295
45.6k
    dest = ssa;
2296
45.6k
    ssa = ms->a;
2297
2298
45.6k
    sortslice_copy_incr(&dest, &ssb);
2299
45.6k
    --nb;
2300
45.6k
    if (nb == 0)
2301
2.95k
        goto Succeed;
2302
42.6k
    if (na == 1)
2303
6.62k
        goto CopyB;
2304
2305
36.0k
    min_gallop = ms->min_gallop;
2306
53.3k
    for (;;) {
2307
53.3k
        Py_ssize_t acount = 0;          /* # of times A won in a row */
2308
53.3k
        Py_ssize_t bcount = 0;          /* # of times B won in a row */
2309
2310
        /* Do the straightforward thing until (if ever) one run
2311
         * appears to win consistently.
2312
         */
2313
354k
        for (;;) {
2314
354k
            assert(na > 1 && nb > 0);
2315
354k
            k = ISLT(ssb.keys[0], ssa.keys[0]);
2316
354k
            if (k) {
2317
194k
                if (k < 0)
2318
0
                    goto Fail;
2319
194k
                sortslice_copy_incr(&dest, &ssb);
2320
194k
                ++bcount;
2321
194k
                acount = 0;
2322
194k
                --nb;
2323
194k
                if (nb == 0)
2324
3.93k
                    goto Succeed;
2325
191k
                if (bcount >= min_gallop)
2326
26.0k
                    break;
2327
191k
            }
2328
159k
            else {
2329
159k
                sortslice_copy_incr(&dest, &ssa);
2330
159k
                ++acount;
2331
159k
                bcount = 0;
2332
159k
                --na;
2333
159k
                if (na == 1)
2334
2.51k
                    goto CopyB;
2335
157k
                if (acount >= min_gallop)
2336
20.8k
                    break;
2337
157k
            }
2338
354k
        }
2339
2340
        /* One run is winning so consistently that galloping may
2341
         * be a huge win.  So try that, and continue galloping until
2342
         * (if ever) neither run appears to be winning consistently
2343
         * anymore.
2344
         */
2345
46.8k
        ++min_gallop;
2346
82.7k
        do {
2347
82.7k
            assert(na > 1 && nb > 0);
2348
82.7k
            min_gallop -= min_gallop > 1;
2349
82.7k
            ms->min_gallop = min_gallop;
2350
82.7k
            k = gallop_right(ms, ssb.keys[0], ssa.keys, na, 0);
2351
82.7k
            acount = k;
2352
82.7k
            if (k) {
2353
47.4k
                if (k < 0)
2354
0
                    goto Fail;
2355
47.4k
                sortslice_memcpy(&dest, 0, &ssa, 0, k);
2356
47.4k
                sortslice_advance(&dest, k);
2357
47.4k
                sortslice_advance(&ssa, k);
2358
47.4k
                na -= k;
2359
47.4k
                if (na == 1)
2360
7.44k
                    goto CopyB;
2361
                /* na==0 is impossible now if the comparison
2362
                 * function is consistent, but we can't assume
2363
                 * that it is.
2364
                 */
2365
40.0k
                if (na == 0)
2366
0
                    goto Succeed;
2367
40.0k
            }
2368
75.2k
            sortslice_copy_incr(&dest, &ssb);
2369
75.2k
            --nb;
2370
75.2k
            if (nb == 0)
2371
1.96k
                goto Succeed;
2372
2373
73.3k
            k = gallop_left(ms, ssa.keys[0], ssb.keys, nb, 0);
2374
73.3k
            bcount = k;
2375
73.3k
            if (k) {
2376
67.7k
                if (k < 0)
2377
0
                    goto Fail;
2378
67.7k
                sortslice_memmove(&dest, 0, &ssb, 0, k);
2379
67.7k
                sortslice_advance(&dest, k);
2380
67.7k
                sortslice_advance(&ssb, k);
2381
67.7k
                nb -= k;
2382
67.7k
                if (nb == 0)
2383
16.6k
                    goto Succeed;
2384
67.7k
            }
2385
56.6k
            sortslice_copy_incr(&dest, &ssa);
2386
56.6k
            --na;
2387
56.6k
            if (na == 1)
2388
3.53k
                goto CopyB;
2389
56.6k
        } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
2390
17.2k
        ++min_gallop;           /* penalize it for leaving galloping mode */
2391
17.2k
        ms->min_gallop = min_gallop;
2392
17.2k
    }
2393
25.5k
Succeed:
2394
25.5k
    result = 0;
2395
25.5k
Fail:
2396
25.5k
    if (na)
2397
25.5k
        sortslice_memcpy(&dest, 0, &ssa, 0, na);
2398
25.5k
    return result;
2399
20.1k
CopyB:
2400
20.1k
    assert(na == 1 && nb > 0);
2401
    /* The last element of ssa belongs at the end of the merge. */
2402
20.1k
    sortslice_memmove(&dest, 0, &ssb, 0, nb);
2403
20.1k
    sortslice_copy(&dest, nb, &ssa, 0);
2404
20.1k
    return 0;
2405
25.5k
}
2406
2407
/* Merge the na elements starting at pa with the nb elements starting at
2408
 * ssb.keys = ssa.keys + na in a stable way, in-place.  na and nb must be > 0.
2409
 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
2410
 * should have na >= nb.  See listsort.txt for more info.  Return 0 if
2411
 * successful, -1 if error.
2412
 */
2413
static Py_ssize_t
2414
merge_hi(MergeState *ms, sortslice ssa, Py_ssize_t na,
2415
         sortslice ssb, Py_ssize_t nb)
2416
25.6k
{
2417
25.6k
    Py_ssize_t k;
2418
25.6k
    sortslice dest, basea, baseb;
2419
25.6k
    int result = -1;            /* guilty until proved innocent */
2420
25.6k
    Py_ssize_t min_gallop;
2421
2422
25.6k
    assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
2423
25.6k
    assert(ssa.keys + na == ssb.keys);
2424
25.6k
    if (MERGE_GETMEM(ms, nb) < 0)
2425
0
        return -1;
2426
25.6k
    dest = ssb;
2427
25.6k
    sortslice_advance(&dest, nb-1);
2428
25.6k
    sortslice_memcpy(&ms->a, 0, &ssb, 0, nb);
2429
25.6k
    basea = ssa;
2430
25.6k
    baseb = ms->a;
2431
25.6k
    ssb.keys = ms->a.keys + nb - 1;
2432
25.6k
    if (ssb.values != NULL)
2433
22.1k
        ssb.values = ms->a.values + nb - 1;
2434
25.6k
    sortslice_advance(&ssa, na - 1);
2435
2436
25.6k
    sortslice_copy_decr(&dest, &ssa);
2437
25.6k
    --na;
2438
25.6k
    if (na == 0)
2439
0
        goto Succeed;
2440
25.6k
    if (nb == 1)
2441
749
        goto CopyA;
2442
2443
24.8k
    min_gallop = ms->min_gallop;
2444
36.6k
    for (;;) {
2445
36.6k
        Py_ssize_t acount = 0;          /* # of times A won in a row */
2446
36.6k
        Py_ssize_t bcount = 0;          /* # of times B won in a row */
2447
2448
        /* Do the straightforward thing until (if ever) one run
2449
         * appears to win consistently.
2450
         */
2451
266k
        for (;;) {
2452
266k
            assert(na > 0 && nb > 1);
2453
266k
            k = ISLT(ssb.keys[0], ssa.keys[0]);
2454
266k
            if (k) {
2455
131k
                if (k < 0)
2456
0
                    goto Fail;
2457
131k
                sortslice_copy_decr(&dest, &ssa);
2458
131k
                ++acount;
2459
131k
                bcount = 0;
2460
131k
                --na;
2461
131k
                if (na == 0)
2462
756
                    goto Succeed;
2463
130k
                if (acount >= min_gallop)
2464
17.3k
                    break;
2465
130k
            }
2466
135k
            else {
2467
135k
                sortslice_copy_decr(&dest, &ssb);
2468
135k
                ++bcount;
2469
135k
                acount = 0;
2470
135k
                --nb;
2471
135k
                if (nb == 1)
2472
451
                    goto CopyA;
2473
134k
                if (bcount >= min_gallop)
2474
18.1k
                    break;
2475
134k
            }
2476
266k
        }
2477
2478
        /* One run is winning so consistently that galloping may
2479
         * be a huge win.  So try that, and continue galloping until
2480
         * (if ever) neither run appears to be winning consistently
2481
         * anymore.
2482
         */
2483
35.4k
        ++min_gallop;
2484
61.2k
        do {
2485
61.2k
            assert(na > 0 && nb > 1);
2486
61.2k
            min_gallop -= min_gallop > 1;
2487
61.2k
            ms->min_gallop = min_gallop;
2488
61.2k
            k = gallop_right(ms, ssb.keys[0], basea.keys, na, na-1);
2489
61.2k
            if (k < 0)
2490
0
                goto Fail;
2491
61.2k
            k = na - k;
2492
61.2k
            acount = k;
2493
61.2k
            if (k) {
2494
38.2k
                sortslice_advance(&dest, -k);
2495
38.2k
                sortslice_advance(&ssa, -k);
2496
38.2k
                sortslice_memmove(&dest, 1, &ssa, 1, k);
2497
38.2k
                na -= k;
2498
38.2k
                if (na == 0)
2499
11.3k
                    goto Succeed;
2500
38.2k
            }
2501
49.9k
            sortslice_copy_decr(&dest, &ssb);
2502
49.9k
            --nb;
2503
49.9k
            if (nb == 1)
2504
698
                goto CopyA;
2505
2506
49.2k
            k = gallop_left(ms, ssa.keys[0], baseb.keys, nb, nb-1);
2507
49.2k
            if (k < 0)
2508
0
                goto Fail;
2509
49.2k
            k = nb - k;
2510
49.2k
            bcount = k;
2511
49.2k
            if (k) {
2512
43.1k
                sortslice_advance(&dest, -k);
2513
43.1k
                sortslice_advance(&ssb, -k);
2514
43.1k
                sortslice_memcpy(&dest, 1, &ssb, 1, k);
2515
43.1k
                nb -= k;
2516
43.1k
                if (nb == 1)
2517
10.5k
                    goto CopyA;
2518
                /* nb==0 is impossible now if the comparison
2519
                 * function is consistent, but we can't assume
2520
                 * that it is.
2521
                 */
2522
32.5k
                if (nb == 0)
2523
0
                    goto Succeed;
2524
32.5k
            }
2525
38.6k
            sortslice_copy_decr(&dest, &ssa);
2526
38.6k
            --na;
2527
38.6k
            if (na == 0)
2528
1.09k
                goto Succeed;
2529
38.6k
        } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
2530
11.8k
        ++min_gallop;           /* penalize it for leaving galloping mode */
2531
11.8k
        ms->min_gallop = min_gallop;
2532
11.8k
    }
2533
13.1k
Succeed:
2534
13.1k
    result = 0;
2535
13.1k
Fail:
2536
13.1k
    if (nb)
2537
13.1k
        sortslice_memcpy(&dest, -(nb-1), &baseb, 0, nb);
2538
13.1k
    return result;
2539
12.4k
CopyA:
2540
12.4k
    assert(nb == 1 && na > 0);
2541
    /* The first element of ssb belongs at the front of the merge. */
2542
12.4k
    sortslice_memmove(&dest, 1-na, &ssa, 1-na, na);
2543
12.4k
    sortslice_advance(&dest, -na);
2544
12.4k
    sortslice_advance(&ssa, -na);
2545
12.4k
    sortslice_copy(&dest, 0, &ssb, 0);
2546
12.4k
    return 0;
2547
13.1k
}
2548
2549
/* Merge the two runs at stack indices i and i+1.
2550
 * Returns 0 on success, -1 on error.
2551
 */
2552
static Py_ssize_t
2553
merge_at(MergeState *ms, Py_ssize_t i)
2554
71.2k
{
2555
71.2k
    sortslice ssa, ssb;
2556
71.2k
    Py_ssize_t na, nb;
2557
71.2k
    Py_ssize_t k;
2558
2559
71.2k
    assert(ms != NULL);
2560
71.2k
    assert(ms->n >= 2);
2561
71.2k
    assert(i >= 0);
2562
71.2k
    assert(i == ms->n - 2 || i == ms->n - 3);
2563
2564
71.2k
    ssa = ms->pending[i].base;
2565
71.2k
    na = ms->pending[i].len;
2566
71.2k
    ssb = ms->pending[i+1].base;
2567
71.2k
    nb = ms->pending[i+1].len;
2568
71.2k
    assert(na > 0 && nb > 0);
2569
71.2k
    assert(ssa.keys + na == ssb.keys);
2570
2571
    /* Record the length of the combined runs; if i is the 3rd-last
2572
     * run now, also slide over the last run (which isn't involved
2573
     * in this merge).  The current run i+1 goes away in any case.
2574
     */
2575
71.2k
    ms->pending[i].len = na + nb;
2576
71.2k
    if (i == ms->n - 3)
2577
418
        ms->pending[i+1] = ms->pending[i+2];
2578
71.2k
    --ms->n;
2579
2580
    /* Where does b start in a?  Elements in a before that can be
2581
     * ignored (already in place).
2582
     */
2583
71.2k
    k = gallop_right(ms, *ssb.keys, ssa.keys, na, 0);
2584
71.2k
    if (k < 0)
2585
0
        return -1;
2586
71.2k
    sortslice_advance(&ssa, k);
2587
71.2k
    na -= k;
2588
71.2k
    if (na == 0)
2589
28
        return 0;
2590
2591
    /* Where does a end in b?  Elements in b after that can be
2592
     * ignored (already in place).
2593
     */
2594
71.2k
    nb = gallop_left(ms, ssa.keys[na-1], ssb.keys, nb, nb-1);
2595
71.2k
    if (nb <= 0)
2596
0
        return nb;
2597
2598
    /* Merge what remains of the runs, using a temp array with
2599
     * min(na, nb) elements.
2600
     */
2601
71.2k
    if (na <= nb)
2602
45.6k
        return merge_lo(ms, ssa, na, ssb, nb);
2603
25.6k
    else
2604
25.6k
        return merge_hi(ms, ssa, na, ssb, nb);
2605
71.2k
}
2606
2607
/* Two adjacent runs begin at index s1. The first run has length n1, and
2608
 * the second run (starting at index s1+n1) has length n2. The list has total
2609
 * length n.
2610
 * Compute the "power" of the first run. See listsort.txt for details.
2611
 */
2612
static int
2613
powerloop(Py_ssize_t s1, Py_ssize_t n1, Py_ssize_t n2, Py_ssize_t n)
2614
71.2k
{
2615
71.2k
    int result = 0;
2616
71.2k
    assert(s1 >= 0);
2617
71.2k
    assert(n1 > 0 && n2 > 0);
2618
71.2k
    assert(s1 + n1 + n2 <= n);
2619
    /* midpoints a and b:
2620
     * a = s1 + n1/2
2621
     * b = s1 + n1 + n2/2 = a + (n1 + n2)/2
2622
     *
2623
     * Those may not be integers, though, because of the "/2". So we work with
2624
     * 2*a and 2*b instead, which are necessarily integers. It makes no
2625
     * difference to the outcome, since the bits in the expansion of (2*i)/n
2626
     * are merely shifted one position from those of i/n.
2627
     */
2628
71.2k
    Py_ssize_t a = 2 * s1 + n1;  /* 2*a */
2629
71.2k
    Py_ssize_t b = a + n1 + n2;  /* 2*b */
2630
    /* Emulate a/n and b/n one bit a time, until bits differ. */
2631
285k
    for (;;) {
2632
285k
        ++result;
2633
285k
        if (a >= n) {  /* both quotient bits are 1 */
2634
110k
            assert(b >= a);
2635
110k
            a -= n;
2636
110k
            b -= n;
2637
110k
        }
2638
175k
        else if (b >= n) {  /* a/n bit is 0, b/n bit is 1 */
2639
71.2k
            break;
2640
71.2k
        } /* else both quotient bits are 0 */
2641
285k
        assert(a < b && b < n);
2642
213k
        a <<= 1;
2643
213k
        b <<= 1;
2644
213k
    }
2645
71.2k
    return result;
2646
71.2k
}
2647
2648
/* The next run has been identified, of length n2.
2649
 * If there's already a run on the stack, apply the "powersort" merge strategy:
2650
 * compute the topmost run's "power" (depth in a conceptual binary merge tree)
2651
 * and merge adjacent runs on the stack with greater power. See listsort.txt
2652
 * for more info.
2653
 *
2654
 * It's the caller's responsibility to push the new run on the stack when this
2655
 * returns.
2656
 *
2657
 * Returns 0 on success, -1 on error.
2658
 */
2659
static int
2660
found_new_run(MergeState *ms, Py_ssize_t n2)
2661
270k
{
2662
270k
    assert(ms);
2663
270k
    if (ms->n) {
2664
71.2k
        assert(ms->n > 0);
2665
71.2k
        struct s_slice *p = ms->pending;
2666
71.2k
        Py_ssize_t s1 = p[ms->n - 1].base.keys - ms->basekeys; /* start index */
2667
71.2k
        Py_ssize_t n1 = p[ms->n - 1].len;
2668
71.2k
        int power = powerloop(s1, n1, n2, ms->listlen);
2669
117k
        while (ms->n > 1 && p[ms->n - 2].power > power) {
2670
46.7k
            if (merge_at(ms, ms->n - 2) < 0)
2671
0
                return -1;
2672
46.7k
        }
2673
71.2k
        assert(ms->n < 2 || p[ms->n - 2].power < power);
2674
71.2k
        p[ms->n - 1].power = power;
2675
71.2k
    }
2676
270k
    return 0;
2677
270k
}
2678
2679
/* Regardless of invariants, merge all runs on the stack until only one
2680
 * remains.  This is used at the end of the mergesort.
2681
 *
2682
 * Returns 0 on success, -1 on error.
2683
 */
2684
static int
2685
merge_force_collapse(MergeState *ms)
2686
199k
{
2687
199k
    struct s_slice *p = ms->pending;
2688
2689
199k
    assert(ms);
2690
224k
    while (ms->n > 1) {
2691
24.5k
        Py_ssize_t n = ms->n - 2;
2692
24.5k
        if (n > 0 && p[n-1].len < p[n+1].len)
2693
418
            --n;
2694
24.5k
        if (merge_at(ms, n) < 0)
2695
0
            return -1;
2696
24.5k
    }
2697
199k
    return 0;
2698
199k
}
2699
2700
/* Return the next minrun value to use. See listsort.txt. */
2701
Py_LOCAL_INLINE(Py_ssize_t)
2702
minrun_next(MergeState *ms)
2703
270k
{
2704
270k
    ms->mr_current += ms->listlen;
2705
270k
    assert(ms->mr_current >= 0); /* no overflow */
2706
270k
    Py_ssize_t result = ms->mr_current >> ms->mr_e;
2707
270k
    ms->mr_current &= ms->mr_mask;
2708
270k
    return result;
2709
270k
}
2710
2711
/* Here we define custom comparison functions to optimize for the cases one commonly
2712
 * encounters in practice: homogeneous lists, often of one of the basic types. */
2713
2714
/* This struct holds the comparison function and helper functions
2715
 * selected in the pre-sort check. */
2716
2717
/* These are the special case compare functions.
2718
 * ms->key_compare will always point to one of these: */
2719
2720
/* Heterogeneous compare: default, always safe to fall back on. */
2721
static int
2722
safe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
2723
0
{
2724
    /* No assumptions necessary! */
2725
0
    return PyObject_RichCompareBool(v, w, Py_LT);
2726
0
}
2727
2728
/* Homogeneous compare: safe for any two comparable objects of the same type.
2729
 * (ms->key_richcompare is set to ob_type->tp_richcompare in the
2730
 *  pre-sort check.)
2731
 */
2732
static int
2733
unsafe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
2734
8.33M
{
2735
8.33M
    PyObject *res_obj; int res;
2736
2737
    /* No assumptions, because we check first: */
2738
8.33M
    if (Py_TYPE(v)->tp_richcompare != ms->key_richcompare)
2739
0
        return PyObject_RichCompareBool(v, w, Py_LT);
2740
2741
8.33M
    assert(ms->key_richcompare != NULL);
2742
8.33M
    res_obj = (*(ms->key_richcompare))(v, w, Py_LT);
2743
2744
8.33M
    if (res_obj == Py_NotImplemented) {
2745
0
        Py_DECREF(res_obj);
2746
0
        return PyObject_RichCompareBool(v, w, Py_LT);
2747
0
    }
2748
8.33M
    if (res_obj == NULL)
2749
0
        return -1;
2750
2751
8.33M
    if (PyBool_Check(res_obj)) {
2752
8.33M
        res = (res_obj == Py_True);
2753
8.33M
    }
2754
0
    else {
2755
0
        res = PyObject_IsTrue(res_obj);
2756
0
    }
2757
8.33M
    Py_DECREF(res_obj);
2758
2759
    /* Note that we can't assert
2760
     *     res == PyObject_RichCompareBool(v, w, Py_LT);
2761
     * because of evil compare functions like this:
2762
     *     lambda a, b:  int(random.random() * 3) - 1)
2763
     * (which is actually in test_sort.py) */
2764
8.33M
    return res;
2765
8.33M
}
2766
2767
/* Latin string compare: safe for any two latin (one byte per char) strings. */
2768
static int
2769
unsafe_latin_compare(PyObject *v, PyObject *w, MergeState *ms)
2770
345k
{
2771
345k
    Py_ssize_t len;
2772
345k
    int res;
2773
2774
    /* Modified from Objects/unicodeobject.c:unicode_compare, assuming: */
2775
345k
    assert(Py_IS_TYPE(v, &PyUnicode_Type));
2776
345k
    assert(Py_IS_TYPE(w, &PyUnicode_Type));
2777
345k
    assert(PyUnicode_KIND(v) == PyUnicode_KIND(w));
2778
345k
    assert(PyUnicode_KIND(v) == PyUnicode_1BYTE_KIND);
2779
2780
345k
    len = Py_MIN(PyUnicode_GET_LENGTH(v), PyUnicode_GET_LENGTH(w));
2781
345k
    res = memcmp(PyUnicode_DATA(v), PyUnicode_DATA(w), len);
2782
2783
345k
    res = (res != 0 ?
2784
338k
           res < 0 :
2785
345k
           PyUnicode_GET_LENGTH(v) < PyUnicode_GET_LENGTH(w));
2786
2787
345k
    assert(res == PyObject_RichCompareBool(v, w, Py_LT));;
2788
345k
    return res;
2789
345k
}
2790
2791
/* Bounded int compare: compare any two longs that fit in a single machine word. */
2792
static int
2793
unsafe_long_compare(PyObject *v, PyObject *w, MergeState *ms)
2794
6.79M
{
2795
6.79M
    PyLongObject *vl, *wl;
2796
6.79M
    intptr_t v0, w0;
2797
6.79M
    int res;
2798
2799
    /* Modified from Objects/longobject.c:long_compare, assuming: */
2800
6.79M
    assert(Py_IS_TYPE(v, &PyLong_Type));
2801
6.79M
    assert(Py_IS_TYPE(w, &PyLong_Type));
2802
6.79M
    assert(_PyLong_IsCompact((PyLongObject *)v));
2803
6.79M
    assert(_PyLong_IsCompact((PyLongObject *)w));
2804
2805
6.79M
    vl = (PyLongObject*)v;
2806
6.79M
    wl = (PyLongObject*)w;
2807
2808
6.79M
    v0 = _PyLong_CompactValue(vl);
2809
6.79M
    w0 = _PyLong_CompactValue(wl);
2810
2811
6.79M
    res = v0 < w0;
2812
6.79M
    assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2813
6.79M
    return res;
2814
6.79M
}
2815
2816
/* Float compare: compare any two floats. */
2817
static int
2818
unsafe_float_compare(PyObject *v, PyObject *w, MergeState *ms)
2819
0
{
2820
0
    int res;
2821
2822
    /* Modified from Objects/floatobject.c:float_richcompare, assuming: */
2823
0
    assert(Py_IS_TYPE(v, &PyFloat_Type));
2824
0
    assert(Py_IS_TYPE(w, &PyFloat_Type));
2825
2826
0
    res = PyFloat_AS_DOUBLE(v) < PyFloat_AS_DOUBLE(w);
2827
0
    assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2828
0
    return res;
2829
0
}
2830
2831
/* Tuple compare: compare *any* two tuples, using
2832
 * ms->tuple_elem_compare to compare the first elements, which is set
2833
 * using the same pre-sort check as we use for ms->key_compare,
2834
 * but run on the list [x[0] for x in L]. This allows us to optimize compares
2835
 * on two levels (as long as [x[0] for x in L] is type-homogeneous.) The idea is
2836
 * that most tuple compares don't involve x[1:]. */
2837
static int
2838
unsafe_tuple_compare(PyObject *v, PyObject *w, MergeState *ms)
2839
1.27k
{
2840
1.27k
    PyTupleObject *vt, *wt;
2841
1.27k
    Py_ssize_t i, vlen, wlen;
2842
1.27k
    int k;
2843
2844
    /* Modified from Objects/tupleobject.c:tuplerichcompare, assuming: */
2845
1.27k
    assert(Py_IS_TYPE(v, &PyTuple_Type));
2846
1.27k
    assert(Py_IS_TYPE(w, &PyTuple_Type));
2847
1.27k
    assert(Py_SIZE(v) > 0);
2848
1.27k
    assert(Py_SIZE(w) > 0);
2849
2850
1.27k
    vt = (PyTupleObject *)v;
2851
1.27k
    wt = (PyTupleObject *)w;
2852
2853
1.27k
    vlen = Py_SIZE(vt);
2854
1.27k
    wlen = Py_SIZE(wt);
2855
2856
1.28k
    for (i = 0; i < vlen && i < wlen; i++) {
2857
1.28k
        k = PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_EQ);
2858
1.28k
        if (k < 0)
2859
0
            return -1;
2860
1.28k
        if (!k)
2861
1.27k
            break;
2862
1.28k
    }
2863
2864
1.27k
    if (i >= vlen || i >= wlen)
2865
0
        return vlen < wlen;
2866
2867
1.27k
    if (i == 0)
2868
1.26k
        return ms->tuple_elem_compare(vt->ob_item[i], wt->ob_item[i], ms);
2869
12
    else
2870
12
        return PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_LT);
2871
1.27k
}
2872
2873
/* An adaptive, stable, natural mergesort.  See listsort.txt.
2874
 * Returns Py_None on success, NULL on error.  Even in case of error, the
2875
 * list will be some permutation of its input state (nothing is lost or
2876
 * duplicated).
2877
 */
2878
/*[clinic input]
2879
@permit_long_docstring_body
2880
@critical_section
2881
list.sort
2882
2883
    *
2884
    key as keyfunc: object = None
2885
    reverse: bool = False
2886
2887
Sort the list in ascending order and return None.
2888
2889
The sort is in-place (i.e. the list itself is modified) and stable (i.e. the
2890
order of two equal elements is maintained).
2891
2892
If a key function is given, apply it once to each list item and sort them,
2893
ascending or descending, according to their function values.
2894
2895
The reverse flag can be set to sort in descending order.
2896
[clinic start generated code]*/
2897
2898
static PyObject *
2899
list_sort_impl(PyListObject *self, PyObject *keyfunc, int reverse)
2900
/*[clinic end generated code: output=57b9f9c5e23fbe42 input=e4f6b6069181ad7d]*/
2901
850k
{
2902
850k
    MergeState ms;
2903
850k
    Py_ssize_t nremaining;
2904
850k
    Py_ssize_t minrun;
2905
850k
    sortslice lo;
2906
850k
    Py_ssize_t saved_ob_size, saved_allocated;
2907
850k
    PyObject **saved_ob_item;
2908
850k
    PyObject **final_ob_item;
2909
850k
    PyObject *result = NULL;            /* guilty until proved innocent */
2910
850k
    Py_ssize_t i;
2911
850k
    PyObject **keys;
2912
2913
850k
    assert(self != NULL);
2914
850k
    assert(PyList_Check(self));
2915
850k
    if (keyfunc == Py_None)
2916
164k
        keyfunc = NULL;
2917
2918
    /* The list is temporarily made empty, so that mutations performed
2919
     * by comparison functions can't affect the slice of memory we're
2920
     * sorting (allowing mutations during sorting is a core-dump
2921
     * factory, since ob_item may change).
2922
     */
2923
850k
    saved_ob_size = Py_SIZE(self);
2924
850k
    saved_ob_item = self->ob_item;
2925
850k
    saved_allocated = self->allocated;
2926
850k
    Py_SET_SIZE(self, 0);
2927
850k
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item, NULL);
2928
850k
    self->allocated = -1; /* any operation will reset it to >= 0 */
2929
2930
850k
    if (keyfunc == NULL) {
2931
182k
        keys = NULL;
2932
182k
        lo.keys = saved_ob_item;
2933
182k
        lo.values = NULL;
2934
182k
    }
2935
668k
    else {
2936
668k
        if (saved_ob_size < MERGESTATE_TEMP_SIZE/2)
2937
            /* Leverage stack space we allocated but won't otherwise use */
2938
663k
            keys = &ms.temparray[saved_ob_size+1];
2939
4.30k
        else {
2940
4.30k
            keys = PyMem_Malloc(sizeof(PyObject *) * saved_ob_size);
2941
4.30k
            if (keys == NULL) {
2942
0
                PyErr_NoMemory();
2943
0
                goto keyfunc_fail;
2944
0
            }
2945
4.30k
        }
2946
2947
5.66M
        for (i = 0; i < saved_ob_size ; i++) {
2948
4.99M
            keys[i] = PyObject_CallOneArg(keyfunc, saved_ob_item[i]);
2949
4.99M
            if (keys[i] == NULL) {
2950
0
                for (i=i-1 ; i>=0 ; i--)
2951
0
                    Py_DECREF(keys[i]);
2952
0
                if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
2953
0
                    PyMem_Free(keys);
2954
0
                goto keyfunc_fail;
2955
0
            }
2956
4.99M
        }
2957
2958
668k
        lo.keys = keys;
2959
668k
        lo.values = saved_ob_item;
2960
668k
    }
2961
2962
2963
    /* The pre-sort check: here's where we decide which compare function to use.
2964
     * How much optimization is safe? We test for homogeneity with respect to
2965
     * several properties that are expensive to check at compare-time, and
2966
     * set ms appropriately. */
2967
850k
    if (saved_ob_size > 1) {
2968
        /* Assume the first element is representative of the whole list. */
2969
199k
        int keys_are_in_tuples = (Py_IS_TYPE(lo.keys[0], &PyTuple_Type) &&
2970
70
                                  Py_SIZE(lo.keys[0]) > 0);
2971
2972
199k
        PyTypeObject* key_type = (keys_are_in_tuples ?
2973
70
                                  Py_TYPE(PyTuple_GET_ITEM(lo.keys[0], 0)) :
2974
199k
                                  Py_TYPE(lo.keys[0]));
2975
2976
199k
        int keys_are_all_same_type = 1;
2977
199k
        int strings_are_latin = 1;
2978
199k
        int ints_are_bounded = 1;
2979
2980
        /* Prove that assumption by checking every key. */
2981
5.78M
        for (i=0; i < saved_ob_size; i++) {
2982
2983
5.58M
            if (keys_are_in_tuples &&
2984
610
                !(Py_IS_TYPE(lo.keys[i], &PyTuple_Type) && Py_SIZE(lo.keys[i]) != 0)) {
2985
0
                keys_are_in_tuples = 0;
2986
0
                keys_are_all_same_type = 0;
2987
0
                break;
2988
0
            }
2989
2990
            /* Note: for lists of tuples, key is the first element of the tuple
2991
             * lo.keys[i], not lo.keys[i] itself! We verify type-homogeneity
2992
             * for lists of tuples in the if-statement directly above. */
2993
5.58M
            PyObject *key = (keys_are_in_tuples ?
2994
610
                             PyTuple_GET_ITEM(lo.keys[i], 0) :
2995
5.58M
                             lo.keys[i]);
2996
2997
5.58M
            if (!Py_IS_TYPE(key, key_type)) {
2998
0
                keys_are_all_same_type = 0;
2999
                /* If keys are in tuple we must loop over the whole list to make
3000
                   sure all items are tuples */
3001
0
                if (!keys_are_in_tuples) {
3002
0
                    break;
3003
0
                }
3004
0
            }
3005
3006
5.58M
            if (keys_are_all_same_type) {
3007
5.58M
                if (key_type == &PyLong_Type &&
3008
4.40M
                    ints_are_bounded &&
3009
2.68M
                    !_PyLong_IsCompact((PyLongObject *)key)) {
3010
3011
6.99k
                    ints_are_bounded = 0;
3012
6.99k
                }
3013
5.57M
                else if (key_type == &PyUnicode_Type &&
3014
195k
                         strings_are_latin &&
3015
122k
                         PyUnicode_KIND(key) != PyUnicode_1BYTE_KIND) {
3016
3017
6.13k
                        strings_are_latin = 0;
3018
6.13k
                    }
3019
5.58M
                }
3020
5.58M
            }
3021
3022
        /* Choose the best compare, given what we now know about the keys. */
3023
199k
        if (keys_are_all_same_type) {
3024
3025
199k
            if (key_type == &PyUnicode_Type && strings_are_latin) {
3026
15.0k
                ms.key_compare = unsafe_latin_compare;
3027
15.0k
            }
3028
184k
            else if (key_type == &PyLong_Type && ints_are_bounded) {
3029
92.4k
                ms.key_compare = unsafe_long_compare;
3030
92.4k
            }
3031
91.9k
            else if (key_type == &PyFloat_Type) {
3032
0
                ms.key_compare = unsafe_float_compare;
3033
0
            }
3034
91.9k
            else if ((ms.key_richcompare = key_type->tp_richcompare) != NULL) {
3035
91.9k
                ms.key_compare = unsafe_object_compare;
3036
91.9k
            }
3037
0
            else {
3038
0
                ms.key_compare = safe_object_compare;
3039
0
            }
3040
199k
        }
3041
0
        else {
3042
0
            ms.key_compare = safe_object_compare;
3043
0
        }
3044
3045
199k
        if (keys_are_in_tuples) {
3046
            /* Make sure we're not dealing with tuples of tuples
3047
             * (remember: here, key_type refers list [key[0] for key in keys]) */
3048
70
            if (key_type == &PyTuple_Type) {
3049
0
                ms.tuple_elem_compare = safe_object_compare;
3050
0
            }
3051
70
            else {
3052
70
                ms.tuple_elem_compare = ms.key_compare;
3053
70
            }
3054
3055
70
            ms.key_compare = unsafe_tuple_compare;
3056
70
        }
3057
199k
    }
3058
    /* End of pre-sort check: ms is now set properly! */
3059
3060
850k
    merge_init(&ms, saved_ob_size, keys != NULL, &lo);
3061
3062
850k
    nremaining = saved_ob_size;
3063
850k
    if (nremaining < 2)
3064
651k
        goto succeed;
3065
3066
    /* Reverse sort stability achieved by initially reversing the list,
3067
    applying a stable forward sort, then reversing the final result. */
3068
199k
    if (reverse) {
3069
2
        if (keys != NULL)
3070
0
            reverse_slice(&keys[0], &keys[saved_ob_size]);
3071
2
        reverse_slice(&saved_ob_item[0], &saved_ob_item[saved_ob_size]);
3072
2
    }
3073
3074
    /* March over the array once, left to right, finding natural runs,
3075
     * and extending short natural runs to minrun elements.
3076
     */
3077
270k
    do {
3078
270k
        Py_ssize_t n;
3079
3080
        /* Identify next run. */
3081
270k
        n = count_run(&ms, &lo, nremaining);
3082
270k
        if (n < 0)
3083
0
            goto fail;
3084
        /* If short, extend to min(minrun, nremaining). */
3085
270k
        minrun = minrun_next(&ms);
3086
270k
        if (n < minrun) {
3087
125k
            const Py_ssize_t force = nremaining <= minrun ?
3088
75.6k
                              nremaining : minrun;
3089
125k
            if (binarysort(&ms, &lo, force, n) < 0)
3090
0
                goto fail;
3091
125k
            n = force;
3092
125k
        }
3093
        /* Maybe merge pending runs. */
3094
270k
        assert(ms.n == 0 || ms.pending[ms.n -1].base.keys +
3095
270k
                            ms.pending[ms.n-1].len == lo.keys);
3096
270k
        if (found_new_run(&ms, n) < 0)
3097
0
            goto fail;
3098
        /* Push new run on stack. */
3099
270k
        assert(ms.n < MAX_MERGE_PENDING);
3100
270k
        ms.pending[ms.n].base = lo;
3101
270k
        ms.pending[ms.n].len = n;
3102
270k
        ++ms.n;
3103
        /* Advance to find next run. */
3104
270k
        sortslice_advance(&lo, n);
3105
270k
        nremaining -= n;
3106
270k
    } while (nremaining);
3107
3108
199k
    if (merge_force_collapse(&ms) < 0)
3109
0
        goto fail;
3110
199k
    assert(ms.n == 1);
3111
199k
    assert(keys == NULL
3112
199k
           ? ms.pending[0].base.keys == saved_ob_item
3113
199k
           : ms.pending[0].base.keys == &keys[0]);
3114
199k
    assert(ms.pending[0].len == saved_ob_size);
3115
199k
    lo = ms.pending[0].base;
3116
3117
850k
succeed:
3118
850k
    result = Py_None;
3119
850k
fail:
3120
850k
    if (keys != NULL) {
3121
5.66M
        for (i = 0; i < saved_ob_size; i++)
3122
4.99M
            Py_DECREF(keys[i]);
3123
668k
        if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
3124
4.30k
            PyMem_Free(keys);
3125
668k
    }
3126
3127
850k
    if (self->allocated != -1 && result != NULL) {
3128
        /* The user mucked with the list during the sort,
3129
         * and we don't already have another error to report.
3130
         */
3131
0
        PyErr_SetString(PyExc_ValueError, "list modified during sort");
3132
0
        result = NULL;
3133
0
    }
3134
3135
850k
    if (reverse && saved_ob_size > 1)
3136
2
        reverse_slice(saved_ob_item, saved_ob_item + saved_ob_size);
3137
3138
850k
    merge_freemem(&ms);
3139
3140
850k
keyfunc_fail:
3141
850k
    final_ob_item = self->ob_item;
3142
850k
    i = Py_SIZE(self);
3143
850k
    Py_SET_SIZE(self, saved_ob_size);
3144
850k
    FT_ATOMIC_STORE_PTR_RELEASE(self->ob_item, saved_ob_item);
3145
850k
    FT_ATOMIC_STORE_SSIZE_RELAXED(self->allocated, saved_allocated);
3146
850k
    if (final_ob_item != NULL) {
3147
        /* we cannot use list_clear() for this because it does not
3148
           guarantee that the list is really empty when it returns */
3149
0
        while (--i >= 0) {
3150
0
            Py_XDECREF(final_ob_item[i]);
3151
0
        }
3152
#ifdef Py_GIL_DISABLED
3153
        ensure_shared_on_resize(self);
3154
        bool use_qsbr = _PyObject_GC_IS_SHARED(self);
3155
#else
3156
0
        bool use_qsbr = false;
3157
0
#endif
3158
0
        free_list_items(final_ob_item, use_qsbr);
3159
0
    }
3160
850k
    return Py_XNewRef(result);
3161
850k
}
3162
#undef IFLT
3163
#undef ISLT
3164
3165
int
3166
PyList_Sort(PyObject *v)
3167
18.2k
{
3168
18.2k
    if (v == NULL || !PyList_Check(v)) {
3169
0
        PyErr_BadInternalCall();
3170
0
        return -1;
3171
0
    }
3172
18.2k
    Py_BEGIN_CRITICAL_SECTION(v);
3173
18.2k
    v = list_sort_impl((PyListObject *)v, NULL, 0);
3174
18.2k
    Py_END_CRITICAL_SECTION();
3175
18.2k
    if (v == NULL)
3176
0
        return -1;
3177
18.2k
    Py_DECREF(v);
3178
18.2k
    return 0;
3179
18.2k
}
3180
3181
/*[clinic input]
3182
@critical_section
3183
list.reverse
3184
3185
Reverse *IN PLACE*.
3186
[clinic start generated code]*/
3187
3188
static PyObject *
3189
list_reverse_impl(PyListObject *self)
3190
/*[clinic end generated code: output=482544fc451abea9 input=04ac8e0c6a66e4d9]*/
3191
0
{
3192
0
    if (Py_SIZE(self) > 1)
3193
0
        reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
3194
0
    Py_RETURN_NONE;
3195
0
}
3196
3197
int
3198
PyList_Reverse(PyObject *v)
3199
50
{
3200
50
    PyListObject *self = (PyListObject *)v;
3201
3202
50
    if (v == NULL || !PyList_Check(v)) {
3203
0
        PyErr_BadInternalCall();
3204
0
        return -1;
3205
0
    }
3206
50
    Py_BEGIN_CRITICAL_SECTION(self);
3207
50
    if (Py_SIZE(self) > 1) {
3208
50
        reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
3209
50
    }
3210
50
    Py_END_CRITICAL_SECTION()
3211
50
    return 0;
3212
50
}
3213
3214
PyObject *
3215
PyList_AsTuple(PyObject *v)
3216
295k
{
3217
295k
    if (v == NULL || !PyList_Check(v)) {
3218
0
        PyErr_BadInternalCall();
3219
0
        return NULL;
3220
0
    }
3221
295k
    PyObject *ret;
3222
295k
    PyListObject *self = (PyListObject *)v;
3223
295k
    Py_BEGIN_CRITICAL_SECTION(self);
3224
295k
    ret = PyTuple_FromArray(self->ob_item, Py_SIZE(v));
3225
295k
    Py_END_CRITICAL_SECTION();
3226
295k
    return ret;
3227
295k
}
3228
3229
PyObject *
3230
_PyList_AsTupleAndClear(PyListObject *self)
3231
26
{
3232
26
    assert(self != NULL);
3233
26
    PyObject *ret;
3234
26
    if (self->ob_item == NULL) {
3235
0
        return PyTuple_New(0);
3236
0
    }
3237
26
    Py_BEGIN_CRITICAL_SECTION(self);
3238
26
    PyObject **items = self->ob_item;
3239
26
    Py_ssize_t size = Py_SIZE(self);
3240
26
    self->ob_item = NULL;
3241
26
    Py_SET_SIZE(self, 0);
3242
26
    ret = _PyTuple_FromArraySteal(items, size);
3243
26
    free_list_items(items, false);
3244
26
    Py_END_CRITICAL_SECTION();
3245
26
    return ret;
3246
26
}
3247
3248
PyObject *
3249
_PyList_FromStackRefStealOnSuccess(const _PyStackRef *src, Py_ssize_t n)
3250
196M
{
3251
196M
    if (n == 0) {
3252
179M
        return PyList_New(0);
3253
179M
    }
3254
3255
16.6M
    PyListObject *list = (PyListObject *)PyList_New(n);
3256
16.6M
    if (list == NULL) {
3257
0
        return NULL;
3258
0
    }
3259
3260
16.6M
    PyObject **dst = list->ob_item;
3261
46.2M
    for (Py_ssize_t i = 0; i < n; i++) {
3262
29.5M
        dst[i] = PyStackRef_AsPyObjectSteal(src[i]);
3263
29.5M
    }
3264
3265
16.6M
    return (PyObject *)list;
3266
16.6M
}
3267
3268
/*[clinic input]
3269
list.index
3270
3271
    value: object
3272
    start: slice_index(accept={int}) = 0
3273
    stop: slice_index(accept={int}, c_default="PY_SSIZE_T_MAX") = sys.maxsize
3274
    /
3275
3276
Return first index of value.
3277
3278
Raises ValueError if the value is not present.
3279
[clinic start generated code]*/
3280
3281
static PyObject *
3282
list_index_impl(PyListObject *self, PyObject *value, Py_ssize_t start,
3283
                Py_ssize_t stop)
3284
/*[clinic end generated code: output=ec51b88787e4e481 input=40ec5826303a0eb1]*/
3285
0
{
3286
0
    if (start < 0) {
3287
0
        start += Py_SIZE(self);
3288
0
        if (start < 0)
3289
0
            start = 0;
3290
0
    }
3291
0
    if (stop < 0) {
3292
0
        stop += Py_SIZE(self);
3293
0
        if (stop < 0)
3294
0
            stop = 0;
3295
0
    }
3296
0
    for (Py_ssize_t i = start; i < stop; i++) {
3297
0
        PyObject *obj = list_get_item_ref(self, i);
3298
0
        if (obj == NULL) {
3299
            // out-of-bounds
3300
0
            break;
3301
0
        }
3302
0
        int cmp = PyObject_RichCompareBool(obj, value, Py_EQ);
3303
0
        Py_DECREF(obj);
3304
0
        if (cmp > 0)
3305
0
            return PyLong_FromSsize_t(i);
3306
0
        else if (cmp < 0)
3307
0
            return NULL;
3308
0
    }
3309
0
    PyErr_SetString(PyExc_ValueError, "list.index(x): x not in list");
3310
0
    return NULL;
3311
0
}
3312
3313
/*[clinic input]
3314
list.count
3315
3316
     value: object
3317
     /
3318
3319
Return number of occurrences of value.
3320
[clinic start generated code]*/
3321
3322
static PyObject *
3323
list_count_impl(PyListObject *self, PyObject *value)
3324
/*[clinic end generated code: output=eff66f14aef2df86 input=3bdc3a5e6f749565]*/
3325
0
{
3326
0
    Py_ssize_t count = 0;
3327
0
    for (Py_ssize_t i = 0; ; i++) {
3328
0
        PyObject *obj = list_get_item_ref(self, i);
3329
0
        if (obj == NULL) {
3330
            // out-of-bounds
3331
0
            break;
3332
0
        }
3333
0
        if (obj == value) {
3334
0
           count++;
3335
0
           Py_DECREF(obj);
3336
0
           continue;
3337
0
        }
3338
0
        int cmp = PyObject_RichCompareBool(obj, value, Py_EQ);
3339
0
        Py_DECREF(obj);
3340
0
        if (cmp > 0)
3341
0
            count++;
3342
0
        else if (cmp < 0)
3343
0
            return NULL;
3344
0
    }
3345
0
    return PyLong_FromSsize_t(count);
3346
0
}
3347
3348
/*[clinic input]
3349
@critical_section
3350
list.remove
3351
3352
     value: object
3353
     /
3354
3355
Remove first occurrence of value.
3356
3357
Raises ValueError if the value is not present.
3358
[clinic start generated code]*/
3359
3360
static PyObject *
3361
list_remove_impl(PyListObject *self, PyObject *value)
3362
/*[clinic end generated code: output=b9b76a6633b18778 input=26c813dbb95aa93b]*/
3363
3.72k
{
3364
3.72k
    Py_ssize_t i;
3365
3366
3.73k
    for (i = 0; i < Py_SIZE(self); i++) {
3367
3.72k
        PyObject *obj = self->ob_item[i];
3368
3.72k
        Py_INCREF(obj);
3369
3.72k
        int cmp = PyObject_RichCompareBool(obj, value, Py_EQ);
3370
3.72k
        Py_DECREF(obj);
3371
3.72k
        if (cmp > 0) {
3372
3.71k
            if (list_ass_slice_lock_held(self, i, i+1, NULL) == 0)
3373
3.71k
                Py_RETURN_NONE;
3374
0
            return NULL;
3375
3.71k
        }
3376
10
        else if (cmp < 0)
3377
0
            return NULL;
3378
3.72k
    }
3379
2
    PyErr_SetString(PyExc_ValueError, "list.remove(x): x not in list");
3380
2
    return NULL;
3381
3.72k
}
3382
3383
static int
3384
list_traverse(PyObject *self, visitproc visit, void *arg)
3385
39.8M
{
3386
39.8M
    PyListObject *o = (PyListObject *)self;
3387
39.8M
    Py_ssize_t i;
3388
3389
97.3M
    for (i = Py_SIZE(o); --i >= 0; )
3390
57.4M
        Py_VISIT(o->ob_item[i]);
3391
39.8M
    return 0;
3392
39.8M
}
3393
3394
static PyObject *
3395
list_richcompare_impl(PyObject *v, PyObject *w, int op)
3396
5.31k
{
3397
5.31k
    PyListObject *vl, *wl;
3398
5.31k
    Py_ssize_t i;
3399
3400
5.31k
    if (!PyList_Check(v) || !PyList_Check(w))
3401
925
        Py_RETURN_NOTIMPLEMENTED;
3402
3403
4.39k
    vl = (PyListObject *)v;
3404
4.39k
    wl = (PyListObject *)w;
3405
3406
4.39k
    if (Py_SIZE(vl) != Py_SIZE(wl) && (op == Py_EQ || op == Py_NE)) {
3407
        /* Shortcut: if the lengths differ, the lists differ */
3408
602
        if (op == Py_EQ)
3409
602
            Py_RETURN_FALSE;
3410
0
        else
3411
0
            Py_RETURN_TRUE;
3412
602
    }
3413
3414
    /* Search for the first index where items are different */
3415
4.01k
    for (i = 0; i < Py_SIZE(vl) && i < Py_SIZE(wl); i++) {
3416
515
        PyObject *vitem = vl->ob_item[i];
3417
515
        PyObject *witem = wl->ob_item[i];
3418
515
        if (vitem == witem) {
3419
158
            continue;
3420
158
        }
3421
3422
357
        Py_INCREF(vitem);
3423
357
        Py_INCREF(witem);
3424
357
        int k = PyObject_RichCompareBool(vitem, witem, Py_EQ);
3425
357
        Py_DECREF(vitem);
3426
357
        Py_DECREF(witem);
3427
357
        if (k < 0)
3428
0
            return NULL;
3429
357
        if (!k)
3430
291
            break;
3431
357
    }
3432
3433
3.79k
    if (i >= Py_SIZE(vl) || i >= Py_SIZE(wl)) {
3434
        /* No more items to compare -- compare sizes */
3435
3.50k
        Py_RETURN_RICHCOMPARE(Py_SIZE(vl), Py_SIZE(wl), op);
3436
3.50k
    }
3437
3438
    /* We have an item that differs -- shortcuts for EQ/NE */
3439
291
    if (op == Py_EQ) {
3440
273
        Py_RETURN_FALSE;
3441
273
    }
3442
18
    if (op == Py_NE) {
3443
18
        Py_RETURN_TRUE;
3444
18
    }
3445
3446
    /* Compare the final item again using the proper operator */
3447
0
    PyObject *vitem = vl->ob_item[i];
3448
0
    PyObject *witem = wl->ob_item[i];
3449
0
    Py_INCREF(vitem);
3450
0
    Py_INCREF(witem);
3451
0
    PyObject *result = PyObject_RichCompare(vl->ob_item[i], wl->ob_item[i], op);
3452
0
    Py_DECREF(vitem);
3453
0
    Py_DECREF(witem);
3454
0
    return result;
3455
18
}
3456
3457
static PyObject *
3458
list_richcompare(PyObject *v, PyObject *w, int op)
3459
5.31k
{
3460
5.31k
    PyObject *ret;
3461
5.31k
    Py_BEGIN_CRITICAL_SECTION2(v, w);
3462
5.31k
    ret = list_richcompare_impl(v, w, op);
3463
5.31k
    Py_END_CRITICAL_SECTION2()
3464
5.31k
    return ret;
3465
5.31k
}
3466
3467
/*[clinic input]
3468
list.__init__
3469
3470
    iterable: object(c_default="NULL") = ()
3471
    /
3472
3473
Built-in mutable sequence.
3474
3475
If no argument is given, the constructor creates a new empty list.
3476
The argument must be an iterable if specified.
3477
[clinic start generated code]*/
3478
3479
static int
3480
list___init___impl(PyListObject *self, PyObject *iterable)
3481
/*[clinic end generated code: output=0f3c21379d01de48 input=b3f3fe7206af8f6b]*/
3482
21.1M
{
3483
    /* Verify list invariants established by PyType_GenericAlloc() */
3484
21.1M
    assert(0 <= Py_SIZE(self));
3485
21.1M
    assert(Py_SIZE(self) <= self->allocated || self->allocated == -1);
3486
21.1M
    assert(self->ob_item != NULL ||
3487
21.1M
           self->allocated == 0 || self->allocated == -1);
3488
3489
    /* Empty previous contents */
3490
21.1M
    if (self->ob_item != NULL) {
3491
0
        Py_BEGIN_CRITICAL_SECTION(self);
3492
0
        list_clear(self);
3493
0
        Py_END_CRITICAL_SECTION();
3494
0
    }
3495
21.1M
    if (iterable != NULL) {
3496
9.52M
        if (_list_extend(self, iterable) < 0) {
3497
0
            return -1;
3498
0
        }
3499
9.52M
    }
3500
21.1M
    return 0;
3501
21.1M
}
3502
3503
static PyObject *
3504
list_vectorcall(PyObject *type, PyObject * const*args,
3505
                size_t nargsf, PyObject *kwnames)
3506
9.52M
{
3507
9.52M
    if (!_PyArg_NoKwnames("list", kwnames)) {
3508
0
        return NULL;
3509
0
    }
3510
9.52M
    Py_ssize_t nargs = PyVectorcall_NARGS(nargsf);
3511
9.52M
    if (!_PyArg_CheckPositional("list", nargs, 0, 1)) {
3512
0
        return NULL;
3513
0
    }
3514
3515
9.52M
    PyObject *list = PyType_GenericAlloc(_PyType_CAST(type), 0);
3516
9.52M
    if (list == NULL) {
3517
0
        return NULL;
3518
0
    }
3519
9.52M
    if (nargs) {
3520
9.52M
        if (list___init___impl((PyListObject *)list, args[0])) {
3521
0
            Py_DECREF(list);
3522
0
            return NULL;
3523
0
        }
3524
9.52M
    }
3525
9.52M
    return list;
3526
9.52M
}
3527
3528
3529
/*[clinic input]
3530
list.__sizeof__
3531
3532
Return the size of the list in memory, in bytes.
3533
[clinic start generated code]*/
3534
3535
static PyObject *
3536
list___sizeof___impl(PyListObject *self)
3537
/*[clinic end generated code: output=3417541f95f9a53e input=b8030a5d5ce8a187]*/
3538
0
{
3539
0
    size_t res = _PyObject_SIZE(Py_TYPE(self));
3540
0
    Py_ssize_t allocated = FT_ATOMIC_LOAD_SSIZE_RELAXED(self->allocated);
3541
0
    res += (size_t)allocated * sizeof(void*);
3542
0
    return PyLong_FromSize_t(res);
3543
0
}
3544
3545
static PyObject *list_iter(PyObject *seq);
3546
static PyObject *list_subscript(PyObject*, PyObject*);
3547
3548
static PyMethodDef list_methods[] = {
3549
    {"__getitem__", list_subscript, METH_O|METH_COEXIST,
3550
     PyDoc_STR("__getitem__($self, index, /)\n--\n\nReturn self[index].")},
3551
    LIST___REVERSED___METHODDEF
3552
    LIST___SIZEOF___METHODDEF
3553
    PY_LIST_CLEAR_METHODDEF
3554
    LIST_COPY_METHODDEF
3555
    LIST_APPEND_METHODDEF
3556
    LIST_INSERT_METHODDEF
3557
    LIST_EXTEND_METHODDEF
3558
    LIST_POP_METHODDEF
3559
    LIST_REMOVE_METHODDEF
3560
    LIST_INDEX_METHODDEF
3561
    LIST_COUNT_METHODDEF
3562
    LIST_REVERSE_METHODDEF
3563
    LIST_SORT_METHODDEF
3564
    {"__class_getitem__", Py_GenericAlias, METH_O|METH_CLASS, PyDoc_STR("See PEP 585")},
3565
    {NULL,              NULL}           /* sentinel */
3566
};
3567
3568
static PySequenceMethods list_as_sequence = {
3569
    list_length,                                /* sq_length */
3570
    list_concat,                                /* sq_concat */
3571
    list_repeat,                                /* sq_repeat */
3572
    list_item,                                  /* sq_item */
3573
    0,                                          /* sq_slice */
3574
    list_ass_item,                              /* sq_ass_item */
3575
    0,                                          /* sq_ass_slice */
3576
    list_contains,                              /* sq_contains */
3577
    list_inplace_concat,                        /* sq_inplace_concat */
3578
    list_inplace_repeat,                        /* sq_inplace_repeat */
3579
};
3580
3581
static inline PyObject *
3582
list_slice_step_lock_held(PyListObject *a, Py_ssize_t start, Py_ssize_t step, Py_ssize_t len)
3583
72
{
3584
72
    PyListObject *np = (PyListObject *)list_new_prealloc(len);
3585
72
    if (np == NULL) {
3586
0
        return NULL;
3587
0
    }
3588
72
    size_t cur;
3589
72
    Py_ssize_t i;
3590
72
    PyObject **src = a->ob_item;
3591
72
    PyObject **dest = np->ob_item;
3592
720
    for (cur = start, i = 0; i < len;
3593
648
            cur += (size_t)step, i++) {
3594
648
        PyObject *v = src[cur];
3595
648
        dest[i] = Py_NewRef(v);
3596
648
    }
3597
72
    Py_SET_SIZE(np, len);
3598
72
    return (PyObject *)np;
3599
72
}
3600
3601
static PyObject *
3602
list_slice_wrap(PyListObject *aa, Py_ssize_t start, Py_ssize_t stop, Py_ssize_t step)
3603
2.95M
{
3604
2.95M
    PyObject *res = NULL;
3605
2.95M
    Py_BEGIN_CRITICAL_SECTION(aa);
3606
2.95M
    Py_ssize_t len = PySlice_AdjustIndices(Py_SIZE(aa), &start, &stop, step);
3607
2.95M
    if (len <= 0) {
3608
495k
        res = PyList_New(0);
3609
495k
    }
3610
2.45M
    else if (step == 1) {
3611
2.45M
        res = list_slice_lock_held(aa, start, stop);
3612
2.45M
    }
3613
72
    else {
3614
72
        res = list_slice_step_lock_held(aa, start, step, len);
3615
72
    }
3616
2.95M
    Py_END_CRITICAL_SECTION();
3617
2.95M
    return res;
3618
2.95M
}
3619
3620
static inline PyObject*
3621
list_slice_subscript(PyObject* self, PyObject* item)
3622
2.95M
{
3623
2.95M
    assert(PyList_Check(self));
3624
2.95M
    assert(PySlice_Check(item));
3625
2.95M
    Py_ssize_t start, stop, step;
3626
2.95M
    if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
3627
0
        return NULL;
3628
0
    }
3629
2.95M
    return list_slice_wrap((PyListObject *)self, start, stop, step);
3630
2.95M
}
3631
3632
PyObject *
3633
_PyList_SliceSubscript(PyObject* _self, PyObject* item)
3634
2.80M
{
3635
2.80M
    return list_slice_subscript(_self, item);
3636
2.80M
}
3637
3638
static PyObject *
3639
list_subscript(PyObject* _self, PyObject* item)
3640
20.0M
{
3641
20.0M
    PyListObject* self = (PyListObject*)_self;
3642
20.0M
    if (_PyIndex_Check(item)) {
3643
19.8M
        Py_ssize_t i;
3644
19.8M
        i = PyNumber_AsSsize_t(item, PyExc_IndexError);
3645
19.8M
        if (i == -1 && PyErr_Occurred())
3646
0
            return NULL;
3647
19.8M
        if (i < 0)
3648
15.8M
            i += PyList_GET_SIZE(self);
3649
19.8M
        return list_item((PyObject *)self, i);
3650
19.8M
    }
3651
150k
    else if (PySlice_Check(item)) {
3652
150k
        return list_slice_subscript(_self, item);
3653
150k
    }
3654
0
    else {
3655
0
        PyErr_Format(PyExc_TypeError,
3656
0
                     "list indices must be integers or slices, not %.200s",
3657
0
                     Py_TYPE(item)->tp_name);
3658
0
        return NULL;
3659
0
    }
3660
20.0M
}
3661
3662
static Py_ssize_t
3663
adjust_slice_indexes(PyListObject *lst,
3664
                     Py_ssize_t *start, Py_ssize_t *stop,
3665
                     Py_ssize_t step)
3666
226k
{
3667
226k
    Py_ssize_t slicelength = PySlice_AdjustIndices(Py_SIZE(lst), start, stop,
3668
226k
                                                   step);
3669
3670
    /* Make sure s[5:2] = [..] inserts at the right place:
3671
        before 5, not before 2. */
3672
226k
    if ((step < 0 && *start < *stop) ||
3673
226k
        (step > 0 && *start > *stop))
3674
0
        *stop = *start;
3675
3676
226k
    return slicelength;
3677
226k
}
3678
3679
static int
3680
list_ass_subscript_lock_held(PyObject *_self, PyObject *item, PyObject *value)
3681
230k
{
3682
230k
    _Py_CRITICAL_SECTION_ASSERT_OBJECT_LOCKED(_self);
3683
3684
230k
    PyListObject *self = (PyListObject *)_self;
3685
230k
    if (_PyIndex_Check(item)) {
3686
3.60k
        Py_ssize_t i = PyNumber_AsSsize_t(item, PyExc_IndexError);
3687
3.60k
        if (i == -1 && PyErr_Occurred())
3688
0
            return -1;
3689
3.60k
        if (i < 0)
3690
3.42k
            i += PyList_GET_SIZE(self);
3691
3.60k
        return list_ass_item_lock_held(self, i, value);
3692
3.60k
    }
3693
226k
    else if (PySlice_Check(item)) {
3694
226k
        Py_ssize_t start, stop, step;
3695
3696
226k
        if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
3697
0
            return -1;
3698
0
        }
3699
3700
226k
        if (value == NULL) {
3701
            /* delete slice */
3702
18
            PyObject **garbage;
3703
18
            size_t cur;
3704
18
            Py_ssize_t i;
3705
18
            int res;
3706
3707
18
            Py_ssize_t slicelength = adjust_slice_indexes(self, &start, &stop,
3708
18
                                                          step);
3709
3710
18
            if (step == 1)
3711
18
                return list_ass_slice_lock_held(self, start, stop, value);
3712
3713
0
            if (slicelength <= 0)
3714
0
                return 0;
3715
3716
0
            if (step < 0) {
3717
0
                stop = start + 1;
3718
0
                start = stop + step*(slicelength - 1) - 1;
3719
0
                step = -step;
3720
0
            }
3721
3722
0
            garbage = (PyObject**)
3723
0
                PyMem_Malloc(slicelength*sizeof(PyObject*));
3724
0
            if (!garbage) {
3725
0
                PyErr_NoMemory();
3726
0
                return -1;
3727
0
            }
3728
3729
            /* drawing pictures might help understand these for
3730
               loops. Basically, we memmove the parts of the
3731
               list that are *not* part of the slice: step-1
3732
               items for each item that is part of the slice,
3733
               and then tail end of the list that was not
3734
               covered by the slice */
3735
0
            for (cur = start, i = 0;
3736
0
                 cur < (size_t)stop;
3737
0
                 cur += step, i++) {
3738
0
                Py_ssize_t lim = step - 1;
3739
3740
0
                garbage[i] = PyList_GET_ITEM(self, cur);
3741
3742
0
                if (cur + step >= (size_t)Py_SIZE(self)) {
3743
0
                    lim = Py_SIZE(self) - cur - 1;
3744
0
                }
3745
3746
0
                memmove(self->ob_item + cur - i,
3747
0
                    self->ob_item + cur + 1,
3748
0
                    lim * sizeof(PyObject *));
3749
0
            }
3750
0
            cur = start + (size_t)slicelength * step;
3751
0
            if (cur < (size_t)Py_SIZE(self)) {
3752
0
                memmove(self->ob_item + cur - slicelength,
3753
0
                    self->ob_item + cur,
3754
0
                    (Py_SIZE(self) - cur) *
3755
0
                     sizeof(PyObject *));
3756
0
            }
3757
3758
0
            Py_SET_SIZE(self, Py_SIZE(self) - slicelength);
3759
0
            res = list_resize(self, Py_SIZE(self));
3760
3761
0
            for (i = 0; i < slicelength; i++) {
3762
0
                Py_DECREF(garbage[i]);
3763
0
            }
3764
0
            PyMem_Free(garbage);
3765
3766
0
            return res;
3767
0
        }
3768
226k
        else {
3769
            /* assign slice */
3770
226k
            PyObject *ins, *seq;
3771
226k
            PyObject **garbage, **seqitems, **selfitems;
3772
226k
            Py_ssize_t i;
3773
226k
            size_t cur;
3774
3775
            /* protect against a[::-1] = a */
3776
226k
            if (self == (PyListObject*)value) {
3777
0
                seq = list_slice_lock_held((PyListObject *)value, 0,
3778
0
                                            Py_SIZE(value));
3779
0
            }
3780
226k
            else {
3781
226k
                seq = PySequence_Fast(value,
3782
226k
                                      "must assign iterable "
3783
226k
                                      "to extended slice");
3784
226k
            }
3785
226k
            if (!seq)
3786
0
                return -1;
3787
3788
226k
            Py_ssize_t slicelength = adjust_slice_indexes(self, &start, &stop,
3789
226k
                                                          step);
3790
3791
226k
            if (step == 1) {
3792
226k
                int res = list_ass_slice_lock_held(self, start, stop, seq);
3793
226k
                Py_DECREF(seq);
3794
226k
                return res;
3795
226k
            }
3796
3797
0
            if (PySequence_Fast_GET_SIZE(seq) != slicelength) {
3798
0
                PyErr_Format(PyExc_ValueError,
3799
0
                    "attempt to assign sequence of "
3800
0
                    "size %zd to extended slice of "
3801
0
                    "size %zd",
3802
0
                         PySequence_Fast_GET_SIZE(seq),
3803
0
                         slicelength);
3804
0
                Py_DECREF(seq);
3805
0
                return -1;
3806
0
            }
3807
3808
0
            if (!slicelength) {
3809
0
                Py_DECREF(seq);
3810
0
                return 0;
3811
0
            }
3812
3813
0
            garbage = (PyObject**)
3814
0
                PyMem_Malloc(slicelength*sizeof(PyObject*));
3815
0
            if (!garbage) {
3816
0
                Py_DECREF(seq);
3817
0
                PyErr_NoMemory();
3818
0
                return -1;
3819
0
            }
3820
3821
0
            selfitems = self->ob_item;
3822
0
            seqitems = PySequence_Fast_ITEMS(seq);
3823
0
            for (cur = start, i = 0; i < slicelength;
3824
0
                 cur += (size_t)step, i++) {
3825
0
                garbage[i] = selfitems[cur];
3826
0
                ins = Py_NewRef(seqitems[i]);
3827
0
                selfitems[cur] = ins;
3828
0
            }
3829
3830
0
            for (i = 0; i < slicelength; i++) {
3831
0
                Py_DECREF(garbage[i]);
3832
0
            }
3833
3834
0
            PyMem_Free(garbage);
3835
0
            Py_DECREF(seq);
3836
3837
0
            return 0;
3838
0
        }
3839
226k
    }
3840
0
    else {
3841
0
        PyErr_Format(PyExc_TypeError,
3842
0
                     "list indices must be integers or slices, not %.200s",
3843
0
                     Py_TYPE(item)->tp_name);
3844
0
        return -1;
3845
0
    }
3846
230k
}
3847
3848
static int
3849
list_ass_subscript(PyObject *self, PyObject *item, PyObject *value)
3850
230k
{
3851
230k
    int res;
3852
#ifdef Py_GIL_DISABLED
3853
    if (PySlice_Check(item) && value != NULL && PyList_CheckExact(value)) {
3854
        Py_BEGIN_CRITICAL_SECTION2(self, value);
3855
        res = list_ass_subscript_lock_held(self, item, value);
3856
        Py_END_CRITICAL_SECTION2();
3857
        return res;
3858
    }
3859
#endif
3860
230k
    Py_BEGIN_CRITICAL_SECTION(self);
3861
230k
    res = list_ass_subscript_lock_held(self, item, value);
3862
230k
    Py_END_CRITICAL_SECTION();
3863
230k
    return res;
3864
230k
}
3865
3866
static PyMappingMethods list_as_mapping = {
3867
    list_length,
3868
    list_subscript,
3869
    list_ass_subscript
3870
};
3871
3872
PyTypeObject PyList_Type = {
3873
    PyVarObject_HEAD_INIT(&PyType_Type, 0)
3874
    "list",
3875
    sizeof(PyListObject),
3876
    0,
3877
    list_dealloc,                               /* tp_dealloc */
3878
    0,                                          /* tp_vectorcall_offset */
3879
    0,                                          /* tp_getattr */
3880
    0,                                          /* tp_setattr */
3881
    0,                                          /* tp_as_async */
3882
    list_repr,                                  /* tp_repr */
3883
    0,                                          /* tp_as_number */
3884
    &list_as_sequence,                          /* tp_as_sequence */
3885
    &list_as_mapping,                           /* tp_as_mapping */
3886
    PyObject_HashNotImplemented,                /* tp_hash */
3887
    0,                                          /* tp_call */
3888
    0,                                          /* tp_str */
3889
    PyObject_GenericGetAttr,                    /* tp_getattro */
3890
    0,                                          /* tp_setattro */
3891
    0,                                          /* tp_as_buffer */
3892
    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
3893
        Py_TPFLAGS_BASETYPE | Py_TPFLAGS_LIST_SUBCLASS |
3894
        _Py_TPFLAGS_MATCH_SELF | Py_TPFLAGS_SEQUENCE,  /* tp_flags */
3895
    list___init____doc__,                       /* tp_doc */
3896
    list_traverse,                              /* tp_traverse */
3897
    list_clear_slot,                            /* tp_clear */
3898
    list_richcompare,                           /* tp_richcompare */
3899
    0,                                          /* tp_weaklistoffset */
3900
    list_iter,                                  /* tp_iter */
3901
    0,                                          /* tp_iternext */
3902
    list_methods,                               /* tp_methods */
3903
    0,                                          /* tp_members */
3904
    0,                                          /* tp_getset */
3905
    0,                                          /* tp_base */
3906
    0,                                          /* tp_dict */
3907
    0,                                          /* tp_descr_get */
3908
    0,                                          /* tp_descr_set */
3909
    0,                                          /* tp_dictoffset */
3910
    list___init__,                              /* tp_init */
3911
    PyType_GenericAlloc,                        /* tp_alloc */
3912
    PyType_GenericNew,                          /* tp_new */
3913
    PyObject_GC_Del,                            /* tp_free */
3914
    .tp_vectorcall = list_vectorcall,
3915
    .tp_version_tag = _Py_TYPE_VERSION_LIST,
3916
};
3917
3918
/*********************** List Iterator **************************/
3919
3920
static void listiter_dealloc(PyObject *);
3921
static int listiter_traverse(PyObject *, visitproc, void *);
3922
static PyObject *listiter_next(PyObject *);
3923
static PyObject *listiter_len(PyObject *, PyObject *);
3924
static PyObject *listiter_reduce_general(void *_it, int forward);
3925
static PyObject *listiter_reduce(PyObject *, PyObject *);
3926
static PyObject *listiter_setstate(PyObject *, PyObject *state);
3927
3928
PyDoc_STRVAR(length_hint_doc, "Private method returning an estimate of len(list(it)).");
3929
PyDoc_STRVAR(reduce_doc, "Return state information for pickling.");
3930
PyDoc_STRVAR(setstate_doc, "Set state information for unpickling.");
3931
3932
static PyMethodDef listiter_methods[] = {
3933
    {"__length_hint__", listiter_len, METH_NOARGS, length_hint_doc},
3934
    {"__reduce__", listiter_reduce, METH_NOARGS, reduce_doc},
3935
    {"__setstate__", listiter_setstate, METH_O, setstate_doc},
3936
    {NULL,              NULL}           /* sentinel */
3937
};
3938
3939
PyTypeObject PyListIter_Type = {
3940
    PyVarObject_HEAD_INIT(&PyType_Type, 0)
3941
    "list_iterator",                            /* tp_name */
3942
    sizeof(_PyListIterObject),                  /* tp_basicsize */
3943
    0,                                          /* tp_itemsize */
3944
    /* methods */
3945
    listiter_dealloc,               /* tp_dealloc */
3946
    0,                                          /* tp_vectorcall_offset */
3947
    0,                                          /* tp_getattr */
3948
    0,                                          /* tp_setattr */
3949
    0,                                          /* tp_as_async */
3950
    0,                                          /* tp_repr */
3951
    0,                                          /* tp_as_number */
3952
    0,                                          /* tp_as_sequence */
3953
    0,                                          /* tp_as_mapping */
3954
    0,                                          /* tp_hash */
3955
    0,                                          /* tp_call */
3956
    0,                                          /* tp_str */
3957
    PyObject_GenericGetAttr,                    /* tp_getattro */
3958
    0,                                          /* tp_setattro */
3959
    0,                                          /* tp_as_buffer */
3960
    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3961
    0,                                          /* tp_doc */
3962
    listiter_traverse,                          /* tp_traverse */
3963
    0,                                          /* tp_clear */
3964
    0,                                          /* tp_richcompare */
3965
    0,                                          /* tp_weaklistoffset */
3966
    PyObject_SelfIter,                          /* tp_iter */
3967
    listiter_next,                              /* tp_iternext */
3968
    listiter_methods,                           /* tp_methods */
3969
    0,                                          /* tp_members */
3970
};
3971
3972
3973
static PyObject *
3974
list_iter(PyObject *seq)
3975
32.2M
{
3976
32.2M
    if (!PyList_Check(seq)) {
3977
0
        PyErr_BadInternalCall();
3978
0
        return NULL;
3979
0
    }
3980
32.2M
    _PyListIterObject *it = _Py_FREELIST_POP(_PyListIterObject, list_iters);
3981
32.2M
    if (it == NULL) {
3982
2.23M
        it = PyObject_GC_New(_PyListIterObject, &PyListIter_Type);
3983
2.23M
        if (it == NULL) {
3984
0
            return NULL;
3985
0
        }
3986
2.23M
    }
3987
32.2M
    it->it_index = 0;
3988
32.2M
    it->it_seq = (PyListObject *)Py_NewRef(seq);
3989
32.2M
    _PyObject_GC_TRACK(it);
3990
32.2M
    return (PyObject *)it;
3991
32.2M
}
3992
3993
static void
3994
listiter_dealloc(PyObject *self)
3995
32.2M
{
3996
32.2M
    _PyListIterObject *it = (_PyListIterObject *)self;
3997
32.2M
    _PyObject_GC_UNTRACK(it);
3998
32.2M
    Py_XDECREF(it->it_seq);
3999
32.2M
    assert(Py_IS_TYPE(self, &PyListIter_Type));
4000
32.2M
    _Py_FREELIST_FREE(list_iters, it, PyObject_GC_Del);
4001
32.2M
}
4002
4003
static int
4004
listiter_traverse(PyObject *it, visitproc visit, void *arg)
4005
576k
{
4006
576k
    Py_VISIT(((_PyListIterObject *)it)->it_seq);
4007
576k
    return 0;
4008
576k
}
4009
4010
static PyObject *
4011
listiter_next(PyObject *self)
4012
140M
{
4013
140M
    _PyListIterObject *it = (_PyListIterObject *)self;
4014
140M
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4015
140M
    if (index < 0) {
4016
166
        return NULL;
4017
166
    }
4018
4019
140M
    PyObject *item = list_get_item_ref(it->it_seq, index);
4020
140M
    if (item == NULL) {
4021
        // out-of-bounds
4022
31.6M
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, -1);
4023
31.6M
#ifndef Py_GIL_DISABLED
4024
31.6M
        PyListObject *seq = it->it_seq;
4025
31.6M
        it->it_seq = NULL;
4026
31.6M
        Py_DECREF(seq);
4027
31.6M
#endif
4028
31.6M
        return NULL;
4029
31.6M
    }
4030
108M
    FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index + 1);
4031
108M
    return item;
4032
140M
}
4033
4034
static PyObject *
4035
listiter_len(PyObject *self, PyObject *Py_UNUSED(ignored))
4036
1.60M
{
4037
1.60M
    assert(self != NULL);
4038
1.60M
    _PyListIterObject *it = (_PyListIterObject *)self;
4039
1.60M
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4040
1.60M
    if (index >= 0) {
4041
1.60M
        Py_ssize_t len = PyList_GET_SIZE(it->it_seq) - index;
4042
1.60M
        if (len >= 0)
4043
1.60M
            return PyLong_FromSsize_t(len);
4044
1.60M
    }
4045
0
    return PyLong_FromLong(0);
4046
1.60M
}
4047
4048
static PyObject *
4049
listiter_reduce(PyObject *it, PyObject *Py_UNUSED(ignored))
4050
0
{
4051
0
    return listiter_reduce_general(it, 1);
4052
0
}
4053
4054
static PyObject *
4055
listiter_setstate(PyObject *self, PyObject *state)
4056
0
{
4057
0
    _PyListIterObject *it = (_PyListIterObject *)self;
4058
0
    Py_ssize_t index = PyLong_AsSsize_t(state);
4059
0
    if (index == -1 && PyErr_Occurred())
4060
0
        return NULL;
4061
0
    if (it->it_seq != NULL) {
4062
0
        if (index < -1)
4063
0
            index = -1;
4064
0
        else if (index > PyList_GET_SIZE(it->it_seq))
4065
0
            index = PyList_GET_SIZE(it->it_seq); /* iterator exhausted */
4066
0
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index);
4067
0
    }
4068
0
    Py_RETURN_NONE;
4069
0
}
4070
4071
/*********************** List Reverse Iterator **************************/
4072
4073
typedef struct {
4074
    PyObject_HEAD
4075
    Py_ssize_t it_index;
4076
    PyListObject *it_seq; /* Set to NULL when iterator is exhausted */
4077
} listreviterobject;
4078
4079
static void listreviter_dealloc(PyObject *);
4080
static int listreviter_traverse(PyObject *, visitproc, void *);
4081
static PyObject *listreviter_next(PyObject *);
4082
static PyObject *listreviter_len(PyObject *, PyObject *);
4083
static PyObject *listreviter_reduce(PyObject *, PyObject *);
4084
static PyObject *listreviter_setstate(PyObject *, PyObject *);
4085
4086
static PyMethodDef listreviter_methods[] = {
4087
    {"__length_hint__", listreviter_len, METH_NOARGS, length_hint_doc},
4088
    {"__reduce__", listreviter_reduce, METH_NOARGS, reduce_doc},
4089
    {"__setstate__", listreviter_setstate, METH_O, setstate_doc},
4090
    {NULL,              NULL}           /* sentinel */
4091
};
4092
4093
PyTypeObject PyListRevIter_Type = {
4094
    PyVarObject_HEAD_INIT(&PyType_Type, 0)
4095
    "list_reverseiterator",                     /* tp_name */
4096
    sizeof(listreviterobject),                  /* tp_basicsize */
4097
    0,                                          /* tp_itemsize */
4098
    /* methods */
4099
    listreviter_dealloc,                        /* tp_dealloc */
4100
    0,                                          /* tp_vectorcall_offset */
4101
    0,                                          /* tp_getattr */
4102
    0,                                          /* tp_setattr */
4103
    0,                                          /* tp_as_async */
4104
    0,                                          /* tp_repr */
4105
    0,                                          /* tp_as_number */
4106
    0,                                          /* tp_as_sequence */
4107
    0,                                          /* tp_as_mapping */
4108
    0,                                          /* tp_hash */
4109
    0,                                          /* tp_call */
4110
    0,                                          /* tp_str */
4111
    PyObject_GenericGetAttr,                    /* tp_getattro */
4112
    0,                                          /* tp_setattro */
4113
    0,                                          /* tp_as_buffer */
4114
    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4115
    0,                                          /* tp_doc */
4116
    listreviter_traverse,                       /* tp_traverse */
4117
    0,                                          /* tp_clear */
4118
    0,                                          /* tp_richcompare */
4119
    0,                                          /* tp_weaklistoffset */
4120
    PyObject_SelfIter,                          /* tp_iter */
4121
    listreviter_next,                           /* tp_iternext */
4122
    listreviter_methods,                /* tp_methods */
4123
    0,
4124
};
4125
4126
/*[clinic input]
4127
list.__reversed__
4128
4129
Return a reverse iterator over the list.
4130
[clinic start generated code]*/
4131
4132
static PyObject *
4133
list___reversed___impl(PyListObject *self)
4134
/*[clinic end generated code: output=b166f073208c888c input=eadb6e17f8a6a280]*/
4135
43.8M
{
4136
43.8M
    listreviterobject *it;
4137
4138
43.8M
    it = PyObject_GC_New(listreviterobject, &PyListRevIter_Type);
4139
43.8M
    if (it == NULL)
4140
0
        return NULL;
4141
43.8M
    assert(PyList_Check(self));
4142
43.8M
    it->it_index = PyList_GET_SIZE(self) - 1;
4143
43.8M
    it->it_seq = (PyListObject*)Py_NewRef(self);
4144
43.8M
    PyObject_GC_Track(it);
4145
43.8M
    return (PyObject *)it;
4146
43.8M
}
4147
4148
static void
4149
listreviter_dealloc(PyObject *self)
4150
43.8M
{
4151
43.8M
    listreviterobject *it = (listreviterobject *)self;
4152
43.8M
    PyObject_GC_UnTrack(it);
4153
43.8M
    Py_XDECREF(it->it_seq);
4154
43.8M
    PyObject_GC_Del(it);
4155
43.8M
}
4156
4157
static int
4158
listreviter_traverse(PyObject *it, visitproc visit, void *arg)
4159
683
{
4160
683
    Py_VISIT(((listreviterobject *)it)->it_seq);
4161
683
    return 0;
4162
683
}
4163
4164
static PyObject *
4165
listreviter_next(PyObject *self)
4166
53.8M
{
4167
53.8M
    listreviterobject *it = (listreviterobject *)self;
4168
53.8M
    assert(it != NULL);
4169
53.8M
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4170
53.8M
    if (index < 0) {
4171
29.0M
        return NULL;
4172
29.0M
    }
4173
4174
24.7M
    PyListObject *seq = it->it_seq;
4175
24.7M
    assert(PyList_Check(seq));
4176
24.7M
    PyObject *item = list_get_item_ref(seq, index);
4177
24.7M
    if (item != NULL) {
4178
24.7M
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index - 1);
4179
24.7M
        return item;
4180
24.7M
    }
4181
0
    FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, -1);
4182
0
#ifndef Py_GIL_DISABLED
4183
0
    it->it_seq = NULL;
4184
0
    Py_DECREF(seq);
4185
0
#endif
4186
0
    return NULL;
4187
24.7M
}
4188
4189
static PyObject *
4190
listreviter_len(PyObject *self, PyObject *Py_UNUSED(ignored))
4191
0
{
4192
0
    listreviterobject *it = (listreviterobject *)self;
4193
0
    Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4194
0
    Py_ssize_t len = index + 1;
4195
0
    if (it->it_seq == NULL || PyList_GET_SIZE(it->it_seq) < len)
4196
0
        len = 0;
4197
0
    return PyLong_FromSsize_t(len);
4198
0
}
4199
4200
static PyObject *
4201
listreviter_reduce(PyObject *it, PyObject *Py_UNUSED(ignored))
4202
0
{
4203
0
    return listiter_reduce_general(it, 0);
4204
0
}
4205
4206
static PyObject *
4207
listreviter_setstate(PyObject *self, PyObject *state)
4208
0
{
4209
0
    listreviterobject *it = (listreviterobject *)self;
4210
0
    Py_ssize_t index = PyLong_AsSsize_t(state);
4211
0
    if (index == -1 && PyErr_Occurred())
4212
0
        return NULL;
4213
0
    if (it->it_seq != NULL) {
4214
0
        if (index < -1)
4215
0
            index = -1;
4216
0
        else if (index > PyList_GET_SIZE(it->it_seq) - 1)
4217
0
            index = PyList_GET_SIZE(it->it_seq) - 1;
4218
0
        FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index);
4219
0
    }
4220
0
    Py_RETURN_NONE;
4221
0
}
4222
4223
/* common pickling support */
4224
4225
static PyObject *
4226
listiter_reduce_general(void *_it, int forward)
4227
0
{
4228
0
    PyObject *list;
4229
0
    PyObject *iter;
4230
4231
    /* _PyEval_GetBuiltin can invoke arbitrary code,
4232
     * call must be before access of iterator pointers.
4233
     * see issue #101765 */
4234
4235
0
    if (forward) {
4236
0
        iter = _PyEval_GetBuiltin(&_Py_ID(iter));
4237
0
        _PyListIterObject *it = (_PyListIterObject *)_it;
4238
0
        Py_ssize_t idx = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4239
0
        if (idx >= 0) {
4240
0
            return Py_BuildValue("N(O)n", iter, it->it_seq, idx);
4241
0
        }
4242
0
    } else {
4243
0
        iter = _PyEval_GetBuiltin(&_Py_ID(reversed));
4244
0
        listreviterobject *it = (listreviterobject *)_it;
4245
0
        Py_ssize_t idx = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
4246
0
        if (idx >= 0) {
4247
0
            return Py_BuildValue("N(O)n", iter, it->it_seq, idx);
4248
0
        }
4249
0
    }
4250
    /* empty iterator, create an empty list */
4251
0
    list = PyList_New(0);
4252
0
    if (list == NULL)
4253
0
        return NULL;
4254
0
    return Py_BuildValue("N(N)", iter, list);
4255
0
}