blob: de73b8bf80fdfd01848425e9e466229ef6a53f96 [file] [log] [blame]
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00001/* List object implementation */
2
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003#include "Python.h"
Eric Snow2ebc5ce2017-09-07 23:51:28 -06004#include "internal/pystate.h"
Antoine Pitrou0197ff92012-03-22 14:38:16 +01005#include "accu.h"
Guido van Rossumc0b618a1997-05-02 03:12:38 +00006
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00007#ifdef STDC_HEADERS
8#include <stddef.h>
9#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000010#include <sys/types.h> /* For size_t */
Guido van Rossum6cd2fe01994-08-29 12:45:32 +000011#endif
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000012
Serhiy Storchakafdd42c42017-03-11 09:19:20 +020013/*[clinic input]
14class list "PyListObject *" "&PyList_Type"
15[clinic start generated code]*/
16/*[clinic end generated code: output=da39a3ee5e6b4b0d input=f9b222678f9f71e0]*/
17
18#include "clinic/listobject.c.h"
19
Tim Peters8d9eb102004-07-31 02:24:20 +000020/* Ensure ob_item has room for at least newsize elements, and set
21 * ob_size to newsize. If newsize > ob_size on entry, the content
22 * of the new slots at exit is undefined heap trash; it's the caller's
Ezio Melotti13925002011-03-16 11:05:33 +020023 * responsibility to overwrite them with sane values.
Tim Peters8d9eb102004-07-31 02:24:20 +000024 * The number of allocated elements may grow, shrink, or stay the same.
25 * Failure is impossible if newsize <= self.allocated on entry, although
26 * that partly relies on an assumption that the system realloc() never
27 * fails when passed a number of bytes <= the number of bytes last
28 * allocated (the C standard doesn't guarantee this, but it's hard to
29 * imagine a realloc implementation where it wouldn't be true).
30 * Note that self->ob_item may change, and even if newsize is less
31 * than ob_size on entry.
32 */
Guido van Rossuma46d51d1995-01-26 22:59:43 +000033static int
Martin v. Löwis18e16552006-02-15 17:27:45 +000034list_resize(PyListObject *self, Py_ssize_t newsize)
Guido van Rossuma46d51d1995-01-26 22:59:43 +000035{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000036 PyObject **items;
Xiang Zhang4cee0492017-02-22 12:32:30 +080037 size_t new_allocated, num_allocated_bytes;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000038 Py_ssize_t allocated = self->allocated;
Tim Peters65b8b842001-05-26 05:28:40 +000039
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000040 /* Bypass realloc() when a previous overallocation is large enough
41 to accommodate the newsize. If the newsize falls lower than half
42 the allocated size, then proceed with the realloc() to shrink the list.
43 */
44 if (allocated >= newsize && newsize >= (allocated >> 1)) {
45 assert(self->ob_item != NULL || newsize == 0);
46 Py_SIZE(self) = newsize;
47 return 0;
48 }
Raymond Hettinger4bb95402004-02-13 11:36:39 +000049
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000050 /* This over-allocates proportional to the list size, making room
51 * for additional growth. The over-allocation is mild, but is
52 * enough to give linear-time amortized behavior over a long
53 * sequence of appends() in the presence of a poorly-performing
54 * system realloc().
55 * The growth pattern is: 0, 4, 8, 16, 25, 35, 46, 58, 72, 88, ...
Xiang Zhang4cee0492017-02-22 12:32:30 +080056 * Note: new_allocated won't overflow because the largest possible value
57 * is PY_SSIZE_T_MAX * (9 / 8) + 6 which always fits in a size_t.
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000058 */
Xiang Zhang4cee0492017-02-22 12:32:30 +080059 new_allocated = (size_t)newsize + (newsize >> 3) + (newsize < 9 ? 3 : 6);
60 if (new_allocated > (size_t)PY_SSIZE_T_MAX / sizeof(PyObject *)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000061 PyErr_NoMemory();
62 return -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000063 }
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +000064
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000065 if (newsize == 0)
66 new_allocated = 0;
Xiang Zhang4cee0492017-02-22 12:32:30 +080067 num_allocated_bytes = new_allocated * sizeof(PyObject *);
68 items = (PyObject **)PyMem_Realloc(self->ob_item, num_allocated_bytes);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000069 if (items == NULL) {
70 PyErr_NoMemory();
71 return -1;
72 }
73 self->ob_item = items;
74 Py_SIZE(self) = newsize;
75 self->allocated = new_allocated;
76 return 0;
Raymond Hettinger4bb95402004-02-13 11:36:39 +000077}
Guido van Rossuma46d51d1995-01-26 22:59:43 +000078
Christian Heimes77c02eb2008-02-09 02:18:51 +000079/* Debug statistic to compare allocations with reuse through the free list */
80#undef SHOW_ALLOC_COUNT
81#ifdef SHOW_ALLOC_COUNT
82static size_t count_alloc = 0;
83static size_t count_reuse = 0;
84
85static void
86show_alloc(void)
87{
Victor Stinner25420fe2017-11-20 18:12:22 -080088 PyInterpreterState *interp = PyThreadState_GET()->interp;
Miss Islington (bot)bc2e1102018-02-21 21:44:08 -080089 if (!interp->core_config.show_alloc_count) {
Serhiy Storchaka7e160ce2016-07-03 21:03:53 +030090 return;
Victor Stinner25420fe2017-11-20 18:12:22 -080091 }
Serhiy Storchaka7e160ce2016-07-03 21:03:53 +030092
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000093 fprintf(stderr, "List allocations: %" PY_FORMAT_SIZE_T "d\n",
94 count_alloc);
95 fprintf(stderr, "List reuse through freelist: %" PY_FORMAT_SIZE_T
96 "d\n", count_reuse);
97 fprintf(stderr, "%.2f%% reuse rate\n\n",
98 (100.0*count_reuse/(count_alloc+count_reuse)));
Christian Heimes77c02eb2008-02-09 02:18:51 +000099}
100#endif
101
Raymond Hettinger0468e412004-05-05 05:37:53 +0000102/* Empty list reuse scheme to save calls to malloc and free */
Christian Heimes2202f872008-02-06 14:31:34 +0000103#ifndef PyList_MAXFREELIST
104#define PyList_MAXFREELIST 80
105#endif
106static PyListObject *free_list[PyList_MAXFREELIST];
107static int numfree = 0;
Raymond Hettinger0468e412004-05-05 05:37:53 +0000108
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100109int
110PyList_ClearFreeList(void)
Raymond Hettingerfb09f0e2004-10-07 03:58:07 +0000111{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000112 PyListObject *op;
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100113 int ret = numfree;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000114 while (numfree) {
115 op = free_list[--numfree];
116 assert(PyList_CheckExact(op));
117 PyObject_GC_Del(op);
118 }
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100119 return ret;
120}
121
122void
123PyList_Fini(void)
124{
125 PyList_ClearFreeList();
Raymond Hettingerfb09f0e2004-10-07 03:58:07 +0000126}
127
David Malcolm49526f42012-06-22 14:55:41 -0400128/* Print summary info about the state of the optimized allocator */
129void
130_PyList_DebugMallocStats(FILE *out)
131{
132 _PyDebugAllocatorStats(out,
133 "free PyListObject",
134 numfree, sizeof(PyListObject));
135}
136
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000137PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000138PyList_New(Py_ssize_t size)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000139{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000140 PyListObject *op;
Christian Heimes77c02eb2008-02-09 02:18:51 +0000141#ifdef SHOW_ALLOC_COUNT
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000142 static int initialized = 0;
143 if (!initialized) {
144 Py_AtExit(show_alloc);
145 initialized = 1;
146 }
Christian Heimes77c02eb2008-02-09 02:18:51 +0000147#endif
Tim Peters3986d4e2004-07-29 02:28:42 +0000148
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000149 if (size < 0) {
150 PyErr_BadInternalCall();
151 return NULL;
152 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000153 if (numfree) {
154 numfree--;
155 op = free_list[numfree];
156 _Py_NewReference((PyObject *)op);
Christian Heimes77c02eb2008-02-09 02:18:51 +0000157#ifdef SHOW_ALLOC_COUNT
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000158 count_reuse++;
Christian Heimes77c02eb2008-02-09 02:18:51 +0000159#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000160 } else {
161 op = PyObject_GC_New(PyListObject, &PyList_Type);
162 if (op == NULL)
163 return NULL;
Christian Heimes77c02eb2008-02-09 02:18:51 +0000164#ifdef SHOW_ALLOC_COUNT
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000165 count_alloc++;
Christian Heimes77c02eb2008-02-09 02:18:51 +0000166#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000167 }
168 if (size <= 0)
169 op->ob_item = NULL;
170 else {
Mark Dickinson5d132382016-08-21 08:55:15 +0100171 op->ob_item = (PyObject **) PyMem_Calloc(size, sizeof(PyObject *));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000172 if (op->ob_item == NULL) {
173 Py_DECREF(op);
174 return PyErr_NoMemory();
175 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000176 }
177 Py_SIZE(op) = size;
178 op->allocated = size;
179 _PyObject_GC_TRACK(op);
180 return (PyObject *) op;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000181}
182
Martin v. Löwis18e16552006-02-15 17:27:45 +0000183Py_ssize_t
Fred Drakea2f55112000-07-09 15:16:51 +0000184PyList_Size(PyObject *op)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000185{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000186 if (!PyList_Check(op)) {
187 PyErr_BadInternalCall();
188 return -1;
189 }
190 else
191 return Py_SIZE(op);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000192}
193
Raymond Hettingerfdfe6182004-05-05 06:28:16 +0000194static PyObject *indexerr = NULL;
Guido van Rossum929f1b81996-08-09 20:51:27 +0000195
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000196PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000197PyList_GetItem(PyObject *op, Py_ssize_t i)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000198{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000199 if (!PyList_Check(op)) {
200 PyErr_BadInternalCall();
201 return NULL;
202 }
203 if (i < 0 || i >= Py_SIZE(op)) {
204 if (indexerr == NULL) {
205 indexerr = PyUnicode_FromString(
206 "list index out of range");
207 if (indexerr == NULL)
208 return NULL;
209 }
210 PyErr_SetObject(PyExc_IndexError, indexerr);
211 return NULL;
212 }
213 return ((PyListObject *)op) -> ob_item[i];
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000214}
215
216int
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200217PyList_SetItem(PyObject *op, Py_ssize_t i,
218 PyObject *newitem)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000219{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200220 PyObject **p;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000221 if (!PyList_Check(op)) {
222 Py_XDECREF(newitem);
223 PyErr_BadInternalCall();
224 return -1;
225 }
226 if (i < 0 || i >= Py_SIZE(op)) {
227 Py_XDECREF(newitem);
228 PyErr_SetString(PyExc_IndexError,
229 "list assignment index out of range");
230 return -1;
231 }
232 p = ((PyListObject *)op) -> ob_item + i;
Serhiy Storchakaec397562016-04-06 09:50:03 +0300233 Py_XSETREF(*p, newitem);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000234 return 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000235}
236
237static int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000238ins1(PyListObject *self, Py_ssize_t where, PyObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000239{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000240 Py_ssize_t i, n = Py_SIZE(self);
241 PyObject **items;
242 if (v == NULL) {
243 PyErr_BadInternalCall();
244 return -1;
245 }
246 if (n == PY_SSIZE_T_MAX) {
247 PyErr_SetString(PyExc_OverflowError,
248 "cannot add more objects to list");
249 return -1;
250 }
Tim Petersb38e2b62004-07-29 02:29:26 +0000251
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800252 if (list_resize(self, n+1) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000253 return -1;
Raymond Hettinger4bb95402004-02-13 11:36:39 +0000254
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000255 if (where < 0) {
256 where += n;
257 if (where < 0)
258 where = 0;
259 }
260 if (where > n)
261 where = n;
262 items = self->ob_item;
263 for (i = n; --i >= where; )
264 items[i+1] = items[i];
265 Py_INCREF(v);
266 items[where] = v;
267 return 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000268}
269
270int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000271PyList_Insert(PyObject *op, Py_ssize_t where, PyObject *newitem)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000272{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000273 if (!PyList_Check(op)) {
274 PyErr_BadInternalCall();
275 return -1;
276 }
277 return ins1((PyListObject *)op, where, newitem);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000278}
279
Raymond Hettinger40a03822004-04-12 13:05:09 +0000280static int
281app1(PyListObject *self, PyObject *v)
282{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000283 Py_ssize_t n = PyList_GET_SIZE(self);
Raymond Hettinger40a03822004-04-12 13:05:09 +0000284
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000285 assert (v != NULL);
286 if (n == PY_SSIZE_T_MAX) {
287 PyErr_SetString(PyExc_OverflowError,
288 "cannot add more objects to list");
289 return -1;
290 }
Raymond Hettinger40a03822004-04-12 13:05:09 +0000291
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800292 if (list_resize(self, n+1) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000293 return -1;
Raymond Hettinger40a03822004-04-12 13:05:09 +0000294
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000295 Py_INCREF(v);
296 PyList_SET_ITEM(self, n, v);
297 return 0;
Raymond Hettinger40a03822004-04-12 13:05:09 +0000298}
299
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000300int
Fred Drakea2f55112000-07-09 15:16:51 +0000301PyList_Append(PyObject *op, PyObject *newitem)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000302{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000303 if (PyList_Check(op) && (newitem != NULL))
304 return app1((PyListObject *)op, newitem);
305 PyErr_BadInternalCall();
306 return -1;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000307}
308
309/* Methods */
310
311static void
Fred Drakea2f55112000-07-09 15:16:51 +0000312list_dealloc(PyListObject *op)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000313{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000314 Py_ssize_t i;
315 PyObject_GC_UnTrack(op);
316 Py_TRASHCAN_SAFE_BEGIN(op)
317 if (op->ob_item != NULL) {
318 /* Do it backwards, for Christian Tismer.
319 There's a simple test case where somehow this reduces
320 thrashing when a *very* large list is created and
321 immediately deleted. */
322 i = Py_SIZE(op);
323 while (--i >= 0) {
324 Py_XDECREF(op->ob_item[i]);
325 }
326 PyMem_FREE(op->ob_item);
327 }
328 if (numfree < PyList_MAXFREELIST && PyList_CheckExact(op))
329 free_list[numfree++] = op;
330 else
331 Py_TYPE(op)->tp_free((PyObject *)op);
332 Py_TRASHCAN_SAFE_END(op)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000333}
334
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000335static PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +0000336list_repr(PyListObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000337{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000338 Py_ssize_t i;
Victor Stinner5c733472013-11-18 21:11:57 +0100339 PyObject *s;
Victor Stinner5c733472013-11-18 21:11:57 +0100340 _PyUnicodeWriter writer;
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200341
342 if (Py_SIZE(v) == 0) {
343 return PyUnicode_FromString("[]");
344 }
345
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000346 i = Py_ReprEnter((PyObject*)v);
347 if (i != 0) {
348 return i > 0 ? PyUnicode_FromString("[...]") : NULL;
349 }
Tim Petersa7259592001-06-16 05:11:17 +0000350
Victor Stinner5c733472013-11-18 21:11:57 +0100351 _PyUnicodeWriter_Init(&writer);
352 writer.overallocate = 1;
Victor Stinnerb8fb1972013-11-18 22:15:44 +0100353 /* "[" + "1" + ", 2" * (len - 1) + "]" */
354 writer.min_length = 1 + 1 + (2 + 1) * (Py_SIZE(v) - 1) + 1;
Tim Petersa7259592001-06-16 05:11:17 +0000355
Victor Stinner5c733472013-11-18 21:11:57 +0100356 if (_PyUnicodeWriter_WriteChar(&writer, '[') < 0)
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200357 goto error;
Tim Petersa7259592001-06-16 05:11:17 +0000358
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000359 /* Do repr() on each element. Note that this may mutate the list,
360 so must refetch the list size on each iteration. */
361 for (i = 0; i < Py_SIZE(v); ++i) {
Victor Stinner5c733472013-11-18 21:11:57 +0100362 if (i > 0) {
Victor Stinner4a587072013-11-19 12:54:53 +0100363 if (_PyUnicodeWriter_WriteASCIIString(&writer, ", ", 2) < 0)
Victor Stinner5c733472013-11-18 21:11:57 +0100364 goto error;
365 }
366
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000367 s = PyObject_Repr(v->ob_item[i]);
Victor Stinner5c733472013-11-18 21:11:57 +0100368 if (s == NULL)
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200369 goto error;
Victor Stinner5c733472013-11-18 21:11:57 +0100370
371 if (_PyUnicodeWriter_WriteStr(&writer, s) < 0) {
372 Py_DECREF(s);
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200373 goto error;
Victor Stinner5c733472013-11-18 21:11:57 +0100374 }
375 Py_DECREF(s);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000376 }
Victor Stinner5c733472013-11-18 21:11:57 +0100377
Victor Stinner4d3f1092013-11-19 12:09:00 +0100378 writer.overallocate = 0;
Victor Stinner5c733472013-11-18 21:11:57 +0100379 if (_PyUnicodeWriter_WriteChar(&writer, ']') < 0)
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200380 goto error;
Tim Petersa7259592001-06-16 05:11:17 +0000381
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000382 Py_ReprLeave((PyObject *)v);
Victor Stinner5c733472013-11-18 21:11:57 +0100383 return _PyUnicodeWriter_Finish(&writer);
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200384
385error:
Victor Stinner5c733472013-11-18 21:11:57 +0100386 _PyUnicodeWriter_Dealloc(&writer);
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200387 Py_ReprLeave((PyObject *)v);
388 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000389}
390
Martin v. Löwis18e16552006-02-15 17:27:45 +0000391static Py_ssize_t
Fred Drakea2f55112000-07-09 15:16:51 +0000392list_length(PyListObject *a)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000393{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000394 return Py_SIZE(a);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000395}
396
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000397static int
Fred Drakea2f55112000-07-09 15:16:51 +0000398list_contains(PyListObject *a, PyObject *el)
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000399{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000400 Py_ssize_t i;
401 int cmp;
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000402
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000403 for (i = 0, cmp = 0 ; cmp == 0 && i < Py_SIZE(a); ++i)
404 cmp = PyObject_RichCompareBool(el, PyList_GET_ITEM(a, i),
405 Py_EQ);
406 return cmp;
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000407}
408
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000409static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000410list_item(PyListObject *a, Py_ssize_t i)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000411{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000412 if (i < 0 || i >= Py_SIZE(a)) {
413 if (indexerr == NULL) {
414 indexerr = PyUnicode_FromString(
415 "list index out of range");
416 if (indexerr == NULL)
417 return NULL;
418 }
419 PyErr_SetObject(PyExc_IndexError, indexerr);
420 return NULL;
421 }
422 Py_INCREF(a->ob_item[i]);
423 return a->ob_item[i];
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000424}
425
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000426static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000427list_slice(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000428{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000429 PyListObject *np;
430 PyObject **src, **dest;
431 Py_ssize_t i, len;
432 if (ilow < 0)
433 ilow = 0;
434 else if (ilow > Py_SIZE(a))
435 ilow = Py_SIZE(a);
436 if (ihigh < ilow)
437 ihigh = ilow;
438 else if (ihigh > Py_SIZE(a))
439 ihigh = Py_SIZE(a);
440 len = ihigh - ilow;
441 np = (PyListObject *) PyList_New(len);
442 if (np == NULL)
443 return NULL;
Raymond Hettinger99842b62004-03-08 05:56:15 +0000444
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000445 src = a->ob_item + ilow;
446 dest = np->ob_item;
447 for (i = 0; i < len; i++) {
448 PyObject *v = src[i];
449 Py_INCREF(v);
450 dest[i] = v;
451 }
452 return (PyObject *)np;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000453}
454
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000455PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000456PyList_GetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
Guido van Rossum234f9421993-06-17 12:35:49 +0000457{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000458 if (!PyList_Check(a)) {
459 PyErr_BadInternalCall();
460 return NULL;
461 }
462 return list_slice((PyListObject *)a, ilow, ihigh);
Guido van Rossum234f9421993-06-17 12:35:49 +0000463}
464
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000465static PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +0000466list_concat(PyListObject *a, PyObject *bb)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000467{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000468 Py_ssize_t size;
469 Py_ssize_t i;
470 PyObject **src, **dest;
471 PyListObject *np;
472 if (!PyList_Check(bb)) {
473 PyErr_Format(PyExc_TypeError,
474 "can only concatenate list (not \"%.200s\") to list",
475 bb->ob_type->tp_name);
476 return NULL;
477 }
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000478#define b ((PyListObject *)bb)
Martin Panterb93d8632016-07-25 02:39:20 +0000479 if (Py_SIZE(a) > PY_SSIZE_T_MAX - Py_SIZE(b))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000480 return PyErr_NoMemory();
Martin Panterb93d8632016-07-25 02:39:20 +0000481 size = Py_SIZE(a) + Py_SIZE(b);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000482 np = (PyListObject *) PyList_New(size);
483 if (np == NULL) {
484 return NULL;
485 }
486 src = a->ob_item;
487 dest = np->ob_item;
488 for (i = 0; i < Py_SIZE(a); i++) {
489 PyObject *v = src[i];
490 Py_INCREF(v);
491 dest[i] = v;
492 }
493 src = b->ob_item;
494 dest = np->ob_item + Py_SIZE(a);
495 for (i = 0; i < Py_SIZE(b); i++) {
496 PyObject *v = src[i];
497 Py_INCREF(v);
498 dest[i] = v;
499 }
500 return (PyObject *)np;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000501#undef b
502}
503
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000504static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000505list_repeat(PyListObject *a, Py_ssize_t n)
Guido van Rossumed98d481991-03-06 13:07:53 +0000506{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000507 Py_ssize_t i, j;
508 Py_ssize_t size;
509 PyListObject *np;
510 PyObject **p, **items;
511 PyObject *elem;
512 if (n < 0)
513 n = 0;
Mark Dickinsonc0420fd2011-09-19 19:18:37 +0100514 if (n > 0 && Py_SIZE(a) > PY_SSIZE_T_MAX / n)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000515 return PyErr_NoMemory();
Mark Dickinsonc0420fd2011-09-19 19:18:37 +0100516 size = Py_SIZE(a) * n;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000517 if (size == 0)
518 return PyList_New(0);
519 np = (PyListObject *) PyList_New(size);
520 if (np == NULL)
521 return NULL;
Raymond Hettinger6624e682003-05-21 05:58:46 +0000522
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000523 items = np->ob_item;
524 if (Py_SIZE(a) == 1) {
525 elem = a->ob_item[0];
526 for (i = 0; i < n; i++) {
527 items[i] = elem;
528 Py_INCREF(elem);
529 }
530 return (PyObject *) np;
531 }
532 p = np->ob_item;
533 items = a->ob_item;
534 for (i = 0; i < n; i++) {
535 for (j = 0; j < Py_SIZE(a); j++) {
536 *p = items[j];
537 Py_INCREF(*p);
538 p++;
539 }
540 }
541 return (PyObject *) np;
Guido van Rossumed98d481991-03-06 13:07:53 +0000542}
543
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000544static int
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200545_list_clear(PyListObject *a)
Armin Rigo93677f02004-07-29 12:40:23 +0000546{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000547 Py_ssize_t i;
548 PyObject **item = a->ob_item;
549 if (item != NULL) {
550 /* Because XDECREF can recursively invoke operations on
551 this list, we make it empty first. */
552 i = Py_SIZE(a);
553 Py_SIZE(a) = 0;
554 a->ob_item = NULL;
555 a->allocated = 0;
556 while (--i >= 0) {
557 Py_XDECREF(item[i]);
558 }
559 PyMem_FREE(item);
560 }
561 /* Never fails; the return value can be ignored.
562 Note that there is no guarantee that the list is actually empty
563 at this point, because XDECREF may have populated it again! */
564 return 0;
Armin Rigo93677f02004-07-29 12:40:23 +0000565}
566
Tim Peters8fc4a912004-07-31 21:53:19 +0000567/* a[ilow:ihigh] = v if v != NULL.
568 * del a[ilow:ihigh] if v == NULL.
569 *
570 * Special speed gimmick: when v is NULL and ihigh - ilow <= 8, it's
571 * guaranteed the call cannot fail.
572 */
Armin Rigo93677f02004-07-29 12:40:23 +0000573static int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000574list_ass_slice(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000575{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000576 /* Because [X]DECREF can recursively invoke list operations on
577 this list, we must postpone all [X]DECREF activity until
578 after the list is back in its canonical shape. Therefore
579 we must allocate an additional array, 'recycle', into which
580 we temporarily copy the items that are deleted from the
581 list. :-( */
582 PyObject *recycle_on_stack[8];
583 PyObject **recycle = recycle_on_stack; /* will allocate more if needed */
584 PyObject **item;
585 PyObject **vitem = NULL;
586 PyObject *v_as_SF = NULL; /* PySequence_Fast(v) */
587 Py_ssize_t n; /* # of elements in replacement list */
588 Py_ssize_t norig; /* # of elements in list getting replaced */
589 Py_ssize_t d; /* Change in size */
590 Py_ssize_t k;
591 size_t s;
592 int result = -1; /* guilty until proved innocent */
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000593#define b ((PyListObject *)v)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000594 if (v == NULL)
595 n = 0;
596 else {
597 if (a == b) {
598 /* Special case "a[i:j] = a" -- copy b first */
599 v = list_slice(b, 0, Py_SIZE(b));
600 if (v == NULL)
601 return result;
602 result = list_ass_slice(a, ilow, ihigh, v);
603 Py_DECREF(v);
604 return result;
605 }
606 v_as_SF = PySequence_Fast(v, "can only assign an iterable");
607 if(v_as_SF == NULL)
608 goto Error;
609 n = PySequence_Fast_GET_SIZE(v_as_SF);
610 vitem = PySequence_Fast_ITEMS(v_as_SF);
611 }
612 if (ilow < 0)
613 ilow = 0;
614 else if (ilow > Py_SIZE(a))
615 ilow = Py_SIZE(a);
Tim Peters8d9eb102004-07-31 02:24:20 +0000616
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000617 if (ihigh < ilow)
618 ihigh = ilow;
619 else if (ihigh > Py_SIZE(a))
620 ihigh = Py_SIZE(a);
Armin Rigo93677f02004-07-29 12:40:23 +0000621
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000622 norig = ihigh - ilow;
623 assert(norig >= 0);
624 d = n - norig;
625 if (Py_SIZE(a) + d == 0) {
626 Py_XDECREF(v_as_SF);
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200627 return _list_clear(a);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000628 }
629 item = a->ob_item;
630 /* recycle the items that we are about to remove */
631 s = norig * sizeof(PyObject *);
Benjamin Peterson5a7d9232016-09-06 17:58:25 -0700632 /* If norig == 0, item might be NULL, in which case we may not memcpy from it. */
633 if (s) {
634 if (s > sizeof(recycle_on_stack)) {
635 recycle = (PyObject **)PyMem_MALLOC(s);
636 if (recycle == NULL) {
637 PyErr_NoMemory();
638 goto Error;
639 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000640 }
Benjamin Peterson5a7d9232016-09-06 17:58:25 -0700641 memcpy(recycle, &item[ilow], s);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000642 }
Tim Peters8d9eb102004-07-31 02:24:20 +0000643
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000644 if (d < 0) { /* Delete -d items */
Victor Stinner2c40f642013-07-19 23:06:21 +0200645 Py_ssize_t tail;
646 tail = (Py_SIZE(a) - ihigh) * sizeof(PyObject *);
647 memmove(&item[ihigh+d], &item[ihigh], tail);
648 if (list_resize(a, Py_SIZE(a) + d) < 0) {
649 memmove(&item[ihigh], &item[ihigh+d], tail);
650 memcpy(&item[ilow], recycle, s);
651 goto Error;
652 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000653 item = a->ob_item;
654 }
655 else if (d > 0) { /* Insert d items */
656 k = Py_SIZE(a);
657 if (list_resize(a, k+d) < 0)
658 goto Error;
659 item = a->ob_item;
660 memmove(&item[ihigh+d], &item[ihigh],
661 (k - ihigh)*sizeof(PyObject *));
662 }
663 for (k = 0; k < n; k++, ilow++) {
664 PyObject *w = vitem[k];
665 Py_XINCREF(w);
666 item[ilow] = w;
667 }
668 for (k = norig - 1; k >= 0; --k)
669 Py_XDECREF(recycle[k]);
670 result = 0;
Tim Peters8d9eb102004-07-31 02:24:20 +0000671 Error:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000672 if (recycle != recycle_on_stack)
673 PyMem_FREE(recycle);
674 Py_XDECREF(v_as_SF);
675 return result;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000676#undef b
677}
678
Guido van Rossum234f9421993-06-17 12:35:49 +0000679int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000680PyList_SetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
Guido van Rossum234f9421993-06-17 12:35:49 +0000681{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000682 if (!PyList_Check(a)) {
683 PyErr_BadInternalCall();
684 return -1;
685 }
686 return list_ass_slice((PyListObject *)a, ilow, ihigh, v);
Guido van Rossum234f9421993-06-17 12:35:49 +0000687}
688
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000689static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000690list_inplace_repeat(PyListObject *self, Py_ssize_t n)
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000691{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000692 PyObject **items;
693 Py_ssize_t size, i, j, p;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000694
695
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000696 size = PyList_GET_SIZE(self);
697 if (size == 0 || n == 1) {
698 Py_INCREF(self);
699 return (PyObject *)self;
700 }
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000701
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000702 if (n < 1) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200703 (void)_list_clear(self);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000704 Py_INCREF(self);
705 return (PyObject *)self;
706 }
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000707
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000708 if (size > PY_SSIZE_T_MAX / n) {
709 return PyErr_NoMemory();
710 }
Christian Heimesaf98da12008-01-27 15:18:18 +0000711
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800712 if (list_resize(self, size*n) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000713 return NULL;
Raymond Hettinger4bb95402004-02-13 11:36:39 +0000714
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000715 p = size;
716 items = self->ob_item;
717 for (i = 1; i < n; i++) { /* Start counting at 1, not 0 */
718 for (j = 0; j < size; j++) {
719 PyObject *o = items[j];
720 Py_INCREF(o);
721 items[p++] = o;
722 }
723 }
724 Py_INCREF(self);
725 return (PyObject *)self;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000726}
727
Guido van Rossum4a450d01991-04-03 19:05:18 +0000728static int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000729list_ass_item(PyListObject *a, Py_ssize_t i, PyObject *v)
Guido van Rossum4a450d01991-04-03 19:05:18 +0000730{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000731 if (i < 0 || i >= Py_SIZE(a)) {
732 PyErr_SetString(PyExc_IndexError,
733 "list assignment index out of range");
734 return -1;
735 }
736 if (v == NULL)
737 return list_ass_slice(a, i, i+1, v);
738 Py_INCREF(v);
Serhiy Storchakaf01e4082016-04-10 18:12:01 +0300739 Py_SETREF(a->ob_item[i], v);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000740 return 0;
Guido van Rossum4a450d01991-04-03 19:05:18 +0000741}
742
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200743/*[clinic input]
744list.insert
745
746 index: Py_ssize_t
747 object: object
748 /
749
750Insert object before index.
751[clinic start generated code]*/
752
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000753static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200754list_insert_impl(PyListObject *self, Py_ssize_t index, PyObject *object)
755/*[clinic end generated code: output=7f35e32f60c8cb78 input=858514cf894c7eab]*/
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000756{
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200757 if (ins1(self, index, object) == 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000758 Py_RETURN_NONE;
759 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000760}
761
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200762/*[clinic input]
763list.clear
764
765Remove all items from list.
766[clinic start generated code]*/
767
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000768static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200769list_clear_impl(PyListObject *self)
770/*[clinic end generated code: output=67a1896c01f74362 input=ca3c1646856742f6]*/
Eli Benderskycbbaa962011-02-25 05:47:53 +0000771{
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200772 _list_clear(self);
Eli Benderskycbbaa962011-02-25 05:47:53 +0000773 Py_RETURN_NONE;
774}
775
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200776/*[clinic input]
777list.copy
778
779Return a shallow copy of the list.
780[clinic start generated code]*/
781
Eli Benderskycbbaa962011-02-25 05:47:53 +0000782static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200783list_copy_impl(PyListObject *self)
784/*[clinic end generated code: output=ec6b72d6209d418e input=6453ab159e84771f]*/
Eli Benderskycbbaa962011-02-25 05:47:53 +0000785{
786 return list_slice(self, 0, Py_SIZE(self));
787}
788
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200789/*[clinic input]
790list.append
791
792 object: object
793 /
794
795Append object to the end of the list.
796[clinic start generated code]*/
797
Eli Benderskycbbaa962011-02-25 05:47:53 +0000798static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200799list_append(PyListObject *self, PyObject *object)
800/*[clinic end generated code: output=7c096003a29c0eae input=43a3fe48a7066e91]*/
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000801{
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200802 if (app1(self, object) == 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000803 Py_RETURN_NONE;
804 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000805}
806
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200807/*[clinic input]
808list.extend
809
810 iterable: object
811 /
812
813Extend list by appending elements from the iterable.
814[clinic start generated code]*/
815
Barry Warsawdedf6d61998-10-09 16:37:25 +0000816static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200817list_extend(PyListObject *self, PyObject *iterable)
818/*[clinic end generated code: output=630fb3bca0c8e789 input=9ec5ba3a81be3a4d]*/
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000819{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000820 PyObject *it; /* iter(v) */
821 Py_ssize_t m; /* size of self */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200822 Py_ssize_t n; /* guess for size of iterable */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000823 Py_ssize_t mn; /* m + n */
824 Py_ssize_t i;
825 PyObject *(*iternext)(PyObject *);
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000826
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000827 /* Special cases:
828 1) lists and tuples which can use PySequence_Fast ops
829 2) extending self to self requires making a copy first
830 */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200831 if (PyList_CheckExact(iterable) || PyTuple_CheckExact(iterable) ||
832 (PyObject *)self == iterable) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000833 PyObject **src, **dest;
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200834 iterable = PySequence_Fast(iterable, "argument must be iterable");
835 if (!iterable)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000836 return NULL;
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200837 n = PySequence_Fast_GET_SIZE(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000838 if (n == 0) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200839 /* short circuit when iterable is empty */
840 Py_DECREF(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000841 Py_RETURN_NONE;
842 }
843 m = Py_SIZE(self);
Martin Panter94b39ce2017-01-14 06:30:37 +0000844 /* It should not be possible to allocate a list large enough to cause
845 an overflow on any relevant platform */
846 assert(m < PY_SSIZE_T_MAX - n);
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800847 if (list_resize(self, m + n) < 0) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200848 Py_DECREF(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000849 return NULL;
850 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200851 /* note that we may still have self == iterable here for the
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000852 * situation a.extend(a), but the following code works
853 * in that case too. Just make sure to resize self
854 * before calling PySequence_Fast_ITEMS.
855 */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200856 /* populate the end of self with iterable's items */
857 src = PySequence_Fast_ITEMS(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000858 dest = self->ob_item + m;
859 for (i = 0; i < n; i++) {
860 PyObject *o = src[i];
861 Py_INCREF(o);
862 dest[i] = o;
863 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200864 Py_DECREF(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000865 Py_RETURN_NONE;
866 }
Raymond Hettinger90a39bf2004-02-15 03:57:00 +0000867
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200868 it = PyObject_GetIter(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000869 if (it == NULL)
870 return NULL;
871 iternext = *it->ob_type->tp_iternext;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000872
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000873 /* Guess a result list size. */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200874 n = PyObject_LengthHint(iterable, 8);
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800875 if (n < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000876 Py_DECREF(it);
877 return NULL;
878 }
879 m = Py_SIZE(self);
Martin Panterb93d8632016-07-25 02:39:20 +0000880 if (m > PY_SSIZE_T_MAX - n) {
881 /* m + n overflowed; on the chance that n lied, and there really
882 * is enough room, ignore it. If n was telling the truth, we'll
883 * eventually run out of memory during the loop.
884 */
885 }
886 else {
887 mn = m + n;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000888 /* Make room. */
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800889 if (list_resize(self, mn) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000890 goto error;
891 /* Make the list sane again. */
892 Py_SIZE(self) = m;
893 }
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000894
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000895 /* Run iterator to exhaustion. */
896 for (;;) {
897 PyObject *item = iternext(it);
898 if (item == NULL) {
899 if (PyErr_Occurred()) {
900 if (PyErr_ExceptionMatches(PyExc_StopIteration))
901 PyErr_Clear();
902 else
903 goto error;
904 }
905 break;
906 }
907 if (Py_SIZE(self) < self->allocated) {
908 /* steals ref */
909 PyList_SET_ITEM(self, Py_SIZE(self), item);
910 ++Py_SIZE(self);
911 }
912 else {
913 int status = app1(self, item);
914 Py_DECREF(item); /* append creates a new ref */
915 if (status < 0)
916 goto error;
917 }
918 }
Raymond Hettinger90a39bf2004-02-15 03:57:00 +0000919
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000920 /* Cut back result list if initial guess was too large. */
Victor Stinner32fd6ea2013-07-16 21:45:58 +0200921 if (Py_SIZE(self) < self->allocated) {
922 if (list_resize(self, Py_SIZE(self)) < 0)
923 goto error;
924 }
Raymond Hettingeraa241e02004-09-26 19:24:20 +0000925
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000926 Py_DECREF(it);
927 Py_RETURN_NONE;
Raymond Hettinger90a39bf2004-02-15 03:57:00 +0000928
929 error:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000930 Py_DECREF(it);
931 return NULL;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000932}
933
Raymond Hettinger8ca92ae2004-03-11 09:13:12 +0000934PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200935_PyList_Extend(PyListObject *self, PyObject *iterable)
Raymond Hettinger8ca92ae2004-03-11 09:13:12 +0000936{
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200937 return list_extend(self, iterable);
Raymond Hettinger8ca92ae2004-03-11 09:13:12 +0000938}
939
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000940static PyObject *
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000941list_inplace_concat(PyListObject *self, PyObject *other)
942{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000943 PyObject *result;
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000944
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200945 result = list_extend(self, other);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000946 if (result == NULL)
947 return result;
948 Py_DECREF(result);
949 Py_INCREF(self);
950 return (PyObject *)self;
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000951}
952
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200953/*[clinic input]
954list.pop
955
956 index: Py_ssize_t = -1
957 /
958
959Remove and return item at index (default last).
960
961Raises IndexError if list is empty or index is out of range.
962[clinic start generated code]*/
963
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000964static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200965list_pop_impl(PyListObject *self, Py_ssize_t index)
966/*[clinic end generated code: output=6bd69dcb3f17eca8 input=b83675976f329e6f]*/
Guido van Rossum3dd7f3f1998-06-30 15:36:32 +0000967{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000968 PyObject *v;
969 int status;
Raymond Hettinger9eb86b32004-02-17 11:36:16 +0000970
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000971 if (Py_SIZE(self) == 0) {
972 /* Special-case most common failure cause */
973 PyErr_SetString(PyExc_IndexError, "pop from empty list");
974 return NULL;
975 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200976 if (index < 0)
977 index += Py_SIZE(self);
978 if (index < 0 || index >= Py_SIZE(self)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000979 PyErr_SetString(PyExc_IndexError, "pop index out of range");
980 return NULL;
981 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200982 v = self->ob_item[index];
983 if (index == Py_SIZE(self) - 1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000984 status = list_resize(self, Py_SIZE(self) - 1);
Victor Stinnerb27cd3e2013-07-08 22:20:44 +0200985 if (status >= 0)
986 return v; /* and v now owns the reference the list had */
987 else
988 return NULL;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000989 }
990 Py_INCREF(v);
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200991 status = list_ass_slice(self, index, index+1, (PyObject *)NULL);
Victor Stinner095d99f2013-07-17 21:58:01 +0200992 if (status < 0) {
993 Py_DECREF(v);
994 return NULL;
995 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000996 return v;
Guido van Rossum3dd7f3f1998-06-30 15:36:32 +0000997}
998
Tim Peters8e2e7ca2002-07-19 02:33:08 +0000999/* Reverse a slice of a list in place, from lo up to (exclusive) hi. */
1000static void
1001reverse_slice(PyObject **lo, PyObject **hi)
1002{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001003 assert(lo && hi);
Tim Peters8e2e7ca2002-07-19 02:33:08 +00001004
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001005 --hi;
1006 while (lo < hi) {
1007 PyObject *t = *lo;
1008 *lo = *hi;
1009 *hi = t;
1010 ++lo;
1011 --hi;
1012 }
Tim Peters8e2e7ca2002-07-19 02:33:08 +00001013}
1014
Tim Petersa64dc242002-08-01 02:13:36 +00001015/* Lots of code for an adaptive, stable, natural mergesort. There are many
1016 * pieces to this algorithm; read listsort.txt for overviews and details.
1017 */
Guido van Rossum3f236de1996-12-10 23:55:39 +00001018
Daniel Stutzbach98338222010-12-02 21:55:33 +00001019/* A sortslice contains a pointer to an array of keys and a pointer to
1020 * an array of corresponding values. In other words, keys[i]
1021 * corresponds with values[i]. If values == NULL, then the keys are
1022 * also the values.
1023 *
1024 * Several convenience routines are provided here, so that keys and
1025 * values are always moved in sync.
1026 */
1027
1028typedef struct {
1029 PyObject **keys;
1030 PyObject **values;
1031} sortslice;
1032
1033Py_LOCAL_INLINE(void)
1034sortslice_copy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j)
1035{
1036 s1->keys[i] = s2->keys[j];
1037 if (s1->values != NULL)
1038 s1->values[i] = s2->values[j];
1039}
1040
1041Py_LOCAL_INLINE(void)
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001042sortslice_copy_incr(sortslice *dst, sortslice *src)
1043{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001044 *dst->keys++ = *src->keys++;
1045 if (dst->values != NULL)
1046 *dst->values++ = *src->values++;
1047}
1048
1049Py_LOCAL_INLINE(void)
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001050sortslice_copy_decr(sortslice *dst, sortslice *src)
1051{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001052 *dst->keys-- = *src->keys--;
1053 if (dst->values != NULL)
1054 *dst->values-- = *src->values--;
1055}
1056
1057
1058Py_LOCAL_INLINE(void)
1059sortslice_memcpy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001060 Py_ssize_t n)
1061{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001062 memcpy(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1063 if (s1->values != NULL)
1064 memcpy(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1065}
1066
1067Py_LOCAL_INLINE(void)
1068sortslice_memmove(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001069 Py_ssize_t n)
1070{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001071 memmove(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1072 if (s1->values != NULL)
1073 memmove(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1074}
1075
1076Py_LOCAL_INLINE(void)
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001077sortslice_advance(sortslice *slice, Py_ssize_t n)
1078{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001079 slice->keys += n;
1080 if (slice->values != NULL)
1081 slice->values += n;
1082}
1083
embg1e34da42018-01-28 20:03:23 -07001084/* Comparison function: ms->key_compare, which is set at run-time in
1085 * listsort_impl to optimize for various special cases.
Tim Petersa64dc242002-08-01 02:13:36 +00001086 * Returns -1 on error, 1 if x < y, 0 if x >= y.
1087 */
Guido van Rossum3f236de1996-12-10 23:55:39 +00001088
embg1e34da42018-01-28 20:03:23 -07001089#define ISLT(X, Y) (*(ms->key_compare))(X, Y, ms)
Tim Peters66860f62002-08-04 17:47:26 +00001090
1091/* Compare X to Y via "<". Goto "fail" if the comparison raises an
Tim Petersa8c974c2002-07-19 03:30:57 +00001092 error. Else "k" is set to true iff X<Y, and an "if (k)" block is
1093 started. It makes more sense in context <wink>. X and Y are PyObject*s.
1094*/
Raymond Hettinger70b64fc2008-01-30 20:15:17 +00001095#define IFLT(X, Y) if ((k = ISLT(X, Y)) < 0) goto fail; \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001096 if (k)
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001097
embg1e34da42018-01-28 20:03:23 -07001098/* The maximum number of entries in a MergeState's pending-runs stack.
1099 * This is enough to sort arrays of size up to about
1100 * 32 * phi ** MAX_MERGE_PENDING
1101 * where phi ~= 1.618. 85 is ridiculouslylarge enough, good for an array
1102 * with 2**64 elements.
1103 */
1104#define MAX_MERGE_PENDING 85
1105
1106/* When we get into galloping mode, we stay there until both runs win less
1107 * often than MIN_GALLOP consecutive times. See listsort.txt for more info.
1108 */
1109#define MIN_GALLOP 7
1110
1111/* Avoid malloc for small temp arrays. */
1112#define MERGESTATE_TEMP_SIZE 256
1113
1114/* One MergeState exists on the stack per invocation of mergesort. It's just
1115 * a convenient way to pass state around among the helper functions.
1116 */
1117struct s_slice {
1118 sortslice base;
1119 Py_ssize_t len;
1120};
1121
1122typedef struct s_MergeState MergeState;
1123struct s_MergeState {
1124 /* This controls when we get *into* galloping mode. It's initialized
1125 * to MIN_GALLOP. merge_lo and merge_hi tend to nudge it higher for
1126 * random data, and lower for highly structured data.
1127 */
1128 Py_ssize_t min_gallop;
1129
1130 /* 'a' is temp storage to help with merges. It contains room for
1131 * alloced entries.
1132 */
1133 sortslice a; /* may point to temparray below */
1134 Py_ssize_t alloced;
1135
1136 /* A stack of n pending runs yet to be merged. Run #i starts at
1137 * address base[i] and extends for len[i] elements. It's always
1138 * true (so long as the indices are in bounds) that
1139 *
1140 * pending[i].base + pending[i].len == pending[i+1].base
1141 *
1142 * so we could cut the storage for this, but it's a minor amount,
1143 * and keeping all the info explicit simplifies the code.
1144 */
1145 int n;
1146 struct s_slice pending[MAX_MERGE_PENDING];
1147
1148 /* 'a' points to this when possible, rather than muck with malloc. */
1149 PyObject *temparray[MERGESTATE_TEMP_SIZE];
1150
1151 /* This is the function we will use to compare two keys,
1152 * even when none of our special cases apply and we have to use
1153 * safe_object_compare. */
1154 int (*key_compare)(PyObject *, PyObject *, MergeState *);
1155
1156 /* This function is used by unsafe_object_compare to optimize comparisons
1157 * when we know our list is type-homogeneous but we can't assume anything else.
1158 * In the pre-sort check it is set equal to key->ob_type->tp_richcompare */
1159 PyObject *(*key_richcompare)(PyObject *, PyObject *, int);
1160
1161 /* This function is used by unsafe_tuple_compare to compare the first elements
1162 * of tuples. It may be set to safe_object_compare, but the idea is that hopefully
1163 * we can assume more, and use one of the special-case compares. */
1164 int (*tuple_elem_compare)(PyObject *, PyObject *, MergeState *);
1165};
1166
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001167/* binarysort is the best method for sorting small arrays: it does
1168 few compares, but can do data movement quadratic in the number of
1169 elements.
Guido van Rossum42812581998-06-17 14:15:44 +00001170 [lo, hi) is a contiguous slice of a list, and is sorted via
Tim Petersa8c974c2002-07-19 03:30:57 +00001171 binary insertion. This sort is stable.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001172 On entry, must have lo <= start <= hi, and that [lo, start) is already
1173 sorted (pass start == lo if you don't know!).
Tim Petersa8c974c2002-07-19 03:30:57 +00001174 If islt() complains return -1, else 0.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001175 Even in case of error, the output slice will be some permutation of
1176 the input (nothing is lost or duplicated).
1177*/
Guido van Rossum3f236de1996-12-10 23:55:39 +00001178static int
embg1e34da42018-01-28 20:03:23 -07001179binarysort(MergeState *ms, sortslice lo, PyObject **hi, PyObject **start)
Guido van Rossum3f236de1996-12-10 23:55:39 +00001180{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02001181 Py_ssize_t k;
1182 PyObject **l, **p, **r;
1183 PyObject *pivot;
Guido van Rossum3f236de1996-12-10 23:55:39 +00001184
Daniel Stutzbach98338222010-12-02 21:55:33 +00001185 assert(lo.keys <= start && start <= hi);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001186 /* assert [lo, start) is sorted */
Daniel Stutzbach98338222010-12-02 21:55:33 +00001187 if (lo.keys == start)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001188 ++start;
1189 for (; start < hi; ++start) {
1190 /* set l to where *start belongs */
Daniel Stutzbach98338222010-12-02 21:55:33 +00001191 l = lo.keys;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001192 r = start;
1193 pivot = *r;
1194 /* Invariants:
1195 * pivot >= all in [lo, l).
1196 * pivot < all in [r, start).
1197 * The second is vacuously true at the start.
1198 */
1199 assert(l < r);
1200 do {
1201 p = l + ((r - l) >> 1);
1202 IFLT(pivot, *p)
1203 r = p;
1204 else
1205 l = p+1;
1206 } while (l < r);
1207 assert(l == r);
1208 /* The invariants still hold, so pivot >= all in [lo, l) and
1209 pivot < all in [l, start), so pivot belongs at l. Note
1210 that if there are elements equal to pivot, l points to the
1211 first slot after them -- that's why this sort is stable.
1212 Slide over to make room.
1213 Caution: using memmove is much slower under MSVC 5;
1214 we're not usually moving many slots. */
1215 for (p = start; p > l; --p)
1216 *p = *(p-1);
1217 *l = pivot;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001218 if (lo.values != NULL) {
1219 Py_ssize_t offset = lo.values - lo.keys;
1220 p = start + offset;
1221 pivot = *p;
1222 l += offset;
1223 for (p = start + offset; p > l; --p)
1224 *p = *(p-1);
1225 *l = pivot;
1226 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001227 }
1228 return 0;
Guido van Rossuma119c0d1998-05-29 17:56:32 +00001229
1230 fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001231 return -1;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001232}
1233
Tim Petersa64dc242002-08-01 02:13:36 +00001234/*
1235Return the length of the run beginning at lo, in the slice [lo, hi). lo < hi
1236is required on entry. "A run" is the longest ascending sequence, with
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001237
Tim Petersa64dc242002-08-01 02:13:36 +00001238 lo[0] <= lo[1] <= lo[2] <= ...
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001239
Tim Petersa64dc242002-08-01 02:13:36 +00001240or the longest descending sequence, with
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001241
Tim Petersa64dc242002-08-01 02:13:36 +00001242 lo[0] > lo[1] > lo[2] > ...
Tim Peters3b01a122002-07-19 02:35:45 +00001243
Tim Petersa64dc242002-08-01 02:13:36 +00001244Boolean *descending is set to 0 in the former case, or to 1 in the latter.
1245For its intended use in a stable mergesort, the strictness of the defn of
1246"descending" is needed so that the caller can safely reverse a descending
1247sequence without violating stability (strict > ensures there are no equal
1248elements to get out of order).
1249
1250Returns -1 in case of error.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001251*/
Martin v. Löwis18e16552006-02-15 17:27:45 +00001252static Py_ssize_t
embg1e34da42018-01-28 20:03:23 -07001253count_run(MergeState *ms, PyObject **lo, PyObject **hi, int *descending)
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001254{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001255 Py_ssize_t k;
1256 Py_ssize_t n;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001257
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001258 assert(lo < hi);
1259 *descending = 0;
1260 ++lo;
1261 if (lo == hi)
1262 return 1;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001263
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001264 n = 2;
1265 IFLT(*lo, *(lo-1)) {
1266 *descending = 1;
1267 for (lo = lo+1; lo < hi; ++lo, ++n) {
1268 IFLT(*lo, *(lo-1))
1269 ;
1270 else
1271 break;
1272 }
1273 }
1274 else {
1275 for (lo = lo+1; lo < hi; ++lo, ++n) {
1276 IFLT(*lo, *(lo-1))
1277 break;
1278 }
1279 }
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001280
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001281 return n;
Tim Petersa64dc242002-08-01 02:13:36 +00001282fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001283 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001284}
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001285
Tim Petersa64dc242002-08-01 02:13:36 +00001286/*
1287Locate the proper position of key in a sorted vector; if the vector contains
1288an element equal to key, return the position immediately to the left of
1289the leftmost equal element. [gallop_right() does the same except returns
1290the position to the right of the rightmost equal element (if any).]
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001291
Tim Petersa64dc242002-08-01 02:13:36 +00001292"a" is a sorted vector with n elements, starting at a[0]. n must be > 0.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001293
Tim Petersa64dc242002-08-01 02:13:36 +00001294"hint" is an index at which to begin the search, 0 <= hint < n. The closer
1295hint is to the final result, the faster this runs.
1296
1297The return value is the int k in 0..n such that
1298
1299 a[k-1] < key <= a[k]
1300
1301pretending that *(a-1) is minus infinity and a[n] is plus infinity. IOW,
1302key belongs at index k; or, IOW, the first k elements of a should precede
1303key, and the last n-k should follow key.
1304
1305Returns -1 on error. See listsort.txt for info on the method.
1306*/
Martin v. Löwis18e16552006-02-15 17:27:45 +00001307static Py_ssize_t
embg1e34da42018-01-28 20:03:23 -07001308gallop_left(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
Tim Petersa64dc242002-08-01 02:13:36 +00001309{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001310 Py_ssize_t ofs;
1311 Py_ssize_t lastofs;
1312 Py_ssize_t k;
Tim Petersa64dc242002-08-01 02:13:36 +00001313
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001314 assert(key && a && n > 0 && hint >= 0 && hint < n);
Tim Petersa64dc242002-08-01 02:13:36 +00001315
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001316 a += hint;
1317 lastofs = 0;
1318 ofs = 1;
1319 IFLT(*a, key) {
1320 /* a[hint] < key -- gallop right, until
1321 * a[hint + lastofs] < key <= a[hint + ofs]
1322 */
1323 const Py_ssize_t maxofs = n - hint; /* &a[n-1] is highest */
1324 while (ofs < maxofs) {
1325 IFLT(a[ofs], key) {
1326 lastofs = ofs;
1327 ofs = (ofs << 1) + 1;
1328 if (ofs <= 0) /* int overflow */
1329 ofs = maxofs;
1330 }
1331 else /* key <= a[hint + ofs] */
1332 break;
1333 }
1334 if (ofs > maxofs)
1335 ofs = maxofs;
1336 /* Translate back to offsets relative to &a[0]. */
1337 lastofs += hint;
1338 ofs += hint;
1339 }
1340 else {
1341 /* key <= a[hint] -- gallop left, until
1342 * a[hint - ofs] < key <= a[hint - lastofs]
1343 */
1344 const Py_ssize_t maxofs = hint + 1; /* &a[0] is lowest */
1345 while (ofs < maxofs) {
1346 IFLT(*(a-ofs), key)
1347 break;
1348 /* key <= a[hint - ofs] */
1349 lastofs = ofs;
1350 ofs = (ofs << 1) + 1;
1351 if (ofs <= 0) /* int overflow */
1352 ofs = maxofs;
1353 }
1354 if (ofs > maxofs)
1355 ofs = maxofs;
1356 /* Translate back to positive offsets relative to &a[0]. */
1357 k = lastofs;
1358 lastofs = hint - ofs;
1359 ofs = hint - k;
1360 }
1361 a -= hint;
Tim Petersa64dc242002-08-01 02:13:36 +00001362
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001363 assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
1364 /* Now a[lastofs] < key <= a[ofs], so key belongs somewhere to the
1365 * right of lastofs but no farther right than ofs. Do a binary
1366 * search, with invariant a[lastofs-1] < key <= a[ofs].
1367 */
1368 ++lastofs;
1369 while (lastofs < ofs) {
1370 Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
Tim Petersa64dc242002-08-01 02:13:36 +00001371
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001372 IFLT(a[m], key)
1373 lastofs = m+1; /* a[m] < key */
1374 else
1375 ofs = m; /* key <= a[m] */
1376 }
1377 assert(lastofs == ofs); /* so a[ofs-1] < key <= a[ofs] */
1378 return ofs;
Tim Petersa64dc242002-08-01 02:13:36 +00001379
1380fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001381 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001382}
1383
1384/*
1385Exactly like gallop_left(), except that if key already exists in a[0:n],
1386finds the position immediately to the right of the rightmost equal value.
1387
1388The return value is the int k in 0..n such that
1389
1390 a[k-1] <= key < a[k]
1391
1392or -1 if error.
1393
1394The code duplication is massive, but this is enough different given that
1395we're sticking to "<" comparisons that it's much harder to follow if
1396written as one routine with yet another "left or right?" flag.
1397*/
Martin v. Löwis18e16552006-02-15 17:27:45 +00001398static Py_ssize_t
embg1e34da42018-01-28 20:03:23 -07001399gallop_right(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
Tim Petersa64dc242002-08-01 02:13:36 +00001400{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001401 Py_ssize_t ofs;
1402 Py_ssize_t lastofs;
1403 Py_ssize_t k;
Tim Petersa64dc242002-08-01 02:13:36 +00001404
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001405 assert(key && a && n > 0 && hint >= 0 && hint < n);
Tim Petersa64dc242002-08-01 02:13:36 +00001406
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001407 a += hint;
1408 lastofs = 0;
1409 ofs = 1;
1410 IFLT(key, *a) {
1411 /* key < a[hint] -- gallop left, until
1412 * a[hint - ofs] <= key < a[hint - lastofs]
1413 */
1414 const Py_ssize_t maxofs = hint + 1; /* &a[0] is lowest */
1415 while (ofs < maxofs) {
1416 IFLT(key, *(a-ofs)) {
1417 lastofs = ofs;
1418 ofs = (ofs << 1) + 1;
1419 if (ofs <= 0) /* int overflow */
1420 ofs = maxofs;
1421 }
1422 else /* a[hint - ofs] <= key */
1423 break;
1424 }
1425 if (ofs > maxofs)
1426 ofs = maxofs;
1427 /* Translate back to positive offsets relative to &a[0]. */
1428 k = lastofs;
1429 lastofs = hint - ofs;
1430 ofs = hint - k;
1431 }
1432 else {
1433 /* a[hint] <= key -- gallop right, until
1434 * a[hint + lastofs] <= key < a[hint + ofs]
1435 */
1436 const Py_ssize_t maxofs = n - hint; /* &a[n-1] is highest */
1437 while (ofs < maxofs) {
1438 IFLT(key, a[ofs])
1439 break;
1440 /* a[hint + ofs] <= key */
1441 lastofs = ofs;
1442 ofs = (ofs << 1) + 1;
1443 if (ofs <= 0) /* int overflow */
1444 ofs = maxofs;
1445 }
1446 if (ofs > maxofs)
1447 ofs = maxofs;
1448 /* Translate back to offsets relative to &a[0]. */
1449 lastofs += hint;
1450 ofs += hint;
1451 }
1452 a -= hint;
Tim Petersa64dc242002-08-01 02:13:36 +00001453
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001454 assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
1455 /* Now a[lastofs] <= key < a[ofs], so key belongs somewhere to the
1456 * right of lastofs but no farther right than ofs. Do a binary
1457 * search, with invariant a[lastofs-1] <= key < a[ofs].
1458 */
1459 ++lastofs;
1460 while (lastofs < ofs) {
1461 Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
Tim Petersa64dc242002-08-01 02:13:36 +00001462
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001463 IFLT(key, a[m])
1464 ofs = m; /* key < a[m] */
1465 else
1466 lastofs = m+1; /* a[m] <= key */
1467 }
1468 assert(lastofs == ofs); /* so a[ofs-1] <= key < a[ofs] */
1469 return ofs;
Tim Petersa64dc242002-08-01 02:13:36 +00001470
1471fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001472 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001473}
1474
Tim Petersa64dc242002-08-01 02:13:36 +00001475/* Conceptually a MergeState's constructor. */
1476static void
Victor Stinner0fcab4a2011-01-04 12:59:15 +00001477merge_init(MergeState *ms, Py_ssize_t list_size, int has_keyfunc)
Tim Petersa64dc242002-08-01 02:13:36 +00001478{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001479 assert(ms != NULL);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001480 if (has_keyfunc) {
1481 /* The temporary space for merging will need at most half the list
1482 * size rounded up. Use the minimum possible space so we can use the
1483 * rest of temparray for other things. In particular, if there is
1484 * enough extra space, listsort() will use it to store the keys.
1485 */
1486 ms->alloced = (list_size + 1) / 2;
1487
1488 /* ms->alloced describes how many keys will be stored at
1489 ms->temparray, but we also need to store the values. Hence,
1490 ms->alloced is capped at half of MERGESTATE_TEMP_SIZE. */
1491 if (MERGESTATE_TEMP_SIZE / 2 < ms->alloced)
1492 ms->alloced = MERGESTATE_TEMP_SIZE / 2;
1493 ms->a.values = &ms->temparray[ms->alloced];
1494 }
1495 else {
1496 ms->alloced = MERGESTATE_TEMP_SIZE;
1497 ms->a.values = NULL;
1498 }
1499 ms->a.keys = ms->temparray;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001500 ms->n = 0;
1501 ms->min_gallop = MIN_GALLOP;
Tim Petersa64dc242002-08-01 02:13:36 +00001502}
1503
1504/* Free all the temp memory owned by the MergeState. This must be called
1505 * when you're done with a MergeState, and may be called before then if
1506 * you want to free the temp memory early.
1507 */
1508static void
1509merge_freemem(MergeState *ms)
1510{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001511 assert(ms != NULL);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001512 if (ms->a.keys != ms->temparray)
1513 PyMem_Free(ms->a.keys);
Tim Petersa64dc242002-08-01 02:13:36 +00001514}
1515
1516/* Ensure enough temp memory for 'need' array slots is available.
1517 * Returns 0 on success and -1 if the memory can't be gotten.
1518 */
1519static int
Martin v. Löwis18e16552006-02-15 17:27:45 +00001520merge_getmem(MergeState *ms, Py_ssize_t need)
Tim Petersa64dc242002-08-01 02:13:36 +00001521{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001522 int multiplier;
1523
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001524 assert(ms != NULL);
1525 if (need <= ms->alloced)
1526 return 0;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001527
1528 multiplier = ms->a.values != NULL ? 2 : 1;
1529
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001530 /* Don't realloc! That can cost cycles to copy the old data, but
1531 * we don't care what's in the block.
1532 */
1533 merge_freemem(ms);
embg1e34da42018-01-28 20:03:23 -07001534 if ((size_t)need > PY_SSIZE_T_MAX / sizeof(PyObject *) / multiplier) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001535 PyErr_NoMemory();
1536 return -1;
1537 }
embg1e34da42018-01-28 20:03:23 -07001538 ms->a.keys = (PyObject **)PyMem_Malloc(multiplier * need
Daniel Stutzbach98338222010-12-02 21:55:33 +00001539 * sizeof(PyObject *));
1540 if (ms->a.keys != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001541 ms->alloced = need;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001542 if (ms->a.values != NULL)
1543 ms->a.values = &ms->a.keys[need];
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001544 return 0;
1545 }
1546 PyErr_NoMemory();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001547 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001548}
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001549#define MERGE_GETMEM(MS, NEED) ((NEED) <= (MS)->alloced ? 0 : \
1550 merge_getmem(MS, NEED))
Tim Petersa64dc242002-08-01 02:13:36 +00001551
Daniel Stutzbach98338222010-12-02 21:55:33 +00001552/* Merge the na elements starting at ssa with the nb elements starting at
1553 * ssb.keys = ssa.keys + na in a stable way, in-place. na and nb must be > 0.
1554 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
1555 * should have na <= nb. See listsort.txt for more info. Return 0 if
1556 * successful, -1 if error.
Tim Petersa64dc242002-08-01 02:13:36 +00001557 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001558static Py_ssize_t
Daniel Stutzbach98338222010-12-02 21:55:33 +00001559merge_lo(MergeState *ms, sortslice ssa, Py_ssize_t na,
1560 sortslice ssb, Py_ssize_t nb)
Tim Petersa64dc242002-08-01 02:13:36 +00001561{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001562 Py_ssize_t k;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001563 sortslice dest;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001564 int result = -1; /* guilty until proved innocent */
1565 Py_ssize_t min_gallop;
Tim Petersa64dc242002-08-01 02:13:36 +00001566
Daniel Stutzbach98338222010-12-02 21:55:33 +00001567 assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
1568 assert(ssa.keys + na == ssb.keys);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001569 if (MERGE_GETMEM(ms, na) < 0)
1570 return -1;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001571 sortslice_memcpy(&ms->a, 0, &ssa, 0, na);
1572 dest = ssa;
1573 ssa = ms->a;
Tim Petersa64dc242002-08-01 02:13:36 +00001574
Daniel Stutzbach98338222010-12-02 21:55:33 +00001575 sortslice_copy_incr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001576 --nb;
1577 if (nb == 0)
1578 goto Succeed;
1579 if (na == 1)
1580 goto CopyB;
Tim Petersa64dc242002-08-01 02:13:36 +00001581
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001582 min_gallop = ms->min_gallop;
1583 for (;;) {
1584 Py_ssize_t acount = 0; /* # of times A won in a row */
1585 Py_ssize_t bcount = 0; /* # of times B won in a row */
Tim Petersa64dc242002-08-01 02:13:36 +00001586
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001587 /* Do the straightforward thing until (if ever) one run
1588 * appears to win consistently.
1589 */
1590 for (;;) {
1591 assert(na > 1 && nb > 0);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001592 k = ISLT(ssb.keys[0], ssa.keys[0]);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001593 if (k) {
1594 if (k < 0)
1595 goto Fail;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001596 sortslice_copy_incr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001597 ++bcount;
1598 acount = 0;
1599 --nb;
1600 if (nb == 0)
1601 goto Succeed;
1602 if (bcount >= min_gallop)
1603 break;
1604 }
1605 else {
Daniel Stutzbach98338222010-12-02 21:55:33 +00001606 sortslice_copy_incr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001607 ++acount;
1608 bcount = 0;
1609 --na;
1610 if (na == 1)
1611 goto CopyB;
1612 if (acount >= min_gallop)
1613 break;
1614 }
1615 }
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001616
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001617 /* One run is winning so consistently that galloping may
1618 * be a huge win. So try that, and continue galloping until
1619 * (if ever) neither run appears to be winning consistently
1620 * anymore.
1621 */
1622 ++min_gallop;
1623 do {
1624 assert(na > 1 && nb > 0);
1625 min_gallop -= min_gallop > 1;
1626 ms->min_gallop = min_gallop;
embg1e34da42018-01-28 20:03:23 -07001627 k = gallop_right(ms, ssb.keys[0], ssa.keys, na, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001628 acount = k;
1629 if (k) {
1630 if (k < 0)
1631 goto Fail;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001632 sortslice_memcpy(&dest, 0, &ssa, 0, k);
1633 sortslice_advance(&dest, k);
1634 sortslice_advance(&ssa, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001635 na -= k;
1636 if (na == 1)
1637 goto CopyB;
1638 /* na==0 is impossible now if the comparison
1639 * function is consistent, but we can't assume
1640 * that it is.
1641 */
1642 if (na == 0)
1643 goto Succeed;
1644 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00001645 sortslice_copy_incr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001646 --nb;
1647 if (nb == 0)
1648 goto Succeed;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001649
embg1e34da42018-01-28 20:03:23 -07001650 k = gallop_left(ms, ssa.keys[0], ssb.keys, nb, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001651 bcount = k;
1652 if (k) {
1653 if (k < 0)
1654 goto Fail;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001655 sortslice_memmove(&dest, 0, &ssb, 0, k);
1656 sortslice_advance(&dest, k);
1657 sortslice_advance(&ssb, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001658 nb -= k;
1659 if (nb == 0)
1660 goto Succeed;
1661 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00001662 sortslice_copy_incr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001663 --na;
1664 if (na == 1)
1665 goto CopyB;
1666 } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
1667 ++min_gallop; /* penalize it for leaving galloping mode */
1668 ms->min_gallop = min_gallop;
1669 }
Tim Petersa64dc242002-08-01 02:13:36 +00001670Succeed:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001671 result = 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001672Fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001673 if (na)
Daniel Stutzbach98338222010-12-02 21:55:33 +00001674 sortslice_memcpy(&dest, 0, &ssa, 0, na);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001675 return result;
Tim Petersa64dc242002-08-01 02:13:36 +00001676CopyB:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001677 assert(na == 1 && nb > 0);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001678 /* The last element of ssa belongs at the end of the merge. */
1679 sortslice_memmove(&dest, 0, &ssb, 0, nb);
1680 sortslice_copy(&dest, nb, &ssa, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001681 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001682}
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001683
Daniel Stutzbach98338222010-12-02 21:55:33 +00001684/* Merge the na elements starting at pa with the nb elements starting at
1685 * ssb.keys = ssa.keys + na in a stable way, in-place. na and nb must be > 0.
1686 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
1687 * should have na >= nb. See listsort.txt for more info. Return 0 if
1688 * successful, -1 if error.
Tim Petersa64dc242002-08-01 02:13:36 +00001689 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001690static Py_ssize_t
Daniel Stutzbach98338222010-12-02 21:55:33 +00001691merge_hi(MergeState *ms, sortslice ssa, Py_ssize_t na,
1692 sortslice ssb, Py_ssize_t nb)
Tim Petersa64dc242002-08-01 02:13:36 +00001693{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001694 Py_ssize_t k;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001695 sortslice dest, basea, baseb;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001696 int result = -1; /* guilty until proved innocent */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001697 Py_ssize_t min_gallop;
Tim Petersa64dc242002-08-01 02:13:36 +00001698
Daniel Stutzbach98338222010-12-02 21:55:33 +00001699 assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
1700 assert(ssa.keys + na == ssb.keys);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001701 if (MERGE_GETMEM(ms, nb) < 0)
1702 return -1;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001703 dest = ssb;
1704 sortslice_advance(&dest, nb-1);
1705 sortslice_memcpy(&ms->a, 0, &ssb, 0, nb);
1706 basea = ssa;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001707 baseb = ms->a;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001708 ssb.keys = ms->a.keys + nb - 1;
1709 if (ssb.values != NULL)
1710 ssb.values = ms->a.values + nb - 1;
1711 sortslice_advance(&ssa, na - 1);
Tim Petersa64dc242002-08-01 02:13:36 +00001712
Daniel Stutzbach98338222010-12-02 21:55:33 +00001713 sortslice_copy_decr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001714 --na;
1715 if (na == 0)
1716 goto Succeed;
1717 if (nb == 1)
1718 goto CopyA;
Tim Petersa64dc242002-08-01 02:13:36 +00001719
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001720 min_gallop = ms->min_gallop;
1721 for (;;) {
1722 Py_ssize_t acount = 0; /* # of times A won in a row */
1723 Py_ssize_t bcount = 0; /* # of times B won in a row */
Tim Petersa64dc242002-08-01 02:13:36 +00001724
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001725 /* Do the straightforward thing until (if ever) one run
1726 * appears to win consistently.
1727 */
1728 for (;;) {
1729 assert(na > 0 && nb > 1);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001730 k = ISLT(ssb.keys[0], ssa.keys[0]);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001731 if (k) {
1732 if (k < 0)
1733 goto Fail;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001734 sortslice_copy_decr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001735 ++acount;
1736 bcount = 0;
1737 --na;
1738 if (na == 0)
1739 goto Succeed;
1740 if (acount >= min_gallop)
1741 break;
1742 }
1743 else {
Daniel Stutzbach98338222010-12-02 21:55:33 +00001744 sortslice_copy_decr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001745 ++bcount;
1746 acount = 0;
1747 --nb;
1748 if (nb == 1)
1749 goto CopyA;
1750 if (bcount >= min_gallop)
1751 break;
1752 }
1753 }
Tim Petersa64dc242002-08-01 02:13:36 +00001754
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001755 /* One run is winning so consistently that galloping may
1756 * be a huge win. So try that, and continue galloping until
1757 * (if ever) neither run appears to be winning consistently
1758 * anymore.
1759 */
1760 ++min_gallop;
1761 do {
1762 assert(na > 0 && nb > 1);
1763 min_gallop -= min_gallop > 1;
1764 ms->min_gallop = min_gallop;
embg1e34da42018-01-28 20:03:23 -07001765 k = gallop_right(ms, ssb.keys[0], basea.keys, na, na-1);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001766 if (k < 0)
1767 goto Fail;
1768 k = na - k;
1769 acount = k;
1770 if (k) {
Daniel Stutzbach98338222010-12-02 21:55:33 +00001771 sortslice_advance(&dest, -k);
1772 sortslice_advance(&ssa, -k);
1773 sortslice_memmove(&dest, 1, &ssa, 1, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001774 na -= k;
1775 if (na == 0)
1776 goto Succeed;
1777 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00001778 sortslice_copy_decr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001779 --nb;
1780 if (nb == 1)
1781 goto CopyA;
Tim Petersa64dc242002-08-01 02:13:36 +00001782
embg1e34da42018-01-28 20:03:23 -07001783 k = gallop_left(ms, ssa.keys[0], baseb.keys, nb, nb-1);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001784 if (k < 0)
1785 goto Fail;
1786 k = nb - k;
1787 bcount = k;
1788 if (k) {
Daniel Stutzbach98338222010-12-02 21:55:33 +00001789 sortslice_advance(&dest, -k);
1790 sortslice_advance(&ssb, -k);
1791 sortslice_memcpy(&dest, 1, &ssb, 1, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001792 nb -= k;
1793 if (nb == 1)
1794 goto CopyA;
1795 /* nb==0 is impossible now if the comparison
1796 * function is consistent, but we can't assume
1797 * that it is.
1798 */
1799 if (nb == 0)
1800 goto Succeed;
1801 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00001802 sortslice_copy_decr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001803 --na;
1804 if (na == 0)
1805 goto Succeed;
1806 } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
1807 ++min_gallop; /* penalize it for leaving galloping mode */
1808 ms->min_gallop = min_gallop;
1809 }
Tim Petersa64dc242002-08-01 02:13:36 +00001810Succeed:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001811 result = 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001812Fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001813 if (nb)
Daniel Stutzbach98338222010-12-02 21:55:33 +00001814 sortslice_memcpy(&dest, -(nb-1), &baseb, 0, nb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001815 return result;
Tim Petersa64dc242002-08-01 02:13:36 +00001816CopyA:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001817 assert(nb == 1 && na > 0);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001818 /* The first element of ssb belongs at the front of the merge. */
1819 sortslice_memmove(&dest, 1-na, &ssa, 1-na, na);
1820 sortslice_advance(&dest, -na);
1821 sortslice_advance(&ssa, -na);
1822 sortslice_copy(&dest, 0, &ssb, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001823 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001824}
1825
1826/* Merge the two runs at stack indices i and i+1.
1827 * Returns 0 on success, -1 on error.
1828 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001829static Py_ssize_t
1830merge_at(MergeState *ms, Py_ssize_t i)
Tim Petersa64dc242002-08-01 02:13:36 +00001831{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001832 sortslice ssa, ssb;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001833 Py_ssize_t na, nb;
1834 Py_ssize_t k;
Tim Petersa64dc242002-08-01 02:13:36 +00001835
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001836 assert(ms != NULL);
1837 assert(ms->n >= 2);
1838 assert(i >= 0);
1839 assert(i == ms->n - 2 || i == ms->n - 3);
Tim Petersa64dc242002-08-01 02:13:36 +00001840
Daniel Stutzbach98338222010-12-02 21:55:33 +00001841 ssa = ms->pending[i].base;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001842 na = ms->pending[i].len;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001843 ssb = ms->pending[i+1].base;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001844 nb = ms->pending[i+1].len;
1845 assert(na > 0 && nb > 0);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001846 assert(ssa.keys + na == ssb.keys);
Tim Petersa64dc242002-08-01 02:13:36 +00001847
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001848 /* Record the length of the combined runs; if i is the 3rd-last
1849 * run now, also slide over the last run (which isn't involved
1850 * in this merge). The current run i+1 goes away in any case.
1851 */
1852 ms->pending[i].len = na + nb;
1853 if (i == ms->n - 3)
1854 ms->pending[i+1] = ms->pending[i+2];
1855 --ms->n;
Tim Petersa64dc242002-08-01 02:13:36 +00001856
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001857 /* Where does b start in a? Elements in a before that can be
1858 * ignored (already in place).
1859 */
embg1e34da42018-01-28 20:03:23 -07001860 k = gallop_right(ms, *ssb.keys, ssa.keys, na, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001861 if (k < 0)
1862 return -1;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001863 sortslice_advance(&ssa, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001864 na -= k;
1865 if (na == 0)
1866 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001867
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001868 /* Where does a end in b? Elements in b after that can be
1869 * ignored (already in place).
1870 */
embg1e34da42018-01-28 20:03:23 -07001871 nb = gallop_left(ms, ssa.keys[na-1], ssb.keys, nb, nb-1);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001872 if (nb <= 0)
1873 return nb;
Tim Petersa64dc242002-08-01 02:13:36 +00001874
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001875 /* Merge what remains of the runs, using a temp array with
1876 * min(na, nb) elements.
1877 */
1878 if (na <= nb)
Daniel Stutzbach98338222010-12-02 21:55:33 +00001879 return merge_lo(ms, ssa, na, ssb, nb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001880 else
Daniel Stutzbach98338222010-12-02 21:55:33 +00001881 return merge_hi(ms, ssa, na, ssb, nb);
Tim Petersa64dc242002-08-01 02:13:36 +00001882}
1883
1884/* Examine the stack of runs waiting to be merged, merging adjacent runs
1885 * until the stack invariants are re-established:
1886 *
1887 * 1. len[-3] > len[-2] + len[-1]
1888 * 2. len[-2] > len[-1]
1889 *
1890 * See listsort.txt for more info.
1891 *
1892 * Returns 0 on success, -1 on error.
1893 */
1894static int
1895merge_collapse(MergeState *ms)
1896{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001897 struct s_slice *p = ms->pending;
Tim Petersa64dc242002-08-01 02:13:36 +00001898
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001899 assert(ms);
1900 while (ms->n > 1) {
1901 Py_ssize_t n = ms->n - 2;
Benjamin Petersonb808d592015-02-25 10:12:26 -05001902 if ((n > 0 && p[n-1].len <= p[n].len + p[n+1].len) ||
1903 (n > 1 && p[n-2].len <= p[n-1].len + p[n].len)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001904 if (p[n-1].len < p[n+1].len)
1905 --n;
1906 if (merge_at(ms, n) < 0)
1907 return -1;
1908 }
1909 else if (p[n].len <= p[n+1].len) {
embg1e34da42018-01-28 20:03:23 -07001910 if (merge_at(ms, n) < 0)
1911 return -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001912 }
1913 else
1914 break;
1915 }
1916 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001917}
1918
1919/* Regardless of invariants, merge all runs on the stack until only one
1920 * remains. This is used at the end of the mergesort.
1921 *
1922 * Returns 0 on success, -1 on error.
1923 */
1924static int
1925merge_force_collapse(MergeState *ms)
1926{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001927 struct s_slice *p = ms->pending;
Tim Petersa64dc242002-08-01 02:13:36 +00001928
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001929 assert(ms);
1930 while (ms->n > 1) {
1931 Py_ssize_t n = ms->n - 2;
1932 if (n > 0 && p[n-1].len < p[n+1].len)
1933 --n;
1934 if (merge_at(ms, n) < 0)
1935 return -1;
1936 }
1937 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001938}
1939
1940/* Compute a good value for the minimum run length; natural runs shorter
1941 * than this are boosted artificially via binary insertion.
1942 *
1943 * If n < 64, return n (it's too small to bother with fancy stuff).
1944 * Else if n is an exact power of 2, return 32.
1945 * Else return an int k, 32 <= k <= 64, such that n/k is close to, but
1946 * strictly less than, an exact power of 2.
1947 *
1948 * See listsort.txt for more info.
1949 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001950static Py_ssize_t
1951merge_compute_minrun(Py_ssize_t n)
Tim Petersa64dc242002-08-01 02:13:36 +00001952{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001953 Py_ssize_t r = 0; /* becomes 1 if any 1 bits are shifted off */
Tim Petersa64dc242002-08-01 02:13:36 +00001954
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001955 assert(n >= 0);
1956 while (n >= 64) {
1957 r |= n & 1;
1958 n >>= 1;
1959 }
1960 return n + r;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001961}
Guido van Rossuma119c0d1998-05-29 17:56:32 +00001962
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001963static void
Daniel Stutzbach98338222010-12-02 21:55:33 +00001964reverse_sortslice(sortslice *s, Py_ssize_t n)
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001965{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001966 reverse_slice(s->keys, &s->keys[n]);
1967 if (s->values != NULL)
1968 reverse_slice(s->values, &s->values[n]);
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001969}
1970
embg1e34da42018-01-28 20:03:23 -07001971/* Here we define custom comparison functions to optimize for the cases one commonly
1972 * encounters in practice: homogeneous lists, often of one of the basic types. */
1973
1974/* This struct holds the comparison function and helper functions
1975 * selected in the pre-sort check. */
1976
1977/* These are the special case compare functions.
1978 * ms->key_compare will always point to one of these: */
1979
1980/* Heterogeneous compare: default, always safe to fall back on. */
1981static int
1982safe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
1983{
1984 /* No assumptions necessary! */
1985 return PyObject_RichCompareBool(v, w, Py_LT);
1986}
1987
1988/* Homogeneous compare: safe for any two compareable objects of the same type.
1989 * (ms->key_richcompare is set to ob_type->tp_richcompare in the
1990 * pre-sort check.)
1991 */
1992static int
1993unsafe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
1994{
1995 PyObject *res_obj; int res;
1996
1997 /* No assumptions, because we check first: */
1998 if (v->ob_type->tp_richcompare != ms->key_richcompare)
1999 return PyObject_RichCompareBool(v, w, Py_LT);
2000
2001 assert(ms->key_richcompare != NULL);
2002 res_obj = (*(ms->key_richcompare))(v, w, Py_LT);
2003
2004 if (res_obj == Py_NotImplemented) {
2005 Py_DECREF(res_obj);
2006 return PyObject_RichCompareBool(v, w, Py_LT);
2007 }
2008 if (res_obj == NULL)
2009 return -1;
2010
2011 if (PyBool_Check(res_obj)) {
2012 res = (res_obj == Py_True);
2013 }
2014 else {
2015 res = PyObject_IsTrue(res_obj);
2016 }
2017 Py_DECREF(res_obj);
2018
2019 /* Note that we can't assert
2020 * res == PyObject_RichCompareBool(v, w, Py_LT);
2021 * because of evil compare functions like this:
2022 * lambda a, b: int(random.random() * 3) - 1)
2023 * (which is actually in test_sort.py) */
2024 return res;
2025}
2026
2027/* Latin string compare: safe for any two latin (one byte per char) strings. */
2028static int
2029unsafe_latin_compare(PyObject *v, PyObject *w, MergeState *ms)
2030{
Victor Stinner8017b802018-01-29 13:47:06 +01002031 Py_ssize_t len;
2032 int res;
embg1e34da42018-01-28 20:03:23 -07002033
2034 /* Modified from Objects/unicodeobject.c:unicode_compare, assuming: */
2035 assert(v->ob_type == w->ob_type);
2036 assert(v->ob_type == &PyUnicode_Type);
2037 assert(PyUnicode_KIND(v) == PyUnicode_KIND(w));
2038 assert(PyUnicode_KIND(v) == PyUnicode_1BYTE_KIND);
2039
2040 len = Py_MIN(PyUnicode_GET_LENGTH(v), PyUnicode_GET_LENGTH(w));
2041 res = memcmp(PyUnicode_DATA(v), PyUnicode_DATA(w), len);
2042
2043 res = (res != 0 ?
2044 res < 0 :
2045 PyUnicode_GET_LENGTH(v) < PyUnicode_GET_LENGTH(w));
2046
2047 assert(res == PyObject_RichCompareBool(v, w, Py_LT));;
2048 return res;
2049}
2050
2051/* Bounded int compare: compare any two longs that fit in a single machine word. */
2052static int
2053unsafe_long_compare(PyObject *v, PyObject *w, MergeState *ms)
2054{
2055 PyLongObject *vl, *wl; sdigit v0, w0; int res;
2056
2057 /* Modified from Objects/longobject.c:long_compare, assuming: */
2058 assert(v->ob_type == w->ob_type);
2059 assert(v->ob_type == &PyLong_Type);
2060 assert(Py_ABS(Py_SIZE(v)) <= 1);
2061 assert(Py_ABS(Py_SIZE(w)) <= 1);
2062
2063 vl = (PyLongObject*)v;
2064 wl = (PyLongObject*)w;
2065
2066 v0 = Py_SIZE(vl) == 0 ? 0 : (sdigit)vl->ob_digit[0];
2067 w0 = Py_SIZE(wl) == 0 ? 0 : (sdigit)wl->ob_digit[0];
2068
2069 if (Py_SIZE(vl) < 0)
2070 v0 = -v0;
2071 if (Py_SIZE(wl) < 0)
2072 w0 = -w0;
2073
2074 res = v0 < w0;
2075 assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2076 return res;
2077}
2078
2079/* Float compare: compare any two floats. */
2080static int
2081unsafe_float_compare(PyObject *v, PyObject *w, MergeState *ms)
2082{
2083 int res;
2084
2085 /* Modified from Objects/floatobject.c:float_richcompare, assuming: */
2086 assert(v->ob_type == w->ob_type);
2087 assert(v->ob_type == &PyFloat_Type);
2088
2089 res = PyFloat_AS_DOUBLE(v) < PyFloat_AS_DOUBLE(w);
2090 assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2091 return res;
2092}
2093
2094/* Tuple compare: compare *any* two tuples, using
2095 * ms->tuple_elem_compare to compare the first elements, which is set
2096 * using the same pre-sort check as we use for ms->key_compare,
2097 * but run on the list [x[0] for x in L]. This allows us to optimize compares
2098 * on two levels (as long as [x[0] for x in L] is type-homogeneous.) The idea is
2099 * that most tuple compares don't involve x[1:]. */
2100static int
2101unsafe_tuple_compare(PyObject *v, PyObject *w, MergeState *ms)
2102{
2103 PyTupleObject *vt, *wt;
2104 Py_ssize_t i, vlen, wlen;
2105 int k;
2106
2107 /* Modified from Objects/tupleobject.c:tuplerichcompare, assuming: */
2108 assert(v->ob_type == w->ob_type);
2109 assert(v->ob_type == &PyTuple_Type);
2110 assert(Py_SIZE(v) > 0);
2111 assert(Py_SIZE(w) > 0);
2112
2113 vt = (PyTupleObject *)v;
2114 wt = (PyTupleObject *)w;
2115
2116 vlen = Py_SIZE(vt);
2117 wlen = Py_SIZE(wt);
2118
2119 for (i = 0; i < vlen && i < wlen; i++) {
2120 k = PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_EQ);
2121 if (k < 0)
2122 return -1;
2123 if (!k)
2124 break;
2125 }
2126
2127 if (i >= vlen || i >= wlen)
2128 return vlen < wlen;
2129
2130 if (i == 0)
2131 return ms->tuple_elem_compare(vt->ob_item[i], wt->ob_item[i], ms);
2132 else
2133 return PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_LT);
2134}
2135
Tim Petersa64dc242002-08-01 02:13:36 +00002136/* An adaptive, stable, natural mergesort. See listsort.txt.
2137 * Returns Py_None on success, NULL on error. Even in case of error, the
2138 * list will be some permutation of its input state (nothing is lost or
2139 * duplicated).
2140 */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002141/*[clinic input]
2142list.sort
2143
2144 *
2145 key as keyfunc: object = None
Serhiy Storchaka202fda52017-03-12 10:10:47 +02002146 reverse: bool(accept={int}) = False
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002147
2148Stable sort *IN PLACE*.
2149[clinic start generated code]*/
2150
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002151static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002152list_sort_impl(PyListObject *self, PyObject *keyfunc, int reverse)
Serhiy Storchaka202fda52017-03-12 10:10:47 +02002153/*[clinic end generated code: output=57b9f9c5e23fbe42 input=b0fcf743982c5b90]*/
Guido van Rossum3f236de1996-12-10 23:55:39 +00002154{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002155 MergeState ms;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002156 Py_ssize_t nremaining;
2157 Py_ssize_t minrun;
Daniel Stutzbach98338222010-12-02 21:55:33 +00002158 sortslice lo;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002159 Py_ssize_t saved_ob_size, saved_allocated;
2160 PyObject **saved_ob_item;
2161 PyObject **final_ob_item;
2162 PyObject *result = NULL; /* guilty until proved innocent */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002163 Py_ssize_t i;
Daniel Stutzbach98338222010-12-02 21:55:33 +00002164 PyObject **keys;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002165
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002166 assert(self != NULL);
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002167 assert(PyList_Check(self));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002168 if (keyfunc == Py_None)
2169 keyfunc = NULL;
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00002170
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002171 /* The list is temporarily made empty, so that mutations performed
2172 * by comparison functions can't affect the slice of memory we're
2173 * sorting (allowing mutations during sorting is a core-dump
2174 * factory, since ob_item may change).
2175 */
2176 saved_ob_size = Py_SIZE(self);
2177 saved_ob_item = self->ob_item;
2178 saved_allocated = self->allocated;
2179 Py_SIZE(self) = 0;
2180 self->ob_item = NULL;
2181 self->allocated = -1; /* any operation will reset it to >= 0 */
Tim Peters330f9e92002-07-19 07:05:44 +00002182
Daniel Stutzbach98338222010-12-02 21:55:33 +00002183 if (keyfunc == NULL) {
2184 keys = NULL;
2185 lo.keys = saved_ob_item;
2186 lo.values = NULL;
2187 }
2188 else {
2189 if (saved_ob_size < MERGESTATE_TEMP_SIZE/2)
2190 /* Leverage stack space we allocated but won't otherwise use */
2191 keys = &ms.temparray[saved_ob_size+1];
2192 else {
2193 keys = PyMem_MALLOC(sizeof(PyObject *) * saved_ob_size);
Benjamin Peterson0823ffb2015-04-23 17:04:36 -04002194 if (keys == NULL) {
2195 PyErr_NoMemory();
2196 goto keyfunc_fail;
2197 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002198 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00002199
2200 for (i = 0; i < saved_ob_size ; i++) {
Victor Stinnerde4ae3d2016-12-04 22:59:09 +01002201 keys[i] = PyObject_CallFunctionObjArgs(keyfunc, saved_ob_item[i],
2202 NULL);
Daniel Stutzbach98338222010-12-02 21:55:33 +00002203 if (keys[i] == NULL) {
2204 for (i=i-1 ; i>=0 ; i--)
2205 Py_DECREF(keys[i]);
Benjamin Peterson4a42cd42014-03-15 12:21:28 -05002206 if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
Daniel Stutzbach8eda5f72011-03-02 23:37:50 +00002207 PyMem_FREE(keys);
Daniel Stutzbach98338222010-12-02 21:55:33 +00002208 goto keyfunc_fail;
2209 }
2210 }
2211
2212 lo.keys = keys;
2213 lo.values = saved_ob_item;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002214 }
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002215
embg1e34da42018-01-28 20:03:23 -07002216
2217 /* The pre-sort check: here's where we decide which compare function to use.
2218 * How much optimization is safe? We test for homogeneity with respect to
2219 * several properties that are expensive to check at compare-time, and
2220 * set ms appropriately. */
2221 if (saved_ob_size > 1) {
2222 /* Assume the first element is representative of the whole list. */
2223 int keys_are_in_tuples = (lo.keys[0]->ob_type == &PyTuple_Type &&
2224 Py_SIZE(lo.keys[0]) > 0);
2225
2226 PyTypeObject* key_type = (keys_are_in_tuples ?
2227 PyTuple_GET_ITEM(lo.keys[0], 0)->ob_type :
2228 lo.keys[0]->ob_type);
2229
2230 int keys_are_all_same_type = 1;
2231 int strings_are_latin = 1;
2232 int ints_are_bounded = 1;
2233
2234 /* Prove that assumption by checking every key. */
embg1e34da42018-01-28 20:03:23 -07002235 for (i=0; i < saved_ob_size; i++) {
2236
2237 if (keys_are_in_tuples &&
2238 !(lo.keys[i]->ob_type == &PyTuple_Type && Py_SIZE(lo.keys[i]) != 0)) {
2239 keys_are_in_tuples = 0;
2240 keys_are_all_same_type = 0;
2241 break;
2242 }
2243
2244 /* Note: for lists of tuples, key is the first element of the tuple
2245 * lo.keys[i], not lo.keys[i] itself! We verify type-homogeneity
2246 * for lists of tuples in the if-statement directly above. */
2247 PyObject *key = (keys_are_in_tuples ?
2248 PyTuple_GET_ITEM(lo.keys[i], 0) :
2249 lo.keys[i]);
2250
2251 if (key->ob_type != key_type) {
2252 keys_are_all_same_type = 0;
2253 break;
2254 }
2255
2256 if (key_type == &PyLong_Type) {
2257 if (ints_are_bounded && Py_ABS(Py_SIZE(key)) > 1)
2258 ints_are_bounded = 0;
2259 }
2260 else if (key_type == &PyUnicode_Type){
2261 if (strings_are_latin &&
2262 PyUnicode_KIND(key) != PyUnicode_1BYTE_KIND)
2263 strings_are_latin = 0;
2264 }
2265 }
2266
2267 /* Choose the best compare, given what we now know about the keys. */
2268 if (keys_are_all_same_type) {
2269
2270 if (key_type == &PyUnicode_Type && strings_are_latin) {
2271 ms.key_compare = unsafe_latin_compare;
2272 }
2273 else if (key_type == &PyLong_Type && ints_are_bounded) {
2274 ms.key_compare = unsafe_long_compare;
2275 }
2276 else if (key_type == &PyFloat_Type) {
2277 ms.key_compare = unsafe_float_compare;
2278 }
2279 else if ((ms.key_richcompare = key_type->tp_richcompare) != NULL) {
2280 ms.key_compare = unsafe_object_compare;
2281 }
2282 }
2283 else {
2284 ms.key_compare = safe_object_compare;
2285 }
2286
2287 if (keys_are_in_tuples) {
2288 /* Make sure we're not dealing with tuples of tuples
2289 * (remember: here, key_type refers list [key[0] for key in keys]) */
2290 if (key_type == &PyTuple_Type)
2291 ms.tuple_elem_compare = safe_object_compare;
2292 else
2293 ms.tuple_elem_compare = ms.key_compare;
2294
2295 ms.key_compare = unsafe_tuple_compare;
2296 }
2297 }
2298 /* End of pre-sort check: ms is now set properly! */
2299
Daniel Stutzbach98338222010-12-02 21:55:33 +00002300 merge_init(&ms, saved_ob_size, keys != NULL);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002301
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002302 nremaining = saved_ob_size;
2303 if (nremaining < 2)
2304 goto succeed;
Tim Peters330f9e92002-07-19 07:05:44 +00002305
Benjamin Peterson05380642010-08-23 19:35:39 +00002306 /* Reverse sort stability achieved by initially reversing the list,
2307 applying a stable forward sort, then reversing the final result. */
Daniel Stutzbach98338222010-12-02 21:55:33 +00002308 if (reverse) {
2309 if (keys != NULL)
2310 reverse_slice(&keys[0], &keys[saved_ob_size]);
2311 reverse_slice(&saved_ob_item[0], &saved_ob_item[saved_ob_size]);
2312 }
Benjamin Peterson05380642010-08-23 19:35:39 +00002313
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002314 /* March over the array once, left to right, finding natural runs,
2315 * and extending short natural runs to minrun elements.
2316 */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002317 minrun = merge_compute_minrun(nremaining);
2318 do {
2319 int descending;
2320 Py_ssize_t n;
Tim Peters330f9e92002-07-19 07:05:44 +00002321
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002322 /* Identify next run. */
embg1e34da42018-01-28 20:03:23 -07002323 n = count_run(&ms, lo.keys, lo.keys + nremaining, &descending);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002324 if (n < 0)
2325 goto fail;
2326 if (descending)
Daniel Stutzbach98338222010-12-02 21:55:33 +00002327 reverse_sortslice(&lo, n);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002328 /* If short, extend to min(minrun, nremaining). */
2329 if (n < minrun) {
2330 const Py_ssize_t force = nremaining <= minrun ?
2331 nremaining : minrun;
embg1e34da42018-01-28 20:03:23 -07002332 if (binarysort(&ms, lo, lo.keys + force, lo.keys + n) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002333 goto fail;
2334 n = force;
2335 }
2336 /* Push run onto pending-runs stack, and maybe merge. */
2337 assert(ms.n < MAX_MERGE_PENDING);
2338 ms.pending[ms.n].base = lo;
2339 ms.pending[ms.n].len = n;
2340 ++ms.n;
2341 if (merge_collapse(&ms) < 0)
2342 goto fail;
2343 /* Advance to find next run. */
Daniel Stutzbach98338222010-12-02 21:55:33 +00002344 sortslice_advance(&lo, n);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002345 nremaining -= n;
2346 } while (nremaining);
Tim Peters330f9e92002-07-19 07:05:44 +00002347
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002348 if (merge_force_collapse(&ms) < 0)
2349 goto fail;
2350 assert(ms.n == 1);
Daniel Stutzbach98338222010-12-02 21:55:33 +00002351 assert(keys == NULL
2352 ? ms.pending[0].base.keys == saved_ob_item
2353 : ms.pending[0].base.keys == &keys[0]);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002354 assert(ms.pending[0].len == saved_ob_size);
Daniel Stutzbach98338222010-12-02 21:55:33 +00002355 lo = ms.pending[0].base;
Tim Petersa64dc242002-08-01 02:13:36 +00002356
2357succeed:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002358 result = Py_None;
Tim Peters330f9e92002-07-19 07:05:44 +00002359fail:
Daniel Stutzbach98338222010-12-02 21:55:33 +00002360 if (keys != NULL) {
2361 for (i = 0; i < saved_ob_size; i++)
2362 Py_DECREF(keys[i]);
Benjamin Petersonef87f8c2014-03-14 21:54:31 -05002363 if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
Daniel Stutzbach98338222010-12-02 21:55:33 +00002364 PyMem_FREE(keys);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002365 }
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002366
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002367 if (self->allocated != -1 && result != NULL) {
2368 /* The user mucked with the list during the sort,
2369 * and we don't already have another error to report.
2370 */
2371 PyErr_SetString(PyExc_ValueError, "list modified during sort");
2372 result = NULL;
2373 }
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002374
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002375 if (reverse && saved_ob_size > 1)
2376 reverse_slice(saved_ob_item, saved_ob_item + saved_ob_size);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002377
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002378 merge_freemem(&ms);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002379
Daniel Stutzbach98338222010-12-02 21:55:33 +00002380keyfunc_fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002381 final_ob_item = self->ob_item;
2382 i = Py_SIZE(self);
2383 Py_SIZE(self) = saved_ob_size;
2384 self->ob_item = saved_ob_item;
2385 self->allocated = saved_allocated;
2386 if (final_ob_item != NULL) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002387 /* we cannot use _list_clear() for this because it does not
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002388 guarantee that the list is really empty when it returns */
2389 while (--i >= 0) {
2390 Py_XDECREF(final_ob_item[i]);
2391 }
2392 PyMem_FREE(final_ob_item);
2393 }
2394 Py_XINCREF(result);
2395 return result;
Guido van Rossum3f236de1996-12-10 23:55:39 +00002396}
Tim Peters330f9e92002-07-19 07:05:44 +00002397#undef IFLT
Tim Peters66860f62002-08-04 17:47:26 +00002398#undef ISLT
Tim Peters330f9e92002-07-19 07:05:44 +00002399
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002400int
Fred Drakea2f55112000-07-09 15:16:51 +00002401PyList_Sort(PyObject *v)
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002402{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002403 if (v == NULL || !PyList_Check(v)) {
2404 PyErr_BadInternalCall();
2405 return -1;
2406 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002407 v = list_sort_impl((PyListObject *)v, NULL, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002408 if (v == NULL)
2409 return -1;
2410 Py_DECREF(v);
2411 return 0;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002412}
2413
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002414/*[clinic input]
2415list.reverse
2416
2417Reverse *IN PLACE*.
2418[clinic start generated code]*/
2419
Guido van Rossumb86c5492001-02-12 22:06:02 +00002420static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002421list_reverse_impl(PyListObject *self)
2422/*[clinic end generated code: output=482544fc451abea9 input=eefd4c3ae1bc9887]*/
Guido van Rossumb86c5492001-02-12 22:06:02 +00002423{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002424 if (Py_SIZE(self) > 1)
2425 reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
2426 Py_RETURN_NONE;
Guido van Rossumed98d481991-03-06 13:07:53 +00002427}
2428
Guido van Rossum84c76f51990-10-30 13:32:20 +00002429int
Fred Drakea2f55112000-07-09 15:16:51 +00002430PyList_Reverse(PyObject *v)
Guido van Rossumb0fe3a91995-01-17 16:34:45 +00002431{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002432 PyListObject *self = (PyListObject *)v;
Tim Peters6063e262002-08-08 01:06:39 +00002433
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002434 if (v == NULL || !PyList_Check(v)) {
2435 PyErr_BadInternalCall();
2436 return -1;
2437 }
2438 if (Py_SIZE(self) > 1)
2439 reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
2440 return 0;
Guido van Rossumb0fe3a91995-01-17 16:34:45 +00002441}
2442
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002443PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +00002444PyList_AsTuple(PyObject *v)
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00002445{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002446 PyObject *w;
2447 PyObject **p, **q;
2448 Py_ssize_t n;
2449 if (v == NULL || !PyList_Check(v)) {
2450 PyErr_BadInternalCall();
2451 return NULL;
2452 }
2453 n = Py_SIZE(v);
2454 w = PyTuple_New(n);
2455 if (w == NULL)
2456 return NULL;
2457 p = ((PyTupleObject *)w)->ob_item;
2458 q = ((PyListObject *)v)->ob_item;
2459 while (--n >= 0) {
2460 Py_INCREF(*q);
2461 *p = *q;
2462 p++;
2463 q++;
2464 }
2465 return w;
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00002466}
2467
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002468/*[clinic input]
2469list.index
Guido van Rossum4aa24f92000-02-24 15:23:03 +00002470
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002471 value: object
Serhiy Storchaka80ec8362017-03-19 19:37:40 +02002472 start: slice_index(accept={int}) = 0
2473 stop: slice_index(accept={int}, c_default="PY_SSIZE_T_MAX") = sys.maxsize
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002474 /
2475
2476Return first index of value.
2477
2478Raises ValueError if the value is not present.
2479[clinic start generated code]*/
2480
2481static PyObject *
2482list_index_impl(PyListObject *self, PyObject *value, Py_ssize_t start,
2483 Py_ssize_t stop)
Serhiy Storchaka80ec8362017-03-19 19:37:40 +02002484/*[clinic end generated code: output=ec51b88787e4e481 input=40ec5826303a0eb1]*/
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002485{
2486 Py_ssize_t i;
2487
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002488 if (start < 0) {
2489 start += Py_SIZE(self);
2490 if (start < 0)
2491 start = 0;
2492 }
2493 if (stop < 0) {
2494 stop += Py_SIZE(self);
2495 if (stop < 0)
2496 stop = 0;
2497 }
2498 for (i = start; i < stop && i < Py_SIZE(self); i++) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002499 int cmp = PyObject_RichCompareBool(self->ob_item[i], value, Py_EQ);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002500 if (cmp > 0)
2501 return PyLong_FromSsize_t(i);
2502 else if (cmp < 0)
2503 return NULL;
2504 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002505 PyErr_Format(PyExc_ValueError, "%R is not in list", value);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002506 return NULL;
Guido van Rossumed98d481991-03-06 13:07:53 +00002507}
2508
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002509/*[clinic input]
2510list.count
2511
2512 value: object
2513 /
2514
2515Return number of occurrences of value.
2516[clinic start generated code]*/
2517
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002518static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002519list_count(PyListObject *self, PyObject *value)
2520/*[clinic end generated code: output=b1f5d284205ae714 input=3bdc3a5e6f749565]*/
Guido van Rossume6f7d181991-10-20 20:20:40 +00002521{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002522 Py_ssize_t count = 0;
2523 Py_ssize_t i;
Guido van Rossum4aa24f92000-02-24 15:23:03 +00002524
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002525 for (i = 0; i < Py_SIZE(self); i++) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002526 int cmp = PyObject_RichCompareBool(self->ob_item[i], value, Py_EQ);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002527 if (cmp > 0)
2528 count++;
2529 else if (cmp < 0)
2530 return NULL;
2531 }
2532 return PyLong_FromSsize_t(count);
Guido van Rossume6f7d181991-10-20 20:20:40 +00002533}
2534
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002535/*[clinic input]
2536list.remove
2537
2538 value: object
2539 /
2540
2541Remove first occurrence of value.
2542
2543Raises ValueError if the value is not present.
2544[clinic start generated code]*/
2545
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002546static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002547list_remove(PyListObject *self, PyObject *value)
2548/*[clinic end generated code: output=f087e1951a5e30d1 input=2dc2ba5bb2fb1f82]*/
Guido van Rossumed98d481991-03-06 13:07:53 +00002549{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002550 Py_ssize_t i;
Guido van Rossum4aa24f92000-02-24 15:23:03 +00002551
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002552 for (i = 0; i < Py_SIZE(self); i++) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002553 int cmp = PyObject_RichCompareBool(self->ob_item[i], value, Py_EQ);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002554 if (cmp > 0) {
2555 if (list_ass_slice(self, i, i+1,
2556 (PyObject *)NULL) == 0)
2557 Py_RETURN_NONE;
2558 return NULL;
2559 }
2560 else if (cmp < 0)
2561 return NULL;
2562 }
2563 PyErr_SetString(PyExc_ValueError, "list.remove(x): x not in list");
2564 return NULL;
Guido van Rossumed98d481991-03-06 13:07:53 +00002565}
2566
Jeremy Hylton8caad492000-06-23 14:18:11 +00002567static int
2568list_traverse(PyListObject *o, visitproc visit, void *arg)
2569{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002570 Py_ssize_t i;
Jeremy Hylton8caad492000-06-23 14:18:11 +00002571
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002572 for (i = Py_SIZE(o); --i >= 0; )
2573 Py_VISIT(o->ob_item[i]);
2574 return 0;
Jeremy Hylton8caad492000-06-23 14:18:11 +00002575}
2576
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002577static PyObject *
2578list_richcompare(PyObject *v, PyObject *w, int op)
2579{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002580 PyListObject *vl, *wl;
2581 Py_ssize_t i;
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002582
Brian Curtindfc80e32011-08-10 20:28:54 -05002583 if (!PyList_Check(v) || !PyList_Check(w))
2584 Py_RETURN_NOTIMPLEMENTED;
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002585
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002586 vl = (PyListObject *)v;
2587 wl = (PyListObject *)w;
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002588
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002589 if (Py_SIZE(vl) != Py_SIZE(wl) && (op == Py_EQ || op == Py_NE)) {
2590 /* Shortcut: if the lengths differ, the lists differ */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002591 if (op == Py_EQ)
stratakise8b19652017-11-02 11:32:54 +01002592 Py_RETURN_FALSE;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002593 else
stratakise8b19652017-11-02 11:32:54 +01002594 Py_RETURN_TRUE;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002595 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002596
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002597 /* Search for the first index where items are different */
2598 for (i = 0; i < Py_SIZE(vl) && i < Py_SIZE(wl); i++) {
2599 int k = PyObject_RichCompareBool(vl->ob_item[i],
2600 wl->ob_item[i], Py_EQ);
2601 if (k < 0)
2602 return NULL;
2603 if (!k)
2604 break;
2605 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002606
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002607 if (i >= Py_SIZE(vl) || i >= Py_SIZE(wl)) {
2608 /* No more items to compare -- compare sizes */
stratakise8b19652017-11-02 11:32:54 +01002609 Py_RETURN_RICHCOMPARE(Py_SIZE(vl), Py_SIZE(wl), op);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002610 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002611
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002612 /* We have an item that differs -- shortcuts for EQ/NE */
2613 if (op == Py_EQ) {
Serhiy Storchaka228b12e2017-01-23 09:47:21 +02002614 Py_RETURN_FALSE;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002615 }
2616 if (op == Py_NE) {
Serhiy Storchaka228b12e2017-01-23 09:47:21 +02002617 Py_RETURN_TRUE;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002618 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002619
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002620 /* Compare the final item again using the proper operator */
2621 return PyObject_RichCompare(vl->ob_item[i], wl->ob_item[i], op);
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002622}
2623
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002624/*[clinic input]
2625list.__init__
2626
2627 iterable: object(c_default="NULL") = ()
2628 /
2629
2630Built-in mutable sequence.
2631
2632If no argument is given, the constructor creates a new empty list.
2633The argument must be an iterable if specified.
2634[clinic start generated code]*/
2635
Tim Peters6d6c1a32001-08-02 04:15:00 +00002636static int
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002637list___init___impl(PyListObject *self, PyObject *iterable)
2638/*[clinic end generated code: output=0f3c21379d01de48 input=b3f3fe7206af8f6b]*/
Tim Peters6d6c1a32001-08-02 04:15:00 +00002639{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002640 /* Verify list invariants established by PyType_GenericAlloc() */
2641 assert(0 <= Py_SIZE(self));
2642 assert(Py_SIZE(self) <= self->allocated || self->allocated == -1);
2643 assert(self->ob_item != NULL ||
2644 self->allocated == 0 || self->allocated == -1);
Raymond Hettingerc0aaa2d2004-07-29 23:31:29 +00002645
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002646 /* Empty previous contents */
2647 if (self->ob_item != NULL) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002648 (void)_list_clear(self);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002649 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002650 if (iterable != NULL) {
2651 PyObject *rv = list_extend(self, iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002652 if (rv == NULL)
2653 return -1;
2654 Py_DECREF(rv);
2655 }
2656 return 0;
Tim Peters6d6c1a32001-08-02 04:15:00 +00002657}
2658
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002659/*[clinic input]
2660list.__sizeof__
2661
2662Return the size of the list in memory, in bytes.
2663[clinic start generated code]*/
2664
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002665static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002666list___sizeof___impl(PyListObject *self)
2667/*[clinic end generated code: output=3417541f95f9a53e input=b8030a5d5ce8a187]*/
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002668{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002669 Py_ssize_t res;
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002670
Serhiy Storchaka5c4064e2015-12-19 20:05:25 +02002671 res = _PyObject_SIZE(Py_TYPE(self)) + self->allocated * sizeof(void*);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002672 return PyLong_FromSsize_t(res);
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002673}
2674
Raymond Hettinger1021c442003-11-07 15:38:09 +00002675static PyObject *list_iter(PyObject *seq);
Raymond Hettinger8f5cdaa2003-12-13 11:26:12 +00002676static PyObject *list_subscript(PyListObject*, PyObject*);
2677
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002678static PyMethodDef list_methods[] = {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002679 {"__getitem__", (PyCFunction)list_subscript, METH_O|METH_COEXIST, "x.__getitem__(y) <==> x[y]"},
2680 LIST___REVERSED___METHODDEF
2681 LIST___SIZEOF___METHODDEF
2682 LIST_CLEAR_METHODDEF
2683 LIST_COPY_METHODDEF
2684 LIST_APPEND_METHODDEF
2685 LIST_INSERT_METHODDEF
2686 LIST_EXTEND_METHODDEF
2687 LIST_POP_METHODDEF
2688 LIST_REMOVE_METHODDEF
2689 LIST_INDEX_METHODDEF
2690 LIST_COUNT_METHODDEF
2691 LIST_REVERSE_METHODDEF
2692 LIST_SORT_METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002693 {NULL, NULL} /* sentinel */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002694};
2695
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002696static PySequenceMethods list_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002697 (lenfunc)list_length, /* sq_length */
2698 (binaryfunc)list_concat, /* sq_concat */
2699 (ssizeargfunc)list_repeat, /* sq_repeat */
2700 (ssizeargfunc)list_item, /* sq_item */
2701 0, /* sq_slice */
2702 (ssizeobjargproc)list_ass_item, /* sq_ass_item */
2703 0, /* sq_ass_slice */
2704 (objobjproc)list_contains, /* sq_contains */
2705 (binaryfunc)list_inplace_concat, /* sq_inplace_concat */
2706 (ssizeargfunc)list_inplace_repeat, /* sq_inplace_repeat */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002707};
2708
Jeremy Hyltona4b4c3b2002-07-13 03:51:17 +00002709static PyObject *
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002710list_subscript(PyListObject* self, PyObject* item)
2711{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002712 if (PyIndex_Check(item)) {
2713 Py_ssize_t i;
2714 i = PyNumber_AsSsize_t(item, PyExc_IndexError);
2715 if (i == -1 && PyErr_Occurred())
2716 return NULL;
2717 if (i < 0)
2718 i += PyList_GET_SIZE(self);
2719 return list_item(self, i);
2720 }
2721 else if (PySlice_Check(item)) {
2722 Py_ssize_t start, stop, step, slicelength, cur, i;
2723 PyObject* result;
2724 PyObject* it;
2725 PyObject **src, **dest;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002726
Serhiy Storchakab879fe82017-04-08 09:53:51 +03002727 if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002728 return NULL;
2729 }
Serhiy Storchakab879fe82017-04-08 09:53:51 +03002730 slicelength = PySlice_AdjustIndices(Py_SIZE(self), &start, &stop,
2731 step);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002732
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002733 if (slicelength <= 0) {
2734 return PyList_New(0);
2735 }
2736 else if (step == 1) {
2737 return list_slice(self, start, stop);
2738 }
2739 else {
2740 result = PyList_New(slicelength);
2741 if (!result) return NULL;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002742
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002743 src = self->ob_item;
2744 dest = ((PyListObject *)result)->ob_item;
2745 for (cur = start, i = 0; i < slicelength;
Mark Dickinsonc7d93b72011-09-25 15:34:32 +01002746 cur += (size_t)step, i++) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002747 it = src[cur];
2748 Py_INCREF(it);
2749 dest[i] = it;
2750 }
Tim Peters3b01a122002-07-19 02:35:45 +00002751
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002752 return result;
2753 }
2754 }
2755 else {
2756 PyErr_Format(PyExc_TypeError,
Terry Jan Reedyffff1442014-08-02 01:30:37 -04002757 "list indices must be integers or slices, not %.200s",
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002758 item->ob_type->tp_name);
2759 return NULL;
2760 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002761}
2762
Tim Peters3b01a122002-07-19 02:35:45 +00002763static int
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002764list_ass_subscript(PyListObject* self, PyObject* item, PyObject* value)
2765{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002766 if (PyIndex_Check(item)) {
2767 Py_ssize_t i = PyNumber_AsSsize_t(item, PyExc_IndexError);
2768 if (i == -1 && PyErr_Occurred())
2769 return -1;
2770 if (i < 0)
2771 i += PyList_GET_SIZE(self);
2772 return list_ass_item(self, i, value);
2773 }
2774 else if (PySlice_Check(item)) {
2775 Py_ssize_t start, stop, step, slicelength;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002776
Serhiy Storchakab879fe82017-04-08 09:53:51 +03002777 if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002778 return -1;
2779 }
Serhiy Storchakab879fe82017-04-08 09:53:51 +03002780 slicelength = PySlice_AdjustIndices(Py_SIZE(self), &start, &stop,
2781 step);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002782
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002783 if (step == 1)
2784 return list_ass_slice(self, start, stop, value);
Michael W. Hudson9c14bad2002-06-19 15:44:15 +00002785
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002786 /* Make sure s[5:2] = [..] inserts at the right place:
2787 before 5, not before 2. */
2788 if ((step < 0 && start < stop) ||
2789 (step > 0 && start > stop))
2790 stop = start;
Thomas Woutersed03b412007-08-28 21:37:11 +00002791
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002792 if (value == NULL) {
2793 /* delete slice */
2794 PyObject **garbage;
2795 size_t cur;
2796 Py_ssize_t i;
Victor Stinner35f28032013-11-21 12:16:35 +01002797 int res;
Tim Peters3b01a122002-07-19 02:35:45 +00002798
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002799 if (slicelength <= 0)
2800 return 0;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002801
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002802 if (step < 0) {
2803 stop = start + 1;
2804 start = stop + step*(slicelength - 1) - 1;
2805 step = -step;
2806 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002807
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002808 garbage = (PyObject**)
2809 PyMem_MALLOC(slicelength*sizeof(PyObject*));
2810 if (!garbage) {
2811 PyErr_NoMemory();
2812 return -1;
2813 }
Tim Peters3b01a122002-07-19 02:35:45 +00002814
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002815 /* drawing pictures might help understand these for
2816 loops. Basically, we memmove the parts of the
2817 list that are *not* part of the slice: step-1
2818 items for each item that is part of the slice,
2819 and then tail end of the list that was not
2820 covered by the slice */
2821 for (cur = start, i = 0;
2822 cur < (size_t)stop;
2823 cur += step, i++) {
2824 Py_ssize_t lim = step - 1;
Michael W. Hudson56796f62002-07-29 14:35:04 +00002825
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002826 garbage[i] = PyList_GET_ITEM(self, cur);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002827
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002828 if (cur + step >= (size_t)Py_SIZE(self)) {
2829 lim = Py_SIZE(self) - cur - 1;
2830 }
Michael W. Hudson56796f62002-07-29 14:35:04 +00002831
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002832 memmove(self->ob_item + cur - i,
2833 self->ob_item + cur + 1,
2834 lim * sizeof(PyObject *));
2835 }
Mark Dickinsonc7d93b72011-09-25 15:34:32 +01002836 cur = start + (size_t)slicelength * step;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002837 if (cur < (size_t)Py_SIZE(self)) {
2838 memmove(self->ob_item + cur - slicelength,
2839 self->ob_item + cur,
2840 (Py_SIZE(self) - cur) *
2841 sizeof(PyObject *));
2842 }
Raymond Hettingera6366fe2004-03-09 13:05:22 +00002843
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002844 Py_SIZE(self) -= slicelength;
Victor Stinner35f28032013-11-21 12:16:35 +01002845 res = list_resize(self, Py_SIZE(self));
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002846
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002847 for (i = 0; i < slicelength; i++) {
2848 Py_DECREF(garbage[i]);
2849 }
2850 PyMem_FREE(garbage);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002851
Victor Stinner35f28032013-11-21 12:16:35 +01002852 return res;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002853 }
2854 else {
2855 /* assign slice */
2856 PyObject *ins, *seq;
2857 PyObject **garbage, **seqitems, **selfitems;
2858 Py_ssize_t cur, i;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002859
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002860 /* protect against a[::-1] = a */
2861 if (self == (PyListObject*)value) {
2862 seq = list_slice((PyListObject*)value, 0,
2863 PyList_GET_SIZE(value));
2864 }
2865 else {
2866 seq = PySequence_Fast(value,
2867 "must assign iterable "
2868 "to extended slice");
2869 }
2870 if (!seq)
2871 return -1;
Michael W. Hudsona69c0302002-12-05 21:32:32 +00002872
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002873 if (PySequence_Fast_GET_SIZE(seq) != slicelength) {
2874 PyErr_Format(PyExc_ValueError,
2875 "attempt to assign sequence of "
2876 "size %zd to extended slice of "
2877 "size %zd",
2878 PySequence_Fast_GET_SIZE(seq),
2879 slicelength);
2880 Py_DECREF(seq);
2881 return -1;
2882 }
Michael W. Hudsona69c0302002-12-05 21:32:32 +00002883
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002884 if (!slicelength) {
2885 Py_DECREF(seq);
2886 return 0;
2887 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002888
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002889 garbage = (PyObject**)
2890 PyMem_MALLOC(slicelength*sizeof(PyObject*));
2891 if (!garbage) {
2892 Py_DECREF(seq);
2893 PyErr_NoMemory();
2894 return -1;
2895 }
Tim Peters3b01a122002-07-19 02:35:45 +00002896
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002897 selfitems = self->ob_item;
2898 seqitems = PySequence_Fast_ITEMS(seq);
2899 for (cur = start, i = 0; i < slicelength;
Mark Dickinsonc7d93b72011-09-25 15:34:32 +01002900 cur += (size_t)step, i++) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002901 garbage[i] = selfitems[cur];
2902 ins = seqitems[i];
2903 Py_INCREF(ins);
2904 selfitems[cur] = ins;
2905 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002906
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002907 for (i = 0; i < slicelength; i++) {
2908 Py_DECREF(garbage[i]);
2909 }
Tim Peters3b01a122002-07-19 02:35:45 +00002910
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002911 PyMem_FREE(garbage);
2912 Py_DECREF(seq);
Tim Peters3b01a122002-07-19 02:35:45 +00002913
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002914 return 0;
2915 }
2916 }
2917 else {
2918 PyErr_Format(PyExc_TypeError,
Terry Jan Reedyffff1442014-08-02 01:30:37 -04002919 "list indices must be integers or slices, not %.200s",
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002920 item->ob_type->tp_name);
2921 return -1;
2922 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002923}
2924
2925static PyMappingMethods list_as_mapping = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002926 (lenfunc)list_length,
2927 (binaryfunc)list_subscript,
2928 (objobjargproc)list_ass_subscript
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002929};
2930
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002931PyTypeObject PyList_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002932 PyVarObject_HEAD_INIT(&PyType_Type, 0)
2933 "list",
2934 sizeof(PyListObject),
2935 0,
2936 (destructor)list_dealloc, /* tp_dealloc */
2937 0, /* tp_print */
2938 0, /* tp_getattr */
2939 0, /* tp_setattr */
2940 0, /* tp_reserved */
2941 (reprfunc)list_repr, /* tp_repr */
2942 0, /* tp_as_number */
2943 &list_as_sequence, /* tp_as_sequence */
2944 &list_as_mapping, /* tp_as_mapping */
Georg Brandl00da4e02010-10-18 07:32:48 +00002945 PyObject_HashNotImplemented, /* tp_hash */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002946 0, /* tp_call */
2947 0, /* tp_str */
2948 PyObject_GenericGetAttr, /* tp_getattro */
2949 0, /* tp_setattro */
2950 0, /* tp_as_buffer */
2951 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002952 Py_TPFLAGS_BASETYPE | Py_TPFLAGS_LIST_SUBCLASS, /* tp_flags */
2953 list___init____doc__, /* tp_doc */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002954 (traverseproc)list_traverse, /* tp_traverse */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002955 (inquiry)_list_clear, /* tp_clear */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002956 list_richcompare, /* tp_richcompare */
2957 0, /* tp_weaklistoffset */
2958 list_iter, /* tp_iter */
2959 0, /* tp_iternext */
2960 list_methods, /* tp_methods */
2961 0, /* tp_members */
2962 0, /* tp_getset */
2963 0, /* tp_base */
2964 0, /* tp_dict */
2965 0, /* tp_descr_get */
2966 0, /* tp_descr_set */
2967 0, /* tp_dictoffset */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002968 (initproc)list___init__, /* tp_init */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002969 PyType_GenericAlloc, /* tp_alloc */
2970 PyType_GenericNew, /* tp_new */
2971 PyObject_GC_Del, /* tp_free */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002972};
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002973
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002974/*********************** List Iterator **************************/
2975
2976typedef struct {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002977 PyObject_HEAD
Victor Stinner7660b882013-06-24 23:59:24 +02002978 Py_ssize_t it_index;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002979 PyListObject *it_seq; /* Set to NULL when iterator is exhausted */
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002980} listiterobject;
2981
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00002982static void listiter_dealloc(listiterobject *);
2983static int listiter_traverse(listiterobject *, visitproc, void *);
2984static PyObject *listiter_next(listiterobject *);
2985static PyObject *listiter_len(listiterobject *);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00002986static PyObject *listiter_reduce_general(void *_it, int forward);
2987static PyObject *listiter_reduce(listiterobject *);
2988static PyObject *listiter_setstate(listiterobject *, PyObject *state);
Raymond Hettinger435bf582004-03-18 22:43:10 +00002989
Armin Rigof5b3e362006-02-11 21:32:43 +00002990PyDoc_STRVAR(length_hint_doc, "Private method returning an estimate of len(list(it)).");
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00002991PyDoc_STRVAR(reduce_doc, "Return state information for pickling.");
2992PyDoc_STRVAR(setstate_doc, "Set state information for unpickling.");
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00002993
2994static PyMethodDef listiter_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002995 {"__length_hint__", (PyCFunction)listiter_len, METH_NOARGS, length_hint_doc},
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00002996 {"__reduce__", (PyCFunction)listiter_reduce, METH_NOARGS, reduce_doc},
2997 {"__setstate__", (PyCFunction)listiter_setstate, METH_O, setstate_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002998 {NULL, NULL} /* sentinel */
Raymond Hettinger435bf582004-03-18 22:43:10 +00002999};
3000
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00003001PyTypeObject PyListIter_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003002 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3003 "list_iterator", /* tp_name */
3004 sizeof(listiterobject), /* tp_basicsize */
3005 0, /* tp_itemsize */
3006 /* methods */
3007 (destructor)listiter_dealloc, /* tp_dealloc */
3008 0, /* tp_print */
3009 0, /* tp_getattr */
3010 0, /* tp_setattr */
3011 0, /* tp_reserved */
3012 0, /* tp_repr */
3013 0, /* tp_as_number */
3014 0, /* tp_as_sequence */
3015 0, /* tp_as_mapping */
3016 0, /* tp_hash */
3017 0, /* tp_call */
3018 0, /* tp_str */
3019 PyObject_GenericGetAttr, /* tp_getattro */
3020 0, /* tp_setattro */
3021 0, /* tp_as_buffer */
3022 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3023 0, /* tp_doc */
3024 (traverseproc)listiter_traverse, /* tp_traverse */
3025 0, /* tp_clear */
3026 0, /* tp_richcompare */
3027 0, /* tp_weaklistoffset */
3028 PyObject_SelfIter, /* tp_iter */
3029 (iternextfunc)listiter_next, /* tp_iternext */
3030 listiter_methods, /* tp_methods */
3031 0, /* tp_members */
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00003032};
Raymond Hettinger1021c442003-11-07 15:38:09 +00003033
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003034
3035static PyObject *
3036list_iter(PyObject *seq)
3037{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003038 listiterobject *it;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003039
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003040 if (!PyList_Check(seq)) {
3041 PyErr_BadInternalCall();
3042 return NULL;
3043 }
3044 it = PyObject_GC_New(listiterobject, &PyListIter_Type);
3045 if (it == NULL)
3046 return NULL;
3047 it->it_index = 0;
3048 Py_INCREF(seq);
3049 it->it_seq = (PyListObject *)seq;
3050 _PyObject_GC_TRACK(it);
3051 return (PyObject *)it;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003052}
3053
3054static void
3055listiter_dealloc(listiterobject *it)
3056{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003057 _PyObject_GC_UNTRACK(it);
3058 Py_XDECREF(it->it_seq);
3059 PyObject_GC_Del(it);
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003060}
3061
3062static int
3063listiter_traverse(listiterobject *it, visitproc visit, void *arg)
3064{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003065 Py_VISIT(it->it_seq);
3066 return 0;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003067}
3068
3069static PyObject *
3070listiter_next(listiterobject *it)
3071{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003072 PyListObject *seq;
3073 PyObject *item;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003074
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003075 assert(it != NULL);
3076 seq = it->it_seq;
3077 if (seq == NULL)
3078 return NULL;
3079 assert(PyList_Check(seq));
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003080
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003081 if (it->it_index < PyList_GET_SIZE(seq)) {
3082 item = PyList_GET_ITEM(seq, it->it_index);
3083 ++it->it_index;
3084 Py_INCREF(item);
3085 return item;
3086 }
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003087
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003088 it->it_seq = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003089 Py_DECREF(seq);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003090 return NULL;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003091}
3092
3093static PyObject *
3094listiter_len(listiterobject *it)
3095{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003096 Py_ssize_t len;
3097 if (it->it_seq) {
3098 len = PyList_GET_SIZE(it->it_seq) - it->it_index;
3099 if (len >= 0)
3100 return PyLong_FromSsize_t(len);
3101 }
3102 return PyLong_FromLong(0);
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003103}
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003104
3105static PyObject *
3106listiter_reduce(listiterobject *it)
3107{
3108 return listiter_reduce_general(it, 1);
3109}
3110
3111static PyObject *
3112listiter_setstate(listiterobject *it, PyObject *state)
3113{
Victor Stinner7660b882013-06-24 23:59:24 +02003114 Py_ssize_t index = PyLong_AsSsize_t(state);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003115 if (index == -1 && PyErr_Occurred())
3116 return NULL;
3117 if (it->it_seq != NULL) {
3118 if (index < 0)
3119 index = 0;
Kristján Valur Jónsson25dded02014-03-05 13:47:57 +00003120 else if (index > PyList_GET_SIZE(it->it_seq))
3121 index = PyList_GET_SIZE(it->it_seq); /* iterator exhausted */
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003122 it->it_index = index;
3123 }
3124 Py_RETURN_NONE;
3125}
3126
Raymond Hettinger1021c442003-11-07 15:38:09 +00003127/*********************** List Reverse Iterator **************************/
3128
3129typedef struct {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003130 PyObject_HEAD
3131 Py_ssize_t it_index;
3132 PyListObject *it_seq; /* Set to NULL when iterator is exhausted */
Raymond Hettinger1021c442003-11-07 15:38:09 +00003133} listreviterobject;
3134
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003135static void listreviter_dealloc(listreviterobject *);
3136static int listreviter_traverse(listreviterobject *, visitproc, void *);
3137static PyObject *listreviter_next(listreviterobject *);
Raymond Hettingerf5b64112008-12-02 21:33:45 +00003138static PyObject *listreviter_len(listreviterobject *);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003139static PyObject *listreviter_reduce(listreviterobject *);
3140static PyObject *listreviter_setstate(listreviterobject *, PyObject *);
Raymond Hettingeref9bf402004-03-10 10:10:42 +00003141
Raymond Hettingerf5b64112008-12-02 21:33:45 +00003142static PyMethodDef listreviter_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003143 {"__length_hint__", (PyCFunction)listreviter_len, METH_NOARGS, length_hint_doc},
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003144 {"__reduce__", (PyCFunction)listreviter_reduce, METH_NOARGS, reduce_doc},
3145 {"__setstate__", (PyCFunction)listreviter_setstate, METH_O, setstate_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003146 {NULL, NULL} /* sentinel */
Raymond Hettingeref9bf402004-03-10 10:10:42 +00003147};
3148
Raymond Hettinger1021c442003-11-07 15:38:09 +00003149PyTypeObject PyListRevIter_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003150 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3151 "list_reverseiterator", /* tp_name */
3152 sizeof(listreviterobject), /* tp_basicsize */
3153 0, /* tp_itemsize */
3154 /* methods */
3155 (destructor)listreviter_dealloc, /* tp_dealloc */
3156 0, /* tp_print */
3157 0, /* tp_getattr */
3158 0, /* tp_setattr */
3159 0, /* tp_reserved */
3160 0, /* tp_repr */
3161 0, /* tp_as_number */
3162 0, /* tp_as_sequence */
3163 0, /* tp_as_mapping */
3164 0, /* tp_hash */
3165 0, /* tp_call */
3166 0, /* tp_str */
3167 PyObject_GenericGetAttr, /* tp_getattro */
3168 0, /* tp_setattro */
3169 0, /* tp_as_buffer */
3170 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3171 0, /* tp_doc */
3172 (traverseproc)listreviter_traverse, /* tp_traverse */
3173 0, /* tp_clear */
3174 0, /* tp_richcompare */
3175 0, /* tp_weaklistoffset */
3176 PyObject_SelfIter, /* tp_iter */
3177 (iternextfunc)listreviter_next, /* tp_iternext */
3178 listreviter_methods, /* tp_methods */
3179 0,
Raymond Hettinger1021c442003-11-07 15:38:09 +00003180};
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003181
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02003182/*[clinic input]
3183list.__reversed__
3184
3185Return a reverse iterator over the list.
3186[clinic start generated code]*/
3187
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003188static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02003189list___reversed___impl(PyListObject *self)
3190/*[clinic end generated code: output=b166f073208c888c input=eadb6e17f8a6a280]*/
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003191{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003192 listreviterobject *it;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003193
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003194 it = PyObject_GC_New(listreviterobject, &PyListRevIter_Type);
3195 if (it == NULL)
3196 return NULL;
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02003197 assert(PyList_Check(self));
3198 it->it_index = PyList_GET_SIZE(self) - 1;
3199 Py_INCREF(self);
3200 it->it_seq = self;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003201 PyObject_GC_Track(it);
3202 return (PyObject *)it;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003203}
3204
3205static void
3206listreviter_dealloc(listreviterobject *it)
3207{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003208 PyObject_GC_UnTrack(it);
3209 Py_XDECREF(it->it_seq);
3210 PyObject_GC_Del(it);
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003211}
3212
3213static int
3214listreviter_traverse(listreviterobject *it, visitproc visit, void *arg)
3215{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003216 Py_VISIT(it->it_seq);
3217 return 0;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003218}
3219
3220static PyObject *
3221listreviter_next(listreviterobject *it)
3222{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003223 PyObject *item;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003224 Py_ssize_t index;
3225 PyListObject *seq;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003226
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003227 assert(it != NULL);
3228 seq = it->it_seq;
3229 if (seq == NULL) {
3230 return NULL;
3231 }
3232 assert(PyList_Check(seq));
3233
3234 index = it->it_index;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003235 if (index>=0 && index < PyList_GET_SIZE(seq)) {
3236 item = PyList_GET_ITEM(seq, index);
3237 it->it_index--;
3238 Py_INCREF(item);
3239 return item;
3240 }
3241 it->it_index = -1;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003242 it->it_seq = NULL;
3243 Py_DECREF(seq);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003244 return NULL;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003245}
3246
Raymond Hettingerf5b64112008-12-02 21:33:45 +00003247static PyObject *
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003248listreviter_len(listreviterobject *it)
3249{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003250 Py_ssize_t len = it->it_index + 1;
3251 if (it->it_seq == NULL || PyList_GET_SIZE(it->it_seq) < len)
3252 len = 0;
3253 return PyLong_FromSsize_t(len);
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003254}
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003255
3256static PyObject *
3257listreviter_reduce(listreviterobject *it)
3258{
3259 return listiter_reduce_general(it, 0);
3260}
3261
3262static PyObject *
3263listreviter_setstate(listreviterobject *it, PyObject *state)
3264{
3265 Py_ssize_t index = PyLong_AsSsize_t(state);
3266 if (index == -1 && PyErr_Occurred())
3267 return NULL;
3268 if (it->it_seq != NULL) {
3269 if (index < -1)
3270 index = -1;
3271 else if (index > PyList_GET_SIZE(it->it_seq) - 1)
3272 index = PyList_GET_SIZE(it->it_seq) - 1;
3273 it->it_index = index;
3274 }
3275 Py_RETURN_NONE;
3276}
3277
3278/* common pickling support */
3279
3280static PyObject *
3281listiter_reduce_general(void *_it, int forward)
3282{
3283 PyObject *list;
3284
3285 /* the objects are not the same, index is of different types! */
3286 if (forward) {
3287 listiterobject *it = (listiterobject *)_it;
3288 if (it->it_seq)
Victor Stinner7660b882013-06-24 23:59:24 +02003289 return Py_BuildValue("N(O)n", _PyObject_GetBuiltin("iter"),
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003290 it->it_seq, it->it_index);
3291 } else {
3292 listreviterobject *it = (listreviterobject *)_it;
3293 if (it->it_seq)
Antoine Pitroua7013882012-04-05 00:04:20 +02003294 return Py_BuildValue("N(O)n", _PyObject_GetBuiltin("reversed"),
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003295 it->it_seq, it->it_index);
3296 }
3297 /* empty iterator, create an empty list */
3298 list = PyList_New(0);
3299 if (list == NULL)
3300 return NULL;
Antoine Pitroua7013882012-04-05 00:04:20 +02003301 return Py_BuildValue("N(N)", _PyObject_GetBuiltin("iter"), list);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003302}