blob: d795f66e6e053588becfc1124c12e7a534823889 [file] [log] [blame]
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00001/* List object implementation */
2
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003#include "Python.h"
Eric Snow2ebc5ce2017-09-07 23:51:28 -06004#include "internal/pystate.h"
Antoine Pitrou0197ff92012-03-22 14:38:16 +01005#include "accu.h"
Guido van Rossumc0b618a1997-05-02 03:12:38 +00006
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00007#ifdef STDC_HEADERS
8#include <stddef.h>
9#else
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000010#include <sys/types.h> /* For size_t */
Guido van Rossum6cd2fe01994-08-29 12:45:32 +000011#endif
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000012
Serhiy Storchakafdd42c42017-03-11 09:19:20 +020013/*[clinic input]
14class list "PyListObject *" "&PyList_Type"
15[clinic start generated code]*/
16/*[clinic end generated code: output=da39a3ee5e6b4b0d input=f9b222678f9f71e0]*/
17
18#include "clinic/listobject.c.h"
19
Tim Peters8d9eb102004-07-31 02:24:20 +000020/* Ensure ob_item has room for at least newsize elements, and set
21 * ob_size to newsize. If newsize > ob_size on entry, the content
22 * of the new slots at exit is undefined heap trash; it's the caller's
Ezio Melotti13925002011-03-16 11:05:33 +020023 * responsibility to overwrite them with sane values.
Tim Peters8d9eb102004-07-31 02:24:20 +000024 * The number of allocated elements may grow, shrink, or stay the same.
25 * Failure is impossible if newsize <= self.allocated on entry, although
26 * that partly relies on an assumption that the system realloc() never
27 * fails when passed a number of bytes <= the number of bytes last
28 * allocated (the C standard doesn't guarantee this, but it's hard to
29 * imagine a realloc implementation where it wouldn't be true).
30 * Note that self->ob_item may change, and even if newsize is less
31 * than ob_size on entry.
32 */
Guido van Rossuma46d51d1995-01-26 22:59:43 +000033static int
Martin v. Löwis18e16552006-02-15 17:27:45 +000034list_resize(PyListObject *self, Py_ssize_t newsize)
Guido van Rossuma46d51d1995-01-26 22:59:43 +000035{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000036 PyObject **items;
Xiang Zhang4cee0492017-02-22 12:32:30 +080037 size_t new_allocated, num_allocated_bytes;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000038 Py_ssize_t allocated = self->allocated;
Tim Peters65b8b842001-05-26 05:28:40 +000039
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000040 /* Bypass realloc() when a previous overallocation is large enough
41 to accommodate the newsize. If the newsize falls lower than half
42 the allocated size, then proceed with the realloc() to shrink the list.
43 */
44 if (allocated >= newsize && newsize >= (allocated >> 1)) {
45 assert(self->ob_item != NULL || newsize == 0);
46 Py_SIZE(self) = newsize;
47 return 0;
48 }
Raymond Hettinger4bb95402004-02-13 11:36:39 +000049
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000050 /* This over-allocates proportional to the list size, making room
51 * for additional growth. The over-allocation is mild, but is
52 * enough to give linear-time amortized behavior over a long
53 * sequence of appends() in the presence of a poorly-performing
54 * system realloc().
55 * The growth pattern is: 0, 4, 8, 16, 25, 35, 46, 58, 72, 88, ...
Xiang Zhang4cee0492017-02-22 12:32:30 +080056 * Note: new_allocated won't overflow because the largest possible value
57 * is PY_SSIZE_T_MAX * (9 / 8) + 6 which always fits in a size_t.
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000058 */
Xiang Zhang4cee0492017-02-22 12:32:30 +080059 new_allocated = (size_t)newsize + (newsize >> 3) + (newsize < 9 ? 3 : 6);
60 if (new_allocated > (size_t)PY_SSIZE_T_MAX / sizeof(PyObject *)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000061 PyErr_NoMemory();
62 return -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000063 }
Amaury Forgeot d'Arc9c74b142008-06-18 00:47:36 +000064
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000065 if (newsize == 0)
66 new_allocated = 0;
Xiang Zhang4cee0492017-02-22 12:32:30 +080067 num_allocated_bytes = new_allocated * sizeof(PyObject *);
68 items = (PyObject **)PyMem_Realloc(self->ob_item, num_allocated_bytes);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000069 if (items == NULL) {
70 PyErr_NoMemory();
71 return -1;
72 }
73 self->ob_item = items;
74 Py_SIZE(self) = newsize;
75 self->allocated = new_allocated;
76 return 0;
Raymond Hettinger4bb95402004-02-13 11:36:39 +000077}
Guido van Rossuma46d51d1995-01-26 22:59:43 +000078
Christian Heimes77c02eb2008-02-09 02:18:51 +000079/* Debug statistic to compare allocations with reuse through the free list */
80#undef SHOW_ALLOC_COUNT
81#ifdef SHOW_ALLOC_COUNT
82static size_t count_alloc = 0;
83static size_t count_reuse = 0;
84
85static void
86show_alloc(void)
87{
Victor Stinner25420fe2017-11-20 18:12:22 -080088 PyInterpreterState *interp = PyThreadState_GET()->interp;
Miss Islington (bot)bc2e1102018-02-21 21:44:08 -080089 if (!interp->core_config.show_alloc_count) {
Serhiy Storchaka7e160ce2016-07-03 21:03:53 +030090 return;
Victor Stinner25420fe2017-11-20 18:12:22 -080091 }
Serhiy Storchaka7e160ce2016-07-03 21:03:53 +030092
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000093 fprintf(stderr, "List allocations: %" PY_FORMAT_SIZE_T "d\n",
94 count_alloc);
95 fprintf(stderr, "List reuse through freelist: %" PY_FORMAT_SIZE_T
96 "d\n", count_reuse);
97 fprintf(stderr, "%.2f%% reuse rate\n\n",
98 (100.0*count_reuse/(count_alloc+count_reuse)));
Christian Heimes77c02eb2008-02-09 02:18:51 +000099}
100#endif
101
Raymond Hettinger0468e412004-05-05 05:37:53 +0000102/* Empty list reuse scheme to save calls to malloc and free */
Christian Heimes2202f872008-02-06 14:31:34 +0000103#ifndef PyList_MAXFREELIST
104#define PyList_MAXFREELIST 80
105#endif
106static PyListObject *free_list[PyList_MAXFREELIST];
107static int numfree = 0;
Raymond Hettinger0468e412004-05-05 05:37:53 +0000108
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100109int
110PyList_ClearFreeList(void)
Raymond Hettingerfb09f0e2004-10-07 03:58:07 +0000111{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000112 PyListObject *op;
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100113 int ret = numfree;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000114 while (numfree) {
115 op = free_list[--numfree];
116 assert(PyList_CheckExact(op));
117 PyObject_GC_Del(op);
118 }
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100119 return ret;
120}
121
122void
123PyList_Fini(void)
124{
125 PyList_ClearFreeList();
Raymond Hettingerfb09f0e2004-10-07 03:58:07 +0000126}
127
David Malcolm49526f42012-06-22 14:55:41 -0400128/* Print summary info about the state of the optimized allocator */
129void
130_PyList_DebugMallocStats(FILE *out)
131{
132 _PyDebugAllocatorStats(out,
133 "free PyListObject",
134 numfree, sizeof(PyListObject));
135}
136
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000137PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000138PyList_New(Py_ssize_t size)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000139{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000140 PyListObject *op;
Christian Heimes77c02eb2008-02-09 02:18:51 +0000141#ifdef SHOW_ALLOC_COUNT
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000142 static int initialized = 0;
143 if (!initialized) {
144 Py_AtExit(show_alloc);
145 initialized = 1;
146 }
Christian Heimes77c02eb2008-02-09 02:18:51 +0000147#endif
Tim Peters3986d4e2004-07-29 02:28:42 +0000148
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000149 if (size < 0) {
150 PyErr_BadInternalCall();
151 return NULL;
152 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000153 if (numfree) {
154 numfree--;
155 op = free_list[numfree];
156 _Py_NewReference((PyObject *)op);
Christian Heimes77c02eb2008-02-09 02:18:51 +0000157#ifdef SHOW_ALLOC_COUNT
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000158 count_reuse++;
Christian Heimes77c02eb2008-02-09 02:18:51 +0000159#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000160 } else {
161 op = PyObject_GC_New(PyListObject, &PyList_Type);
162 if (op == NULL)
163 return NULL;
Christian Heimes77c02eb2008-02-09 02:18:51 +0000164#ifdef SHOW_ALLOC_COUNT
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000165 count_alloc++;
Christian Heimes77c02eb2008-02-09 02:18:51 +0000166#endif
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000167 }
168 if (size <= 0)
169 op->ob_item = NULL;
170 else {
Mark Dickinson5d132382016-08-21 08:55:15 +0100171 op->ob_item = (PyObject **) PyMem_Calloc(size, sizeof(PyObject *));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000172 if (op->ob_item == NULL) {
173 Py_DECREF(op);
174 return PyErr_NoMemory();
175 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000176 }
177 Py_SIZE(op) = size;
178 op->allocated = size;
179 _PyObject_GC_TRACK(op);
180 return (PyObject *) op;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000181}
182
Martin v. Löwis18e16552006-02-15 17:27:45 +0000183Py_ssize_t
Fred Drakea2f55112000-07-09 15:16:51 +0000184PyList_Size(PyObject *op)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000185{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000186 if (!PyList_Check(op)) {
187 PyErr_BadInternalCall();
188 return -1;
189 }
190 else
191 return Py_SIZE(op);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000192}
193
Raymond Hettingerfdfe6182004-05-05 06:28:16 +0000194static PyObject *indexerr = NULL;
Guido van Rossum929f1b81996-08-09 20:51:27 +0000195
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000196PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000197PyList_GetItem(PyObject *op, Py_ssize_t i)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000198{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000199 if (!PyList_Check(op)) {
200 PyErr_BadInternalCall();
201 return NULL;
202 }
203 if (i < 0 || i >= Py_SIZE(op)) {
204 if (indexerr == NULL) {
205 indexerr = PyUnicode_FromString(
206 "list index out of range");
207 if (indexerr == NULL)
208 return NULL;
209 }
210 PyErr_SetObject(PyExc_IndexError, indexerr);
211 return NULL;
212 }
213 return ((PyListObject *)op) -> ob_item[i];
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000214}
215
216int
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200217PyList_SetItem(PyObject *op, Py_ssize_t i,
218 PyObject *newitem)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000219{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200220 PyObject **p;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000221 if (!PyList_Check(op)) {
222 Py_XDECREF(newitem);
223 PyErr_BadInternalCall();
224 return -1;
225 }
226 if (i < 0 || i >= Py_SIZE(op)) {
227 Py_XDECREF(newitem);
228 PyErr_SetString(PyExc_IndexError,
229 "list assignment index out of range");
230 return -1;
231 }
232 p = ((PyListObject *)op) -> ob_item + i;
Serhiy Storchakaec397562016-04-06 09:50:03 +0300233 Py_XSETREF(*p, newitem);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000234 return 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000235}
236
237static int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000238ins1(PyListObject *self, Py_ssize_t where, PyObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000239{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000240 Py_ssize_t i, n = Py_SIZE(self);
241 PyObject **items;
242 if (v == NULL) {
243 PyErr_BadInternalCall();
244 return -1;
245 }
246 if (n == PY_SSIZE_T_MAX) {
247 PyErr_SetString(PyExc_OverflowError,
248 "cannot add more objects to list");
249 return -1;
250 }
Tim Petersb38e2b62004-07-29 02:29:26 +0000251
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800252 if (list_resize(self, n+1) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000253 return -1;
Raymond Hettinger4bb95402004-02-13 11:36:39 +0000254
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000255 if (where < 0) {
256 where += n;
257 if (where < 0)
258 where = 0;
259 }
260 if (where > n)
261 where = n;
262 items = self->ob_item;
263 for (i = n; --i >= where; )
264 items[i+1] = items[i];
265 Py_INCREF(v);
266 items[where] = v;
267 return 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000268}
269
270int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000271PyList_Insert(PyObject *op, Py_ssize_t where, PyObject *newitem)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000272{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000273 if (!PyList_Check(op)) {
274 PyErr_BadInternalCall();
275 return -1;
276 }
277 return ins1((PyListObject *)op, where, newitem);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000278}
279
Raymond Hettinger40a03822004-04-12 13:05:09 +0000280static int
281app1(PyListObject *self, PyObject *v)
282{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000283 Py_ssize_t n = PyList_GET_SIZE(self);
Raymond Hettinger40a03822004-04-12 13:05:09 +0000284
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000285 assert (v != NULL);
286 if (n == PY_SSIZE_T_MAX) {
287 PyErr_SetString(PyExc_OverflowError,
288 "cannot add more objects to list");
289 return -1;
290 }
Raymond Hettinger40a03822004-04-12 13:05:09 +0000291
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800292 if (list_resize(self, n+1) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000293 return -1;
Raymond Hettinger40a03822004-04-12 13:05:09 +0000294
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000295 Py_INCREF(v);
296 PyList_SET_ITEM(self, n, v);
297 return 0;
Raymond Hettinger40a03822004-04-12 13:05:09 +0000298}
299
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000300int
Fred Drakea2f55112000-07-09 15:16:51 +0000301PyList_Append(PyObject *op, PyObject *newitem)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000302{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000303 if (PyList_Check(op) && (newitem != NULL))
304 return app1((PyListObject *)op, newitem);
305 PyErr_BadInternalCall();
306 return -1;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000307}
308
309/* Methods */
310
311static void
Fred Drakea2f55112000-07-09 15:16:51 +0000312list_dealloc(PyListObject *op)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000313{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000314 Py_ssize_t i;
315 PyObject_GC_UnTrack(op);
316 Py_TRASHCAN_SAFE_BEGIN(op)
317 if (op->ob_item != NULL) {
318 /* Do it backwards, for Christian Tismer.
319 There's a simple test case where somehow this reduces
320 thrashing when a *very* large list is created and
321 immediately deleted. */
322 i = Py_SIZE(op);
323 while (--i >= 0) {
324 Py_XDECREF(op->ob_item[i]);
325 }
326 PyMem_FREE(op->ob_item);
327 }
328 if (numfree < PyList_MAXFREELIST && PyList_CheckExact(op))
329 free_list[numfree++] = op;
330 else
331 Py_TYPE(op)->tp_free((PyObject *)op);
332 Py_TRASHCAN_SAFE_END(op)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000333}
334
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000335static PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +0000336list_repr(PyListObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000337{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000338 Py_ssize_t i;
Victor Stinner5c733472013-11-18 21:11:57 +0100339 PyObject *s;
Victor Stinner5c733472013-11-18 21:11:57 +0100340 _PyUnicodeWriter writer;
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200341
342 if (Py_SIZE(v) == 0) {
343 return PyUnicode_FromString("[]");
344 }
345
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000346 i = Py_ReprEnter((PyObject*)v);
347 if (i != 0) {
348 return i > 0 ? PyUnicode_FromString("[...]") : NULL;
349 }
Tim Petersa7259592001-06-16 05:11:17 +0000350
Victor Stinner5c733472013-11-18 21:11:57 +0100351 _PyUnicodeWriter_Init(&writer);
352 writer.overallocate = 1;
Victor Stinnerb8fb1972013-11-18 22:15:44 +0100353 /* "[" + "1" + ", 2" * (len - 1) + "]" */
354 writer.min_length = 1 + 1 + (2 + 1) * (Py_SIZE(v) - 1) + 1;
Tim Petersa7259592001-06-16 05:11:17 +0000355
Victor Stinner5c733472013-11-18 21:11:57 +0100356 if (_PyUnicodeWriter_WriteChar(&writer, '[') < 0)
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200357 goto error;
Tim Petersa7259592001-06-16 05:11:17 +0000358
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000359 /* Do repr() on each element. Note that this may mutate the list,
360 so must refetch the list size on each iteration. */
361 for (i = 0; i < Py_SIZE(v); ++i) {
Victor Stinner5c733472013-11-18 21:11:57 +0100362 if (i > 0) {
Victor Stinner4a587072013-11-19 12:54:53 +0100363 if (_PyUnicodeWriter_WriteASCIIString(&writer, ", ", 2) < 0)
Victor Stinner5c733472013-11-18 21:11:57 +0100364 goto error;
365 }
366
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000367 s = PyObject_Repr(v->ob_item[i]);
Victor Stinner5c733472013-11-18 21:11:57 +0100368 if (s == NULL)
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200369 goto error;
Victor Stinner5c733472013-11-18 21:11:57 +0100370
371 if (_PyUnicodeWriter_WriteStr(&writer, s) < 0) {
372 Py_DECREF(s);
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200373 goto error;
Victor Stinner5c733472013-11-18 21:11:57 +0100374 }
375 Py_DECREF(s);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000376 }
Victor Stinner5c733472013-11-18 21:11:57 +0100377
Victor Stinner4d3f1092013-11-19 12:09:00 +0100378 writer.overallocate = 0;
Victor Stinner5c733472013-11-18 21:11:57 +0100379 if (_PyUnicodeWriter_WriteChar(&writer, ']') < 0)
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200380 goto error;
Tim Petersa7259592001-06-16 05:11:17 +0000381
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000382 Py_ReprLeave((PyObject *)v);
Victor Stinner5c733472013-11-18 21:11:57 +0100383 return _PyUnicodeWriter_Finish(&writer);
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200384
385error:
Victor Stinner5c733472013-11-18 21:11:57 +0100386 _PyUnicodeWriter_Dealloc(&writer);
Antoine Pitroueeb7eea2011-10-06 18:57:27 +0200387 Py_ReprLeave((PyObject *)v);
388 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000389}
390
Martin v. Löwis18e16552006-02-15 17:27:45 +0000391static Py_ssize_t
Fred Drakea2f55112000-07-09 15:16:51 +0000392list_length(PyListObject *a)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000393{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000394 return Py_SIZE(a);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000395}
396
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000397static int
Fred Drakea2f55112000-07-09 15:16:51 +0000398list_contains(PyListObject *a, PyObject *el)
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000399{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000400 Py_ssize_t i;
401 int cmp;
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000402
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000403 for (i = 0, cmp = 0 ; cmp == 0 && i < Py_SIZE(a); ++i)
404 cmp = PyObject_RichCompareBool(el, PyList_GET_ITEM(a, i),
405 Py_EQ);
406 return cmp;
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000407}
408
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000409static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000410list_item(PyListObject *a, Py_ssize_t i)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000411{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000412 if (i < 0 || i >= Py_SIZE(a)) {
413 if (indexerr == NULL) {
414 indexerr = PyUnicode_FromString(
415 "list index out of range");
416 if (indexerr == NULL)
417 return NULL;
418 }
419 PyErr_SetObject(PyExc_IndexError, indexerr);
420 return NULL;
421 }
422 Py_INCREF(a->ob_item[i]);
423 return a->ob_item[i];
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000424}
425
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000426static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000427list_slice(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000428{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000429 PyListObject *np;
430 PyObject **src, **dest;
431 Py_ssize_t i, len;
432 if (ilow < 0)
433 ilow = 0;
434 else if (ilow > Py_SIZE(a))
435 ilow = Py_SIZE(a);
436 if (ihigh < ilow)
437 ihigh = ilow;
438 else if (ihigh > Py_SIZE(a))
439 ihigh = Py_SIZE(a);
440 len = ihigh - ilow;
441 np = (PyListObject *) PyList_New(len);
442 if (np == NULL)
443 return NULL;
Raymond Hettinger99842b62004-03-08 05:56:15 +0000444
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000445 src = a->ob_item + ilow;
446 dest = np->ob_item;
447 for (i = 0; i < len; i++) {
448 PyObject *v = src[i];
449 Py_INCREF(v);
450 dest[i] = v;
451 }
452 return (PyObject *)np;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000453}
454
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000455PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000456PyList_GetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
Guido van Rossum234f9421993-06-17 12:35:49 +0000457{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000458 if (!PyList_Check(a)) {
459 PyErr_BadInternalCall();
460 return NULL;
461 }
462 return list_slice((PyListObject *)a, ilow, ihigh);
Guido van Rossum234f9421993-06-17 12:35:49 +0000463}
464
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000465static PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +0000466list_concat(PyListObject *a, PyObject *bb)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000467{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000468 Py_ssize_t size;
469 Py_ssize_t i;
470 PyObject **src, **dest;
471 PyListObject *np;
472 if (!PyList_Check(bb)) {
473 PyErr_Format(PyExc_TypeError,
474 "can only concatenate list (not \"%.200s\") to list",
475 bb->ob_type->tp_name);
476 return NULL;
477 }
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000478#define b ((PyListObject *)bb)
Martin Panterb93d8632016-07-25 02:39:20 +0000479 if (Py_SIZE(a) > PY_SSIZE_T_MAX - Py_SIZE(b))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000480 return PyErr_NoMemory();
Martin Panterb93d8632016-07-25 02:39:20 +0000481 size = Py_SIZE(a) + Py_SIZE(b);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000482 np = (PyListObject *) PyList_New(size);
483 if (np == NULL) {
484 return NULL;
485 }
486 src = a->ob_item;
487 dest = np->ob_item;
488 for (i = 0; i < Py_SIZE(a); i++) {
489 PyObject *v = src[i];
490 Py_INCREF(v);
491 dest[i] = v;
492 }
493 src = b->ob_item;
494 dest = np->ob_item + Py_SIZE(a);
495 for (i = 0; i < Py_SIZE(b); i++) {
496 PyObject *v = src[i];
497 Py_INCREF(v);
498 dest[i] = v;
499 }
500 return (PyObject *)np;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000501#undef b
502}
503
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000504static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000505list_repeat(PyListObject *a, Py_ssize_t n)
Guido van Rossumed98d481991-03-06 13:07:53 +0000506{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000507 Py_ssize_t i, j;
508 Py_ssize_t size;
509 PyListObject *np;
510 PyObject **p, **items;
511 PyObject *elem;
512 if (n < 0)
513 n = 0;
Mark Dickinsonc0420fd2011-09-19 19:18:37 +0100514 if (n > 0 && Py_SIZE(a) > PY_SSIZE_T_MAX / n)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000515 return PyErr_NoMemory();
Mark Dickinsonc0420fd2011-09-19 19:18:37 +0100516 size = Py_SIZE(a) * n;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000517 if (size == 0)
518 return PyList_New(0);
519 np = (PyListObject *) PyList_New(size);
520 if (np == NULL)
521 return NULL;
Raymond Hettinger6624e682003-05-21 05:58:46 +0000522
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000523 items = np->ob_item;
524 if (Py_SIZE(a) == 1) {
525 elem = a->ob_item[0];
526 for (i = 0; i < n; i++) {
527 items[i] = elem;
528 Py_INCREF(elem);
529 }
530 return (PyObject *) np;
531 }
532 p = np->ob_item;
533 items = a->ob_item;
534 for (i = 0; i < n; i++) {
535 for (j = 0; j < Py_SIZE(a); j++) {
536 *p = items[j];
537 Py_INCREF(*p);
538 p++;
539 }
540 }
541 return (PyObject *) np;
Guido van Rossumed98d481991-03-06 13:07:53 +0000542}
543
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000544static int
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200545_list_clear(PyListObject *a)
Armin Rigo93677f02004-07-29 12:40:23 +0000546{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000547 Py_ssize_t i;
548 PyObject **item = a->ob_item;
549 if (item != NULL) {
550 /* Because XDECREF can recursively invoke operations on
551 this list, we make it empty first. */
552 i = Py_SIZE(a);
553 Py_SIZE(a) = 0;
554 a->ob_item = NULL;
555 a->allocated = 0;
556 while (--i >= 0) {
557 Py_XDECREF(item[i]);
558 }
559 PyMem_FREE(item);
560 }
561 /* Never fails; the return value can be ignored.
562 Note that there is no guarantee that the list is actually empty
563 at this point, because XDECREF may have populated it again! */
564 return 0;
Armin Rigo93677f02004-07-29 12:40:23 +0000565}
566
Tim Peters8fc4a912004-07-31 21:53:19 +0000567/* a[ilow:ihigh] = v if v != NULL.
568 * del a[ilow:ihigh] if v == NULL.
569 *
570 * Special speed gimmick: when v is NULL and ihigh - ilow <= 8, it's
571 * guaranteed the call cannot fail.
572 */
Armin Rigo93677f02004-07-29 12:40:23 +0000573static int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000574list_ass_slice(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000575{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000576 /* Because [X]DECREF can recursively invoke list operations on
577 this list, we must postpone all [X]DECREF activity until
578 after the list is back in its canonical shape. Therefore
579 we must allocate an additional array, 'recycle', into which
580 we temporarily copy the items that are deleted from the
581 list. :-( */
582 PyObject *recycle_on_stack[8];
583 PyObject **recycle = recycle_on_stack; /* will allocate more if needed */
584 PyObject **item;
585 PyObject **vitem = NULL;
586 PyObject *v_as_SF = NULL; /* PySequence_Fast(v) */
587 Py_ssize_t n; /* # of elements in replacement list */
588 Py_ssize_t norig; /* # of elements in list getting replaced */
589 Py_ssize_t d; /* Change in size */
590 Py_ssize_t k;
591 size_t s;
592 int result = -1; /* guilty until proved innocent */
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000593#define b ((PyListObject *)v)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000594 if (v == NULL)
595 n = 0;
596 else {
597 if (a == b) {
598 /* Special case "a[i:j] = a" -- copy b first */
599 v = list_slice(b, 0, Py_SIZE(b));
600 if (v == NULL)
601 return result;
602 result = list_ass_slice(a, ilow, ihigh, v);
603 Py_DECREF(v);
604 return result;
605 }
606 v_as_SF = PySequence_Fast(v, "can only assign an iterable");
607 if(v_as_SF == NULL)
608 goto Error;
609 n = PySequence_Fast_GET_SIZE(v_as_SF);
610 vitem = PySequence_Fast_ITEMS(v_as_SF);
611 }
612 if (ilow < 0)
613 ilow = 0;
614 else if (ilow > Py_SIZE(a))
615 ilow = Py_SIZE(a);
Tim Peters8d9eb102004-07-31 02:24:20 +0000616
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000617 if (ihigh < ilow)
618 ihigh = ilow;
619 else if (ihigh > Py_SIZE(a))
620 ihigh = Py_SIZE(a);
Armin Rigo93677f02004-07-29 12:40:23 +0000621
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000622 norig = ihigh - ilow;
623 assert(norig >= 0);
624 d = n - norig;
625 if (Py_SIZE(a) + d == 0) {
626 Py_XDECREF(v_as_SF);
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200627 return _list_clear(a);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000628 }
629 item = a->ob_item;
630 /* recycle the items that we are about to remove */
631 s = norig * sizeof(PyObject *);
Benjamin Peterson5a7d9232016-09-06 17:58:25 -0700632 /* If norig == 0, item might be NULL, in which case we may not memcpy from it. */
633 if (s) {
634 if (s > sizeof(recycle_on_stack)) {
635 recycle = (PyObject **)PyMem_MALLOC(s);
636 if (recycle == NULL) {
637 PyErr_NoMemory();
638 goto Error;
639 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000640 }
Benjamin Peterson5a7d9232016-09-06 17:58:25 -0700641 memcpy(recycle, &item[ilow], s);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000642 }
Tim Peters8d9eb102004-07-31 02:24:20 +0000643
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000644 if (d < 0) { /* Delete -d items */
Victor Stinner2c40f642013-07-19 23:06:21 +0200645 Py_ssize_t tail;
646 tail = (Py_SIZE(a) - ihigh) * sizeof(PyObject *);
647 memmove(&item[ihigh+d], &item[ihigh], tail);
648 if (list_resize(a, Py_SIZE(a) + d) < 0) {
649 memmove(&item[ihigh], &item[ihigh+d], tail);
650 memcpy(&item[ilow], recycle, s);
651 goto Error;
652 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000653 item = a->ob_item;
654 }
655 else if (d > 0) { /* Insert d items */
656 k = Py_SIZE(a);
657 if (list_resize(a, k+d) < 0)
658 goto Error;
659 item = a->ob_item;
660 memmove(&item[ihigh+d], &item[ihigh],
661 (k - ihigh)*sizeof(PyObject *));
662 }
663 for (k = 0; k < n; k++, ilow++) {
664 PyObject *w = vitem[k];
665 Py_XINCREF(w);
666 item[ilow] = w;
667 }
668 for (k = norig - 1; k >= 0; --k)
669 Py_XDECREF(recycle[k]);
670 result = 0;
Tim Peters8d9eb102004-07-31 02:24:20 +0000671 Error:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000672 if (recycle != recycle_on_stack)
673 PyMem_FREE(recycle);
674 Py_XDECREF(v_as_SF);
675 return result;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000676#undef b
677}
678
Guido van Rossum234f9421993-06-17 12:35:49 +0000679int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000680PyList_SetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
Guido van Rossum234f9421993-06-17 12:35:49 +0000681{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000682 if (!PyList_Check(a)) {
683 PyErr_BadInternalCall();
684 return -1;
685 }
686 return list_ass_slice((PyListObject *)a, ilow, ihigh, v);
Guido van Rossum234f9421993-06-17 12:35:49 +0000687}
688
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000689static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000690list_inplace_repeat(PyListObject *self, Py_ssize_t n)
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000691{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000692 PyObject **items;
693 Py_ssize_t size, i, j, p;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000694
695
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000696 size = PyList_GET_SIZE(self);
697 if (size == 0 || n == 1) {
698 Py_INCREF(self);
699 return (PyObject *)self;
700 }
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000701
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000702 if (n < 1) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200703 (void)_list_clear(self);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000704 Py_INCREF(self);
705 return (PyObject *)self;
706 }
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000707
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000708 if (size > PY_SSIZE_T_MAX / n) {
709 return PyErr_NoMemory();
710 }
Christian Heimesaf98da12008-01-27 15:18:18 +0000711
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800712 if (list_resize(self, size*n) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000713 return NULL;
Raymond Hettinger4bb95402004-02-13 11:36:39 +0000714
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000715 p = size;
716 items = self->ob_item;
717 for (i = 1; i < n; i++) { /* Start counting at 1, not 0 */
718 for (j = 0; j < size; j++) {
719 PyObject *o = items[j];
720 Py_INCREF(o);
721 items[p++] = o;
722 }
723 }
724 Py_INCREF(self);
725 return (PyObject *)self;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000726}
727
Guido van Rossum4a450d01991-04-03 19:05:18 +0000728static int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000729list_ass_item(PyListObject *a, Py_ssize_t i, PyObject *v)
Guido van Rossum4a450d01991-04-03 19:05:18 +0000730{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000731 if (i < 0 || i >= Py_SIZE(a)) {
732 PyErr_SetString(PyExc_IndexError,
733 "list assignment index out of range");
734 return -1;
735 }
736 if (v == NULL)
737 return list_ass_slice(a, i, i+1, v);
738 Py_INCREF(v);
Serhiy Storchakaf01e4082016-04-10 18:12:01 +0300739 Py_SETREF(a->ob_item[i], v);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000740 return 0;
Guido van Rossum4a450d01991-04-03 19:05:18 +0000741}
742
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200743/*[clinic input]
744list.insert
745
746 index: Py_ssize_t
747 object: object
748 /
749
750Insert object before index.
751[clinic start generated code]*/
752
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000753static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200754list_insert_impl(PyListObject *self, Py_ssize_t index, PyObject *object)
755/*[clinic end generated code: output=7f35e32f60c8cb78 input=858514cf894c7eab]*/
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000756{
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200757 if (ins1(self, index, object) == 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000758 Py_RETURN_NONE;
759 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000760}
761
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200762/*[clinic input]
763list.clear
764
765Remove all items from list.
766[clinic start generated code]*/
767
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000768static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200769list_clear_impl(PyListObject *self)
770/*[clinic end generated code: output=67a1896c01f74362 input=ca3c1646856742f6]*/
Eli Benderskycbbaa962011-02-25 05:47:53 +0000771{
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200772 _list_clear(self);
Eli Benderskycbbaa962011-02-25 05:47:53 +0000773 Py_RETURN_NONE;
774}
775
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200776/*[clinic input]
777list.copy
778
779Return a shallow copy of the list.
780[clinic start generated code]*/
781
Eli Benderskycbbaa962011-02-25 05:47:53 +0000782static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200783list_copy_impl(PyListObject *self)
784/*[clinic end generated code: output=ec6b72d6209d418e input=6453ab159e84771f]*/
Eli Benderskycbbaa962011-02-25 05:47:53 +0000785{
786 return list_slice(self, 0, Py_SIZE(self));
787}
788
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200789/*[clinic input]
790list.append
791
792 object: object
793 /
794
795Append object to the end of the list.
796[clinic start generated code]*/
797
Eli Benderskycbbaa962011-02-25 05:47:53 +0000798static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200799list_append(PyListObject *self, PyObject *object)
800/*[clinic end generated code: output=7c096003a29c0eae input=43a3fe48a7066e91]*/
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000801{
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200802 if (app1(self, object) == 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000803 Py_RETURN_NONE;
804 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000805}
806
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200807/*[clinic input]
808list.extend
809
810 iterable: object
811 /
812
813Extend list by appending elements from the iterable.
814[clinic start generated code]*/
815
Barry Warsawdedf6d61998-10-09 16:37:25 +0000816static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200817list_extend(PyListObject *self, PyObject *iterable)
818/*[clinic end generated code: output=630fb3bca0c8e789 input=9ec5ba3a81be3a4d]*/
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000819{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000820 PyObject *it; /* iter(v) */
821 Py_ssize_t m; /* size of self */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200822 Py_ssize_t n; /* guess for size of iterable */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000823 Py_ssize_t mn; /* m + n */
824 Py_ssize_t i;
825 PyObject *(*iternext)(PyObject *);
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000826
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000827 /* Special cases:
828 1) lists and tuples which can use PySequence_Fast ops
829 2) extending self to self requires making a copy first
830 */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200831 if (PyList_CheckExact(iterable) || PyTuple_CheckExact(iterable) ||
832 (PyObject *)self == iterable) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000833 PyObject **src, **dest;
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200834 iterable = PySequence_Fast(iterable, "argument must be iterable");
835 if (!iterable)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000836 return NULL;
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200837 n = PySequence_Fast_GET_SIZE(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000838 if (n == 0) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200839 /* short circuit when iterable is empty */
840 Py_DECREF(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000841 Py_RETURN_NONE;
842 }
843 m = Py_SIZE(self);
Martin Panter94b39ce2017-01-14 06:30:37 +0000844 /* It should not be possible to allocate a list large enough to cause
845 an overflow on any relevant platform */
846 assert(m < PY_SSIZE_T_MAX - n);
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800847 if (list_resize(self, m + n) < 0) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200848 Py_DECREF(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000849 return NULL;
850 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200851 /* note that we may still have self == iterable here for the
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000852 * situation a.extend(a), but the following code works
853 * in that case too. Just make sure to resize self
854 * before calling PySequence_Fast_ITEMS.
855 */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200856 /* populate the end of self with iterable's items */
857 src = PySequence_Fast_ITEMS(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000858 dest = self->ob_item + m;
859 for (i = 0; i < n; i++) {
860 PyObject *o = src[i];
861 Py_INCREF(o);
862 dest[i] = o;
863 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200864 Py_DECREF(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000865 Py_RETURN_NONE;
866 }
Raymond Hettinger90a39bf2004-02-15 03:57:00 +0000867
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200868 it = PyObject_GetIter(iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000869 if (it == NULL)
870 return NULL;
871 iternext = *it->ob_type->tp_iternext;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000872
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000873 /* Guess a result list size. */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200874 n = PyObject_LengthHint(iterable, 8);
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800875 if (n < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000876 Py_DECREF(it);
877 return NULL;
878 }
879 m = Py_SIZE(self);
Martin Panterb93d8632016-07-25 02:39:20 +0000880 if (m > PY_SSIZE_T_MAX - n) {
881 /* m + n overflowed; on the chance that n lied, and there really
882 * is enough room, ignore it. If n was telling the truth, we'll
883 * eventually run out of memory during the loop.
884 */
885 }
886 else {
887 mn = m + n;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000888 /* Make room. */
Raymond Hettinger0dceb912016-01-25 10:33:30 -0800889 if (list_resize(self, mn) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000890 goto error;
891 /* Make the list sane again. */
892 Py_SIZE(self) = m;
893 }
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000894
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000895 /* Run iterator to exhaustion. */
896 for (;;) {
897 PyObject *item = iternext(it);
898 if (item == NULL) {
899 if (PyErr_Occurred()) {
900 if (PyErr_ExceptionMatches(PyExc_StopIteration))
901 PyErr_Clear();
902 else
903 goto error;
904 }
905 break;
906 }
907 if (Py_SIZE(self) < self->allocated) {
908 /* steals ref */
909 PyList_SET_ITEM(self, Py_SIZE(self), item);
910 ++Py_SIZE(self);
911 }
912 else {
913 int status = app1(self, item);
914 Py_DECREF(item); /* append creates a new ref */
915 if (status < 0)
916 goto error;
917 }
918 }
Raymond Hettinger90a39bf2004-02-15 03:57:00 +0000919
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000920 /* Cut back result list if initial guess was too large. */
Victor Stinner32fd6ea2013-07-16 21:45:58 +0200921 if (Py_SIZE(self) < self->allocated) {
922 if (list_resize(self, Py_SIZE(self)) < 0)
923 goto error;
924 }
Raymond Hettingeraa241e02004-09-26 19:24:20 +0000925
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000926 Py_DECREF(it);
927 Py_RETURN_NONE;
Raymond Hettinger90a39bf2004-02-15 03:57:00 +0000928
929 error:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000930 Py_DECREF(it);
931 return NULL;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000932}
933
Raymond Hettinger8ca92ae2004-03-11 09:13:12 +0000934PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200935_PyList_Extend(PyListObject *self, PyObject *iterable)
Raymond Hettinger8ca92ae2004-03-11 09:13:12 +0000936{
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200937 return list_extend(self, iterable);
Raymond Hettinger8ca92ae2004-03-11 09:13:12 +0000938}
939
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000940static PyObject *
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000941list_inplace_concat(PyListObject *self, PyObject *other)
942{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000943 PyObject *result;
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000944
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200945 result = list_extend(self, other);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000946 if (result == NULL)
947 return result;
948 Py_DECREF(result);
949 Py_INCREF(self);
950 return (PyObject *)self;
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000951}
952
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200953/*[clinic input]
954list.pop
955
956 index: Py_ssize_t = -1
957 /
958
959Remove and return item at index (default last).
960
961Raises IndexError if list is empty or index is out of range.
962[clinic start generated code]*/
963
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000964static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200965list_pop_impl(PyListObject *self, Py_ssize_t index)
966/*[clinic end generated code: output=6bd69dcb3f17eca8 input=b83675976f329e6f]*/
Guido van Rossum3dd7f3f1998-06-30 15:36:32 +0000967{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000968 PyObject *v;
969 int status;
Raymond Hettinger9eb86b32004-02-17 11:36:16 +0000970
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000971 if (Py_SIZE(self) == 0) {
972 /* Special-case most common failure cause */
973 PyErr_SetString(PyExc_IndexError, "pop from empty list");
974 return NULL;
975 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200976 if (index < 0)
977 index += Py_SIZE(self);
978 if (index < 0 || index >= Py_SIZE(self)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000979 PyErr_SetString(PyExc_IndexError, "pop index out of range");
980 return NULL;
981 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200982 v = self->ob_item[index];
983 if (index == Py_SIZE(self) - 1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000984 status = list_resize(self, Py_SIZE(self) - 1);
Victor Stinnerb27cd3e2013-07-08 22:20:44 +0200985 if (status >= 0)
986 return v; /* and v now owns the reference the list had */
987 else
988 return NULL;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000989 }
990 Py_INCREF(v);
Serhiy Storchakafdd42c42017-03-11 09:19:20 +0200991 status = list_ass_slice(self, index, index+1, (PyObject *)NULL);
Victor Stinner095d99f2013-07-17 21:58:01 +0200992 if (status < 0) {
993 Py_DECREF(v);
994 return NULL;
995 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000996 return v;
Guido van Rossum3dd7f3f1998-06-30 15:36:32 +0000997}
998
Tim Peters8e2e7ca2002-07-19 02:33:08 +0000999/* Reverse a slice of a list in place, from lo up to (exclusive) hi. */
1000static void
1001reverse_slice(PyObject **lo, PyObject **hi)
1002{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001003 assert(lo && hi);
Tim Peters8e2e7ca2002-07-19 02:33:08 +00001004
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001005 --hi;
1006 while (lo < hi) {
1007 PyObject *t = *lo;
1008 *lo = *hi;
1009 *hi = t;
1010 ++lo;
1011 --hi;
1012 }
Tim Peters8e2e7ca2002-07-19 02:33:08 +00001013}
1014
Tim Petersa64dc242002-08-01 02:13:36 +00001015/* Lots of code for an adaptive, stable, natural mergesort. There are many
1016 * pieces to this algorithm; read listsort.txt for overviews and details.
1017 */
Guido van Rossum3f236de1996-12-10 23:55:39 +00001018
Daniel Stutzbach98338222010-12-02 21:55:33 +00001019/* A sortslice contains a pointer to an array of keys and a pointer to
1020 * an array of corresponding values. In other words, keys[i]
1021 * corresponds with values[i]. If values == NULL, then the keys are
1022 * also the values.
1023 *
1024 * Several convenience routines are provided here, so that keys and
1025 * values are always moved in sync.
1026 */
1027
1028typedef struct {
1029 PyObject **keys;
1030 PyObject **values;
1031} sortslice;
1032
1033Py_LOCAL_INLINE(void)
1034sortslice_copy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j)
1035{
1036 s1->keys[i] = s2->keys[j];
1037 if (s1->values != NULL)
1038 s1->values[i] = s2->values[j];
1039}
1040
1041Py_LOCAL_INLINE(void)
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001042sortslice_copy_incr(sortslice *dst, sortslice *src)
1043{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001044 *dst->keys++ = *src->keys++;
1045 if (dst->values != NULL)
1046 *dst->values++ = *src->values++;
1047}
1048
1049Py_LOCAL_INLINE(void)
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001050sortslice_copy_decr(sortslice *dst, sortslice *src)
1051{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001052 *dst->keys-- = *src->keys--;
1053 if (dst->values != NULL)
1054 *dst->values-- = *src->values--;
1055}
1056
1057
1058Py_LOCAL_INLINE(void)
1059sortslice_memcpy(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001060 Py_ssize_t n)
1061{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001062 memcpy(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1063 if (s1->values != NULL)
1064 memcpy(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1065}
1066
1067Py_LOCAL_INLINE(void)
1068sortslice_memmove(sortslice *s1, Py_ssize_t i, sortslice *s2, Py_ssize_t j,
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001069 Py_ssize_t n)
1070{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001071 memmove(&s1->keys[i], &s2->keys[j], sizeof(PyObject *) * n);
1072 if (s1->values != NULL)
1073 memmove(&s1->values[i], &s2->values[j], sizeof(PyObject *) * n);
1074}
1075
1076Py_LOCAL_INLINE(void)
Benjamin Peterson9efdcca2010-12-03 01:44:10 +00001077sortslice_advance(sortslice *slice, Py_ssize_t n)
1078{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001079 slice->keys += n;
1080 if (slice->values != NULL)
1081 slice->values += n;
1082}
1083
embg1e34da42018-01-28 20:03:23 -07001084/* Comparison function: ms->key_compare, which is set at run-time in
1085 * listsort_impl to optimize for various special cases.
Tim Petersa64dc242002-08-01 02:13:36 +00001086 * Returns -1 on error, 1 if x < y, 0 if x >= y.
1087 */
Guido van Rossum3f236de1996-12-10 23:55:39 +00001088
embg1e34da42018-01-28 20:03:23 -07001089#define ISLT(X, Y) (*(ms->key_compare))(X, Y, ms)
Tim Peters66860f62002-08-04 17:47:26 +00001090
1091/* Compare X to Y via "<". Goto "fail" if the comparison raises an
Tim Petersa8c974c2002-07-19 03:30:57 +00001092 error. Else "k" is set to true iff X<Y, and an "if (k)" block is
1093 started. It makes more sense in context <wink>. X and Y are PyObject*s.
1094*/
Raymond Hettinger70b64fc2008-01-30 20:15:17 +00001095#define IFLT(X, Y) if ((k = ISLT(X, Y)) < 0) goto fail; \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001096 if (k)
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001097
embg1e34da42018-01-28 20:03:23 -07001098/* The maximum number of entries in a MergeState's pending-runs stack.
1099 * This is enough to sort arrays of size up to about
1100 * 32 * phi ** MAX_MERGE_PENDING
1101 * where phi ~= 1.618. 85 is ridiculouslylarge enough, good for an array
1102 * with 2**64 elements.
1103 */
1104#define MAX_MERGE_PENDING 85
1105
1106/* When we get into galloping mode, we stay there until both runs win less
1107 * often than MIN_GALLOP consecutive times. See listsort.txt for more info.
1108 */
1109#define MIN_GALLOP 7
1110
1111/* Avoid malloc for small temp arrays. */
1112#define MERGESTATE_TEMP_SIZE 256
1113
1114/* One MergeState exists on the stack per invocation of mergesort. It's just
1115 * a convenient way to pass state around among the helper functions.
1116 */
1117struct s_slice {
1118 sortslice base;
1119 Py_ssize_t len;
1120};
1121
1122typedef struct s_MergeState MergeState;
1123struct s_MergeState {
1124 /* This controls when we get *into* galloping mode. It's initialized
1125 * to MIN_GALLOP. merge_lo and merge_hi tend to nudge it higher for
1126 * random data, and lower for highly structured data.
1127 */
1128 Py_ssize_t min_gallop;
1129
1130 /* 'a' is temp storage to help with merges. It contains room for
1131 * alloced entries.
1132 */
1133 sortslice a; /* may point to temparray below */
1134 Py_ssize_t alloced;
1135
1136 /* A stack of n pending runs yet to be merged. Run #i starts at
1137 * address base[i] and extends for len[i] elements. It's always
1138 * true (so long as the indices are in bounds) that
1139 *
1140 * pending[i].base + pending[i].len == pending[i+1].base
1141 *
1142 * so we could cut the storage for this, but it's a minor amount,
1143 * and keeping all the info explicit simplifies the code.
1144 */
1145 int n;
1146 struct s_slice pending[MAX_MERGE_PENDING];
1147
1148 /* 'a' points to this when possible, rather than muck with malloc. */
1149 PyObject *temparray[MERGESTATE_TEMP_SIZE];
1150
1151 /* This is the function we will use to compare two keys,
1152 * even when none of our special cases apply and we have to use
1153 * safe_object_compare. */
1154 int (*key_compare)(PyObject *, PyObject *, MergeState *);
1155
1156 /* This function is used by unsafe_object_compare to optimize comparisons
1157 * when we know our list is type-homogeneous but we can't assume anything else.
1158 * In the pre-sort check it is set equal to key->ob_type->tp_richcompare */
1159 PyObject *(*key_richcompare)(PyObject *, PyObject *, int);
1160
1161 /* This function is used by unsafe_tuple_compare to compare the first elements
1162 * of tuples. It may be set to safe_object_compare, but the idea is that hopefully
1163 * we can assume more, and use one of the special-case compares. */
1164 int (*tuple_elem_compare)(PyObject *, PyObject *, MergeState *);
1165};
1166
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001167/* binarysort is the best method for sorting small arrays: it does
1168 few compares, but can do data movement quadratic in the number of
1169 elements.
Guido van Rossum42812581998-06-17 14:15:44 +00001170 [lo, hi) is a contiguous slice of a list, and is sorted via
Tim Petersa8c974c2002-07-19 03:30:57 +00001171 binary insertion. This sort is stable.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001172 On entry, must have lo <= start <= hi, and that [lo, start) is already
1173 sorted (pass start == lo if you don't know!).
Tim Petersa8c974c2002-07-19 03:30:57 +00001174 If islt() complains return -1, else 0.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001175 Even in case of error, the output slice will be some permutation of
1176 the input (nothing is lost or duplicated).
1177*/
Guido van Rossum3f236de1996-12-10 23:55:39 +00001178static int
embg1e34da42018-01-28 20:03:23 -07001179binarysort(MergeState *ms, sortslice lo, PyObject **hi, PyObject **start)
Guido van Rossum3f236de1996-12-10 23:55:39 +00001180{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02001181 Py_ssize_t k;
1182 PyObject **l, **p, **r;
1183 PyObject *pivot;
Guido van Rossum3f236de1996-12-10 23:55:39 +00001184
Daniel Stutzbach98338222010-12-02 21:55:33 +00001185 assert(lo.keys <= start && start <= hi);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001186 /* assert [lo, start) is sorted */
Daniel Stutzbach98338222010-12-02 21:55:33 +00001187 if (lo.keys == start)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001188 ++start;
1189 for (; start < hi; ++start) {
1190 /* set l to where *start belongs */
Daniel Stutzbach98338222010-12-02 21:55:33 +00001191 l = lo.keys;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001192 r = start;
1193 pivot = *r;
1194 /* Invariants:
1195 * pivot >= all in [lo, l).
1196 * pivot < all in [r, start).
1197 * The second is vacuously true at the start.
1198 */
1199 assert(l < r);
1200 do {
1201 p = l + ((r - l) >> 1);
1202 IFLT(pivot, *p)
1203 r = p;
1204 else
1205 l = p+1;
1206 } while (l < r);
1207 assert(l == r);
1208 /* The invariants still hold, so pivot >= all in [lo, l) and
1209 pivot < all in [l, start), so pivot belongs at l. Note
1210 that if there are elements equal to pivot, l points to the
1211 first slot after them -- that's why this sort is stable.
1212 Slide over to make room.
1213 Caution: using memmove is much slower under MSVC 5;
1214 we're not usually moving many slots. */
1215 for (p = start; p > l; --p)
1216 *p = *(p-1);
1217 *l = pivot;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001218 if (lo.values != NULL) {
1219 Py_ssize_t offset = lo.values - lo.keys;
1220 p = start + offset;
1221 pivot = *p;
1222 l += offset;
1223 for (p = start + offset; p > l; --p)
1224 *p = *(p-1);
1225 *l = pivot;
1226 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001227 }
1228 return 0;
Guido van Rossuma119c0d1998-05-29 17:56:32 +00001229
1230 fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001231 return -1;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001232}
1233
Tim Petersa64dc242002-08-01 02:13:36 +00001234/*
1235Return the length of the run beginning at lo, in the slice [lo, hi). lo < hi
1236is required on entry. "A run" is the longest ascending sequence, with
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001237
Tim Petersa64dc242002-08-01 02:13:36 +00001238 lo[0] <= lo[1] <= lo[2] <= ...
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001239
Tim Petersa64dc242002-08-01 02:13:36 +00001240or the longest descending sequence, with
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001241
Tim Petersa64dc242002-08-01 02:13:36 +00001242 lo[0] > lo[1] > lo[2] > ...
Tim Peters3b01a122002-07-19 02:35:45 +00001243
Tim Petersa64dc242002-08-01 02:13:36 +00001244Boolean *descending is set to 0 in the former case, or to 1 in the latter.
1245For its intended use in a stable mergesort, the strictness of the defn of
1246"descending" is needed so that the caller can safely reverse a descending
1247sequence without violating stability (strict > ensures there are no equal
1248elements to get out of order).
1249
1250Returns -1 in case of error.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001251*/
Martin v. Löwis18e16552006-02-15 17:27:45 +00001252static Py_ssize_t
embg1e34da42018-01-28 20:03:23 -07001253count_run(MergeState *ms, PyObject **lo, PyObject **hi, int *descending)
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001254{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001255 Py_ssize_t k;
1256 Py_ssize_t n;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001257
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001258 assert(lo < hi);
1259 *descending = 0;
1260 ++lo;
1261 if (lo == hi)
1262 return 1;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001263
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001264 n = 2;
1265 IFLT(*lo, *(lo-1)) {
1266 *descending = 1;
1267 for (lo = lo+1; lo < hi; ++lo, ++n) {
1268 IFLT(*lo, *(lo-1))
1269 ;
1270 else
1271 break;
1272 }
1273 }
1274 else {
1275 for (lo = lo+1; lo < hi; ++lo, ++n) {
1276 IFLT(*lo, *(lo-1))
1277 break;
1278 }
1279 }
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001280
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001281 return n;
Tim Petersa64dc242002-08-01 02:13:36 +00001282fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001283 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001284}
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001285
Tim Petersa64dc242002-08-01 02:13:36 +00001286/*
1287Locate the proper position of key in a sorted vector; if the vector contains
1288an element equal to key, return the position immediately to the left of
1289the leftmost equal element. [gallop_right() does the same except returns
1290the position to the right of the rightmost equal element (if any).]
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001291
Tim Petersa64dc242002-08-01 02:13:36 +00001292"a" is a sorted vector with n elements, starting at a[0]. n must be > 0.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001293
Tim Petersa64dc242002-08-01 02:13:36 +00001294"hint" is an index at which to begin the search, 0 <= hint < n. The closer
1295hint is to the final result, the faster this runs.
1296
1297The return value is the int k in 0..n such that
1298
1299 a[k-1] < key <= a[k]
1300
1301pretending that *(a-1) is minus infinity and a[n] is plus infinity. IOW,
1302key belongs at index k; or, IOW, the first k elements of a should precede
1303key, and the last n-k should follow key.
1304
1305Returns -1 on error. See listsort.txt for info on the method.
1306*/
Martin v. Löwis18e16552006-02-15 17:27:45 +00001307static Py_ssize_t
embg1e34da42018-01-28 20:03:23 -07001308gallop_left(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
Tim Petersa64dc242002-08-01 02:13:36 +00001309{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001310 Py_ssize_t ofs;
1311 Py_ssize_t lastofs;
1312 Py_ssize_t k;
Tim Petersa64dc242002-08-01 02:13:36 +00001313
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001314 assert(key && a && n > 0 && hint >= 0 && hint < n);
Tim Petersa64dc242002-08-01 02:13:36 +00001315
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001316 a += hint;
1317 lastofs = 0;
1318 ofs = 1;
1319 IFLT(*a, key) {
1320 /* a[hint] < key -- gallop right, until
1321 * a[hint + lastofs] < key <= a[hint + ofs]
1322 */
1323 const Py_ssize_t maxofs = n - hint; /* &a[n-1] is highest */
1324 while (ofs < maxofs) {
1325 IFLT(a[ofs], key) {
1326 lastofs = ofs;
1327 ofs = (ofs << 1) + 1;
1328 if (ofs <= 0) /* int overflow */
1329 ofs = maxofs;
1330 }
1331 else /* key <= a[hint + ofs] */
1332 break;
1333 }
1334 if (ofs > maxofs)
1335 ofs = maxofs;
1336 /* Translate back to offsets relative to &a[0]. */
1337 lastofs += hint;
1338 ofs += hint;
1339 }
1340 else {
1341 /* key <= a[hint] -- gallop left, until
1342 * a[hint - ofs] < key <= a[hint - lastofs]
1343 */
1344 const Py_ssize_t maxofs = hint + 1; /* &a[0] is lowest */
1345 while (ofs < maxofs) {
1346 IFLT(*(a-ofs), key)
1347 break;
1348 /* key <= a[hint - ofs] */
1349 lastofs = ofs;
1350 ofs = (ofs << 1) + 1;
1351 if (ofs <= 0) /* int overflow */
1352 ofs = maxofs;
1353 }
1354 if (ofs > maxofs)
1355 ofs = maxofs;
1356 /* Translate back to positive offsets relative to &a[0]. */
1357 k = lastofs;
1358 lastofs = hint - ofs;
1359 ofs = hint - k;
1360 }
1361 a -= hint;
Tim Petersa64dc242002-08-01 02:13:36 +00001362
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001363 assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
1364 /* Now a[lastofs] < key <= a[ofs], so key belongs somewhere to the
1365 * right of lastofs but no farther right than ofs. Do a binary
1366 * search, with invariant a[lastofs-1] < key <= a[ofs].
1367 */
1368 ++lastofs;
1369 while (lastofs < ofs) {
1370 Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
Tim Petersa64dc242002-08-01 02:13:36 +00001371
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001372 IFLT(a[m], key)
1373 lastofs = m+1; /* a[m] < key */
1374 else
1375 ofs = m; /* key <= a[m] */
1376 }
1377 assert(lastofs == ofs); /* so a[ofs-1] < key <= a[ofs] */
1378 return ofs;
Tim Petersa64dc242002-08-01 02:13:36 +00001379
1380fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001381 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001382}
1383
1384/*
1385Exactly like gallop_left(), except that if key already exists in a[0:n],
1386finds the position immediately to the right of the rightmost equal value.
1387
1388The return value is the int k in 0..n such that
1389
1390 a[k-1] <= key < a[k]
1391
1392or -1 if error.
1393
1394The code duplication is massive, but this is enough different given that
1395we're sticking to "<" comparisons that it's much harder to follow if
1396written as one routine with yet another "left or right?" flag.
1397*/
Martin v. Löwis18e16552006-02-15 17:27:45 +00001398static Py_ssize_t
embg1e34da42018-01-28 20:03:23 -07001399gallop_right(MergeState *ms, PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint)
Tim Petersa64dc242002-08-01 02:13:36 +00001400{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001401 Py_ssize_t ofs;
1402 Py_ssize_t lastofs;
1403 Py_ssize_t k;
Tim Petersa64dc242002-08-01 02:13:36 +00001404
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001405 assert(key && a && n > 0 && hint >= 0 && hint < n);
Tim Petersa64dc242002-08-01 02:13:36 +00001406
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001407 a += hint;
1408 lastofs = 0;
1409 ofs = 1;
1410 IFLT(key, *a) {
1411 /* key < a[hint] -- gallop left, until
1412 * a[hint - ofs] <= key < a[hint - lastofs]
1413 */
1414 const Py_ssize_t maxofs = hint + 1; /* &a[0] is lowest */
1415 while (ofs < maxofs) {
1416 IFLT(key, *(a-ofs)) {
1417 lastofs = ofs;
1418 ofs = (ofs << 1) + 1;
1419 if (ofs <= 0) /* int overflow */
1420 ofs = maxofs;
1421 }
1422 else /* a[hint - ofs] <= key */
1423 break;
1424 }
1425 if (ofs > maxofs)
1426 ofs = maxofs;
1427 /* Translate back to positive offsets relative to &a[0]. */
1428 k = lastofs;
1429 lastofs = hint - ofs;
1430 ofs = hint - k;
1431 }
1432 else {
1433 /* a[hint] <= key -- gallop right, until
1434 * a[hint + lastofs] <= key < a[hint + ofs]
1435 */
1436 const Py_ssize_t maxofs = n - hint; /* &a[n-1] is highest */
1437 while (ofs < maxofs) {
1438 IFLT(key, a[ofs])
1439 break;
1440 /* a[hint + ofs] <= key */
1441 lastofs = ofs;
1442 ofs = (ofs << 1) + 1;
1443 if (ofs <= 0) /* int overflow */
1444 ofs = maxofs;
1445 }
1446 if (ofs > maxofs)
1447 ofs = maxofs;
1448 /* Translate back to offsets relative to &a[0]. */
1449 lastofs += hint;
1450 ofs += hint;
1451 }
1452 a -= hint;
Tim Petersa64dc242002-08-01 02:13:36 +00001453
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001454 assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
1455 /* Now a[lastofs] <= key < a[ofs], so key belongs somewhere to the
1456 * right of lastofs but no farther right than ofs. Do a binary
1457 * search, with invariant a[lastofs-1] <= key < a[ofs].
1458 */
1459 ++lastofs;
1460 while (lastofs < ofs) {
1461 Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
Tim Petersa64dc242002-08-01 02:13:36 +00001462
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001463 IFLT(key, a[m])
1464 ofs = m; /* key < a[m] */
1465 else
1466 lastofs = m+1; /* a[m] <= key */
1467 }
1468 assert(lastofs == ofs); /* so a[ofs-1] <= key < a[ofs] */
1469 return ofs;
Tim Petersa64dc242002-08-01 02:13:36 +00001470
1471fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001472 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001473}
1474
Tim Petersa64dc242002-08-01 02:13:36 +00001475/* Conceptually a MergeState's constructor. */
1476static void
Victor Stinner0fcab4a2011-01-04 12:59:15 +00001477merge_init(MergeState *ms, Py_ssize_t list_size, int has_keyfunc)
Tim Petersa64dc242002-08-01 02:13:36 +00001478{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001479 assert(ms != NULL);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001480 if (has_keyfunc) {
1481 /* The temporary space for merging will need at most half the list
1482 * size rounded up. Use the minimum possible space so we can use the
1483 * rest of temparray for other things. In particular, if there is
1484 * enough extra space, listsort() will use it to store the keys.
1485 */
1486 ms->alloced = (list_size + 1) / 2;
1487
1488 /* ms->alloced describes how many keys will be stored at
1489 ms->temparray, but we also need to store the values. Hence,
1490 ms->alloced is capped at half of MERGESTATE_TEMP_SIZE. */
1491 if (MERGESTATE_TEMP_SIZE / 2 < ms->alloced)
1492 ms->alloced = MERGESTATE_TEMP_SIZE / 2;
1493 ms->a.values = &ms->temparray[ms->alloced];
1494 }
1495 else {
1496 ms->alloced = MERGESTATE_TEMP_SIZE;
1497 ms->a.values = NULL;
1498 }
1499 ms->a.keys = ms->temparray;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001500 ms->n = 0;
1501 ms->min_gallop = MIN_GALLOP;
Tim Petersa64dc242002-08-01 02:13:36 +00001502}
1503
1504/* Free all the temp memory owned by the MergeState. This must be called
1505 * when you're done with a MergeState, and may be called before then if
1506 * you want to free the temp memory early.
1507 */
1508static void
1509merge_freemem(MergeState *ms)
1510{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001511 assert(ms != NULL);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001512 if (ms->a.keys != ms->temparray)
1513 PyMem_Free(ms->a.keys);
Tim Petersa64dc242002-08-01 02:13:36 +00001514}
1515
1516/* Ensure enough temp memory for 'need' array slots is available.
1517 * Returns 0 on success and -1 if the memory can't be gotten.
1518 */
1519static int
Martin v. Löwis18e16552006-02-15 17:27:45 +00001520merge_getmem(MergeState *ms, Py_ssize_t need)
Tim Petersa64dc242002-08-01 02:13:36 +00001521{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001522 int multiplier;
1523
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001524 assert(ms != NULL);
1525 if (need <= ms->alloced)
1526 return 0;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001527
1528 multiplier = ms->a.values != NULL ? 2 : 1;
1529
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001530 /* Don't realloc! That can cost cycles to copy the old data, but
1531 * we don't care what's in the block.
1532 */
1533 merge_freemem(ms);
embg1e34da42018-01-28 20:03:23 -07001534 if ((size_t)need > PY_SSIZE_T_MAX / sizeof(PyObject *) / multiplier) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001535 PyErr_NoMemory();
1536 return -1;
1537 }
embg1e34da42018-01-28 20:03:23 -07001538 ms->a.keys = (PyObject **)PyMem_Malloc(multiplier * need
Daniel Stutzbach98338222010-12-02 21:55:33 +00001539 * sizeof(PyObject *));
1540 if (ms->a.keys != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001541 ms->alloced = need;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001542 if (ms->a.values != NULL)
1543 ms->a.values = &ms->a.keys[need];
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001544 return 0;
1545 }
1546 PyErr_NoMemory();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001547 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001548}
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001549#define MERGE_GETMEM(MS, NEED) ((NEED) <= (MS)->alloced ? 0 : \
1550 merge_getmem(MS, NEED))
Tim Petersa64dc242002-08-01 02:13:36 +00001551
Daniel Stutzbach98338222010-12-02 21:55:33 +00001552/* Merge the na elements starting at ssa with the nb elements starting at
1553 * ssb.keys = ssa.keys + na in a stable way, in-place. na and nb must be > 0.
1554 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
1555 * should have na <= nb. See listsort.txt for more info. Return 0 if
1556 * successful, -1 if error.
Tim Petersa64dc242002-08-01 02:13:36 +00001557 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001558static Py_ssize_t
Daniel Stutzbach98338222010-12-02 21:55:33 +00001559merge_lo(MergeState *ms, sortslice ssa, Py_ssize_t na,
1560 sortslice ssb, Py_ssize_t nb)
Tim Petersa64dc242002-08-01 02:13:36 +00001561{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001562 Py_ssize_t k;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001563 sortslice dest;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001564 int result = -1; /* guilty until proved innocent */
1565 Py_ssize_t min_gallop;
Tim Petersa64dc242002-08-01 02:13:36 +00001566
Daniel Stutzbach98338222010-12-02 21:55:33 +00001567 assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
1568 assert(ssa.keys + na == ssb.keys);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001569 if (MERGE_GETMEM(ms, na) < 0)
1570 return -1;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001571 sortslice_memcpy(&ms->a, 0, &ssa, 0, na);
1572 dest = ssa;
1573 ssa = ms->a;
Tim Petersa64dc242002-08-01 02:13:36 +00001574
Daniel Stutzbach98338222010-12-02 21:55:33 +00001575 sortslice_copy_incr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001576 --nb;
1577 if (nb == 0)
1578 goto Succeed;
1579 if (na == 1)
1580 goto CopyB;
Tim Petersa64dc242002-08-01 02:13:36 +00001581
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001582 min_gallop = ms->min_gallop;
1583 for (;;) {
1584 Py_ssize_t acount = 0; /* # of times A won in a row */
1585 Py_ssize_t bcount = 0; /* # of times B won in a row */
Tim Petersa64dc242002-08-01 02:13:36 +00001586
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001587 /* Do the straightforward thing until (if ever) one run
1588 * appears to win consistently.
1589 */
1590 for (;;) {
1591 assert(na > 1 && nb > 0);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001592 k = ISLT(ssb.keys[0], ssa.keys[0]);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001593 if (k) {
1594 if (k < 0)
1595 goto Fail;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001596 sortslice_copy_incr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001597 ++bcount;
1598 acount = 0;
1599 --nb;
1600 if (nb == 0)
1601 goto Succeed;
1602 if (bcount >= min_gallop)
1603 break;
1604 }
1605 else {
Daniel Stutzbach98338222010-12-02 21:55:33 +00001606 sortslice_copy_incr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001607 ++acount;
1608 bcount = 0;
1609 --na;
1610 if (na == 1)
1611 goto CopyB;
1612 if (acount >= min_gallop)
1613 break;
1614 }
1615 }
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001616
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001617 /* One run is winning so consistently that galloping may
1618 * be a huge win. So try that, and continue galloping until
1619 * (if ever) neither run appears to be winning consistently
1620 * anymore.
1621 */
1622 ++min_gallop;
1623 do {
1624 assert(na > 1 && nb > 0);
1625 min_gallop -= min_gallop > 1;
1626 ms->min_gallop = min_gallop;
embg1e34da42018-01-28 20:03:23 -07001627 k = gallop_right(ms, ssb.keys[0], ssa.keys, na, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001628 acount = k;
1629 if (k) {
1630 if (k < 0)
1631 goto Fail;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001632 sortslice_memcpy(&dest, 0, &ssa, 0, k);
1633 sortslice_advance(&dest, k);
1634 sortslice_advance(&ssa, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001635 na -= k;
1636 if (na == 1)
1637 goto CopyB;
1638 /* na==0 is impossible now if the comparison
1639 * function is consistent, but we can't assume
1640 * that it is.
1641 */
1642 if (na == 0)
1643 goto Succeed;
1644 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00001645 sortslice_copy_incr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001646 --nb;
1647 if (nb == 0)
1648 goto Succeed;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001649
embg1e34da42018-01-28 20:03:23 -07001650 k = gallop_left(ms, ssa.keys[0], ssb.keys, nb, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001651 bcount = k;
1652 if (k) {
1653 if (k < 0)
1654 goto Fail;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001655 sortslice_memmove(&dest, 0, &ssb, 0, k);
1656 sortslice_advance(&dest, k);
1657 sortslice_advance(&ssb, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001658 nb -= k;
1659 if (nb == 0)
1660 goto Succeed;
1661 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00001662 sortslice_copy_incr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001663 --na;
1664 if (na == 1)
1665 goto CopyB;
1666 } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
1667 ++min_gallop; /* penalize it for leaving galloping mode */
1668 ms->min_gallop = min_gallop;
1669 }
Tim Petersa64dc242002-08-01 02:13:36 +00001670Succeed:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001671 result = 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001672Fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001673 if (na)
Daniel Stutzbach98338222010-12-02 21:55:33 +00001674 sortslice_memcpy(&dest, 0, &ssa, 0, na);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001675 return result;
Tim Petersa64dc242002-08-01 02:13:36 +00001676CopyB:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001677 assert(na == 1 && nb > 0);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001678 /* The last element of ssa belongs at the end of the merge. */
1679 sortslice_memmove(&dest, 0, &ssb, 0, nb);
1680 sortslice_copy(&dest, nb, &ssa, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001681 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001682}
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001683
Daniel Stutzbach98338222010-12-02 21:55:33 +00001684/* Merge the na elements starting at pa with the nb elements starting at
1685 * ssb.keys = ssa.keys + na in a stable way, in-place. na and nb must be > 0.
1686 * Must also have that ssa.keys[na-1] belongs at the end of the merge, and
1687 * should have na >= nb. See listsort.txt for more info. Return 0 if
1688 * successful, -1 if error.
Tim Petersa64dc242002-08-01 02:13:36 +00001689 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001690static Py_ssize_t
Daniel Stutzbach98338222010-12-02 21:55:33 +00001691merge_hi(MergeState *ms, sortslice ssa, Py_ssize_t na,
1692 sortslice ssb, Py_ssize_t nb)
Tim Petersa64dc242002-08-01 02:13:36 +00001693{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001694 Py_ssize_t k;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001695 sortslice dest, basea, baseb;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001696 int result = -1; /* guilty until proved innocent */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001697 Py_ssize_t min_gallop;
Tim Petersa64dc242002-08-01 02:13:36 +00001698
Daniel Stutzbach98338222010-12-02 21:55:33 +00001699 assert(ms && ssa.keys && ssb.keys && na > 0 && nb > 0);
1700 assert(ssa.keys + na == ssb.keys);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001701 if (MERGE_GETMEM(ms, nb) < 0)
1702 return -1;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001703 dest = ssb;
1704 sortslice_advance(&dest, nb-1);
1705 sortslice_memcpy(&ms->a, 0, &ssb, 0, nb);
1706 basea = ssa;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001707 baseb = ms->a;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001708 ssb.keys = ms->a.keys + nb - 1;
1709 if (ssb.values != NULL)
1710 ssb.values = ms->a.values + nb - 1;
1711 sortslice_advance(&ssa, na - 1);
Tim Petersa64dc242002-08-01 02:13:36 +00001712
Daniel Stutzbach98338222010-12-02 21:55:33 +00001713 sortslice_copy_decr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001714 --na;
1715 if (na == 0)
1716 goto Succeed;
1717 if (nb == 1)
1718 goto CopyA;
Tim Petersa64dc242002-08-01 02:13:36 +00001719
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001720 min_gallop = ms->min_gallop;
1721 for (;;) {
1722 Py_ssize_t acount = 0; /* # of times A won in a row */
1723 Py_ssize_t bcount = 0; /* # of times B won in a row */
Tim Petersa64dc242002-08-01 02:13:36 +00001724
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001725 /* Do the straightforward thing until (if ever) one run
1726 * appears to win consistently.
1727 */
1728 for (;;) {
1729 assert(na > 0 && nb > 1);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001730 k = ISLT(ssb.keys[0], ssa.keys[0]);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001731 if (k) {
1732 if (k < 0)
1733 goto Fail;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001734 sortslice_copy_decr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001735 ++acount;
1736 bcount = 0;
1737 --na;
1738 if (na == 0)
1739 goto Succeed;
1740 if (acount >= min_gallop)
1741 break;
1742 }
1743 else {
Daniel Stutzbach98338222010-12-02 21:55:33 +00001744 sortslice_copy_decr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001745 ++bcount;
1746 acount = 0;
1747 --nb;
1748 if (nb == 1)
1749 goto CopyA;
1750 if (bcount >= min_gallop)
1751 break;
1752 }
1753 }
Tim Petersa64dc242002-08-01 02:13:36 +00001754
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001755 /* One run is winning so consistently that galloping may
1756 * be a huge win. So try that, and continue galloping until
1757 * (if ever) neither run appears to be winning consistently
1758 * anymore.
1759 */
1760 ++min_gallop;
1761 do {
1762 assert(na > 0 && nb > 1);
1763 min_gallop -= min_gallop > 1;
1764 ms->min_gallop = min_gallop;
embg1e34da42018-01-28 20:03:23 -07001765 k = gallop_right(ms, ssb.keys[0], basea.keys, na, na-1);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001766 if (k < 0)
1767 goto Fail;
1768 k = na - k;
1769 acount = k;
1770 if (k) {
Daniel Stutzbach98338222010-12-02 21:55:33 +00001771 sortslice_advance(&dest, -k);
1772 sortslice_advance(&ssa, -k);
1773 sortslice_memmove(&dest, 1, &ssa, 1, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001774 na -= k;
1775 if (na == 0)
1776 goto Succeed;
1777 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00001778 sortslice_copy_decr(&dest, &ssb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001779 --nb;
1780 if (nb == 1)
1781 goto CopyA;
Tim Petersa64dc242002-08-01 02:13:36 +00001782
embg1e34da42018-01-28 20:03:23 -07001783 k = gallop_left(ms, ssa.keys[0], baseb.keys, nb, nb-1);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001784 if (k < 0)
1785 goto Fail;
1786 k = nb - k;
1787 bcount = k;
1788 if (k) {
Daniel Stutzbach98338222010-12-02 21:55:33 +00001789 sortslice_advance(&dest, -k);
1790 sortslice_advance(&ssb, -k);
1791 sortslice_memcpy(&dest, 1, &ssb, 1, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001792 nb -= k;
1793 if (nb == 1)
1794 goto CopyA;
1795 /* nb==0 is impossible now if the comparison
1796 * function is consistent, but we can't assume
1797 * that it is.
1798 */
1799 if (nb == 0)
1800 goto Succeed;
1801 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00001802 sortslice_copy_decr(&dest, &ssa);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001803 --na;
1804 if (na == 0)
1805 goto Succeed;
1806 } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
1807 ++min_gallop; /* penalize it for leaving galloping mode */
1808 ms->min_gallop = min_gallop;
1809 }
Tim Petersa64dc242002-08-01 02:13:36 +00001810Succeed:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001811 result = 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001812Fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001813 if (nb)
Daniel Stutzbach98338222010-12-02 21:55:33 +00001814 sortslice_memcpy(&dest, -(nb-1), &baseb, 0, nb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001815 return result;
Tim Petersa64dc242002-08-01 02:13:36 +00001816CopyA:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001817 assert(nb == 1 && na > 0);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001818 /* The first element of ssb belongs at the front of the merge. */
1819 sortslice_memmove(&dest, 1-na, &ssa, 1-na, na);
1820 sortslice_advance(&dest, -na);
1821 sortslice_advance(&ssa, -na);
1822 sortslice_copy(&dest, 0, &ssb, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001823 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001824}
1825
1826/* Merge the two runs at stack indices i and i+1.
1827 * Returns 0 on success, -1 on error.
1828 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001829static Py_ssize_t
1830merge_at(MergeState *ms, Py_ssize_t i)
Tim Petersa64dc242002-08-01 02:13:36 +00001831{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001832 sortslice ssa, ssb;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001833 Py_ssize_t na, nb;
1834 Py_ssize_t k;
Tim Petersa64dc242002-08-01 02:13:36 +00001835
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001836 assert(ms != NULL);
1837 assert(ms->n >= 2);
1838 assert(i >= 0);
1839 assert(i == ms->n - 2 || i == ms->n - 3);
Tim Petersa64dc242002-08-01 02:13:36 +00001840
Daniel Stutzbach98338222010-12-02 21:55:33 +00001841 ssa = ms->pending[i].base;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001842 na = ms->pending[i].len;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001843 ssb = ms->pending[i+1].base;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001844 nb = ms->pending[i+1].len;
1845 assert(na > 0 && nb > 0);
Daniel Stutzbach98338222010-12-02 21:55:33 +00001846 assert(ssa.keys + na == ssb.keys);
Tim Petersa64dc242002-08-01 02:13:36 +00001847
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001848 /* Record the length of the combined runs; if i is the 3rd-last
1849 * run now, also slide over the last run (which isn't involved
1850 * in this merge). The current run i+1 goes away in any case.
1851 */
1852 ms->pending[i].len = na + nb;
1853 if (i == ms->n - 3)
1854 ms->pending[i+1] = ms->pending[i+2];
1855 --ms->n;
Tim Petersa64dc242002-08-01 02:13:36 +00001856
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001857 /* Where does b start in a? Elements in a before that can be
1858 * ignored (already in place).
1859 */
embg1e34da42018-01-28 20:03:23 -07001860 k = gallop_right(ms, *ssb.keys, ssa.keys, na, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001861 if (k < 0)
1862 return -1;
Daniel Stutzbach98338222010-12-02 21:55:33 +00001863 sortslice_advance(&ssa, k);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001864 na -= k;
1865 if (na == 0)
1866 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001867
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001868 /* Where does a end in b? Elements in b after that can be
1869 * ignored (already in place).
1870 */
embg1e34da42018-01-28 20:03:23 -07001871 nb = gallop_left(ms, ssa.keys[na-1], ssb.keys, nb, nb-1);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001872 if (nb <= 0)
1873 return nb;
Tim Petersa64dc242002-08-01 02:13:36 +00001874
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001875 /* Merge what remains of the runs, using a temp array with
1876 * min(na, nb) elements.
1877 */
1878 if (na <= nb)
Daniel Stutzbach98338222010-12-02 21:55:33 +00001879 return merge_lo(ms, ssa, na, ssb, nb);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001880 else
Daniel Stutzbach98338222010-12-02 21:55:33 +00001881 return merge_hi(ms, ssa, na, ssb, nb);
Tim Petersa64dc242002-08-01 02:13:36 +00001882}
1883
1884/* Examine the stack of runs waiting to be merged, merging adjacent runs
1885 * until the stack invariants are re-established:
1886 *
1887 * 1. len[-3] > len[-2] + len[-1]
1888 * 2. len[-2] > len[-1]
1889 *
1890 * See listsort.txt for more info.
1891 *
1892 * Returns 0 on success, -1 on error.
1893 */
1894static int
1895merge_collapse(MergeState *ms)
1896{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001897 struct s_slice *p = ms->pending;
Tim Petersa64dc242002-08-01 02:13:36 +00001898
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001899 assert(ms);
1900 while (ms->n > 1) {
1901 Py_ssize_t n = ms->n - 2;
Benjamin Petersonb808d592015-02-25 10:12:26 -05001902 if ((n > 0 && p[n-1].len <= p[n].len + p[n+1].len) ||
1903 (n > 1 && p[n-2].len <= p[n-1].len + p[n].len)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001904 if (p[n-1].len < p[n+1].len)
1905 --n;
1906 if (merge_at(ms, n) < 0)
1907 return -1;
1908 }
1909 else if (p[n].len <= p[n+1].len) {
embg1e34da42018-01-28 20:03:23 -07001910 if (merge_at(ms, n) < 0)
1911 return -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001912 }
1913 else
1914 break;
1915 }
1916 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001917}
1918
1919/* Regardless of invariants, merge all runs on the stack until only one
1920 * remains. This is used at the end of the mergesort.
1921 *
1922 * Returns 0 on success, -1 on error.
1923 */
1924static int
1925merge_force_collapse(MergeState *ms)
1926{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001927 struct s_slice *p = ms->pending;
Tim Petersa64dc242002-08-01 02:13:36 +00001928
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001929 assert(ms);
1930 while (ms->n > 1) {
1931 Py_ssize_t n = ms->n - 2;
1932 if (n > 0 && p[n-1].len < p[n+1].len)
1933 --n;
1934 if (merge_at(ms, n) < 0)
1935 return -1;
1936 }
1937 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001938}
1939
1940/* Compute a good value for the minimum run length; natural runs shorter
1941 * than this are boosted artificially via binary insertion.
1942 *
1943 * If n < 64, return n (it's too small to bother with fancy stuff).
1944 * Else if n is an exact power of 2, return 32.
1945 * Else return an int k, 32 <= k <= 64, such that n/k is close to, but
1946 * strictly less than, an exact power of 2.
1947 *
1948 * See listsort.txt for more info.
1949 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001950static Py_ssize_t
1951merge_compute_minrun(Py_ssize_t n)
Tim Petersa64dc242002-08-01 02:13:36 +00001952{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001953 Py_ssize_t r = 0; /* becomes 1 if any 1 bits are shifted off */
Tim Petersa64dc242002-08-01 02:13:36 +00001954
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001955 assert(n >= 0);
1956 while (n >= 64) {
1957 r |= n & 1;
1958 n >>= 1;
1959 }
1960 return n + r;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001961}
Guido van Rossuma119c0d1998-05-29 17:56:32 +00001962
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001963static void
Daniel Stutzbach98338222010-12-02 21:55:33 +00001964reverse_sortslice(sortslice *s, Py_ssize_t n)
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001965{
Daniel Stutzbach98338222010-12-02 21:55:33 +00001966 reverse_slice(s->keys, &s->keys[n]);
1967 if (s->values != NULL)
1968 reverse_slice(s->values, &s->values[n]);
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001969}
1970
embg1e34da42018-01-28 20:03:23 -07001971/* Here we define custom comparison functions to optimize for the cases one commonly
1972 * encounters in practice: homogeneous lists, often of one of the basic types. */
1973
1974/* This struct holds the comparison function and helper functions
1975 * selected in the pre-sort check. */
1976
1977/* These are the special case compare functions.
1978 * ms->key_compare will always point to one of these: */
1979
1980/* Heterogeneous compare: default, always safe to fall back on. */
1981static int
1982safe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
1983{
1984 /* No assumptions necessary! */
1985 return PyObject_RichCompareBool(v, w, Py_LT);
1986}
1987
1988/* Homogeneous compare: safe for any two compareable objects of the same type.
1989 * (ms->key_richcompare is set to ob_type->tp_richcompare in the
1990 * pre-sort check.)
1991 */
1992static int
1993unsafe_object_compare(PyObject *v, PyObject *w, MergeState *ms)
1994{
1995 PyObject *res_obj; int res;
1996
1997 /* No assumptions, because we check first: */
1998 if (v->ob_type->tp_richcompare != ms->key_richcompare)
1999 return PyObject_RichCompareBool(v, w, Py_LT);
2000
2001 assert(ms->key_richcompare != NULL);
2002 res_obj = (*(ms->key_richcompare))(v, w, Py_LT);
2003
2004 if (res_obj == Py_NotImplemented) {
2005 Py_DECREF(res_obj);
2006 return PyObject_RichCompareBool(v, w, Py_LT);
2007 }
2008 if (res_obj == NULL)
2009 return -1;
2010
2011 if (PyBool_Check(res_obj)) {
2012 res = (res_obj == Py_True);
2013 }
2014 else {
2015 res = PyObject_IsTrue(res_obj);
2016 }
2017 Py_DECREF(res_obj);
2018
2019 /* Note that we can't assert
2020 * res == PyObject_RichCompareBool(v, w, Py_LT);
2021 * because of evil compare functions like this:
2022 * lambda a, b: int(random.random() * 3) - 1)
2023 * (which is actually in test_sort.py) */
2024 return res;
2025}
2026
2027/* Latin string compare: safe for any two latin (one byte per char) strings. */
2028static int
2029unsafe_latin_compare(PyObject *v, PyObject *w, MergeState *ms)
2030{
Victor Stinner8017b802018-01-29 13:47:06 +01002031 Py_ssize_t len;
2032 int res;
embg1e34da42018-01-28 20:03:23 -07002033
2034 /* Modified from Objects/unicodeobject.c:unicode_compare, assuming: */
2035 assert(v->ob_type == w->ob_type);
2036 assert(v->ob_type == &PyUnicode_Type);
2037 assert(PyUnicode_KIND(v) == PyUnicode_KIND(w));
2038 assert(PyUnicode_KIND(v) == PyUnicode_1BYTE_KIND);
2039
2040 len = Py_MIN(PyUnicode_GET_LENGTH(v), PyUnicode_GET_LENGTH(w));
2041 res = memcmp(PyUnicode_DATA(v), PyUnicode_DATA(w), len);
2042
2043 res = (res != 0 ?
2044 res < 0 :
2045 PyUnicode_GET_LENGTH(v) < PyUnicode_GET_LENGTH(w));
2046
2047 assert(res == PyObject_RichCompareBool(v, w, Py_LT));;
2048 return res;
2049}
2050
2051/* Bounded int compare: compare any two longs that fit in a single machine word. */
2052static int
2053unsafe_long_compare(PyObject *v, PyObject *w, MergeState *ms)
2054{
2055 PyLongObject *vl, *wl; sdigit v0, w0; int res;
2056
2057 /* Modified from Objects/longobject.c:long_compare, assuming: */
2058 assert(v->ob_type == w->ob_type);
2059 assert(v->ob_type == &PyLong_Type);
2060 assert(Py_ABS(Py_SIZE(v)) <= 1);
2061 assert(Py_ABS(Py_SIZE(w)) <= 1);
2062
2063 vl = (PyLongObject*)v;
2064 wl = (PyLongObject*)w;
2065
2066 v0 = Py_SIZE(vl) == 0 ? 0 : (sdigit)vl->ob_digit[0];
2067 w0 = Py_SIZE(wl) == 0 ? 0 : (sdigit)wl->ob_digit[0];
2068
2069 if (Py_SIZE(vl) < 0)
2070 v0 = -v0;
2071 if (Py_SIZE(wl) < 0)
2072 w0 = -w0;
2073
2074 res = v0 < w0;
2075 assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2076 return res;
2077}
2078
2079/* Float compare: compare any two floats. */
2080static int
2081unsafe_float_compare(PyObject *v, PyObject *w, MergeState *ms)
2082{
2083 int res;
2084
2085 /* Modified from Objects/floatobject.c:float_richcompare, assuming: */
2086 assert(v->ob_type == w->ob_type);
2087 assert(v->ob_type == &PyFloat_Type);
2088
2089 res = PyFloat_AS_DOUBLE(v) < PyFloat_AS_DOUBLE(w);
2090 assert(res == PyObject_RichCompareBool(v, w, Py_LT));
2091 return res;
2092}
2093
2094/* Tuple compare: compare *any* two tuples, using
2095 * ms->tuple_elem_compare to compare the first elements, which is set
2096 * using the same pre-sort check as we use for ms->key_compare,
2097 * but run on the list [x[0] for x in L]. This allows us to optimize compares
2098 * on two levels (as long as [x[0] for x in L] is type-homogeneous.) The idea is
2099 * that most tuple compares don't involve x[1:]. */
2100static int
2101unsafe_tuple_compare(PyObject *v, PyObject *w, MergeState *ms)
2102{
2103 PyTupleObject *vt, *wt;
2104 Py_ssize_t i, vlen, wlen;
2105 int k;
2106
2107 /* Modified from Objects/tupleobject.c:tuplerichcompare, assuming: */
2108 assert(v->ob_type == w->ob_type);
2109 assert(v->ob_type == &PyTuple_Type);
2110 assert(Py_SIZE(v) > 0);
2111 assert(Py_SIZE(w) > 0);
2112
2113 vt = (PyTupleObject *)v;
2114 wt = (PyTupleObject *)w;
2115
2116 vlen = Py_SIZE(vt);
2117 wlen = Py_SIZE(wt);
2118
2119 for (i = 0; i < vlen && i < wlen; i++) {
2120 k = PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_EQ);
2121 if (k < 0)
2122 return -1;
2123 if (!k)
2124 break;
2125 }
2126
2127 if (i >= vlen || i >= wlen)
2128 return vlen < wlen;
2129
2130 if (i == 0)
2131 return ms->tuple_elem_compare(vt->ob_item[i], wt->ob_item[i], ms);
2132 else
2133 return PyObject_RichCompareBool(vt->ob_item[i], wt->ob_item[i], Py_LT);
2134}
2135
Tim Petersa64dc242002-08-01 02:13:36 +00002136/* An adaptive, stable, natural mergesort. See listsort.txt.
2137 * Returns Py_None on success, NULL on error. Even in case of error, the
2138 * list will be some permutation of its input state (nothing is lost or
2139 * duplicated).
2140 */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002141/*[clinic input]
2142list.sort
2143
2144 *
2145 key as keyfunc: object = None
Serhiy Storchaka202fda52017-03-12 10:10:47 +02002146 reverse: bool(accept={int}) = False
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002147
2148Stable sort *IN PLACE*.
2149[clinic start generated code]*/
2150
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002151static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002152list_sort_impl(PyListObject *self, PyObject *keyfunc, int reverse)
Serhiy Storchaka202fda52017-03-12 10:10:47 +02002153/*[clinic end generated code: output=57b9f9c5e23fbe42 input=b0fcf743982c5b90]*/
Guido van Rossum3f236de1996-12-10 23:55:39 +00002154{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002155 MergeState ms;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002156 Py_ssize_t nremaining;
2157 Py_ssize_t minrun;
Daniel Stutzbach98338222010-12-02 21:55:33 +00002158 sortslice lo;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002159 Py_ssize_t saved_ob_size, saved_allocated;
2160 PyObject **saved_ob_item;
2161 PyObject **final_ob_item;
2162 PyObject *result = NULL; /* guilty until proved innocent */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002163 Py_ssize_t i;
Daniel Stutzbach98338222010-12-02 21:55:33 +00002164 PyObject **keys;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002165
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002166 assert(self != NULL);
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002167 assert(PyList_Check(self));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002168 if (keyfunc == Py_None)
2169 keyfunc = NULL;
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00002170
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002171 /* The list is temporarily made empty, so that mutations performed
2172 * by comparison functions can't affect the slice of memory we're
2173 * sorting (allowing mutations during sorting is a core-dump
2174 * factory, since ob_item may change).
2175 */
2176 saved_ob_size = Py_SIZE(self);
2177 saved_ob_item = self->ob_item;
2178 saved_allocated = self->allocated;
2179 Py_SIZE(self) = 0;
2180 self->ob_item = NULL;
2181 self->allocated = -1; /* any operation will reset it to >= 0 */
Tim Peters330f9e92002-07-19 07:05:44 +00002182
Daniel Stutzbach98338222010-12-02 21:55:33 +00002183 if (keyfunc == NULL) {
2184 keys = NULL;
2185 lo.keys = saved_ob_item;
2186 lo.values = NULL;
2187 }
2188 else {
2189 if (saved_ob_size < MERGESTATE_TEMP_SIZE/2)
2190 /* Leverage stack space we allocated but won't otherwise use */
2191 keys = &ms.temparray[saved_ob_size+1];
2192 else {
2193 keys = PyMem_MALLOC(sizeof(PyObject *) * saved_ob_size);
Benjamin Peterson0823ffb2015-04-23 17:04:36 -04002194 if (keys == NULL) {
2195 PyErr_NoMemory();
2196 goto keyfunc_fail;
2197 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002198 }
Daniel Stutzbach98338222010-12-02 21:55:33 +00002199
2200 for (i = 0; i < saved_ob_size ; i++) {
Victor Stinnerde4ae3d2016-12-04 22:59:09 +01002201 keys[i] = PyObject_CallFunctionObjArgs(keyfunc, saved_ob_item[i],
2202 NULL);
Daniel Stutzbach98338222010-12-02 21:55:33 +00002203 if (keys[i] == NULL) {
2204 for (i=i-1 ; i>=0 ; i--)
2205 Py_DECREF(keys[i]);
Benjamin Peterson4a42cd42014-03-15 12:21:28 -05002206 if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
Daniel Stutzbach8eda5f72011-03-02 23:37:50 +00002207 PyMem_FREE(keys);
Daniel Stutzbach98338222010-12-02 21:55:33 +00002208 goto keyfunc_fail;
2209 }
2210 }
2211
2212 lo.keys = keys;
2213 lo.values = saved_ob_item;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002214 }
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002215
embg1e34da42018-01-28 20:03:23 -07002216
2217 /* The pre-sort check: here's where we decide which compare function to use.
2218 * How much optimization is safe? We test for homogeneity with respect to
2219 * several properties that are expensive to check at compare-time, and
2220 * set ms appropriately. */
2221 if (saved_ob_size > 1) {
2222 /* Assume the first element is representative of the whole list. */
2223 int keys_are_in_tuples = (lo.keys[0]->ob_type == &PyTuple_Type &&
2224 Py_SIZE(lo.keys[0]) > 0);
2225
2226 PyTypeObject* key_type = (keys_are_in_tuples ?
2227 PyTuple_GET_ITEM(lo.keys[0], 0)->ob_type :
2228 lo.keys[0]->ob_type);
2229
2230 int keys_are_all_same_type = 1;
2231 int strings_are_latin = 1;
2232 int ints_are_bounded = 1;
2233
2234 /* Prove that assumption by checking every key. */
embg1e34da42018-01-28 20:03:23 -07002235 for (i=0; i < saved_ob_size; i++) {
2236
2237 if (keys_are_in_tuples &&
2238 !(lo.keys[i]->ob_type == &PyTuple_Type && Py_SIZE(lo.keys[i]) != 0)) {
2239 keys_are_in_tuples = 0;
2240 keys_are_all_same_type = 0;
2241 break;
2242 }
2243
2244 /* Note: for lists of tuples, key is the first element of the tuple
2245 * lo.keys[i], not lo.keys[i] itself! We verify type-homogeneity
2246 * for lists of tuples in the if-statement directly above. */
2247 PyObject *key = (keys_are_in_tuples ?
2248 PyTuple_GET_ITEM(lo.keys[i], 0) :
2249 lo.keys[i]);
2250
2251 if (key->ob_type != key_type) {
2252 keys_are_all_same_type = 0;
Miss Islington (bot)9dbb09f2019-03-25 00:47:55 -07002253 /* If keys are in tuple we must loop over the whole list to make
2254 sure all items are tuples */
2255 if (!keys_are_in_tuples) {
2256 break;
2257 }
embg1e34da42018-01-28 20:03:23 -07002258 }
2259
Miss Islington (bot)9dbb09f2019-03-25 00:47:55 -07002260 if (keys_are_all_same_type) {
2261 if (key_type == &PyLong_Type &&
2262 ints_are_bounded &&
2263 Py_ABS(Py_SIZE(key)) > 1) {
2264
embg1e34da42018-01-28 20:03:23 -07002265 ints_are_bounded = 0;
Miss Islington (bot)9dbb09f2019-03-25 00:47:55 -07002266 }
2267 else if (key_type == &PyUnicode_Type &&
2268 strings_are_latin &&
2269 PyUnicode_KIND(key) != PyUnicode_1BYTE_KIND) {
2270
2271 strings_are_latin = 0;
2272 }
2273 }
embg1e34da42018-01-28 20:03:23 -07002274 }
embg1e34da42018-01-28 20:03:23 -07002275
2276 /* Choose the best compare, given what we now know about the keys. */
2277 if (keys_are_all_same_type) {
2278
2279 if (key_type == &PyUnicode_Type && strings_are_latin) {
2280 ms.key_compare = unsafe_latin_compare;
2281 }
2282 else if (key_type == &PyLong_Type && ints_are_bounded) {
2283 ms.key_compare = unsafe_long_compare;
2284 }
2285 else if (key_type == &PyFloat_Type) {
2286 ms.key_compare = unsafe_float_compare;
2287 }
2288 else if ((ms.key_richcompare = key_type->tp_richcompare) != NULL) {
2289 ms.key_compare = unsafe_object_compare;
2290 }
Miss Islington (bot)0e73ea22019-02-21 00:05:22 -08002291 else {
2292 ms.key_compare = safe_object_compare;
2293 }
embg1e34da42018-01-28 20:03:23 -07002294 }
2295 else {
2296 ms.key_compare = safe_object_compare;
2297 }
2298
2299 if (keys_are_in_tuples) {
2300 /* Make sure we're not dealing with tuples of tuples
2301 * (remember: here, key_type refers list [key[0] for key in keys]) */
Miss Islington (bot)9dbb09f2019-03-25 00:47:55 -07002302 if (key_type == &PyTuple_Type) {
embg1e34da42018-01-28 20:03:23 -07002303 ms.tuple_elem_compare = safe_object_compare;
Miss Islington (bot)9dbb09f2019-03-25 00:47:55 -07002304 }
2305 else {
embg1e34da42018-01-28 20:03:23 -07002306 ms.tuple_elem_compare = ms.key_compare;
Miss Islington (bot)9dbb09f2019-03-25 00:47:55 -07002307 }
embg1e34da42018-01-28 20:03:23 -07002308
2309 ms.key_compare = unsafe_tuple_compare;
2310 }
2311 }
2312 /* End of pre-sort check: ms is now set properly! */
2313
Daniel Stutzbach98338222010-12-02 21:55:33 +00002314 merge_init(&ms, saved_ob_size, keys != NULL);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002315
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002316 nremaining = saved_ob_size;
2317 if (nremaining < 2)
2318 goto succeed;
Tim Peters330f9e92002-07-19 07:05:44 +00002319
Benjamin Peterson05380642010-08-23 19:35:39 +00002320 /* Reverse sort stability achieved by initially reversing the list,
2321 applying a stable forward sort, then reversing the final result. */
Daniel Stutzbach98338222010-12-02 21:55:33 +00002322 if (reverse) {
2323 if (keys != NULL)
2324 reverse_slice(&keys[0], &keys[saved_ob_size]);
2325 reverse_slice(&saved_ob_item[0], &saved_ob_item[saved_ob_size]);
2326 }
Benjamin Peterson05380642010-08-23 19:35:39 +00002327
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002328 /* March over the array once, left to right, finding natural runs,
2329 * and extending short natural runs to minrun elements.
2330 */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002331 minrun = merge_compute_minrun(nremaining);
2332 do {
2333 int descending;
2334 Py_ssize_t n;
Tim Peters330f9e92002-07-19 07:05:44 +00002335
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002336 /* Identify next run. */
embg1e34da42018-01-28 20:03:23 -07002337 n = count_run(&ms, lo.keys, lo.keys + nremaining, &descending);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002338 if (n < 0)
2339 goto fail;
2340 if (descending)
Daniel Stutzbach98338222010-12-02 21:55:33 +00002341 reverse_sortslice(&lo, n);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002342 /* If short, extend to min(minrun, nremaining). */
2343 if (n < minrun) {
2344 const Py_ssize_t force = nremaining <= minrun ?
2345 nremaining : minrun;
embg1e34da42018-01-28 20:03:23 -07002346 if (binarysort(&ms, lo, lo.keys + force, lo.keys + n) < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002347 goto fail;
2348 n = force;
2349 }
2350 /* Push run onto pending-runs stack, and maybe merge. */
2351 assert(ms.n < MAX_MERGE_PENDING);
2352 ms.pending[ms.n].base = lo;
2353 ms.pending[ms.n].len = n;
2354 ++ms.n;
2355 if (merge_collapse(&ms) < 0)
2356 goto fail;
2357 /* Advance to find next run. */
Daniel Stutzbach98338222010-12-02 21:55:33 +00002358 sortslice_advance(&lo, n);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002359 nremaining -= n;
2360 } while (nremaining);
Tim Peters330f9e92002-07-19 07:05:44 +00002361
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002362 if (merge_force_collapse(&ms) < 0)
2363 goto fail;
2364 assert(ms.n == 1);
Daniel Stutzbach98338222010-12-02 21:55:33 +00002365 assert(keys == NULL
2366 ? ms.pending[0].base.keys == saved_ob_item
2367 : ms.pending[0].base.keys == &keys[0]);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002368 assert(ms.pending[0].len == saved_ob_size);
Daniel Stutzbach98338222010-12-02 21:55:33 +00002369 lo = ms.pending[0].base;
Tim Petersa64dc242002-08-01 02:13:36 +00002370
2371succeed:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002372 result = Py_None;
Tim Peters330f9e92002-07-19 07:05:44 +00002373fail:
Daniel Stutzbach98338222010-12-02 21:55:33 +00002374 if (keys != NULL) {
2375 for (i = 0; i < saved_ob_size; i++)
2376 Py_DECREF(keys[i]);
Benjamin Petersonef87f8c2014-03-14 21:54:31 -05002377 if (saved_ob_size >= MERGESTATE_TEMP_SIZE/2)
Daniel Stutzbach98338222010-12-02 21:55:33 +00002378 PyMem_FREE(keys);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002379 }
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002380
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002381 if (self->allocated != -1 && result != NULL) {
2382 /* The user mucked with the list during the sort,
2383 * and we don't already have another error to report.
2384 */
2385 PyErr_SetString(PyExc_ValueError, "list modified during sort");
2386 result = NULL;
2387 }
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002388
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002389 if (reverse && saved_ob_size > 1)
2390 reverse_slice(saved_ob_item, saved_ob_item + saved_ob_size);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002391
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002392 merge_freemem(&ms);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002393
Daniel Stutzbach98338222010-12-02 21:55:33 +00002394keyfunc_fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002395 final_ob_item = self->ob_item;
2396 i = Py_SIZE(self);
2397 Py_SIZE(self) = saved_ob_size;
2398 self->ob_item = saved_ob_item;
2399 self->allocated = saved_allocated;
2400 if (final_ob_item != NULL) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002401 /* we cannot use _list_clear() for this because it does not
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002402 guarantee that the list is really empty when it returns */
2403 while (--i >= 0) {
2404 Py_XDECREF(final_ob_item[i]);
2405 }
2406 PyMem_FREE(final_ob_item);
2407 }
2408 Py_XINCREF(result);
2409 return result;
Guido van Rossum3f236de1996-12-10 23:55:39 +00002410}
Tim Peters330f9e92002-07-19 07:05:44 +00002411#undef IFLT
Tim Peters66860f62002-08-04 17:47:26 +00002412#undef ISLT
Tim Peters330f9e92002-07-19 07:05:44 +00002413
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002414int
Fred Drakea2f55112000-07-09 15:16:51 +00002415PyList_Sort(PyObject *v)
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002416{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002417 if (v == NULL || !PyList_Check(v)) {
2418 PyErr_BadInternalCall();
2419 return -1;
2420 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002421 v = list_sort_impl((PyListObject *)v, NULL, 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002422 if (v == NULL)
2423 return -1;
2424 Py_DECREF(v);
2425 return 0;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002426}
2427
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002428/*[clinic input]
2429list.reverse
2430
2431Reverse *IN PLACE*.
2432[clinic start generated code]*/
2433
Guido van Rossumb86c5492001-02-12 22:06:02 +00002434static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002435list_reverse_impl(PyListObject *self)
2436/*[clinic end generated code: output=482544fc451abea9 input=eefd4c3ae1bc9887]*/
Guido van Rossumb86c5492001-02-12 22:06:02 +00002437{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002438 if (Py_SIZE(self) > 1)
2439 reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
2440 Py_RETURN_NONE;
Guido van Rossumed98d481991-03-06 13:07:53 +00002441}
2442
Guido van Rossum84c76f51990-10-30 13:32:20 +00002443int
Fred Drakea2f55112000-07-09 15:16:51 +00002444PyList_Reverse(PyObject *v)
Guido van Rossumb0fe3a91995-01-17 16:34:45 +00002445{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002446 PyListObject *self = (PyListObject *)v;
Tim Peters6063e262002-08-08 01:06:39 +00002447
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002448 if (v == NULL || !PyList_Check(v)) {
2449 PyErr_BadInternalCall();
2450 return -1;
2451 }
2452 if (Py_SIZE(self) > 1)
2453 reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
2454 return 0;
Guido van Rossumb0fe3a91995-01-17 16:34:45 +00002455}
2456
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002457PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +00002458PyList_AsTuple(PyObject *v)
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00002459{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002460 PyObject *w;
2461 PyObject **p, **q;
2462 Py_ssize_t n;
2463 if (v == NULL || !PyList_Check(v)) {
2464 PyErr_BadInternalCall();
2465 return NULL;
2466 }
2467 n = Py_SIZE(v);
2468 w = PyTuple_New(n);
2469 if (w == NULL)
2470 return NULL;
2471 p = ((PyTupleObject *)w)->ob_item;
2472 q = ((PyListObject *)v)->ob_item;
2473 while (--n >= 0) {
2474 Py_INCREF(*q);
2475 *p = *q;
2476 p++;
2477 q++;
2478 }
2479 return w;
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00002480}
2481
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002482/*[clinic input]
2483list.index
Guido van Rossum4aa24f92000-02-24 15:23:03 +00002484
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002485 value: object
Serhiy Storchaka80ec8362017-03-19 19:37:40 +02002486 start: slice_index(accept={int}) = 0
2487 stop: slice_index(accept={int}, c_default="PY_SSIZE_T_MAX") = sys.maxsize
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002488 /
2489
2490Return first index of value.
2491
2492Raises ValueError if the value is not present.
2493[clinic start generated code]*/
2494
2495static PyObject *
2496list_index_impl(PyListObject *self, PyObject *value, Py_ssize_t start,
2497 Py_ssize_t stop)
Serhiy Storchaka80ec8362017-03-19 19:37:40 +02002498/*[clinic end generated code: output=ec51b88787e4e481 input=40ec5826303a0eb1]*/
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002499{
2500 Py_ssize_t i;
2501
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002502 if (start < 0) {
2503 start += Py_SIZE(self);
2504 if (start < 0)
2505 start = 0;
2506 }
2507 if (stop < 0) {
2508 stop += Py_SIZE(self);
2509 if (stop < 0)
2510 stop = 0;
2511 }
2512 for (i = start; i < stop && i < Py_SIZE(self); i++) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002513 int cmp = PyObject_RichCompareBool(self->ob_item[i], value, Py_EQ);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002514 if (cmp > 0)
2515 return PyLong_FromSsize_t(i);
2516 else if (cmp < 0)
2517 return NULL;
2518 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002519 PyErr_Format(PyExc_ValueError, "%R is not in list", value);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002520 return NULL;
Guido van Rossumed98d481991-03-06 13:07:53 +00002521}
2522
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002523/*[clinic input]
2524list.count
2525
2526 value: object
2527 /
2528
2529Return number of occurrences of value.
2530[clinic start generated code]*/
2531
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002532static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002533list_count(PyListObject *self, PyObject *value)
2534/*[clinic end generated code: output=b1f5d284205ae714 input=3bdc3a5e6f749565]*/
Guido van Rossume6f7d181991-10-20 20:20:40 +00002535{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002536 Py_ssize_t count = 0;
2537 Py_ssize_t i;
Guido van Rossum4aa24f92000-02-24 15:23:03 +00002538
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002539 for (i = 0; i < Py_SIZE(self); i++) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002540 int cmp = PyObject_RichCompareBool(self->ob_item[i], value, Py_EQ);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002541 if (cmp > 0)
2542 count++;
2543 else if (cmp < 0)
2544 return NULL;
2545 }
2546 return PyLong_FromSsize_t(count);
Guido van Rossume6f7d181991-10-20 20:20:40 +00002547}
2548
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002549/*[clinic input]
2550list.remove
2551
2552 value: object
2553 /
2554
2555Remove first occurrence of value.
2556
2557Raises ValueError if the value is not present.
2558[clinic start generated code]*/
2559
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002560static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002561list_remove(PyListObject *self, PyObject *value)
2562/*[clinic end generated code: output=f087e1951a5e30d1 input=2dc2ba5bb2fb1f82]*/
Guido van Rossumed98d481991-03-06 13:07:53 +00002563{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002564 Py_ssize_t i;
Guido van Rossum4aa24f92000-02-24 15:23:03 +00002565
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002566 for (i = 0; i < Py_SIZE(self); i++) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002567 int cmp = PyObject_RichCompareBool(self->ob_item[i], value, Py_EQ);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002568 if (cmp > 0) {
2569 if (list_ass_slice(self, i, i+1,
2570 (PyObject *)NULL) == 0)
2571 Py_RETURN_NONE;
2572 return NULL;
2573 }
2574 else if (cmp < 0)
2575 return NULL;
2576 }
2577 PyErr_SetString(PyExc_ValueError, "list.remove(x): x not in list");
2578 return NULL;
Guido van Rossumed98d481991-03-06 13:07:53 +00002579}
2580
Jeremy Hylton8caad492000-06-23 14:18:11 +00002581static int
2582list_traverse(PyListObject *o, visitproc visit, void *arg)
2583{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002584 Py_ssize_t i;
Jeremy Hylton8caad492000-06-23 14:18:11 +00002585
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002586 for (i = Py_SIZE(o); --i >= 0; )
2587 Py_VISIT(o->ob_item[i]);
2588 return 0;
Jeremy Hylton8caad492000-06-23 14:18:11 +00002589}
2590
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002591static PyObject *
2592list_richcompare(PyObject *v, PyObject *w, int op)
2593{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002594 PyListObject *vl, *wl;
2595 Py_ssize_t i;
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002596
Brian Curtindfc80e32011-08-10 20:28:54 -05002597 if (!PyList_Check(v) || !PyList_Check(w))
2598 Py_RETURN_NOTIMPLEMENTED;
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002599
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002600 vl = (PyListObject *)v;
2601 wl = (PyListObject *)w;
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002602
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002603 if (Py_SIZE(vl) != Py_SIZE(wl) && (op == Py_EQ || op == Py_NE)) {
2604 /* Shortcut: if the lengths differ, the lists differ */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002605 if (op == Py_EQ)
stratakise8b19652017-11-02 11:32:54 +01002606 Py_RETURN_FALSE;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002607 else
stratakise8b19652017-11-02 11:32:54 +01002608 Py_RETURN_TRUE;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002609 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002610
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002611 /* Search for the first index where items are different */
2612 for (i = 0; i < Py_SIZE(vl) && i < Py_SIZE(wl); i++) {
2613 int k = PyObject_RichCompareBool(vl->ob_item[i],
2614 wl->ob_item[i], Py_EQ);
2615 if (k < 0)
2616 return NULL;
2617 if (!k)
2618 break;
2619 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002620
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002621 if (i >= Py_SIZE(vl) || i >= Py_SIZE(wl)) {
2622 /* No more items to compare -- compare sizes */
stratakise8b19652017-11-02 11:32:54 +01002623 Py_RETURN_RICHCOMPARE(Py_SIZE(vl), Py_SIZE(wl), op);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002624 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002625
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002626 /* We have an item that differs -- shortcuts for EQ/NE */
2627 if (op == Py_EQ) {
Serhiy Storchaka228b12e2017-01-23 09:47:21 +02002628 Py_RETURN_FALSE;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002629 }
2630 if (op == Py_NE) {
Serhiy Storchaka228b12e2017-01-23 09:47:21 +02002631 Py_RETURN_TRUE;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002632 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002633
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002634 /* Compare the final item again using the proper operator */
2635 return PyObject_RichCompare(vl->ob_item[i], wl->ob_item[i], op);
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002636}
2637
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002638/*[clinic input]
2639list.__init__
2640
2641 iterable: object(c_default="NULL") = ()
2642 /
2643
2644Built-in mutable sequence.
2645
2646If no argument is given, the constructor creates a new empty list.
2647The argument must be an iterable if specified.
2648[clinic start generated code]*/
2649
Tim Peters6d6c1a32001-08-02 04:15:00 +00002650static int
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002651list___init___impl(PyListObject *self, PyObject *iterable)
2652/*[clinic end generated code: output=0f3c21379d01de48 input=b3f3fe7206af8f6b]*/
Tim Peters6d6c1a32001-08-02 04:15:00 +00002653{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002654 /* Verify list invariants established by PyType_GenericAlloc() */
2655 assert(0 <= Py_SIZE(self));
2656 assert(Py_SIZE(self) <= self->allocated || self->allocated == -1);
2657 assert(self->ob_item != NULL ||
2658 self->allocated == 0 || self->allocated == -1);
Raymond Hettingerc0aaa2d2004-07-29 23:31:29 +00002659
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002660 /* Empty previous contents */
2661 if (self->ob_item != NULL) {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002662 (void)_list_clear(self);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002663 }
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002664 if (iterable != NULL) {
2665 PyObject *rv = list_extend(self, iterable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002666 if (rv == NULL)
2667 return -1;
2668 Py_DECREF(rv);
2669 }
2670 return 0;
Tim Peters6d6c1a32001-08-02 04:15:00 +00002671}
2672
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002673/*[clinic input]
2674list.__sizeof__
2675
2676Return the size of the list in memory, in bytes.
2677[clinic start generated code]*/
2678
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002679static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002680list___sizeof___impl(PyListObject *self)
2681/*[clinic end generated code: output=3417541f95f9a53e input=b8030a5d5ce8a187]*/
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002682{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002683 Py_ssize_t res;
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002684
Serhiy Storchaka5c4064e2015-12-19 20:05:25 +02002685 res = _PyObject_SIZE(Py_TYPE(self)) + self->allocated * sizeof(void*);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002686 return PyLong_FromSsize_t(res);
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002687}
2688
Raymond Hettinger1021c442003-11-07 15:38:09 +00002689static PyObject *list_iter(PyObject *seq);
Raymond Hettinger8f5cdaa2003-12-13 11:26:12 +00002690static PyObject *list_subscript(PyListObject*, PyObject*);
2691
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002692static PyMethodDef list_methods[] = {
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002693 {"__getitem__", (PyCFunction)list_subscript, METH_O|METH_COEXIST, "x.__getitem__(y) <==> x[y]"},
2694 LIST___REVERSED___METHODDEF
2695 LIST___SIZEOF___METHODDEF
2696 LIST_CLEAR_METHODDEF
2697 LIST_COPY_METHODDEF
2698 LIST_APPEND_METHODDEF
2699 LIST_INSERT_METHODDEF
2700 LIST_EXTEND_METHODDEF
2701 LIST_POP_METHODDEF
2702 LIST_REMOVE_METHODDEF
2703 LIST_INDEX_METHODDEF
2704 LIST_COUNT_METHODDEF
2705 LIST_REVERSE_METHODDEF
2706 LIST_SORT_METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002707 {NULL, NULL} /* sentinel */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002708};
2709
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002710static PySequenceMethods list_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002711 (lenfunc)list_length, /* sq_length */
2712 (binaryfunc)list_concat, /* sq_concat */
2713 (ssizeargfunc)list_repeat, /* sq_repeat */
2714 (ssizeargfunc)list_item, /* sq_item */
2715 0, /* sq_slice */
2716 (ssizeobjargproc)list_ass_item, /* sq_ass_item */
2717 0, /* sq_ass_slice */
2718 (objobjproc)list_contains, /* sq_contains */
2719 (binaryfunc)list_inplace_concat, /* sq_inplace_concat */
2720 (ssizeargfunc)list_inplace_repeat, /* sq_inplace_repeat */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002721};
2722
Jeremy Hyltona4b4c3b2002-07-13 03:51:17 +00002723static PyObject *
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002724list_subscript(PyListObject* self, PyObject* item)
2725{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002726 if (PyIndex_Check(item)) {
2727 Py_ssize_t i;
2728 i = PyNumber_AsSsize_t(item, PyExc_IndexError);
2729 if (i == -1 && PyErr_Occurred())
2730 return NULL;
2731 if (i < 0)
2732 i += PyList_GET_SIZE(self);
2733 return list_item(self, i);
2734 }
2735 else if (PySlice_Check(item)) {
2736 Py_ssize_t start, stop, step, slicelength, cur, i;
2737 PyObject* result;
2738 PyObject* it;
2739 PyObject **src, **dest;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002740
Serhiy Storchakab879fe82017-04-08 09:53:51 +03002741 if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002742 return NULL;
2743 }
Serhiy Storchakab879fe82017-04-08 09:53:51 +03002744 slicelength = PySlice_AdjustIndices(Py_SIZE(self), &start, &stop,
2745 step);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002746
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002747 if (slicelength <= 0) {
2748 return PyList_New(0);
2749 }
2750 else if (step == 1) {
2751 return list_slice(self, start, stop);
2752 }
2753 else {
2754 result = PyList_New(slicelength);
2755 if (!result) return NULL;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002756
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002757 src = self->ob_item;
2758 dest = ((PyListObject *)result)->ob_item;
2759 for (cur = start, i = 0; i < slicelength;
Mark Dickinsonc7d93b72011-09-25 15:34:32 +01002760 cur += (size_t)step, i++) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002761 it = src[cur];
2762 Py_INCREF(it);
2763 dest[i] = it;
2764 }
Tim Peters3b01a122002-07-19 02:35:45 +00002765
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002766 return result;
2767 }
2768 }
2769 else {
2770 PyErr_Format(PyExc_TypeError,
Terry Jan Reedyffff1442014-08-02 01:30:37 -04002771 "list indices must be integers or slices, not %.200s",
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002772 item->ob_type->tp_name);
2773 return NULL;
2774 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002775}
2776
Tim Peters3b01a122002-07-19 02:35:45 +00002777static int
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002778list_ass_subscript(PyListObject* self, PyObject* item, PyObject* value)
2779{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002780 if (PyIndex_Check(item)) {
2781 Py_ssize_t i = PyNumber_AsSsize_t(item, PyExc_IndexError);
2782 if (i == -1 && PyErr_Occurred())
2783 return -1;
2784 if (i < 0)
2785 i += PyList_GET_SIZE(self);
2786 return list_ass_item(self, i, value);
2787 }
2788 else if (PySlice_Check(item)) {
2789 Py_ssize_t start, stop, step, slicelength;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002790
Serhiy Storchakab879fe82017-04-08 09:53:51 +03002791 if (PySlice_Unpack(item, &start, &stop, &step) < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002792 return -1;
2793 }
Serhiy Storchakab879fe82017-04-08 09:53:51 +03002794 slicelength = PySlice_AdjustIndices(Py_SIZE(self), &start, &stop,
2795 step);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002796
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002797 if (step == 1)
2798 return list_ass_slice(self, start, stop, value);
Michael W. Hudson9c14bad2002-06-19 15:44:15 +00002799
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002800 /* Make sure s[5:2] = [..] inserts at the right place:
2801 before 5, not before 2. */
2802 if ((step < 0 && start < stop) ||
2803 (step > 0 && start > stop))
2804 stop = start;
Thomas Woutersed03b412007-08-28 21:37:11 +00002805
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002806 if (value == NULL) {
2807 /* delete slice */
2808 PyObject **garbage;
2809 size_t cur;
2810 Py_ssize_t i;
Victor Stinner35f28032013-11-21 12:16:35 +01002811 int res;
Tim Peters3b01a122002-07-19 02:35:45 +00002812
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002813 if (slicelength <= 0)
2814 return 0;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002815
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002816 if (step < 0) {
2817 stop = start + 1;
2818 start = stop + step*(slicelength - 1) - 1;
2819 step = -step;
2820 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002821
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002822 garbage = (PyObject**)
2823 PyMem_MALLOC(slicelength*sizeof(PyObject*));
2824 if (!garbage) {
2825 PyErr_NoMemory();
2826 return -1;
2827 }
Tim Peters3b01a122002-07-19 02:35:45 +00002828
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002829 /* drawing pictures might help understand these for
2830 loops. Basically, we memmove the parts of the
2831 list that are *not* part of the slice: step-1
2832 items for each item that is part of the slice,
2833 and then tail end of the list that was not
2834 covered by the slice */
2835 for (cur = start, i = 0;
2836 cur < (size_t)stop;
2837 cur += step, i++) {
2838 Py_ssize_t lim = step - 1;
Michael W. Hudson56796f62002-07-29 14:35:04 +00002839
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002840 garbage[i] = PyList_GET_ITEM(self, cur);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002841
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002842 if (cur + step >= (size_t)Py_SIZE(self)) {
2843 lim = Py_SIZE(self) - cur - 1;
2844 }
Michael W. Hudson56796f62002-07-29 14:35:04 +00002845
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002846 memmove(self->ob_item + cur - i,
2847 self->ob_item + cur + 1,
2848 lim * sizeof(PyObject *));
2849 }
Mark Dickinsonc7d93b72011-09-25 15:34:32 +01002850 cur = start + (size_t)slicelength * step;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002851 if (cur < (size_t)Py_SIZE(self)) {
2852 memmove(self->ob_item + cur - slicelength,
2853 self->ob_item + cur,
2854 (Py_SIZE(self) - cur) *
2855 sizeof(PyObject *));
2856 }
Raymond Hettingera6366fe2004-03-09 13:05:22 +00002857
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002858 Py_SIZE(self) -= slicelength;
Victor Stinner35f28032013-11-21 12:16:35 +01002859 res = list_resize(self, Py_SIZE(self));
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002860
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002861 for (i = 0; i < slicelength; i++) {
2862 Py_DECREF(garbage[i]);
2863 }
2864 PyMem_FREE(garbage);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002865
Victor Stinner35f28032013-11-21 12:16:35 +01002866 return res;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002867 }
2868 else {
2869 /* assign slice */
2870 PyObject *ins, *seq;
2871 PyObject **garbage, **seqitems, **selfitems;
2872 Py_ssize_t cur, i;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002873
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002874 /* protect against a[::-1] = a */
2875 if (self == (PyListObject*)value) {
2876 seq = list_slice((PyListObject*)value, 0,
2877 PyList_GET_SIZE(value));
2878 }
2879 else {
2880 seq = PySequence_Fast(value,
2881 "must assign iterable "
2882 "to extended slice");
2883 }
2884 if (!seq)
2885 return -1;
Michael W. Hudsona69c0302002-12-05 21:32:32 +00002886
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002887 if (PySequence_Fast_GET_SIZE(seq) != slicelength) {
2888 PyErr_Format(PyExc_ValueError,
2889 "attempt to assign sequence of "
2890 "size %zd to extended slice of "
2891 "size %zd",
2892 PySequence_Fast_GET_SIZE(seq),
2893 slicelength);
2894 Py_DECREF(seq);
2895 return -1;
2896 }
Michael W. Hudsona69c0302002-12-05 21:32:32 +00002897
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002898 if (!slicelength) {
2899 Py_DECREF(seq);
2900 return 0;
2901 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002902
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002903 garbage = (PyObject**)
2904 PyMem_MALLOC(slicelength*sizeof(PyObject*));
2905 if (!garbage) {
2906 Py_DECREF(seq);
2907 PyErr_NoMemory();
2908 return -1;
2909 }
Tim Peters3b01a122002-07-19 02:35:45 +00002910
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002911 selfitems = self->ob_item;
2912 seqitems = PySequence_Fast_ITEMS(seq);
2913 for (cur = start, i = 0; i < slicelength;
Mark Dickinsonc7d93b72011-09-25 15:34:32 +01002914 cur += (size_t)step, i++) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002915 garbage[i] = selfitems[cur];
2916 ins = seqitems[i];
2917 Py_INCREF(ins);
2918 selfitems[cur] = ins;
2919 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002920
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002921 for (i = 0; i < slicelength; i++) {
2922 Py_DECREF(garbage[i]);
2923 }
Tim Peters3b01a122002-07-19 02:35:45 +00002924
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002925 PyMem_FREE(garbage);
2926 Py_DECREF(seq);
Tim Peters3b01a122002-07-19 02:35:45 +00002927
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002928 return 0;
2929 }
2930 }
2931 else {
2932 PyErr_Format(PyExc_TypeError,
Terry Jan Reedyffff1442014-08-02 01:30:37 -04002933 "list indices must be integers or slices, not %.200s",
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002934 item->ob_type->tp_name);
2935 return -1;
2936 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002937}
2938
2939static PyMappingMethods list_as_mapping = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002940 (lenfunc)list_length,
2941 (binaryfunc)list_subscript,
2942 (objobjargproc)list_ass_subscript
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002943};
2944
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002945PyTypeObject PyList_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002946 PyVarObject_HEAD_INIT(&PyType_Type, 0)
2947 "list",
2948 sizeof(PyListObject),
2949 0,
2950 (destructor)list_dealloc, /* tp_dealloc */
2951 0, /* tp_print */
2952 0, /* tp_getattr */
2953 0, /* tp_setattr */
2954 0, /* tp_reserved */
2955 (reprfunc)list_repr, /* tp_repr */
2956 0, /* tp_as_number */
2957 &list_as_sequence, /* tp_as_sequence */
2958 &list_as_mapping, /* tp_as_mapping */
Georg Brandl00da4e02010-10-18 07:32:48 +00002959 PyObject_HashNotImplemented, /* tp_hash */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002960 0, /* tp_call */
2961 0, /* tp_str */
2962 PyObject_GenericGetAttr, /* tp_getattro */
2963 0, /* tp_setattro */
2964 0, /* tp_as_buffer */
2965 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002966 Py_TPFLAGS_BASETYPE | Py_TPFLAGS_LIST_SUBCLASS, /* tp_flags */
2967 list___init____doc__, /* tp_doc */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002968 (traverseproc)list_traverse, /* tp_traverse */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002969 (inquiry)_list_clear, /* tp_clear */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002970 list_richcompare, /* tp_richcompare */
2971 0, /* tp_weaklistoffset */
2972 list_iter, /* tp_iter */
2973 0, /* tp_iternext */
2974 list_methods, /* tp_methods */
2975 0, /* tp_members */
2976 0, /* tp_getset */
2977 0, /* tp_base */
2978 0, /* tp_dict */
2979 0, /* tp_descr_get */
2980 0, /* tp_descr_set */
2981 0, /* tp_dictoffset */
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02002982 (initproc)list___init__, /* tp_init */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002983 PyType_GenericAlloc, /* tp_alloc */
2984 PyType_GenericNew, /* tp_new */
2985 PyObject_GC_Del, /* tp_free */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002986};
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002987
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002988/*********************** List Iterator **************************/
2989
2990typedef struct {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002991 PyObject_HEAD
Victor Stinner7660b882013-06-24 23:59:24 +02002992 Py_ssize_t it_index;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002993 PyListObject *it_seq; /* Set to NULL when iterator is exhausted */
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002994} listiterobject;
2995
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00002996static void listiter_dealloc(listiterobject *);
2997static int listiter_traverse(listiterobject *, visitproc, void *);
2998static PyObject *listiter_next(listiterobject *);
2999static PyObject *listiter_len(listiterobject *);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003000static PyObject *listiter_reduce_general(void *_it, int forward);
3001static PyObject *listiter_reduce(listiterobject *);
3002static PyObject *listiter_setstate(listiterobject *, PyObject *state);
Raymond Hettinger435bf582004-03-18 22:43:10 +00003003
Armin Rigof5b3e362006-02-11 21:32:43 +00003004PyDoc_STRVAR(length_hint_doc, "Private method returning an estimate of len(list(it)).");
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003005PyDoc_STRVAR(reduce_doc, "Return state information for pickling.");
3006PyDoc_STRVAR(setstate_doc, "Set state information for unpickling.");
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003007
3008static PyMethodDef listiter_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003009 {"__length_hint__", (PyCFunction)listiter_len, METH_NOARGS, length_hint_doc},
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003010 {"__reduce__", (PyCFunction)listiter_reduce, METH_NOARGS, reduce_doc},
3011 {"__setstate__", (PyCFunction)listiter_setstate, METH_O, setstate_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003012 {NULL, NULL} /* sentinel */
Raymond Hettinger435bf582004-03-18 22:43:10 +00003013};
3014
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00003015PyTypeObject PyListIter_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003016 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3017 "list_iterator", /* tp_name */
3018 sizeof(listiterobject), /* tp_basicsize */
3019 0, /* tp_itemsize */
3020 /* methods */
3021 (destructor)listiter_dealloc, /* tp_dealloc */
3022 0, /* tp_print */
3023 0, /* tp_getattr */
3024 0, /* tp_setattr */
3025 0, /* tp_reserved */
3026 0, /* tp_repr */
3027 0, /* tp_as_number */
3028 0, /* tp_as_sequence */
3029 0, /* tp_as_mapping */
3030 0, /* tp_hash */
3031 0, /* tp_call */
3032 0, /* tp_str */
3033 PyObject_GenericGetAttr, /* tp_getattro */
3034 0, /* tp_setattro */
3035 0, /* tp_as_buffer */
3036 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3037 0, /* tp_doc */
3038 (traverseproc)listiter_traverse, /* tp_traverse */
3039 0, /* tp_clear */
3040 0, /* tp_richcompare */
3041 0, /* tp_weaklistoffset */
3042 PyObject_SelfIter, /* tp_iter */
3043 (iternextfunc)listiter_next, /* tp_iternext */
3044 listiter_methods, /* tp_methods */
3045 0, /* tp_members */
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00003046};
Raymond Hettinger1021c442003-11-07 15:38:09 +00003047
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003048
3049static PyObject *
3050list_iter(PyObject *seq)
3051{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003052 listiterobject *it;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003053
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003054 if (!PyList_Check(seq)) {
3055 PyErr_BadInternalCall();
3056 return NULL;
3057 }
3058 it = PyObject_GC_New(listiterobject, &PyListIter_Type);
3059 if (it == NULL)
3060 return NULL;
3061 it->it_index = 0;
3062 Py_INCREF(seq);
3063 it->it_seq = (PyListObject *)seq;
3064 _PyObject_GC_TRACK(it);
3065 return (PyObject *)it;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003066}
3067
3068static void
3069listiter_dealloc(listiterobject *it)
3070{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003071 _PyObject_GC_UNTRACK(it);
3072 Py_XDECREF(it->it_seq);
3073 PyObject_GC_Del(it);
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003074}
3075
3076static int
3077listiter_traverse(listiterobject *it, visitproc visit, void *arg)
3078{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003079 Py_VISIT(it->it_seq);
3080 return 0;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003081}
3082
3083static PyObject *
3084listiter_next(listiterobject *it)
3085{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003086 PyListObject *seq;
3087 PyObject *item;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003088
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003089 assert(it != NULL);
3090 seq = it->it_seq;
3091 if (seq == NULL)
3092 return NULL;
3093 assert(PyList_Check(seq));
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003094
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003095 if (it->it_index < PyList_GET_SIZE(seq)) {
3096 item = PyList_GET_ITEM(seq, it->it_index);
3097 ++it->it_index;
3098 Py_INCREF(item);
3099 return item;
3100 }
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003101
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003102 it->it_seq = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003103 Py_DECREF(seq);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003104 return NULL;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003105}
3106
3107static PyObject *
3108listiter_len(listiterobject *it)
3109{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003110 Py_ssize_t len;
3111 if (it->it_seq) {
3112 len = PyList_GET_SIZE(it->it_seq) - it->it_index;
3113 if (len >= 0)
3114 return PyLong_FromSsize_t(len);
3115 }
3116 return PyLong_FromLong(0);
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003117}
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003118
3119static PyObject *
3120listiter_reduce(listiterobject *it)
3121{
3122 return listiter_reduce_general(it, 1);
3123}
3124
3125static PyObject *
3126listiter_setstate(listiterobject *it, PyObject *state)
3127{
Victor Stinner7660b882013-06-24 23:59:24 +02003128 Py_ssize_t index = PyLong_AsSsize_t(state);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003129 if (index == -1 && PyErr_Occurred())
3130 return NULL;
3131 if (it->it_seq != NULL) {
3132 if (index < 0)
3133 index = 0;
Kristján Valur Jónsson25dded02014-03-05 13:47:57 +00003134 else if (index > PyList_GET_SIZE(it->it_seq))
3135 index = PyList_GET_SIZE(it->it_seq); /* iterator exhausted */
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003136 it->it_index = index;
3137 }
3138 Py_RETURN_NONE;
3139}
3140
Raymond Hettinger1021c442003-11-07 15:38:09 +00003141/*********************** List Reverse Iterator **************************/
3142
3143typedef struct {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003144 PyObject_HEAD
3145 Py_ssize_t it_index;
3146 PyListObject *it_seq; /* Set to NULL when iterator is exhausted */
Raymond Hettinger1021c442003-11-07 15:38:09 +00003147} listreviterobject;
3148
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003149static void listreviter_dealloc(listreviterobject *);
3150static int listreviter_traverse(listreviterobject *, visitproc, void *);
3151static PyObject *listreviter_next(listreviterobject *);
Raymond Hettingerf5b64112008-12-02 21:33:45 +00003152static PyObject *listreviter_len(listreviterobject *);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003153static PyObject *listreviter_reduce(listreviterobject *);
3154static PyObject *listreviter_setstate(listreviterobject *, PyObject *);
Raymond Hettingeref9bf402004-03-10 10:10:42 +00003155
Raymond Hettingerf5b64112008-12-02 21:33:45 +00003156static PyMethodDef listreviter_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003157 {"__length_hint__", (PyCFunction)listreviter_len, METH_NOARGS, length_hint_doc},
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003158 {"__reduce__", (PyCFunction)listreviter_reduce, METH_NOARGS, reduce_doc},
3159 {"__setstate__", (PyCFunction)listreviter_setstate, METH_O, setstate_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003160 {NULL, NULL} /* sentinel */
Raymond Hettingeref9bf402004-03-10 10:10:42 +00003161};
3162
Raymond Hettinger1021c442003-11-07 15:38:09 +00003163PyTypeObject PyListRevIter_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003164 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3165 "list_reverseiterator", /* tp_name */
3166 sizeof(listreviterobject), /* tp_basicsize */
3167 0, /* tp_itemsize */
3168 /* methods */
3169 (destructor)listreviter_dealloc, /* tp_dealloc */
3170 0, /* tp_print */
3171 0, /* tp_getattr */
3172 0, /* tp_setattr */
3173 0, /* tp_reserved */
3174 0, /* tp_repr */
3175 0, /* tp_as_number */
3176 0, /* tp_as_sequence */
3177 0, /* tp_as_mapping */
3178 0, /* tp_hash */
3179 0, /* tp_call */
3180 0, /* tp_str */
3181 PyObject_GenericGetAttr, /* tp_getattro */
3182 0, /* tp_setattro */
3183 0, /* tp_as_buffer */
3184 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3185 0, /* tp_doc */
3186 (traverseproc)listreviter_traverse, /* tp_traverse */
3187 0, /* tp_clear */
3188 0, /* tp_richcompare */
3189 0, /* tp_weaklistoffset */
3190 PyObject_SelfIter, /* tp_iter */
3191 (iternextfunc)listreviter_next, /* tp_iternext */
3192 listreviter_methods, /* tp_methods */
3193 0,
Raymond Hettinger1021c442003-11-07 15:38:09 +00003194};
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003195
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02003196/*[clinic input]
3197list.__reversed__
3198
3199Return a reverse iterator over the list.
3200[clinic start generated code]*/
3201
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003202static PyObject *
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02003203list___reversed___impl(PyListObject *self)
3204/*[clinic end generated code: output=b166f073208c888c input=eadb6e17f8a6a280]*/
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003205{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003206 listreviterobject *it;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003207
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003208 it = PyObject_GC_New(listreviterobject, &PyListRevIter_Type);
3209 if (it == NULL)
3210 return NULL;
Serhiy Storchakafdd42c42017-03-11 09:19:20 +02003211 assert(PyList_Check(self));
3212 it->it_index = PyList_GET_SIZE(self) - 1;
3213 Py_INCREF(self);
3214 it->it_seq = self;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003215 PyObject_GC_Track(it);
3216 return (PyObject *)it;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003217}
3218
3219static void
3220listreviter_dealloc(listreviterobject *it)
3221{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003222 PyObject_GC_UnTrack(it);
3223 Py_XDECREF(it->it_seq);
3224 PyObject_GC_Del(it);
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003225}
3226
3227static int
3228listreviter_traverse(listreviterobject *it, visitproc visit, void *arg)
3229{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003230 Py_VISIT(it->it_seq);
3231 return 0;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003232}
3233
3234static PyObject *
3235listreviter_next(listreviterobject *it)
3236{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003237 PyObject *item;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003238 Py_ssize_t index;
3239 PyListObject *seq;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003240
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003241 assert(it != NULL);
3242 seq = it->it_seq;
3243 if (seq == NULL) {
3244 return NULL;
3245 }
3246 assert(PyList_Check(seq));
3247
3248 index = it->it_index;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003249 if (index>=0 && index < PyList_GET_SIZE(seq)) {
3250 item = PyList_GET_ITEM(seq, index);
3251 it->it_index--;
3252 Py_INCREF(item);
3253 return item;
3254 }
3255 it->it_index = -1;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003256 it->it_seq = NULL;
3257 Py_DECREF(seq);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003258 return NULL;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003259}
3260
Raymond Hettingerf5b64112008-12-02 21:33:45 +00003261static PyObject *
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003262listreviter_len(listreviterobject *it)
3263{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003264 Py_ssize_t len = it->it_index + 1;
3265 if (it->it_seq == NULL || PyList_GET_SIZE(it->it_seq) < len)
3266 len = 0;
3267 return PyLong_FromSsize_t(len);
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00003268}
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003269
3270static PyObject *
3271listreviter_reduce(listreviterobject *it)
3272{
3273 return listiter_reduce_general(it, 0);
3274}
3275
3276static PyObject *
3277listreviter_setstate(listreviterobject *it, PyObject *state)
3278{
3279 Py_ssize_t index = PyLong_AsSsize_t(state);
3280 if (index == -1 && PyErr_Occurred())
3281 return NULL;
3282 if (it->it_seq != NULL) {
3283 if (index < -1)
3284 index = -1;
3285 else if (index > PyList_GET_SIZE(it->it_seq) - 1)
3286 index = PyList_GET_SIZE(it->it_seq) - 1;
3287 it->it_index = index;
3288 }
3289 Py_RETURN_NONE;
3290}
3291
3292/* common pickling support */
3293
3294static PyObject *
3295listiter_reduce_general(void *_it, int forward)
3296{
3297 PyObject *list;
3298
3299 /* the objects are not the same, index is of different types! */
3300 if (forward) {
3301 listiterobject *it = (listiterobject *)_it;
3302 if (it->it_seq)
Victor Stinner7660b882013-06-24 23:59:24 +02003303 return Py_BuildValue("N(O)n", _PyObject_GetBuiltin("iter"),
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003304 it->it_seq, it->it_index);
3305 } else {
3306 listreviterobject *it = (listreviterobject *)_it;
3307 if (it->it_seq)
Antoine Pitroua7013882012-04-05 00:04:20 +02003308 return Py_BuildValue("N(O)n", _PyObject_GetBuiltin("reversed"),
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003309 it->it_seq, it->it_index);
3310 }
3311 /* empty iterator, create an empty list */
3312 list = PyList_New(0);
3313 if (list == NULL)
3314 return NULL;
Antoine Pitroua7013882012-04-05 00:04:20 +02003315 return Py_BuildValue("N(N)", _PyObject_GetBuiltin("iter"), list);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003316}