blob: f753643bd39a94987be327c791dea4eed6183cae [file] [log] [blame]
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00001/* List object implementation */
2
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003#include "Python.h"
4
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00005#ifdef STDC_HEADERS
6#include <stddef.h>
7#else
Antoine Pitrouc83ea132010-05-09 14:46:46 +00008#include <sys/types.h> /* For size_t */
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00009#endif
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000010
Tim Peters8d9eb102004-07-31 02:24:20 +000011/* Ensure ob_item has room for at least newsize elements, and set
12 * ob_size to newsize. If newsize > ob_size on entry, the content
13 * of the new slots at exit is undefined heap trash; it's the caller's
Ezio Melottic2077b02011-03-16 12:34:31 +020014 * responsibility to overwrite them with sane values.
Tim Peters8d9eb102004-07-31 02:24:20 +000015 * The number of allocated elements may grow, shrink, or stay the same.
16 * Failure is impossible if newsize <= self.allocated on entry, although
17 * that partly relies on an assumption that the system realloc() never
18 * fails when passed a number of bytes <= the number of bytes last
19 * allocated (the C standard doesn't guarantee this, but it's hard to
20 * imagine a realloc implementation where it wouldn't be true).
21 * Note that self->ob_item may change, and even if newsize is less
22 * than ob_size on entry.
23 */
Guido van Rossuma46d51d1995-01-26 22:59:43 +000024static int
Martin v. Löwis18e16552006-02-15 17:27:45 +000025list_resize(PyListObject *self, Py_ssize_t newsize)
Guido van Rossuma46d51d1995-01-26 22:59:43 +000026{
Antoine Pitrouc83ea132010-05-09 14:46:46 +000027 PyObject **items;
28 size_t new_allocated;
29 Py_ssize_t allocated = self->allocated;
Tim Peters65b8b842001-05-26 05:28:40 +000030
Antoine Pitrouc83ea132010-05-09 14:46:46 +000031 /* Bypass realloc() when a previous overallocation is large enough
32 to accommodate the newsize. If the newsize falls lower than half
33 the allocated size, then proceed with the realloc() to shrink the list.
34 */
35 if (allocated >= newsize && newsize >= (allocated >> 1)) {
36 assert(self->ob_item != NULL || newsize == 0);
37 Py_SIZE(self) = newsize;
38 return 0;
39 }
Raymond Hettinger4bb95402004-02-13 11:36:39 +000040
Antoine Pitrouc83ea132010-05-09 14:46:46 +000041 /* This over-allocates proportional to the list size, making room
42 * for additional growth. The over-allocation is mild, but is
43 * enough to give linear-time amortized behavior over a long
44 * sequence of appends() in the presence of a poorly-performing
45 * system realloc().
46 * The growth pattern is: 0, 4, 8, 16, 25, 35, 46, 58, 72, 88, ...
47 */
48 new_allocated = (newsize >> 3) + (newsize < 9 ? 3 : 6);
Gregory P. Smith9d534572008-06-11 07:41:16 +000049
Antoine Pitrouc83ea132010-05-09 14:46:46 +000050 /* check for integer overflow */
51 if (new_allocated > PY_SIZE_MAX - newsize) {
52 PyErr_NoMemory();
53 return -1;
54 } else {
55 new_allocated += newsize;
56 }
Gregory P. Smith9d534572008-06-11 07:41:16 +000057
Antoine Pitrouc83ea132010-05-09 14:46:46 +000058 if (newsize == 0)
59 new_allocated = 0;
60 items = self->ob_item;
Mark Dickinson4ac5d2c2011-09-19 19:23:55 +010061 if (new_allocated <= (PY_SIZE_MAX / sizeof(PyObject *)))
Antoine Pitrouc83ea132010-05-09 14:46:46 +000062 PyMem_RESIZE(items, PyObject *, new_allocated);
63 else
64 items = NULL;
65 if (items == NULL) {
66 PyErr_NoMemory();
67 return -1;
68 }
69 self->ob_item = items;
70 Py_SIZE(self) = newsize;
71 self->allocated = new_allocated;
72 return 0;
Raymond Hettinger4bb95402004-02-13 11:36:39 +000073}
Guido van Rossuma46d51d1995-01-26 22:59:43 +000074
Christian Heimesb4ee4a12008-02-07 17:15:30 +000075/* Debug statistic to compare allocations with reuse through the free list */
76#undef SHOW_ALLOC_COUNT
77#ifdef SHOW_ALLOC_COUNT
78static size_t count_alloc = 0;
79static size_t count_reuse = 0;
80
81static void
82show_alloc(void)
83{
Antoine Pitrouc83ea132010-05-09 14:46:46 +000084 fprintf(stderr, "List allocations: %" PY_FORMAT_SIZE_T "d\n",
85 count_alloc);
86 fprintf(stderr, "List reuse through freelist: %" PY_FORMAT_SIZE_T
87 "d\n", count_reuse);
88 fprintf(stderr, "%.2f%% reuse rate\n\n",
89 (100.0*count_reuse/(count_alloc+count_reuse)));
Christian Heimesb4ee4a12008-02-07 17:15:30 +000090}
91#endif
92
Raymond Hettinger0468e412004-05-05 05:37:53 +000093/* Empty list reuse scheme to save calls to malloc and free */
Christian Heimes5b970ad2008-02-06 13:33:44 +000094#ifndef PyList_MAXFREELIST
95#define PyList_MAXFREELIST 80
96#endif
97static PyListObject *free_list[PyList_MAXFREELIST];
98static int numfree = 0;
Raymond Hettinger0468e412004-05-05 05:37:53 +000099
Raymond Hettingerfb09f0e2004-10-07 03:58:07 +0000100void
101PyList_Fini(void)
102{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000103 PyListObject *op;
Raymond Hettingerfb09f0e2004-10-07 03:58:07 +0000104
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000105 while (numfree) {
106 op = free_list[--numfree];
107 assert(PyList_CheckExact(op));
108 PyObject_GC_Del(op);
109 }
Raymond Hettingerfb09f0e2004-10-07 03:58:07 +0000110}
111
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000112PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000113PyList_New(Py_ssize_t size)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000114{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000115 PyListObject *op;
116 size_t nbytes;
Christian Heimesb4ee4a12008-02-07 17:15:30 +0000117#ifdef SHOW_ALLOC_COUNT
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000118 static int initialized = 0;
119 if (!initialized) {
120 Py_AtExit(show_alloc);
121 initialized = 1;
122 }
Christian Heimesb4ee4a12008-02-07 17:15:30 +0000123#endif
Tim Peters3986d4e2004-07-29 02:28:42 +0000124
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000125 if (size < 0) {
126 PyErr_BadInternalCall();
127 return NULL;
128 }
129 /* Check for overflow without an actual overflow,
130 * which can cause compiler to optimise out */
131 if ((size_t)size > PY_SIZE_MAX / sizeof(PyObject *))
132 return PyErr_NoMemory();
133 nbytes = size * sizeof(PyObject *);
134 if (numfree) {
135 numfree--;
136 op = free_list[numfree];
137 _Py_NewReference((PyObject *)op);
Christian Heimesb4ee4a12008-02-07 17:15:30 +0000138#ifdef SHOW_ALLOC_COUNT
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000139 count_reuse++;
Christian Heimesb4ee4a12008-02-07 17:15:30 +0000140#endif
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000141 } else {
142 op = PyObject_GC_New(PyListObject, &PyList_Type);
143 if (op == NULL)
144 return NULL;
Christian Heimesb4ee4a12008-02-07 17:15:30 +0000145#ifdef SHOW_ALLOC_COUNT
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000146 count_alloc++;
Christian Heimesb4ee4a12008-02-07 17:15:30 +0000147#endif
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000148 }
149 if (size <= 0)
150 op->ob_item = NULL;
151 else {
152 op->ob_item = (PyObject **) PyMem_MALLOC(nbytes);
153 if (op->ob_item == NULL) {
154 Py_DECREF(op);
155 return PyErr_NoMemory();
156 }
157 memset(op->ob_item, 0, nbytes);
158 }
159 Py_SIZE(op) = size;
160 op->allocated = size;
161 _PyObject_GC_TRACK(op);
162 return (PyObject *) op;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000163}
164
Martin v. Löwis18e16552006-02-15 17:27:45 +0000165Py_ssize_t
Fred Drakea2f55112000-07-09 15:16:51 +0000166PyList_Size(PyObject *op)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000167{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000168 if (!PyList_Check(op)) {
169 PyErr_BadInternalCall();
170 return -1;
171 }
172 else
173 return Py_SIZE(op);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000174}
175
Raymond Hettingerfdfe6182004-05-05 06:28:16 +0000176static PyObject *indexerr = NULL;
Guido van Rossum929f1b81996-08-09 20:51:27 +0000177
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000178PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000179PyList_GetItem(PyObject *op, Py_ssize_t i)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000180{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000181 if (!PyList_Check(op)) {
182 PyErr_BadInternalCall();
183 return NULL;
184 }
185 if (i < 0 || i >= Py_SIZE(op)) {
186 if (indexerr == NULL) {
187 indexerr = PyString_FromString(
188 "list index out of range");
189 if (indexerr == NULL)
190 return NULL;
191 }
192 PyErr_SetObject(PyExc_IndexError, indexerr);
193 return NULL;
194 }
195 return ((PyListObject *)op) -> ob_item[i];
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000196}
197
198int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000199PyList_SetItem(register PyObject *op, register Py_ssize_t i,
Fred Drakea2f55112000-07-09 15:16:51 +0000200 register PyObject *newitem)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000201{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000202 register PyObject *olditem;
203 register PyObject **p;
204 if (!PyList_Check(op)) {
205 Py_XDECREF(newitem);
206 PyErr_BadInternalCall();
207 return -1;
208 }
209 if (i < 0 || i >= Py_SIZE(op)) {
210 Py_XDECREF(newitem);
211 PyErr_SetString(PyExc_IndexError,
212 "list assignment index out of range");
213 return -1;
214 }
215 p = ((PyListObject *)op) -> ob_item + i;
216 olditem = *p;
217 *p = newitem;
218 Py_XDECREF(olditem);
219 return 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000220}
221
222static int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000223ins1(PyListObject *self, Py_ssize_t where, PyObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000224{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000225 Py_ssize_t i, n = Py_SIZE(self);
226 PyObject **items;
227 if (v == NULL) {
228 PyErr_BadInternalCall();
229 return -1;
230 }
231 if (n == PY_SSIZE_T_MAX) {
232 PyErr_SetString(PyExc_OverflowError,
233 "cannot add more objects to list");
234 return -1;
235 }
Tim Petersb38e2b62004-07-29 02:29:26 +0000236
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000237 if (list_resize(self, n+1) == -1)
238 return -1;
Raymond Hettinger4bb95402004-02-13 11:36:39 +0000239
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000240 if (where < 0) {
241 where += n;
242 if (where < 0)
243 where = 0;
244 }
245 if (where > n)
246 where = n;
247 items = self->ob_item;
248 for (i = n; --i >= where; )
249 items[i+1] = items[i];
250 Py_INCREF(v);
251 items[where] = v;
252 return 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000253}
254
255int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000256PyList_Insert(PyObject *op, Py_ssize_t where, PyObject *newitem)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000257{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000258 if (!PyList_Check(op)) {
259 PyErr_BadInternalCall();
260 return -1;
261 }
262 return ins1((PyListObject *)op, where, newitem);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000263}
264
Raymond Hettinger40a03822004-04-12 13:05:09 +0000265static int
266app1(PyListObject *self, PyObject *v)
267{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000268 Py_ssize_t n = PyList_GET_SIZE(self);
Raymond Hettinger40a03822004-04-12 13:05:09 +0000269
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000270 assert (v != NULL);
271 if (n == PY_SSIZE_T_MAX) {
272 PyErr_SetString(PyExc_OverflowError,
273 "cannot add more objects to list");
274 return -1;
275 }
Raymond Hettinger40a03822004-04-12 13:05:09 +0000276
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000277 if (list_resize(self, n+1) == -1)
278 return -1;
Raymond Hettinger40a03822004-04-12 13:05:09 +0000279
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000280 Py_INCREF(v);
281 PyList_SET_ITEM(self, n, v);
282 return 0;
Raymond Hettinger40a03822004-04-12 13:05:09 +0000283}
284
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000285int
Fred Drakea2f55112000-07-09 15:16:51 +0000286PyList_Append(PyObject *op, PyObject *newitem)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000287{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000288 if (PyList_Check(op) && (newitem != NULL))
289 return app1((PyListObject *)op, newitem);
290 PyErr_BadInternalCall();
291 return -1;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000292}
293
294/* Methods */
295
296static void
Fred Drakea2f55112000-07-09 15:16:51 +0000297list_dealloc(PyListObject *op)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000298{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000299 Py_ssize_t i;
300 PyObject_GC_UnTrack(op);
301 Py_TRASHCAN_SAFE_BEGIN(op)
302 if (op->ob_item != NULL) {
303 /* Do it backwards, for Christian Tismer.
304 There's a simple test case where somehow this reduces
305 thrashing when a *very* large list is created and
306 immediately deleted. */
307 i = Py_SIZE(op);
308 while (--i >= 0) {
309 Py_XDECREF(op->ob_item[i]);
310 }
311 PyMem_FREE(op->ob_item);
312 }
313 if (numfree < PyList_MAXFREELIST && PyList_CheckExact(op))
314 free_list[numfree++] = op;
315 else
316 Py_TYPE(op)->tp_free((PyObject *)op);
317 Py_TRASHCAN_SAFE_END(op)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000318}
319
Guido van Rossum90933611991-06-07 16:10:43 +0000320static int
Fred Drakea2f55112000-07-09 15:16:51 +0000321list_print(PyListObject *op, FILE *fp, int flags)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000322{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000323 int rc;
324 Py_ssize_t i;
325 PyObject *item;
Guido van Rossumfb376de1998-04-10 22:47:27 +0000326
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000327 rc = Py_ReprEnter((PyObject*)op);
328 if (rc != 0) {
329 if (rc < 0)
330 return rc;
331 Py_BEGIN_ALLOW_THREADS
332 fprintf(fp, "[...]");
333 Py_END_ALLOW_THREADS
334 return 0;
335 }
336 Py_BEGIN_ALLOW_THREADS
337 fprintf(fp, "[");
338 Py_END_ALLOW_THREADS
339 for (i = 0; i < Py_SIZE(op); i++) {
340 item = op->ob_item[i];
341 Py_INCREF(item);
342 if (i > 0) {
343 Py_BEGIN_ALLOW_THREADS
344 fprintf(fp, ", ");
345 Py_END_ALLOW_THREADS
346 }
347 if (PyObject_Print(item, fp, 0) != 0) {
348 Py_DECREF(item);
349 Py_ReprLeave((PyObject *)op);
350 return -1;
351 }
352 Py_DECREF(item);
353 }
354 Py_BEGIN_ALLOW_THREADS
355 fprintf(fp, "]");
356 Py_END_ALLOW_THREADS
357 Py_ReprLeave((PyObject *)op);
358 return 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000359}
360
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000361static PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +0000362list_repr(PyListObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000363{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000364 Py_ssize_t i;
365 PyObject *s, *temp;
366 PyObject *pieces = NULL, *result = NULL;
Guido van Rossumfb376de1998-04-10 22:47:27 +0000367
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000368 i = Py_ReprEnter((PyObject*)v);
369 if (i != 0) {
370 return i > 0 ? PyString_FromString("[...]") : NULL;
371 }
Tim Petersa7259592001-06-16 05:11:17 +0000372
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000373 if (Py_SIZE(v) == 0) {
374 result = PyString_FromString("[]");
375 goto Done;
376 }
Tim Petersa7259592001-06-16 05:11:17 +0000377
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000378 pieces = PyList_New(0);
379 if (pieces == NULL)
380 goto Done;
Tim Petersa7259592001-06-16 05:11:17 +0000381
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000382 /* Do repr() on each element. Note that this may mutate the list,
383 so must refetch the list size on each iteration. */
384 for (i = 0; i < Py_SIZE(v); ++i) {
385 int status;
386 if (Py_EnterRecursiveCall(" while getting the repr of a list"))
387 goto Done;
388 s = PyObject_Repr(v->ob_item[i]);
389 Py_LeaveRecursiveCall();
390 if (s == NULL)
391 goto Done;
392 status = PyList_Append(pieces, s);
393 Py_DECREF(s); /* append created a new ref */
394 if (status < 0)
395 goto Done;
396 }
Tim Petersa7259592001-06-16 05:11:17 +0000397
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000398 /* Add "[]" decorations to the first and last items. */
399 assert(PyList_GET_SIZE(pieces) > 0);
400 s = PyString_FromString("[");
401 if (s == NULL)
402 goto Done;
403 temp = PyList_GET_ITEM(pieces, 0);
404 PyString_ConcatAndDel(&s, temp);
405 PyList_SET_ITEM(pieces, 0, s);
406 if (s == NULL)
407 goto Done;
Tim Petersa7259592001-06-16 05:11:17 +0000408
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000409 s = PyString_FromString("]");
410 if (s == NULL)
411 goto Done;
412 temp = PyList_GET_ITEM(pieces, PyList_GET_SIZE(pieces) - 1);
413 PyString_ConcatAndDel(&temp, s);
414 PyList_SET_ITEM(pieces, PyList_GET_SIZE(pieces) - 1, temp);
415 if (temp == NULL)
416 goto Done;
Tim Petersa7259592001-06-16 05:11:17 +0000417
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000418 /* Paste them all together with ", " between. */
419 s = PyString_FromString(", ");
420 if (s == NULL)
421 goto Done;
422 result = _PyString_Join(s, pieces);
423 Py_DECREF(s);
Tim Petersa7259592001-06-16 05:11:17 +0000424
425Done:
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000426 Py_XDECREF(pieces);
427 Py_ReprLeave((PyObject *)v);
428 return result;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000429}
430
Martin v. Löwis18e16552006-02-15 17:27:45 +0000431static Py_ssize_t
Fred Drakea2f55112000-07-09 15:16:51 +0000432list_length(PyListObject *a)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000433{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000434 return Py_SIZE(a);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000435}
436
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000437static int
Fred Drakea2f55112000-07-09 15:16:51 +0000438list_contains(PyListObject *a, PyObject *el)
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000439{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000440 Py_ssize_t i;
441 int cmp;
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000442
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000443 for (i = 0, cmp = 0 ; cmp == 0 && i < Py_SIZE(a); ++i)
444 cmp = PyObject_RichCompareBool(el, PyList_GET_ITEM(a, i),
445 Py_EQ);
446 return cmp;
Jeremy Hylton37b1a262000-04-27 21:41:03 +0000447}
448
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000449static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000450list_item(PyListObject *a, Py_ssize_t i)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000451{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000452 if (i < 0 || i >= Py_SIZE(a)) {
453 if (indexerr == NULL) {
454 indexerr = PyString_FromString(
455 "list index out of range");
456 if (indexerr == NULL)
457 return NULL;
458 }
459 PyErr_SetObject(PyExc_IndexError, indexerr);
460 return NULL;
461 }
462 Py_INCREF(a->ob_item[i]);
463 return a->ob_item[i];
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000464}
465
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000466static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000467list_slice(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000468{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000469 PyListObject *np;
470 PyObject **src, **dest;
471 Py_ssize_t i, len;
472 if (ilow < 0)
473 ilow = 0;
474 else if (ilow > Py_SIZE(a))
475 ilow = Py_SIZE(a);
476 if (ihigh < ilow)
477 ihigh = ilow;
478 else if (ihigh > Py_SIZE(a))
479 ihigh = Py_SIZE(a);
480 len = ihigh - ilow;
481 np = (PyListObject *) PyList_New(len);
482 if (np == NULL)
483 return NULL;
Raymond Hettinger99842b62004-03-08 05:56:15 +0000484
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000485 src = a->ob_item + ilow;
486 dest = np->ob_item;
487 for (i = 0; i < len; i++) {
488 PyObject *v = src[i];
489 Py_INCREF(v);
490 dest[i] = v;
491 }
492 return (PyObject *)np;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000493}
494
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000495PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000496PyList_GetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
Guido van Rossum234f9421993-06-17 12:35:49 +0000497{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000498 if (!PyList_Check(a)) {
499 PyErr_BadInternalCall();
500 return NULL;
501 }
502 return list_slice((PyListObject *)a, ilow, ihigh);
Guido van Rossum234f9421993-06-17 12:35:49 +0000503}
504
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000505static PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +0000506list_concat(PyListObject *a, PyObject *bb)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000507{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000508 Py_ssize_t size;
509 Py_ssize_t i;
510 PyObject **src, **dest;
511 PyListObject *np;
512 if (!PyList_Check(bb)) {
513 PyErr_Format(PyExc_TypeError,
514 "can only concatenate list (not \"%.200s\") to list",
515 bb->ob_type->tp_name);
516 return NULL;
517 }
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000518#define b ((PyListObject *)bb)
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000519 size = Py_SIZE(a) + Py_SIZE(b);
520 if (size < 0)
521 return PyErr_NoMemory();
522 np = (PyListObject *) PyList_New(size);
523 if (np == NULL) {
524 return NULL;
525 }
526 src = a->ob_item;
527 dest = np->ob_item;
528 for (i = 0; i < Py_SIZE(a); i++) {
529 PyObject *v = src[i];
530 Py_INCREF(v);
531 dest[i] = v;
532 }
533 src = b->ob_item;
534 dest = np->ob_item + Py_SIZE(a);
535 for (i = 0; i < Py_SIZE(b); i++) {
536 PyObject *v = src[i];
537 Py_INCREF(v);
538 dest[i] = v;
539 }
540 return (PyObject *)np;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000541#undef b
542}
543
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000544static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000545list_repeat(PyListObject *a, Py_ssize_t n)
Guido van Rossumed98d481991-03-06 13:07:53 +0000546{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000547 Py_ssize_t i, j;
548 Py_ssize_t size;
549 PyListObject *np;
550 PyObject **p, **items;
551 PyObject *elem;
552 if (n < 0)
553 n = 0;
Mark Dickinson4ac5d2c2011-09-19 19:23:55 +0100554 if (n > 0 && Py_SIZE(a) > PY_SSIZE_T_MAX / n)
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000555 return PyErr_NoMemory();
Mark Dickinson4ac5d2c2011-09-19 19:23:55 +0100556 size = Py_SIZE(a) * n;
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000557 if (size == 0)
558 return PyList_New(0);
559 np = (PyListObject *) PyList_New(size);
560 if (np == NULL)
561 return NULL;
Raymond Hettinger6624e682003-05-21 05:58:46 +0000562
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000563 items = np->ob_item;
564 if (Py_SIZE(a) == 1) {
565 elem = a->ob_item[0];
566 for (i = 0; i < n; i++) {
567 items[i] = elem;
568 Py_INCREF(elem);
569 }
570 return (PyObject *) np;
571 }
572 p = np->ob_item;
573 items = a->ob_item;
574 for (i = 0; i < n; i++) {
575 for (j = 0; j < Py_SIZE(a); j++) {
576 *p = items[j];
577 Py_INCREF(*p);
578 p++;
579 }
580 }
581 return (PyObject *) np;
Guido van Rossumed98d481991-03-06 13:07:53 +0000582}
583
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000584static int
Armin Rigo93677f02004-07-29 12:40:23 +0000585list_clear(PyListObject *a)
586{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000587 Py_ssize_t i;
588 PyObject **item = a->ob_item;
589 if (item != NULL) {
590 /* Because XDECREF can recursively invoke operations on
591 this list, we make it empty first. */
592 i = Py_SIZE(a);
593 Py_SIZE(a) = 0;
594 a->ob_item = NULL;
595 a->allocated = 0;
596 while (--i >= 0) {
597 Py_XDECREF(item[i]);
598 }
599 PyMem_FREE(item);
600 }
601 /* Never fails; the return value can be ignored.
602 Note that there is no guarantee that the list is actually empty
603 at this point, because XDECREF may have populated it again! */
604 return 0;
Armin Rigo93677f02004-07-29 12:40:23 +0000605}
606
Tim Peters8fc4a912004-07-31 21:53:19 +0000607/* a[ilow:ihigh] = v if v != NULL.
608 * del a[ilow:ihigh] if v == NULL.
609 *
610 * Special speed gimmick: when v is NULL and ihigh - ilow <= 8, it's
611 * guaranteed the call cannot fail.
612 */
Armin Rigo93677f02004-07-29 12:40:23 +0000613static int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000614list_ass_slice(PyListObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000615{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000616 /* Because [X]DECREF can recursively invoke list operations on
617 this list, we must postpone all [X]DECREF activity until
618 after the list is back in its canonical shape. Therefore
619 we must allocate an additional array, 'recycle', into which
620 we temporarily copy the items that are deleted from the
621 list. :-( */
622 PyObject *recycle_on_stack[8];
623 PyObject **recycle = recycle_on_stack; /* will allocate more if needed */
624 PyObject **item;
625 PyObject **vitem = NULL;
626 PyObject *v_as_SF = NULL; /* PySequence_Fast(v) */
627 Py_ssize_t n; /* # of elements in replacement list */
628 Py_ssize_t norig; /* # of elements in list getting replaced */
629 Py_ssize_t d; /* Change in size */
630 Py_ssize_t k;
631 size_t s;
632 int result = -1; /* guilty until proved innocent */
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000633#define b ((PyListObject *)v)
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000634 if (v == NULL)
635 n = 0;
636 else {
637 if (a == b) {
638 /* Special case "a[i:j] = a" -- copy b first */
639 v = list_slice(b, 0, Py_SIZE(b));
640 if (v == NULL)
641 return result;
642 result = list_ass_slice(a, ilow, ihigh, v);
643 Py_DECREF(v);
644 return result;
645 }
646 v_as_SF = PySequence_Fast(v, "can only assign an iterable");
647 if(v_as_SF == NULL)
648 goto Error;
649 n = PySequence_Fast_GET_SIZE(v_as_SF);
650 vitem = PySequence_Fast_ITEMS(v_as_SF);
651 }
652 if (ilow < 0)
653 ilow = 0;
654 else if (ilow > Py_SIZE(a))
655 ilow = Py_SIZE(a);
Tim Peters8d9eb102004-07-31 02:24:20 +0000656
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000657 if (ihigh < ilow)
658 ihigh = ilow;
659 else if (ihigh > Py_SIZE(a))
660 ihigh = Py_SIZE(a);
Armin Rigo93677f02004-07-29 12:40:23 +0000661
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000662 norig = ihigh - ilow;
663 assert(norig >= 0);
664 d = n - norig;
665 if (Py_SIZE(a) + d == 0) {
666 Py_XDECREF(v_as_SF);
667 return list_clear(a);
668 }
669 item = a->ob_item;
670 /* recycle the items that we are about to remove */
671 s = norig * sizeof(PyObject *);
672 if (s > sizeof(recycle_on_stack)) {
673 recycle = (PyObject **)PyMem_MALLOC(s);
674 if (recycle == NULL) {
675 PyErr_NoMemory();
676 goto Error;
677 }
678 }
679 memcpy(recycle, &item[ilow], s);
Tim Peters8d9eb102004-07-31 02:24:20 +0000680
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000681 if (d < 0) { /* Delete -d items */
682 memmove(&item[ihigh+d], &item[ihigh],
683 (Py_SIZE(a) - ihigh)*sizeof(PyObject *));
684 list_resize(a, Py_SIZE(a) + d);
685 item = a->ob_item;
686 }
687 else if (d > 0) { /* Insert d items */
688 k = Py_SIZE(a);
689 if (list_resize(a, k+d) < 0)
690 goto Error;
691 item = a->ob_item;
692 memmove(&item[ihigh+d], &item[ihigh],
693 (k - ihigh)*sizeof(PyObject *));
694 }
695 for (k = 0; k < n; k++, ilow++) {
696 PyObject *w = vitem[k];
697 Py_XINCREF(w);
698 item[ilow] = w;
699 }
700 for (k = norig - 1; k >= 0; --k)
701 Py_XDECREF(recycle[k]);
702 result = 0;
Tim Peters8d9eb102004-07-31 02:24:20 +0000703 Error:
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000704 if (recycle != recycle_on_stack)
705 PyMem_FREE(recycle);
706 Py_XDECREF(v_as_SF);
707 return result;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000708#undef b
709}
710
Guido van Rossum234f9421993-06-17 12:35:49 +0000711int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000712PyList_SetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
Guido van Rossum234f9421993-06-17 12:35:49 +0000713{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000714 if (!PyList_Check(a)) {
715 PyErr_BadInternalCall();
716 return -1;
717 }
718 return list_ass_slice((PyListObject *)a, ilow, ihigh, v);
Guido van Rossum234f9421993-06-17 12:35:49 +0000719}
720
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000721static PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +0000722list_inplace_repeat(PyListObject *self, Py_ssize_t n)
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000723{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000724 PyObject **items;
725 Py_ssize_t size, i, j, p;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000726
727
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000728 size = PyList_GET_SIZE(self);
729 if (size == 0 || n == 1) {
730 Py_INCREF(self);
731 return (PyObject *)self;
732 }
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000733
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000734 if (n < 1) {
735 (void)list_clear(self);
736 Py_INCREF(self);
737 return (PyObject *)self;
738 }
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000739
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000740 if (size > PY_SSIZE_T_MAX / n) {
741 return PyErr_NoMemory();
742 }
Guido van Rossum8d5cf4e2008-01-25 19:50:26 +0000743
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000744 if (list_resize(self, size*n) == -1)
745 return NULL;
Raymond Hettinger4bb95402004-02-13 11:36:39 +0000746
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000747 p = size;
748 items = self->ob_item;
749 for (i = 1; i < n; i++) { /* Start counting at 1, not 0 */
750 for (j = 0; j < size; j++) {
751 PyObject *o = items[j];
752 Py_INCREF(o);
753 items[p++] = o;
754 }
755 }
756 Py_INCREF(self);
757 return (PyObject *)self;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000758}
759
Guido van Rossum4a450d01991-04-03 19:05:18 +0000760static int
Martin v. Löwis18e16552006-02-15 17:27:45 +0000761list_ass_item(PyListObject *a, Py_ssize_t i, PyObject *v)
Guido van Rossum4a450d01991-04-03 19:05:18 +0000762{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000763 PyObject *old_value;
764 if (i < 0 || i >= Py_SIZE(a)) {
765 PyErr_SetString(PyExc_IndexError,
766 "list assignment index out of range");
767 return -1;
768 }
769 if (v == NULL)
770 return list_ass_slice(a, i, i+1, v);
771 Py_INCREF(v);
772 old_value = a->ob_item[i];
773 a->ob_item[i] = v;
774 Py_DECREF(old_value);
775 return 0;
Guido van Rossum4a450d01991-04-03 19:05:18 +0000776}
777
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000778static PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +0000779listinsert(PyListObject *self, PyObject *args)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000780{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000781 Py_ssize_t i;
782 PyObject *v;
783 if (!PyArg_ParseTuple(args, "nO:insert", &i, &v))
784 return NULL;
785 if (ins1(self, i, v) == 0)
786 Py_RETURN_NONE;
787 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000788}
789
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000790static PyObject *
Martin v. Löwise3eb1f22001-08-16 13:15:00 +0000791listappend(PyListObject *self, PyObject *v)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000792{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000793 if (app1(self, v) == 0)
794 Py_RETURN_NONE;
795 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000796}
797
Barry Warsawdedf6d61998-10-09 16:37:25 +0000798static PyObject *
Martin v. Löwise3eb1f22001-08-16 13:15:00 +0000799listextend(PyListObject *self, PyObject *b)
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000800{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000801 PyObject *it; /* iter(v) */
802 Py_ssize_t m; /* size of self */
803 Py_ssize_t n; /* guess for size of b */
804 Py_ssize_t mn; /* m + n */
805 Py_ssize_t i;
806 PyObject *(*iternext)(PyObject *);
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000807
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000808 /* Special cases:
809 1) lists and tuples which can use PySequence_Fast ops
810 2) extending self to self requires making a copy first
811 */
812 if (PyList_CheckExact(b) || PyTuple_CheckExact(b) || (PyObject *)self == b) {
813 PyObject **src, **dest;
814 b = PySequence_Fast(b, "argument must be iterable");
815 if (!b)
816 return NULL;
817 n = PySequence_Fast_GET_SIZE(b);
818 if (n == 0) {
819 /* short circuit when b is empty */
820 Py_DECREF(b);
821 Py_RETURN_NONE;
822 }
823 m = Py_SIZE(self);
824 if (list_resize(self, m + n) == -1) {
825 Py_DECREF(b);
826 return NULL;
827 }
828 /* note that we may still have self == b here for the
829 * situation a.extend(a), but the following code works
830 * in that case too. Just make sure to resize self
831 * before calling PySequence_Fast_ITEMS.
832 */
833 /* populate the end of self with b's items */
834 src = PySequence_Fast_ITEMS(b);
835 dest = self->ob_item + m;
836 for (i = 0; i < n; i++) {
837 PyObject *o = src[i];
838 Py_INCREF(o);
839 dest[i] = o;
840 }
841 Py_DECREF(b);
842 Py_RETURN_NONE;
843 }
Raymond Hettinger90a39bf2004-02-15 03:57:00 +0000844
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000845 it = PyObject_GetIter(b);
846 if (it == NULL)
847 return NULL;
848 iternext = *it->ob_type->tp_iternext;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000849
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000850 /* Guess a result list size. */
851 n = _PyObject_LengthHint(b, 8);
852 if (n == -1) {
853 Py_DECREF(it);
854 return NULL;
855 }
856 m = Py_SIZE(self);
857 mn = m + n;
858 if (mn >= m) {
859 /* Make room. */
860 if (list_resize(self, mn) == -1)
861 goto error;
862 /* Make the list sane again. */
863 Py_SIZE(self) = m;
864 }
865 /* Else m + n overflowed; on the chance that n lied, and there really
866 * is enough room, ignore it. If n was telling the truth, we'll
867 * eventually run out of memory during the loop.
868 */
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000869
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000870 /* Run iterator to exhaustion. */
871 for (;;) {
872 PyObject *item = iternext(it);
873 if (item == NULL) {
874 if (PyErr_Occurred()) {
875 if (PyErr_ExceptionMatches(PyExc_StopIteration))
876 PyErr_Clear();
877 else
878 goto error;
879 }
880 break;
881 }
882 if (Py_SIZE(self) < self->allocated) {
883 /* steals ref */
884 PyList_SET_ITEM(self, Py_SIZE(self), item);
885 ++Py_SIZE(self);
886 }
887 else {
888 int status = app1(self, item);
889 Py_DECREF(item); /* append creates a new ref */
890 if (status < 0)
891 goto error;
892 }
893 }
Raymond Hettinger90a39bf2004-02-15 03:57:00 +0000894
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000895 /* Cut back result list if initial guess was too large. */
896 if (Py_SIZE(self) < self->allocated)
897 list_resize(self, Py_SIZE(self)); /* shrinking can't fail */
Raymond Hettingeraa241e02004-09-26 19:24:20 +0000898
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000899 Py_DECREF(it);
900 Py_RETURN_NONE;
Raymond Hettinger90a39bf2004-02-15 03:57:00 +0000901
902 error:
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000903 Py_DECREF(it);
904 return NULL;
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000905}
906
Raymond Hettinger8ca92ae2004-03-11 09:13:12 +0000907PyObject *
908_PyList_Extend(PyListObject *self, PyObject *b)
909{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000910 return listextend(self, b);
Raymond Hettinger8ca92ae2004-03-11 09:13:12 +0000911}
912
Thomas Wouterse289e0b2000-08-24 20:08:19 +0000913static PyObject *
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000914list_inplace_concat(PyListObject *self, PyObject *other)
915{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000916 PyObject *result;
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000917
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000918 result = listextend(self, other);
919 if (result == NULL)
920 return result;
921 Py_DECREF(result);
922 Py_INCREF(self);
923 return (PyObject *)self;
Raymond Hettinger97bc6182004-03-11 07:34:19 +0000924}
925
926static PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +0000927listpop(PyListObject *self, PyObject *args)
Guido van Rossum3dd7f3f1998-06-30 15:36:32 +0000928{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000929 Py_ssize_t i = -1;
930 PyObject *v;
931 int status;
Raymond Hettinger9eb86b32004-02-17 11:36:16 +0000932
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000933 if (!PyArg_ParseTuple(args, "|n:pop", &i))
934 return NULL;
Armin Rigo7ccbca92006-10-04 12:17:45 +0000935
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000936 if (Py_SIZE(self) == 0) {
937 /* Special-case most common failure cause */
938 PyErr_SetString(PyExc_IndexError, "pop from empty list");
939 return NULL;
940 }
941 if (i < 0)
942 i += Py_SIZE(self);
943 if (i < 0 || i >= Py_SIZE(self)) {
944 PyErr_SetString(PyExc_IndexError, "pop index out of range");
945 return NULL;
946 }
947 v = self->ob_item[i];
948 if (i == Py_SIZE(self) - 1) {
949 status = list_resize(self, Py_SIZE(self) - 1);
950 assert(status >= 0);
951 return v; /* and v now owns the reference the list had */
952 }
953 Py_INCREF(v);
954 status = list_ass_slice(self, i, i+1, (PyObject *)NULL);
955 assert(status >= 0);
956 /* Use status, so that in a release build compilers don't
957 * complain about the unused name.
958 */
959 (void) status;
Brett Cannon651dd522004-08-08 21:21:18 +0000960
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000961 return v;
Guido van Rossum3dd7f3f1998-06-30 15:36:32 +0000962}
963
Tim Peters8e2e7ca2002-07-19 02:33:08 +0000964/* Reverse a slice of a list in place, from lo up to (exclusive) hi. */
965static void
966reverse_slice(PyObject **lo, PyObject **hi)
967{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000968 assert(lo && hi);
Tim Peters8e2e7ca2002-07-19 02:33:08 +0000969
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000970 --hi;
971 while (lo < hi) {
972 PyObject *t = *lo;
973 *lo = *hi;
974 *hi = t;
975 ++lo;
976 --hi;
977 }
Tim Peters8e2e7ca2002-07-19 02:33:08 +0000978}
979
Tim Petersa64dc242002-08-01 02:13:36 +0000980/* Lots of code for an adaptive, stable, natural mergesort. There are many
981 * pieces to this algorithm; read listsort.txt for overviews and details.
982 */
Guido van Rossum3f236de1996-12-10 23:55:39 +0000983
Guido van Rossum3f236de1996-12-10 23:55:39 +0000984/* Comparison function. Takes care of calling a user-supplied
Tim Peters66860f62002-08-04 17:47:26 +0000985 * comparison function (any callable Python object), which must not be
986 * NULL (use the ISLT macro if you don't know, or call PyObject_RichCompareBool
987 * with Py_LT if you know it's NULL).
Tim Petersa64dc242002-08-01 02:13:36 +0000988 * Returns -1 on error, 1 if x < y, 0 if x >= y.
989 */
Guido van Rossum3f236de1996-12-10 23:55:39 +0000990static int
Tim Petersa8c974c2002-07-19 03:30:57 +0000991islt(PyObject *x, PyObject *y, PyObject *compare)
Guido van Rossum3f236de1996-12-10 23:55:39 +0000992{
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000993 PyObject *res;
994 PyObject *args;
995 Py_ssize_t i;
Guido van Rossum3f236de1996-12-10 23:55:39 +0000996
Antoine Pitrouc83ea132010-05-09 14:46:46 +0000997 assert(compare != NULL);
998 /* Call the user's comparison function and translate the 3-way
999 * result into true or false (or error).
1000 */
1001 args = PyTuple_New(2);
1002 if (args == NULL)
1003 return -1;
1004 Py_INCREF(x);
1005 Py_INCREF(y);
1006 PyTuple_SET_ITEM(args, 0, x);
1007 PyTuple_SET_ITEM(args, 1, y);
1008 res = PyObject_Call(compare, args, NULL);
1009 Py_DECREF(args);
1010 if (res == NULL)
1011 return -1;
1012 if (!PyInt_Check(res)) {
1013 PyErr_Format(PyExc_TypeError,
1014 "comparison function must return int, not %.200s",
1015 res->ob_type->tp_name);
1016 Py_DECREF(res);
1017 return -1;
1018 }
1019 i = PyInt_AsLong(res);
1020 Py_DECREF(res);
1021 return i < 0;
Guido van Rossum3f236de1996-12-10 23:55:39 +00001022}
1023
Tim Peters66860f62002-08-04 17:47:26 +00001024/* If COMPARE is NULL, calls PyObject_RichCompareBool with Py_LT, else calls
1025 * islt. This avoids a layer of function call in the usual case, and
1026 * sorting does many comparisons.
1027 * Returns -1 on error, 1 if x < y, 0 if x >= y.
1028 */
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001029#define ISLT(X, Y, COMPARE) ((COMPARE) == NULL ? \
1030 PyObject_RichCompareBool(X, Y, Py_LT) : \
1031 islt(X, Y, COMPARE))
Tim Peters66860f62002-08-04 17:47:26 +00001032
1033/* Compare X to Y via "<". Goto "fail" if the comparison raises an
Tim Petersa8c974c2002-07-19 03:30:57 +00001034 error. Else "k" is set to true iff X<Y, and an "if (k)" block is
1035 started. It makes more sense in context <wink>. X and Y are PyObject*s.
1036*/
Tim Peters66860f62002-08-04 17:47:26 +00001037#define IFLT(X, Y) if ((k = ISLT(X, Y, compare)) < 0) goto fail; \
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001038 if (k)
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001039
1040/* binarysort is the best method for sorting small arrays: it does
1041 few compares, but can do data movement quadratic in the number of
1042 elements.
Guido van Rossum42812581998-06-17 14:15:44 +00001043 [lo, hi) is a contiguous slice of a list, and is sorted via
Tim Petersa8c974c2002-07-19 03:30:57 +00001044 binary insertion. This sort is stable.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001045 On entry, must have lo <= start <= hi, and that [lo, start) is already
1046 sorted (pass start == lo if you don't know!).
Tim Petersa8c974c2002-07-19 03:30:57 +00001047 If islt() complains return -1, else 0.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001048 Even in case of error, the output slice will be some permutation of
1049 the input (nothing is lost or duplicated).
1050*/
Guido van Rossum3f236de1996-12-10 23:55:39 +00001051static int
Fred Drakea2f55112000-07-09 15:16:51 +00001052binarysort(PyObject **lo, PyObject **hi, PyObject **start, PyObject *compare)
1053 /* compare -- comparison function object, or NULL for default */
Guido van Rossum3f236de1996-12-10 23:55:39 +00001054{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001055 register Py_ssize_t k;
1056 register PyObject **l, **p, **r;
1057 register PyObject *pivot;
Guido van Rossum3f236de1996-12-10 23:55:39 +00001058
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001059 assert(lo <= start && start <= hi);
1060 /* assert [lo, start) is sorted */
1061 if (lo == start)
1062 ++start;
1063 for (; start < hi; ++start) {
1064 /* set l to where *start belongs */
1065 l = lo;
1066 r = start;
1067 pivot = *r;
1068 /* Invariants:
1069 * pivot >= all in [lo, l).
1070 * pivot < all in [r, start).
1071 * The second is vacuously true at the start.
1072 */
1073 assert(l < r);
1074 do {
1075 p = l + ((r - l) >> 1);
1076 IFLT(pivot, *p)
1077 r = p;
1078 else
1079 l = p+1;
1080 } while (l < r);
1081 assert(l == r);
1082 /* The invariants still hold, so pivot >= all in [lo, l) and
1083 pivot < all in [l, start), so pivot belongs at l. Note
1084 that if there are elements equal to pivot, l points to the
1085 first slot after them -- that's why this sort is stable.
1086 Slide over to make room.
1087 Caution: using memmove is much slower under MSVC 5;
1088 we're not usually moving many slots. */
1089 for (p = start; p > l; --p)
1090 *p = *(p-1);
1091 *l = pivot;
1092 }
1093 return 0;
Guido van Rossuma119c0d1998-05-29 17:56:32 +00001094
1095 fail:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001096 return -1;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001097}
1098
Tim Petersa64dc242002-08-01 02:13:36 +00001099/*
1100Return the length of the run beginning at lo, in the slice [lo, hi). lo < hi
1101is required on entry. "A run" is the longest ascending sequence, with
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001102
Tim Petersa64dc242002-08-01 02:13:36 +00001103 lo[0] <= lo[1] <= lo[2] <= ...
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001104
Tim Petersa64dc242002-08-01 02:13:36 +00001105or the longest descending sequence, with
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001106
Tim Petersa64dc242002-08-01 02:13:36 +00001107 lo[0] > lo[1] > lo[2] > ...
Tim Peters3b01a122002-07-19 02:35:45 +00001108
Tim Petersa64dc242002-08-01 02:13:36 +00001109Boolean *descending is set to 0 in the former case, or to 1 in the latter.
1110For its intended use in a stable mergesort, the strictness of the defn of
1111"descending" is needed so that the caller can safely reverse a descending
1112sequence without violating stability (strict > ensures there are no equal
1113elements to get out of order).
1114
1115Returns -1 in case of error.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001116*/
Martin v. Löwis18e16552006-02-15 17:27:45 +00001117static Py_ssize_t
Tim Petersa64dc242002-08-01 02:13:36 +00001118count_run(PyObject **lo, PyObject **hi, PyObject *compare, int *descending)
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001119{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001120 Py_ssize_t k;
1121 Py_ssize_t n;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001122
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001123 assert(lo < hi);
1124 *descending = 0;
1125 ++lo;
1126 if (lo == hi)
1127 return 1;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001128
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001129 n = 2;
1130 IFLT(*lo, *(lo-1)) {
1131 *descending = 1;
1132 for (lo = lo+1; lo < hi; ++lo, ++n) {
1133 IFLT(*lo, *(lo-1))
1134 ;
1135 else
1136 break;
1137 }
1138 }
1139 else {
1140 for (lo = lo+1; lo < hi; ++lo, ++n) {
1141 IFLT(*lo, *(lo-1))
1142 break;
1143 }
1144 }
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001145
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001146 return n;
Tim Petersa64dc242002-08-01 02:13:36 +00001147fail:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001148 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001149}
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001150
Tim Petersa64dc242002-08-01 02:13:36 +00001151/*
1152Locate the proper position of key in a sorted vector; if the vector contains
1153an element equal to key, return the position immediately to the left of
1154the leftmost equal element. [gallop_right() does the same except returns
1155the position to the right of the rightmost equal element (if any).]
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001156
Tim Petersa64dc242002-08-01 02:13:36 +00001157"a" is a sorted vector with n elements, starting at a[0]. n must be > 0.
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001158
Tim Petersa64dc242002-08-01 02:13:36 +00001159"hint" is an index at which to begin the search, 0 <= hint < n. The closer
1160hint is to the final result, the faster this runs.
1161
1162The return value is the int k in 0..n such that
1163
1164 a[k-1] < key <= a[k]
1165
1166pretending that *(a-1) is minus infinity and a[n] is plus infinity. IOW,
1167key belongs at index k; or, IOW, the first k elements of a should precede
1168key, and the last n-k should follow key.
1169
1170Returns -1 on error. See listsort.txt for info on the method.
1171*/
Martin v. Löwis18e16552006-02-15 17:27:45 +00001172static Py_ssize_t
1173gallop_left(PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint, PyObject *compare)
Tim Petersa64dc242002-08-01 02:13:36 +00001174{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001175 Py_ssize_t ofs;
1176 Py_ssize_t lastofs;
1177 Py_ssize_t k;
Tim Petersa64dc242002-08-01 02:13:36 +00001178
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001179 assert(key && a && n > 0 && hint >= 0 && hint < n);
Tim Petersa64dc242002-08-01 02:13:36 +00001180
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001181 a += hint;
1182 lastofs = 0;
1183 ofs = 1;
1184 IFLT(*a, key) {
1185 /* a[hint] < key -- gallop right, until
1186 * a[hint + lastofs] < key <= a[hint + ofs]
1187 */
1188 const Py_ssize_t maxofs = n - hint; /* &a[n-1] is highest */
1189 while (ofs < maxofs) {
1190 IFLT(a[ofs], key) {
1191 lastofs = ofs;
1192 ofs = (ofs << 1) + 1;
1193 if (ofs <= 0) /* int overflow */
1194 ofs = maxofs;
1195 }
1196 else /* key <= a[hint + ofs] */
1197 break;
1198 }
1199 if (ofs > maxofs)
1200 ofs = maxofs;
1201 /* Translate back to offsets relative to &a[0]. */
1202 lastofs += hint;
1203 ofs += hint;
1204 }
1205 else {
1206 /* key <= a[hint] -- gallop left, until
1207 * a[hint - ofs] < key <= a[hint - lastofs]
1208 */
1209 const Py_ssize_t maxofs = hint + 1; /* &a[0] is lowest */
1210 while (ofs < maxofs) {
1211 IFLT(*(a-ofs), key)
1212 break;
1213 /* key <= a[hint - ofs] */
1214 lastofs = ofs;
1215 ofs = (ofs << 1) + 1;
1216 if (ofs <= 0) /* int overflow */
1217 ofs = maxofs;
1218 }
1219 if (ofs > maxofs)
1220 ofs = maxofs;
1221 /* Translate back to positive offsets relative to &a[0]. */
1222 k = lastofs;
1223 lastofs = hint - ofs;
1224 ofs = hint - k;
1225 }
1226 a -= hint;
Tim Petersa64dc242002-08-01 02:13:36 +00001227
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001228 assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
1229 /* Now a[lastofs] < key <= a[ofs], so key belongs somewhere to the
1230 * right of lastofs but no farther right than ofs. Do a binary
1231 * search, with invariant a[lastofs-1] < key <= a[ofs].
1232 */
1233 ++lastofs;
1234 while (lastofs < ofs) {
1235 Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
Tim Petersa64dc242002-08-01 02:13:36 +00001236
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001237 IFLT(a[m], key)
1238 lastofs = m+1; /* a[m] < key */
1239 else
1240 ofs = m; /* key <= a[m] */
1241 }
1242 assert(lastofs == ofs); /* so a[ofs-1] < key <= a[ofs] */
1243 return ofs;
Tim Petersa64dc242002-08-01 02:13:36 +00001244
1245fail:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001246 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001247}
1248
1249/*
1250Exactly like gallop_left(), except that if key already exists in a[0:n],
1251finds the position immediately to the right of the rightmost equal value.
1252
1253The return value is the int k in 0..n such that
1254
1255 a[k-1] <= key < a[k]
1256
1257or -1 if error.
1258
1259The code duplication is massive, but this is enough different given that
1260we're sticking to "<" comparisons that it's much harder to follow if
1261written as one routine with yet another "left or right?" flag.
1262*/
Martin v. Löwis18e16552006-02-15 17:27:45 +00001263static Py_ssize_t
1264gallop_right(PyObject *key, PyObject **a, Py_ssize_t n, Py_ssize_t hint, PyObject *compare)
Tim Petersa64dc242002-08-01 02:13:36 +00001265{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001266 Py_ssize_t ofs;
1267 Py_ssize_t lastofs;
1268 Py_ssize_t k;
Tim Petersa64dc242002-08-01 02:13:36 +00001269
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001270 assert(key && a && n > 0 && hint >= 0 && hint < n);
Tim Petersa64dc242002-08-01 02:13:36 +00001271
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001272 a += hint;
1273 lastofs = 0;
1274 ofs = 1;
1275 IFLT(key, *a) {
1276 /* key < a[hint] -- gallop left, until
1277 * a[hint - ofs] <= key < a[hint - lastofs]
1278 */
1279 const Py_ssize_t maxofs = hint + 1; /* &a[0] is lowest */
1280 while (ofs < maxofs) {
1281 IFLT(key, *(a-ofs)) {
1282 lastofs = ofs;
1283 ofs = (ofs << 1) + 1;
1284 if (ofs <= 0) /* int overflow */
1285 ofs = maxofs;
1286 }
1287 else /* a[hint - ofs] <= key */
1288 break;
1289 }
1290 if (ofs > maxofs)
1291 ofs = maxofs;
1292 /* Translate back to positive offsets relative to &a[0]. */
1293 k = lastofs;
1294 lastofs = hint - ofs;
1295 ofs = hint - k;
1296 }
1297 else {
1298 /* a[hint] <= key -- gallop right, until
1299 * a[hint + lastofs] <= key < a[hint + ofs]
1300 */
1301 const Py_ssize_t maxofs = n - hint; /* &a[n-1] is highest */
1302 while (ofs < maxofs) {
1303 IFLT(key, a[ofs])
1304 break;
1305 /* a[hint + ofs] <= key */
1306 lastofs = ofs;
1307 ofs = (ofs << 1) + 1;
1308 if (ofs <= 0) /* int overflow */
1309 ofs = maxofs;
1310 }
1311 if (ofs > maxofs)
1312 ofs = maxofs;
1313 /* Translate back to offsets relative to &a[0]. */
1314 lastofs += hint;
1315 ofs += hint;
1316 }
1317 a -= hint;
Tim Petersa64dc242002-08-01 02:13:36 +00001318
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001319 assert(-1 <= lastofs && lastofs < ofs && ofs <= n);
1320 /* Now a[lastofs] <= key < a[ofs], so key belongs somewhere to the
1321 * right of lastofs but no farther right than ofs. Do a binary
1322 * search, with invariant a[lastofs-1] <= key < a[ofs].
1323 */
1324 ++lastofs;
1325 while (lastofs < ofs) {
1326 Py_ssize_t m = lastofs + ((ofs - lastofs) >> 1);
Tim Petersa64dc242002-08-01 02:13:36 +00001327
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001328 IFLT(key, a[m])
1329 ofs = m; /* key < a[m] */
1330 else
1331 lastofs = m+1; /* a[m] <= key */
1332 }
1333 assert(lastofs == ofs); /* so a[ofs-1] <= key < a[ofs] */
1334 return ofs;
Tim Petersa64dc242002-08-01 02:13:36 +00001335
1336fail:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001337 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001338}
1339
1340/* The maximum number of entries in a MergeState's pending-runs stack.
1341 * This is enough to sort arrays of size up to about
1342 * 32 * phi ** MAX_MERGE_PENDING
1343 * where phi ~= 1.618. 85 is ridiculouslylarge enough, good for an array
1344 * with 2**64 elements.
1345 */
1346#define MAX_MERGE_PENDING 85
1347
Tim Peterse05f65a2002-08-10 05:21:15 +00001348/* When we get into galloping mode, we stay there until both runs win less
1349 * often than MIN_GALLOP consecutive times. See listsort.txt for more info.
Tim Petersa64dc242002-08-01 02:13:36 +00001350 */
Tim Peterse05f65a2002-08-10 05:21:15 +00001351#define MIN_GALLOP 7
Tim Petersa64dc242002-08-01 02:13:36 +00001352
1353/* Avoid malloc for small temp arrays. */
1354#define MERGESTATE_TEMP_SIZE 256
1355
1356/* One MergeState exists on the stack per invocation of mergesort. It's just
1357 * a convenient way to pass state around among the helper functions.
1358 */
Tim Peterse05f65a2002-08-10 05:21:15 +00001359struct s_slice {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001360 PyObject **base;
1361 Py_ssize_t len;
Tim Peterse05f65a2002-08-10 05:21:15 +00001362};
1363
Tim Petersa64dc242002-08-01 02:13:36 +00001364typedef struct s_MergeState {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001365 /* The user-supplied comparison function. or NULL if none given. */
1366 PyObject *compare;
Tim Petersa64dc242002-08-01 02:13:36 +00001367
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001368 /* This controls when we get *into* galloping mode. It's initialized
1369 * to MIN_GALLOP. merge_lo and merge_hi tend to nudge it higher for
1370 * random data, and lower for highly structured data.
1371 */
1372 Py_ssize_t min_gallop;
Tim Peterse05f65a2002-08-10 05:21:15 +00001373
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001374 /* 'a' is temp storage to help with merges. It contains room for
1375 * alloced entries.
1376 */
1377 PyObject **a; /* may point to temparray below */
1378 Py_ssize_t alloced;
Tim Petersa64dc242002-08-01 02:13:36 +00001379
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001380 /* A stack of n pending runs yet to be merged. Run #i starts at
1381 * address base[i] and extends for len[i] elements. It's always
1382 * true (so long as the indices are in bounds) that
1383 *
1384 * pending[i].base + pending[i].len == pending[i+1].base
1385 *
1386 * so we could cut the storage for this, but it's a minor amount,
1387 * and keeping all the info explicit simplifies the code.
1388 */
1389 int n;
1390 struct s_slice pending[MAX_MERGE_PENDING];
Tim Petersa64dc242002-08-01 02:13:36 +00001391
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001392 /* 'a' points to this when possible, rather than muck with malloc. */
1393 PyObject *temparray[MERGESTATE_TEMP_SIZE];
Tim Petersa64dc242002-08-01 02:13:36 +00001394} MergeState;
1395
1396/* Conceptually a MergeState's constructor. */
1397static void
1398merge_init(MergeState *ms, PyObject *compare)
1399{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001400 assert(ms != NULL);
1401 ms->compare = compare;
1402 ms->a = ms->temparray;
1403 ms->alloced = MERGESTATE_TEMP_SIZE;
1404 ms->n = 0;
1405 ms->min_gallop = MIN_GALLOP;
Tim Petersa64dc242002-08-01 02:13:36 +00001406}
1407
1408/* Free all the temp memory owned by the MergeState. This must be called
1409 * when you're done with a MergeState, and may be called before then if
1410 * you want to free the temp memory early.
1411 */
1412static void
1413merge_freemem(MergeState *ms)
1414{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001415 assert(ms != NULL);
1416 if (ms->a != ms->temparray)
1417 PyMem_Free(ms->a);
1418 ms->a = ms->temparray;
1419 ms->alloced = MERGESTATE_TEMP_SIZE;
Tim Petersa64dc242002-08-01 02:13:36 +00001420}
1421
1422/* Ensure enough temp memory for 'need' array slots is available.
1423 * Returns 0 on success and -1 if the memory can't be gotten.
1424 */
1425static int
Martin v. Löwis18e16552006-02-15 17:27:45 +00001426merge_getmem(MergeState *ms, Py_ssize_t need)
Tim Petersa64dc242002-08-01 02:13:36 +00001427{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001428 assert(ms != NULL);
1429 if (need <= ms->alloced)
1430 return 0;
1431 /* Don't realloc! That can cost cycles to copy the old data, but
1432 * we don't care what's in the block.
1433 */
1434 merge_freemem(ms);
1435 if ((size_t)need > PY_SSIZE_T_MAX / sizeof(PyObject*)) {
1436 PyErr_NoMemory();
1437 return -1;
1438 }
1439 ms->a = (PyObject **)PyMem_Malloc(need * sizeof(PyObject*));
1440 if (ms->a) {
1441 ms->alloced = need;
1442 return 0;
1443 }
1444 PyErr_NoMemory();
1445 merge_freemem(ms); /* reset to sane state */
1446 return -1;
Tim Petersa64dc242002-08-01 02:13:36 +00001447}
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001448#define MERGE_GETMEM(MS, NEED) ((NEED) <= (MS)->alloced ? 0 : \
1449 merge_getmem(MS, NEED))
Tim Petersa64dc242002-08-01 02:13:36 +00001450
1451/* Merge the na elements starting at pa with the nb elements starting at pb
1452 * in a stable way, in-place. na and nb must be > 0, and pa + na == pb.
1453 * Must also have that *pb < *pa, that pa[na-1] belongs at the end of the
1454 * merge, and should have na <= nb. See listsort.txt for more info.
1455 * Return 0 if successful, -1 if error.
1456 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001457static Py_ssize_t
1458merge_lo(MergeState *ms, PyObject **pa, Py_ssize_t na,
1459 PyObject **pb, Py_ssize_t nb)
Tim Petersa64dc242002-08-01 02:13:36 +00001460{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001461 Py_ssize_t k;
1462 PyObject *compare;
1463 PyObject **dest;
1464 int result = -1; /* guilty until proved innocent */
1465 Py_ssize_t min_gallop;
Tim Petersa64dc242002-08-01 02:13:36 +00001466
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001467 assert(ms && pa && pb && na > 0 && nb > 0 && pa + na == pb);
1468 if (MERGE_GETMEM(ms, na) < 0)
1469 return -1;
1470 memcpy(ms->a, pa, na * sizeof(PyObject*));
1471 dest = pa;
1472 pa = ms->a;
Tim Petersa64dc242002-08-01 02:13:36 +00001473
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001474 *dest++ = *pb++;
1475 --nb;
1476 if (nb == 0)
1477 goto Succeed;
1478 if (na == 1)
1479 goto CopyB;
Tim Petersa64dc242002-08-01 02:13:36 +00001480
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001481 min_gallop = ms->min_gallop;
1482 compare = ms->compare;
1483 for (;;) {
1484 Py_ssize_t acount = 0; /* # of times A won in a row */
1485 Py_ssize_t bcount = 0; /* # of times B won in a row */
Tim Petersa64dc242002-08-01 02:13:36 +00001486
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001487 /* Do the straightforward thing until (if ever) one run
1488 * appears to win consistently.
1489 */
1490 for (;;) {
1491 assert(na > 1 && nb > 0);
1492 k = ISLT(*pb, *pa, compare);
1493 if (k) {
1494 if (k < 0)
1495 goto Fail;
1496 *dest++ = *pb++;
1497 ++bcount;
1498 acount = 0;
1499 --nb;
1500 if (nb == 0)
1501 goto Succeed;
1502 if (bcount >= min_gallop)
1503 break;
1504 }
1505 else {
1506 *dest++ = *pa++;
1507 ++acount;
1508 bcount = 0;
1509 --na;
1510 if (na == 1)
1511 goto CopyB;
1512 if (acount >= min_gallop)
1513 break;
1514 }
1515 }
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001516
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001517 /* One run is winning so consistently that galloping may
1518 * be a huge win. So try that, and continue galloping until
1519 * (if ever) neither run appears to be winning consistently
1520 * anymore.
1521 */
1522 ++min_gallop;
1523 do {
1524 assert(na > 1 && nb > 0);
1525 min_gallop -= min_gallop > 1;
1526 ms->min_gallop = min_gallop;
1527 k = gallop_right(*pb, pa, na, 0, compare);
1528 acount = k;
1529 if (k) {
1530 if (k < 0)
1531 goto Fail;
1532 memcpy(dest, pa, k * sizeof(PyObject *));
1533 dest += k;
1534 pa += k;
1535 na -= k;
1536 if (na == 1)
1537 goto CopyB;
1538 /* na==0 is impossible now if the comparison
1539 * function is consistent, but we can't assume
1540 * that it is.
1541 */
1542 if (na == 0)
1543 goto Succeed;
1544 }
1545 *dest++ = *pb++;
1546 --nb;
1547 if (nb == 0)
1548 goto Succeed;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001549
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001550 k = gallop_left(*pa, pb, nb, 0, compare);
1551 bcount = k;
1552 if (k) {
1553 if (k < 0)
1554 goto Fail;
1555 memmove(dest, pb, k * sizeof(PyObject *));
1556 dest += k;
1557 pb += k;
1558 nb -= k;
1559 if (nb == 0)
1560 goto Succeed;
1561 }
1562 *dest++ = *pa++;
1563 --na;
1564 if (na == 1)
1565 goto CopyB;
1566 } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
1567 ++min_gallop; /* penalize it for leaving galloping mode */
1568 ms->min_gallop = min_gallop;
1569 }
Tim Petersa64dc242002-08-01 02:13:36 +00001570Succeed:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001571 result = 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001572Fail:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001573 if (na)
1574 memcpy(dest, pa, na * sizeof(PyObject*));
1575 return result;
Tim Petersa64dc242002-08-01 02:13:36 +00001576CopyB:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001577 assert(na == 1 && nb > 0);
1578 /* The last element of pa belongs at the end of the merge. */
1579 memmove(dest, pb, nb * sizeof(PyObject *));
1580 dest[nb] = *pa;
1581 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001582}
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001583
Tim Petersa64dc242002-08-01 02:13:36 +00001584/* Merge the na elements starting at pa with the nb elements starting at pb
1585 * in a stable way, in-place. na and nb must be > 0, and pa + na == pb.
1586 * Must also have that *pb < *pa, that pa[na-1] belongs at the end of the
1587 * merge, and should have na >= nb. See listsort.txt for more info.
1588 * Return 0 if successful, -1 if error.
1589 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001590static Py_ssize_t
1591merge_hi(MergeState *ms, PyObject **pa, Py_ssize_t na, PyObject **pb, Py_ssize_t nb)
Tim Petersa64dc242002-08-01 02:13:36 +00001592{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001593 Py_ssize_t k;
1594 PyObject *compare;
1595 PyObject **dest;
1596 int result = -1; /* guilty until proved innocent */
1597 PyObject **basea;
1598 PyObject **baseb;
1599 Py_ssize_t min_gallop;
Tim Petersa64dc242002-08-01 02:13:36 +00001600
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001601 assert(ms && pa && pb && na > 0 && nb > 0 && pa + na == pb);
1602 if (MERGE_GETMEM(ms, nb) < 0)
1603 return -1;
1604 dest = pb + nb - 1;
1605 memcpy(ms->a, pb, nb * sizeof(PyObject*));
1606 basea = pa;
1607 baseb = ms->a;
1608 pb = ms->a + nb - 1;
1609 pa += na - 1;
Tim Petersa64dc242002-08-01 02:13:36 +00001610
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001611 *dest-- = *pa--;
1612 --na;
1613 if (na == 0)
1614 goto Succeed;
1615 if (nb == 1)
1616 goto CopyA;
Tim Petersa64dc242002-08-01 02:13:36 +00001617
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001618 min_gallop = ms->min_gallop;
1619 compare = ms->compare;
1620 for (;;) {
1621 Py_ssize_t acount = 0; /* # of times A won in a row */
1622 Py_ssize_t bcount = 0; /* # of times B won in a row */
Tim Petersa64dc242002-08-01 02:13:36 +00001623
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001624 /* Do the straightforward thing until (if ever) one run
1625 * appears to win consistently.
1626 */
1627 for (;;) {
1628 assert(na > 0 && nb > 1);
1629 k = ISLT(*pb, *pa, compare);
1630 if (k) {
1631 if (k < 0)
1632 goto Fail;
1633 *dest-- = *pa--;
1634 ++acount;
1635 bcount = 0;
1636 --na;
1637 if (na == 0)
1638 goto Succeed;
1639 if (acount >= min_gallop)
1640 break;
1641 }
1642 else {
1643 *dest-- = *pb--;
1644 ++bcount;
1645 acount = 0;
1646 --nb;
1647 if (nb == 1)
1648 goto CopyA;
1649 if (bcount >= min_gallop)
1650 break;
1651 }
1652 }
Tim Petersa64dc242002-08-01 02:13:36 +00001653
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001654 /* One run is winning so consistently that galloping may
1655 * be a huge win. So try that, and continue galloping until
1656 * (if ever) neither run appears to be winning consistently
1657 * anymore.
1658 */
1659 ++min_gallop;
1660 do {
1661 assert(na > 0 && nb > 1);
1662 min_gallop -= min_gallop > 1;
1663 ms->min_gallop = min_gallop;
1664 k = gallop_right(*pb, basea, na, na-1, compare);
1665 if (k < 0)
1666 goto Fail;
1667 k = na - k;
1668 acount = k;
1669 if (k) {
1670 dest -= k;
1671 pa -= k;
1672 memmove(dest+1, pa+1, k * sizeof(PyObject *));
1673 na -= k;
1674 if (na == 0)
1675 goto Succeed;
1676 }
1677 *dest-- = *pb--;
1678 --nb;
1679 if (nb == 1)
1680 goto CopyA;
Tim Petersa64dc242002-08-01 02:13:36 +00001681
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001682 k = gallop_left(*pa, baseb, nb, nb-1, compare);
1683 if (k < 0)
1684 goto Fail;
1685 k = nb - k;
1686 bcount = k;
1687 if (k) {
1688 dest -= k;
1689 pb -= k;
1690 memcpy(dest+1, pb+1, k * sizeof(PyObject *));
1691 nb -= k;
1692 if (nb == 1)
1693 goto CopyA;
1694 /* nb==0 is impossible now if the comparison
1695 * function is consistent, but we can't assume
1696 * that it is.
1697 */
1698 if (nb == 0)
1699 goto Succeed;
1700 }
1701 *dest-- = *pa--;
1702 --na;
1703 if (na == 0)
1704 goto Succeed;
1705 } while (acount >= MIN_GALLOP || bcount >= MIN_GALLOP);
1706 ++min_gallop; /* penalize it for leaving galloping mode */
1707 ms->min_gallop = min_gallop;
1708 }
Tim Petersa64dc242002-08-01 02:13:36 +00001709Succeed:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001710 result = 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001711Fail:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001712 if (nb)
1713 memcpy(dest-(nb-1), baseb, nb * sizeof(PyObject*));
1714 return result;
Tim Petersa64dc242002-08-01 02:13:36 +00001715CopyA:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001716 assert(nb == 1 && na > 0);
1717 /* The first element of pb belongs at the front of the merge. */
1718 dest -= na;
1719 pa -= na;
1720 memmove(dest+1, pa+1, na * sizeof(PyObject *));
1721 *dest = *pb;
1722 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001723}
1724
1725/* Merge the two runs at stack indices i and i+1.
1726 * Returns 0 on success, -1 on error.
1727 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001728static Py_ssize_t
1729merge_at(MergeState *ms, Py_ssize_t i)
Tim Petersa64dc242002-08-01 02:13:36 +00001730{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001731 PyObject **pa, **pb;
1732 Py_ssize_t na, nb;
1733 Py_ssize_t k;
1734 PyObject *compare;
Tim Petersa64dc242002-08-01 02:13:36 +00001735
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001736 assert(ms != NULL);
1737 assert(ms->n >= 2);
1738 assert(i >= 0);
1739 assert(i == ms->n - 2 || i == ms->n - 3);
Tim Petersa64dc242002-08-01 02:13:36 +00001740
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001741 pa = ms->pending[i].base;
1742 na = ms->pending[i].len;
1743 pb = ms->pending[i+1].base;
1744 nb = ms->pending[i+1].len;
1745 assert(na > 0 && nb > 0);
1746 assert(pa + na == pb);
Tim Petersa64dc242002-08-01 02:13:36 +00001747
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001748 /* Record the length of the combined runs; if i is the 3rd-last
1749 * run now, also slide over the last run (which isn't involved
1750 * in this merge). The current run i+1 goes away in any case.
1751 */
1752 ms->pending[i].len = na + nb;
1753 if (i == ms->n - 3)
1754 ms->pending[i+1] = ms->pending[i+2];
1755 --ms->n;
Tim Petersa64dc242002-08-01 02:13:36 +00001756
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001757 /* Where does b start in a? Elements in a before that can be
1758 * ignored (already in place).
1759 */
1760 compare = ms->compare;
1761 k = gallop_right(*pb, pa, na, 0, compare);
1762 if (k < 0)
1763 return -1;
1764 pa += k;
1765 na -= k;
1766 if (na == 0)
1767 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001768
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001769 /* Where does a end in b? Elements in b after that can be
1770 * ignored (already in place).
1771 */
1772 nb = gallop_left(pa[na-1], pb, nb, nb-1, compare);
1773 if (nb <= 0)
1774 return nb;
Tim Petersa64dc242002-08-01 02:13:36 +00001775
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001776 /* Merge what remains of the runs, using a temp array with
1777 * min(na, nb) elements.
1778 */
1779 if (na <= nb)
1780 return merge_lo(ms, pa, na, pb, nb);
1781 else
1782 return merge_hi(ms, pa, na, pb, nb);
Tim Petersa64dc242002-08-01 02:13:36 +00001783}
1784
1785/* Examine the stack of runs waiting to be merged, merging adjacent runs
1786 * until the stack invariants are re-established:
1787 *
1788 * 1. len[-3] > len[-2] + len[-1]
1789 * 2. len[-2] > len[-1]
1790 *
1791 * See listsort.txt for more info.
1792 *
1793 * Returns 0 on success, -1 on error.
1794 */
1795static int
1796merge_collapse(MergeState *ms)
1797{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001798 struct s_slice *p = ms->pending;
Tim Petersa64dc242002-08-01 02:13:36 +00001799
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001800 assert(ms);
1801 while (ms->n > 1) {
1802 Py_ssize_t n = ms->n - 2;
1803 if (n > 0 && p[n-1].len <= p[n].len + p[n+1].len) {
1804 if (p[n-1].len < p[n+1].len)
1805 --n;
1806 if (merge_at(ms, n) < 0)
1807 return -1;
1808 }
1809 else if (p[n].len <= p[n+1].len) {
1810 if (merge_at(ms, n) < 0)
1811 return -1;
1812 }
1813 else
1814 break;
1815 }
1816 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001817}
1818
1819/* Regardless of invariants, merge all runs on the stack until only one
1820 * remains. This is used at the end of the mergesort.
1821 *
1822 * Returns 0 on success, -1 on error.
1823 */
1824static int
1825merge_force_collapse(MergeState *ms)
1826{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001827 struct s_slice *p = ms->pending;
Tim Petersa64dc242002-08-01 02:13:36 +00001828
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001829 assert(ms);
1830 while (ms->n > 1) {
1831 Py_ssize_t n = ms->n - 2;
1832 if (n > 0 && p[n-1].len < p[n+1].len)
1833 --n;
1834 if (merge_at(ms, n) < 0)
1835 return -1;
1836 }
1837 return 0;
Tim Petersa64dc242002-08-01 02:13:36 +00001838}
1839
1840/* Compute a good value for the minimum run length; natural runs shorter
1841 * than this are boosted artificially via binary insertion.
1842 *
1843 * If n < 64, return n (it's too small to bother with fancy stuff).
1844 * Else if n is an exact power of 2, return 32.
1845 * Else return an int k, 32 <= k <= 64, such that n/k is close to, but
1846 * strictly less than, an exact power of 2.
1847 *
1848 * See listsort.txt for more info.
1849 */
Martin v. Löwis18e16552006-02-15 17:27:45 +00001850static Py_ssize_t
1851merge_compute_minrun(Py_ssize_t n)
Tim Petersa64dc242002-08-01 02:13:36 +00001852{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001853 Py_ssize_t r = 0; /* becomes 1 if any 1 bits are shifted off */
Tim Petersa64dc242002-08-01 02:13:36 +00001854
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001855 assert(n >= 0);
1856 while (n >= 64) {
1857 r |= n & 1;
1858 n >>= 1;
1859 }
1860 return n + r;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00001861}
Guido van Rossuma119c0d1998-05-29 17:56:32 +00001862
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001863/* Special wrapper to support stable sorting using the decorate-sort-undecorate
Andrew M. Kuchling55be9ea2004-09-10 12:59:54 +00001864 pattern. Holds a key which is used for comparisons and the original record
Tim Petersb38e2b62004-07-29 02:29:26 +00001865 which is returned during the undecorate phase. By exposing only the key
1866 during comparisons, the underlying sort stability characteristics are left
1867 unchanged. Also, if a custom comparison function is used, it will only see
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001868 the key instead of a full record. */
1869
1870typedef struct {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001871 PyObject_HEAD
1872 PyObject *key;
1873 PyObject *value;
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001874} sortwrapperobject;
1875
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001876PyDoc_STRVAR(sortwrapper_doc, "Object wrapper with a custom sort key.");
Anthony Baxter377be112006-04-11 06:54:30 +00001877static PyObject *
1878sortwrapper_richcompare(sortwrapperobject *, sortwrapperobject *, int);
1879static void
1880sortwrapper_dealloc(sortwrapperobject *);
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001881
1882static PyTypeObject sortwrapper_type = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001883 PyVarObject_HEAD_INIT(&PyType_Type, 0)
1884 "sortwrapper", /* tp_name */
1885 sizeof(sortwrapperobject), /* tp_basicsize */
1886 0, /* tp_itemsize */
1887 /* methods */
1888 (destructor)sortwrapper_dealloc, /* tp_dealloc */
1889 0, /* tp_print */
1890 0, /* tp_getattr */
1891 0, /* tp_setattr */
1892 0, /* tp_compare */
1893 0, /* tp_repr */
1894 0, /* tp_as_number */
1895 0, /* tp_as_sequence */
1896 0, /* tp_as_mapping */
1897 0, /* tp_hash */
1898 0, /* tp_call */
1899 0, /* tp_str */
1900 PyObject_GenericGetAttr, /* tp_getattro */
1901 0, /* tp_setattro */
1902 0, /* tp_as_buffer */
1903 Py_TPFLAGS_DEFAULT |
1904 Py_TPFLAGS_HAVE_RICHCOMPARE, /* tp_flags */
1905 sortwrapper_doc, /* tp_doc */
1906 0, /* tp_traverse */
1907 0, /* tp_clear */
1908 (richcmpfunc)sortwrapper_richcompare, /* tp_richcompare */
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001909};
1910
Anthony Baxter377be112006-04-11 06:54:30 +00001911
1912static PyObject *
1913sortwrapper_richcompare(sortwrapperobject *a, sortwrapperobject *b, int op)
1914{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001915 if (!PyObject_TypeCheck(b, &sortwrapper_type)) {
1916 PyErr_SetString(PyExc_TypeError,
1917 "expected a sortwrapperobject");
1918 return NULL;
1919 }
1920 return PyObject_RichCompare(a->key, b->key, op);
Anthony Baxter377be112006-04-11 06:54:30 +00001921}
1922
1923static void
1924sortwrapper_dealloc(sortwrapperobject *so)
1925{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001926 Py_XDECREF(so->key);
1927 Py_XDECREF(so->value);
1928 PyObject_Del(so);
Anthony Baxter377be112006-04-11 06:54:30 +00001929}
1930
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001931/* Returns a new reference to a sortwrapper.
1932 Consumes the references to the two underlying objects. */
1933
1934static PyObject *
1935build_sortwrapper(PyObject *key, PyObject *value)
1936{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001937 sortwrapperobject *so;
Tim Petersb38e2b62004-07-29 02:29:26 +00001938
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001939 so = PyObject_New(sortwrapperobject, &sortwrapper_type);
1940 if (so == NULL)
1941 return NULL;
1942 so->key = key;
1943 so->value = value;
1944 return (PyObject *)so;
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001945}
1946
1947/* Returns a new reference to the value underlying the wrapper. */
1948static PyObject *
1949sortwrapper_getvalue(PyObject *so)
1950{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001951 PyObject *value;
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001952
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001953 if (!PyObject_TypeCheck(so, &sortwrapper_type)) {
1954 PyErr_SetString(PyExc_TypeError,
1955 "expected a sortwrapperobject");
1956 return NULL;
1957 }
1958 value = ((sortwrapperobject *)so)->value;
1959 Py_INCREF(value);
1960 return value;
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001961}
1962
1963/* Wrapper for user specified cmp functions in combination with a
1964 specified key function. Makes sure the cmp function is presented
1965 with the actual key instead of the sortwrapper */
1966
1967typedef struct {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001968 PyObject_HEAD
1969 PyObject *func;
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001970} cmpwrapperobject;
1971
1972static void
1973cmpwrapper_dealloc(cmpwrapperobject *co)
1974{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001975 Py_XDECREF(co->func);
1976 PyObject_Del(co);
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001977}
1978
1979static PyObject *
1980cmpwrapper_call(cmpwrapperobject *co, PyObject *args, PyObject *kwds)
1981{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001982 PyObject *x, *y, *xx, *yy;
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001983
Antoine Pitrouc83ea132010-05-09 14:46:46 +00001984 if (!PyArg_UnpackTuple(args, "", 2, 2, &x, &y))
1985 return NULL;
1986 if (!PyObject_TypeCheck(x, &sortwrapper_type) ||
1987 !PyObject_TypeCheck(y, &sortwrapper_type)) {
1988 PyErr_SetString(PyExc_TypeError,
1989 "expected a sortwrapperobject");
1990 return NULL;
1991 }
1992 xx = ((sortwrapperobject *)x)->key;
1993 yy = ((sortwrapperobject *)y)->key;
1994 return PyObject_CallFunctionObjArgs(co->func, xx, yy, NULL);
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00001995}
1996
1997PyDoc_STRVAR(cmpwrapper_doc, "cmp() wrapper for sort with custom keys.");
1998
1999static PyTypeObject cmpwrapper_type = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002000 PyVarObject_HEAD_INIT(&PyType_Type, 0)
2001 "cmpwrapper", /* tp_name */
2002 sizeof(cmpwrapperobject), /* tp_basicsize */
2003 0, /* tp_itemsize */
2004 /* methods */
2005 (destructor)cmpwrapper_dealloc, /* tp_dealloc */
2006 0, /* tp_print */
2007 0, /* tp_getattr */
2008 0, /* tp_setattr */
2009 0, /* tp_compare */
2010 0, /* tp_repr */
2011 0, /* tp_as_number */
2012 0, /* tp_as_sequence */
2013 0, /* tp_as_mapping */
2014 0, /* tp_hash */
2015 (ternaryfunc)cmpwrapper_call, /* tp_call */
2016 0, /* tp_str */
2017 PyObject_GenericGetAttr, /* tp_getattro */
2018 0, /* tp_setattro */
2019 0, /* tp_as_buffer */
2020 Py_TPFLAGS_DEFAULT, /* tp_flags */
2021 cmpwrapper_doc, /* tp_doc */
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00002022};
2023
2024static PyObject *
2025build_cmpwrapper(PyObject *cmpfunc)
2026{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002027 cmpwrapperobject *co;
Tim Petersb38e2b62004-07-29 02:29:26 +00002028
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002029 co = PyObject_New(cmpwrapperobject, &cmpwrapper_type);
2030 if (co == NULL)
2031 return NULL;
2032 Py_INCREF(cmpfunc);
2033 co->func = cmpfunc;
2034 return (PyObject *)co;
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00002035}
2036
Tim Petersa64dc242002-08-01 02:13:36 +00002037/* An adaptive, stable, natural mergesort. See listsort.txt.
2038 * Returns Py_None on success, NULL on error. Even in case of error, the
2039 * list will be some permutation of its input state (nothing is lost or
2040 * duplicated).
2041 */
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002042static PyObject *
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00002043listsort(PyListObject *self, PyObject *args, PyObject *kwds)
Guido van Rossum3f236de1996-12-10 23:55:39 +00002044{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002045 MergeState ms;
2046 PyObject **lo, **hi;
2047 Py_ssize_t nremaining;
2048 Py_ssize_t minrun;
2049 Py_ssize_t saved_ob_size, saved_allocated;
2050 PyObject **saved_ob_item;
2051 PyObject **final_ob_item;
2052 PyObject *compare = NULL;
2053 PyObject *result = NULL; /* guilty until proved innocent */
2054 int reverse = 0;
2055 PyObject *keyfunc = NULL;
2056 Py_ssize_t i;
2057 PyObject *key, *value, *kvpair;
2058 static char *kwlist[] = {"cmp", "key", "reverse", 0};
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002059
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002060 assert(self != NULL);
2061 assert (PyList_Check(self));
2062 if (args != NULL) {
2063 if (!PyArg_ParseTupleAndKeywords(args, kwds, "|OOi:sort",
2064 kwlist, &compare, &keyfunc, &reverse))
2065 return NULL;
2066 }
2067 if (compare == Py_None)
2068 compare = NULL;
2069 if (compare != NULL &&
2070 PyErr_WarnPy3k("the cmp argument is not supported in 3.x", 1) < 0)
2071 return NULL;
2072 if (keyfunc == Py_None)
2073 keyfunc = NULL;
2074 if (compare != NULL && keyfunc != NULL) {
2075 compare = build_cmpwrapper(compare);
2076 if (compare == NULL)
2077 return NULL;
2078 } else
2079 Py_XINCREF(compare);
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00002080
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002081 /* The list is temporarily made empty, so that mutations performed
2082 * by comparison functions can't affect the slice of memory we're
2083 * sorting (allowing mutations during sorting is a core-dump
2084 * factory, since ob_item may change).
2085 */
2086 saved_ob_size = Py_SIZE(self);
2087 saved_ob_item = self->ob_item;
2088 saved_allocated = self->allocated;
2089 Py_SIZE(self) = 0;
2090 self->ob_item = NULL;
2091 self->allocated = -1; /* any operation will reset it to >= 0 */
Tim Peters330f9e92002-07-19 07:05:44 +00002092
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002093 if (keyfunc != NULL) {
2094 for (i=0 ; i < saved_ob_size ; i++) {
2095 value = saved_ob_item[i];
2096 key = PyObject_CallFunctionObjArgs(keyfunc, value,
2097 NULL);
2098 if (key == NULL) {
2099 for (i=i-1 ; i>=0 ; i--) {
2100 kvpair = saved_ob_item[i];
2101 value = sortwrapper_getvalue(kvpair);
2102 saved_ob_item[i] = value;
2103 Py_DECREF(kvpair);
2104 }
2105 goto dsu_fail;
2106 }
2107 kvpair = build_sortwrapper(key, value);
2108 if (kvpair == NULL)
2109 goto dsu_fail;
2110 saved_ob_item[i] = kvpair;
2111 }
2112 }
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002113
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002114 /* Reverse sort stability achieved by initially reversing the list,
2115 applying a stable forward sort, then reversing the final result. */
2116 if (reverse && saved_ob_size > 1)
2117 reverse_slice(saved_ob_item, saved_ob_item + saved_ob_size);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002118
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002119 merge_init(&ms, compare);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002120
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002121 nremaining = saved_ob_size;
2122 if (nremaining < 2)
2123 goto succeed;
Tim Peters330f9e92002-07-19 07:05:44 +00002124
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002125 /* March over the array once, left to right, finding natural runs,
2126 * and extending short natural runs to minrun elements.
2127 */
2128 lo = saved_ob_item;
2129 hi = lo + nremaining;
2130 minrun = merge_compute_minrun(nremaining);
2131 do {
2132 int descending;
2133 Py_ssize_t n;
Tim Peters330f9e92002-07-19 07:05:44 +00002134
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002135 /* Identify next run. */
2136 n = count_run(lo, hi, compare, &descending);
2137 if (n < 0)
2138 goto fail;
2139 if (descending)
2140 reverse_slice(lo, lo + n);
2141 /* If short, extend to min(minrun, nremaining). */
2142 if (n < minrun) {
2143 const Py_ssize_t force = nremaining <= minrun ?
2144 nremaining : minrun;
2145 if (binarysort(lo, lo + force, lo + n, compare) < 0)
2146 goto fail;
2147 n = force;
2148 }
2149 /* Push run onto pending-runs stack, and maybe merge. */
2150 assert(ms.n < MAX_MERGE_PENDING);
2151 ms.pending[ms.n].base = lo;
2152 ms.pending[ms.n].len = n;
2153 ++ms.n;
2154 if (merge_collapse(&ms) < 0)
2155 goto fail;
2156 /* Advance to find next run. */
2157 lo += n;
2158 nremaining -= n;
2159 } while (nremaining);
2160 assert(lo == hi);
Tim Peters330f9e92002-07-19 07:05:44 +00002161
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002162 if (merge_force_collapse(&ms) < 0)
2163 goto fail;
2164 assert(ms.n == 1);
2165 assert(ms.pending[0].base == saved_ob_item);
2166 assert(ms.pending[0].len == saved_ob_size);
Tim Petersa64dc242002-08-01 02:13:36 +00002167
2168succeed:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002169 result = Py_None;
Tim Peters330f9e92002-07-19 07:05:44 +00002170fail:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002171 if (keyfunc != NULL) {
2172 for (i=0 ; i < saved_ob_size ; i++) {
2173 kvpair = saved_ob_item[i];
2174 value = sortwrapper_getvalue(kvpair);
2175 saved_ob_item[i] = value;
2176 Py_DECREF(kvpair);
2177 }
2178 }
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002179
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002180 if (self->allocated != -1 && result != NULL) {
2181 /* The user mucked with the list during the sort,
2182 * and we don't already have another error to report.
2183 */
2184 PyErr_SetString(PyExc_ValueError, "list modified during sort");
2185 result = NULL;
2186 }
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002187
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002188 if (reverse && saved_ob_size > 1)
2189 reverse_slice(saved_ob_item, saved_ob_item + saved_ob_size);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002190
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002191 merge_freemem(&ms);
Michael W. Hudson1df0f652003-12-04 11:25:46 +00002192
2193dsu_fail:
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002194 final_ob_item = self->ob_item;
2195 i = Py_SIZE(self);
2196 Py_SIZE(self) = saved_ob_size;
2197 self->ob_item = saved_ob_item;
2198 self->allocated = saved_allocated;
2199 if (final_ob_item != NULL) {
2200 /* we cannot use list_clear() for this because it does not
2201 guarantee that the list is really empty when it returns */
2202 while (--i >= 0) {
2203 Py_XDECREF(final_ob_item[i]);
2204 }
2205 PyMem_FREE(final_ob_item);
2206 }
2207 Py_XDECREF(compare);
2208 Py_XINCREF(result);
2209 return result;
Guido van Rossum3f236de1996-12-10 23:55:39 +00002210}
Tim Peters330f9e92002-07-19 07:05:44 +00002211#undef IFLT
Tim Peters66860f62002-08-04 17:47:26 +00002212#undef ISLT
Tim Peters330f9e92002-07-19 07:05:44 +00002213
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002214int
Fred Drakea2f55112000-07-09 15:16:51 +00002215PyList_Sort(PyObject *v)
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002216{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002217 if (v == NULL || !PyList_Check(v)) {
2218 PyErr_BadInternalCall();
2219 return -1;
2220 }
2221 v = listsort((PyListObject *)v, (PyObject *)NULL, (PyObject *)NULL);
2222 if (v == NULL)
2223 return -1;
2224 Py_DECREF(v);
2225 return 0;
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002226}
2227
Guido van Rossumb86c5492001-02-12 22:06:02 +00002228static PyObject *
Martin v. Löwise3eb1f22001-08-16 13:15:00 +00002229listreverse(PyListObject *self)
Guido van Rossumb86c5492001-02-12 22:06:02 +00002230{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002231 if (Py_SIZE(self) > 1)
2232 reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
2233 Py_RETURN_NONE;
Guido van Rossumed98d481991-03-06 13:07:53 +00002234}
2235
Guido van Rossum84c76f51990-10-30 13:32:20 +00002236int
Fred Drakea2f55112000-07-09 15:16:51 +00002237PyList_Reverse(PyObject *v)
Guido van Rossumb0fe3a91995-01-17 16:34:45 +00002238{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002239 PyListObject *self = (PyListObject *)v;
Tim Peters6063e262002-08-08 01:06:39 +00002240
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002241 if (v == NULL || !PyList_Check(v)) {
2242 PyErr_BadInternalCall();
2243 return -1;
2244 }
2245 if (Py_SIZE(self) > 1)
2246 reverse_slice(self->ob_item, self->ob_item + Py_SIZE(self));
2247 return 0;
Guido van Rossumb0fe3a91995-01-17 16:34:45 +00002248}
2249
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002250PyObject *
Fred Drakea2f55112000-07-09 15:16:51 +00002251PyList_AsTuple(PyObject *v)
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00002252{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002253 PyObject *w;
2254 PyObject **p, **q;
2255 Py_ssize_t n;
2256 if (v == NULL || !PyList_Check(v)) {
2257 PyErr_BadInternalCall();
2258 return NULL;
2259 }
2260 n = Py_SIZE(v);
2261 w = PyTuple_New(n);
2262 if (w == NULL)
2263 return NULL;
2264 p = ((PyTupleObject *)w)->ob_item;
2265 q = ((PyListObject *)v)->ob_item;
2266 while (--n >= 0) {
2267 Py_INCREF(*q);
2268 *p = *q;
2269 p++;
2270 q++;
2271 }
2272 return w;
Guido van Rossum6cd2fe01994-08-29 12:45:32 +00002273}
2274
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002275static PyObject *
Raymond Hettingerd05abde2003-06-17 05:05:49 +00002276listindex(PyListObject *self, PyObject *args)
Guido van Rossumed98d481991-03-06 13:07:53 +00002277{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002278 Py_ssize_t i, start=0, stop=Py_SIZE(self);
2279 PyObject *v, *format_tuple, *err_string;
2280 static PyObject *err_format = NULL;
Guido van Rossum4aa24f92000-02-24 15:23:03 +00002281
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002282 if (!PyArg_ParseTuple(args, "O|O&O&:index", &v,
2283 _PyEval_SliceIndex, &start,
2284 _PyEval_SliceIndex, &stop))
2285 return NULL;
2286 if (start < 0) {
2287 start += Py_SIZE(self);
2288 if (start < 0)
2289 start = 0;
2290 }
2291 if (stop < 0) {
2292 stop += Py_SIZE(self);
2293 if (stop < 0)
2294 stop = 0;
2295 }
2296 for (i = start; i < stop && i < Py_SIZE(self); i++) {
2297 int cmp = PyObject_RichCompareBool(self->ob_item[i], v, Py_EQ);
2298 if (cmp > 0)
2299 return PyInt_FromSsize_t(i);
2300 else if (cmp < 0)
2301 return NULL;
2302 }
2303 if (err_format == NULL) {
2304 err_format = PyString_FromString("%r is not in list");
2305 if (err_format == NULL)
2306 return NULL;
2307 }
2308 format_tuple = PyTuple_Pack(1, v);
2309 if (format_tuple == NULL)
2310 return NULL;
2311 err_string = PyString_Format(err_format, format_tuple);
2312 Py_DECREF(format_tuple);
2313 if (err_string == NULL)
2314 return NULL;
2315 PyErr_SetObject(PyExc_ValueError, err_string);
2316 Py_DECREF(err_string);
2317 return NULL;
Guido van Rossumed98d481991-03-06 13:07:53 +00002318}
2319
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002320static PyObject *
Martin v. Löwise3eb1f22001-08-16 13:15:00 +00002321listcount(PyListObject *self, PyObject *v)
Guido van Rossume6f7d181991-10-20 20:20:40 +00002322{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002323 Py_ssize_t count = 0;
2324 Py_ssize_t i;
Guido van Rossum4aa24f92000-02-24 15:23:03 +00002325
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002326 for (i = 0; i < Py_SIZE(self); i++) {
2327 int cmp = PyObject_RichCompareBool(self->ob_item[i], v, Py_EQ);
2328 if (cmp > 0)
2329 count++;
2330 else if (cmp < 0)
2331 return NULL;
2332 }
2333 return PyInt_FromSsize_t(count);
Guido van Rossume6f7d181991-10-20 20:20:40 +00002334}
2335
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002336static PyObject *
Martin v. Löwise3eb1f22001-08-16 13:15:00 +00002337listremove(PyListObject *self, PyObject *v)
Guido van Rossumed98d481991-03-06 13:07:53 +00002338{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002339 Py_ssize_t i;
Guido van Rossum4aa24f92000-02-24 15:23:03 +00002340
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002341 for (i = 0; i < Py_SIZE(self); i++) {
2342 int cmp = PyObject_RichCompareBool(self->ob_item[i], v, Py_EQ);
2343 if (cmp > 0) {
2344 if (list_ass_slice(self, i, i+1,
2345 (PyObject *)NULL) == 0)
2346 Py_RETURN_NONE;
2347 return NULL;
2348 }
2349 else if (cmp < 0)
2350 return NULL;
2351 }
2352 PyErr_SetString(PyExc_ValueError, "list.remove(x): x not in list");
2353 return NULL;
Guido van Rossumed98d481991-03-06 13:07:53 +00002354}
2355
Jeremy Hylton8caad492000-06-23 14:18:11 +00002356static int
2357list_traverse(PyListObject *o, visitproc visit, void *arg)
2358{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002359 Py_ssize_t i;
Jeremy Hylton8caad492000-06-23 14:18:11 +00002360
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002361 for (i = Py_SIZE(o); --i >= 0; )
2362 Py_VISIT(o->ob_item[i]);
2363 return 0;
Jeremy Hylton8caad492000-06-23 14:18:11 +00002364}
2365
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002366static PyObject *
2367list_richcompare(PyObject *v, PyObject *w, int op)
2368{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002369 PyListObject *vl, *wl;
2370 Py_ssize_t i;
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002371
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002372 if (!PyList_Check(v) || !PyList_Check(w)) {
2373 Py_INCREF(Py_NotImplemented);
2374 return Py_NotImplemented;
2375 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002376
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002377 vl = (PyListObject *)v;
2378 wl = (PyListObject *)w;
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002379
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002380 if (Py_SIZE(vl) != Py_SIZE(wl) && (op == Py_EQ || op == Py_NE)) {
2381 /* Shortcut: if the lengths differ, the lists differ */
2382 PyObject *res;
2383 if (op == Py_EQ)
2384 res = Py_False;
2385 else
2386 res = Py_True;
2387 Py_INCREF(res);
2388 return res;
2389 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002390
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002391 /* Search for the first index where items are different */
2392 for (i = 0; i < Py_SIZE(vl) && i < Py_SIZE(wl); i++) {
2393 int k = PyObject_RichCompareBool(vl->ob_item[i],
2394 wl->ob_item[i], Py_EQ);
2395 if (k < 0)
2396 return NULL;
2397 if (!k)
2398 break;
2399 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002400
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002401 if (i >= Py_SIZE(vl) || i >= Py_SIZE(wl)) {
2402 /* No more items to compare -- compare sizes */
2403 Py_ssize_t vs = Py_SIZE(vl);
2404 Py_ssize_t ws = Py_SIZE(wl);
2405 int cmp;
2406 PyObject *res;
2407 switch (op) {
2408 case Py_LT: cmp = vs < ws; break;
2409 case Py_LE: cmp = vs <= ws; break;
2410 case Py_EQ: cmp = vs == ws; break;
2411 case Py_NE: cmp = vs != ws; break;
2412 case Py_GT: cmp = vs > ws; break;
2413 case Py_GE: cmp = vs >= ws; break;
2414 default: return NULL; /* cannot happen */
2415 }
2416 if (cmp)
2417 res = Py_True;
2418 else
2419 res = Py_False;
2420 Py_INCREF(res);
2421 return res;
2422 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002423
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002424 /* We have an item that differs -- shortcuts for EQ/NE */
2425 if (op == Py_EQ) {
2426 Py_INCREF(Py_False);
2427 return Py_False;
2428 }
2429 if (op == Py_NE) {
2430 Py_INCREF(Py_True);
2431 return Py_True;
2432 }
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002433
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002434 /* Compare the final item again using the proper operator */
2435 return PyObject_RichCompare(vl->ob_item[i], wl->ob_item[i], op);
Guido van Rossum65e1cea2001-01-17 22:11:59 +00002436}
2437
Tim Peters6d6c1a32001-08-02 04:15:00 +00002438static int
2439list_init(PyListObject *self, PyObject *args, PyObject *kw)
2440{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002441 PyObject *arg = NULL;
2442 static char *kwlist[] = {"sequence", 0};
Tim Peters6d6c1a32001-08-02 04:15:00 +00002443
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002444 if (!PyArg_ParseTupleAndKeywords(args, kw, "|O:list", kwlist, &arg))
2445 return -1;
Raymond Hettingerc0aaa2d2004-07-29 23:31:29 +00002446
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002447 /* Verify list invariants established by PyType_GenericAlloc() */
2448 assert(0 <= Py_SIZE(self));
2449 assert(Py_SIZE(self) <= self->allocated || self->allocated == -1);
2450 assert(self->ob_item != NULL ||
2451 self->allocated == 0 || self->allocated == -1);
Raymond Hettingerc0aaa2d2004-07-29 23:31:29 +00002452
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002453 /* Empty previous contents */
2454 if (self->ob_item != NULL) {
2455 (void)list_clear(self);
2456 }
2457 if (arg != NULL) {
2458 PyObject *rv = listextend(self, arg);
2459 if (rv == NULL)
2460 return -1;
2461 Py_DECREF(rv);
2462 }
2463 return 0;
Tim Peters6d6c1a32001-08-02 04:15:00 +00002464}
2465
Robert Schuppenies51df0642008-06-01 16:16:17 +00002466static PyObject *
2467list_sizeof(PyListObject *self)
2468{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002469 Py_ssize_t res;
Robert Schuppenies51df0642008-06-01 16:16:17 +00002470
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002471 res = sizeof(PyListObject) + self->allocated * sizeof(void*);
2472 return PyInt_FromSsize_t(res);
Robert Schuppenies51df0642008-06-01 16:16:17 +00002473}
2474
Raymond Hettinger1021c442003-11-07 15:38:09 +00002475static PyObject *list_iter(PyObject *seq);
2476static PyObject *list_reversed(PyListObject* seq, PyObject* unused);
2477
Raymond Hettinger8f5cdaa2003-12-13 11:26:12 +00002478PyDoc_STRVAR(getitem_doc,
2479"x.__getitem__(y) <==> x[y]");
Raymond Hettinger1021c442003-11-07 15:38:09 +00002480PyDoc_STRVAR(reversed_doc,
2481"L.__reversed__() -- return a reverse iterator over the list");
Robert Schuppenies51df0642008-06-01 16:16:17 +00002482PyDoc_STRVAR(sizeof_doc,
Georg Brandl7a6de8b2008-06-01 16:42:16 +00002483"L.__sizeof__() -- size of L in memory, in bytes");
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00002484PyDoc_STRVAR(append_doc,
2485"L.append(object) -- append object to end");
2486PyDoc_STRVAR(extend_doc,
Raymond Hettingerf8bcfb12002-12-29 05:49:09 +00002487"L.extend(iterable) -- extend list by appending elements from the iterable");
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00002488PyDoc_STRVAR(insert_doc,
2489"L.insert(index, object) -- insert object before index");
2490PyDoc_STRVAR(pop_doc,
Andrew M. Kuchlingd810cdf2008-10-04 01:04:24 +00002491"L.pop([index]) -> item -- remove and return item at index (default last).\n"
2492"Raises IndexError if list is empty or index is out of range.");
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00002493PyDoc_STRVAR(remove_doc,
Andrew M. Kuchlingd810cdf2008-10-04 01:04:24 +00002494"L.remove(value) -- remove first occurrence of value.\n"
2495"Raises ValueError if the value is not present.");
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00002496PyDoc_STRVAR(index_doc,
Andrew M. Kuchlingd810cdf2008-10-04 01:04:24 +00002497"L.index(value, [start, [stop]]) -> integer -- return first index of value.\n"
2498"Raises ValueError if the value is not present.");
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00002499PyDoc_STRVAR(count_doc,
2500"L.count(value) -> integer -- return number of occurrences of value");
2501PyDoc_STRVAR(reverse_doc,
2502"L.reverse() -- reverse *IN PLACE*");
2503PyDoc_STRVAR(sort_doc,
Raymond Hettinger42b1ba32003-10-16 03:41:09 +00002504"L.sort(cmp=None, key=None, reverse=False) -- stable sort *IN PLACE*;\n\
2505cmp(x, y) -> -1, 0, 1");
Guido van Rossum3dd7f3f1998-06-30 15:36:32 +00002506
Raymond Hettinger8f5cdaa2003-12-13 11:26:12 +00002507static PyObject *list_subscript(PyListObject*, PyObject*);
2508
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002509static PyMethodDef list_methods[] = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002510 {"__getitem__", (PyCFunction)list_subscript, METH_O|METH_COEXIST, getitem_doc},
2511 {"__reversed__",(PyCFunction)list_reversed, METH_NOARGS, reversed_doc},
2512 {"__sizeof__", (PyCFunction)list_sizeof, METH_NOARGS, sizeof_doc},
2513 {"append", (PyCFunction)listappend, METH_O, append_doc},
2514 {"insert", (PyCFunction)listinsert, METH_VARARGS, insert_doc},
2515 {"extend", (PyCFunction)listextend, METH_O, extend_doc},
2516 {"pop", (PyCFunction)listpop, METH_VARARGS, pop_doc},
2517 {"remove", (PyCFunction)listremove, METH_O, remove_doc},
2518 {"index", (PyCFunction)listindex, METH_VARARGS, index_doc},
2519 {"count", (PyCFunction)listcount, METH_O, count_doc},
2520 {"reverse", (PyCFunction)listreverse, METH_NOARGS, reverse_doc},
2521 {"sort", (PyCFunction)listsort, METH_VARARGS | METH_KEYWORDS, sort_doc},
2522 {NULL, NULL} /* sentinel */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002523};
2524
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002525static PySequenceMethods list_as_sequence = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002526 (lenfunc)list_length, /* sq_length */
2527 (binaryfunc)list_concat, /* sq_concat */
2528 (ssizeargfunc)list_repeat, /* sq_repeat */
2529 (ssizeargfunc)list_item, /* sq_item */
2530 (ssizessizeargfunc)list_slice, /* sq_slice */
2531 (ssizeobjargproc)list_ass_item, /* sq_ass_item */
2532 (ssizessizeobjargproc)list_ass_slice, /* sq_ass_slice */
2533 (objobjproc)list_contains, /* sq_contains */
2534 (binaryfunc)list_inplace_concat, /* sq_inplace_concat */
2535 (ssizeargfunc)list_inplace_repeat, /* sq_inplace_repeat */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002536};
2537
Neal Norwitz2c2e8272002-06-14 02:04:18 +00002538PyDoc_STRVAR(list_doc,
Ezio Melottifb501122010-02-28 23:59:00 +00002539"list() -> new empty list\n"
Georg Brandlbca11692010-02-28 18:19:17 +00002540"list(iterable) -> new list initialized from iterable's items");
Tim Peters6d6c1a32001-08-02 04:15:00 +00002541
Guido van Rossum38fff8c2006-03-07 18:50:55 +00002542
Jeremy Hyltona4b4c3b2002-07-13 03:51:17 +00002543static PyObject *
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002544list_subscript(PyListObject* self, PyObject* item)
2545{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002546 if (PyIndex_Check(item)) {
2547 Py_ssize_t i;
2548 i = PyNumber_AsSsize_t(item, PyExc_IndexError);
2549 if (i == -1 && PyErr_Occurred())
2550 return NULL;
2551 if (i < 0)
2552 i += PyList_GET_SIZE(self);
2553 return list_item(self, i);
2554 }
2555 else if (PySlice_Check(item)) {
2556 Py_ssize_t start, stop, step, slicelength, cur, i;
2557 PyObject* result;
2558 PyObject* it;
2559 PyObject **src, **dest;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002560
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002561 if (PySlice_GetIndicesEx((PySliceObject*)item, Py_SIZE(self),
2562 &start, &stop, &step, &slicelength) < 0) {
2563 return NULL;
2564 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002565
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002566 if (slicelength <= 0) {
2567 return PyList_New(0);
2568 }
2569 else if (step == 1) {
2570 return list_slice(self, start, stop);
2571 }
2572 else {
2573 result = PyList_New(slicelength);
2574 if (!result) return NULL;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002575
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002576 src = self->ob_item;
2577 dest = ((PyListObject *)result)->ob_item;
2578 for (cur = start, i = 0; i < slicelength;
2579 cur += step, i++) {
2580 it = src[cur];
2581 Py_INCREF(it);
2582 dest[i] = it;
2583 }
Tim Peters3b01a122002-07-19 02:35:45 +00002584
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002585 return result;
2586 }
2587 }
2588 else {
2589 PyErr_Format(PyExc_TypeError,
2590 "list indices must be integers, not %.200s",
2591 item->ob_type->tp_name);
2592 return NULL;
2593 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002594}
2595
Tim Peters3b01a122002-07-19 02:35:45 +00002596static int
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002597list_ass_subscript(PyListObject* self, PyObject* item, PyObject* value)
2598{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002599 if (PyIndex_Check(item)) {
2600 Py_ssize_t i = PyNumber_AsSsize_t(item, PyExc_IndexError);
2601 if (i == -1 && PyErr_Occurred())
2602 return -1;
2603 if (i < 0)
2604 i += PyList_GET_SIZE(self);
2605 return list_ass_item(self, i, value);
2606 }
2607 else if (PySlice_Check(item)) {
2608 Py_ssize_t start, stop, step, slicelength;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002609
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002610 if (PySlice_GetIndicesEx((PySliceObject*)item, Py_SIZE(self),
2611 &start, &stop, &step, &slicelength) < 0) {
2612 return -1;
2613 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002614
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002615 if (step == 1)
2616 return list_ass_slice(self, start, stop, value);
Michael W. Hudson9c14bad2002-06-19 15:44:15 +00002617
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002618 /* Make sure s[5:2] = [..] inserts at the right place:
2619 before 5, not before 2. */
2620 if ((step < 0 && start < stop) ||
2621 (step > 0 && start > stop))
2622 stop = start;
Thomas Wouters3ccec682007-08-28 15:28:19 +00002623
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002624 if (value == NULL) {
2625 /* delete slice */
2626 PyObject **garbage;
2627 size_t cur;
2628 Py_ssize_t i;
Tim Peters3b01a122002-07-19 02:35:45 +00002629
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002630 if (slicelength <= 0)
2631 return 0;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002632
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002633 if (step < 0) {
2634 stop = start + 1;
2635 start = stop + step*(slicelength - 1) - 1;
2636 step = -step;
2637 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002638
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002639 assert((size_t)slicelength <=
2640 PY_SIZE_MAX / sizeof(PyObject*));
Gregory P. Smith9d534572008-06-11 07:41:16 +00002641
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002642 garbage = (PyObject**)
2643 PyMem_MALLOC(slicelength*sizeof(PyObject*));
2644 if (!garbage) {
2645 PyErr_NoMemory();
2646 return -1;
2647 }
Tim Peters3b01a122002-07-19 02:35:45 +00002648
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002649 /* drawing pictures might help understand these for
2650 loops. Basically, we memmove the parts of the
2651 list that are *not* part of the slice: step-1
2652 items for each item that is part of the slice,
2653 and then tail end of the list that was not
2654 covered by the slice */
2655 for (cur = start, i = 0;
2656 cur < (size_t)stop;
2657 cur += step, i++) {
2658 Py_ssize_t lim = step - 1;
Michael W. Hudson56796f62002-07-29 14:35:04 +00002659
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002660 garbage[i] = PyList_GET_ITEM(self, cur);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002661
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002662 if (cur + step >= (size_t)Py_SIZE(self)) {
2663 lim = Py_SIZE(self) - cur - 1;
2664 }
Michael W. Hudson56796f62002-07-29 14:35:04 +00002665
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002666 memmove(self->ob_item + cur - i,
2667 self->ob_item + cur + 1,
2668 lim * sizeof(PyObject *));
2669 }
2670 cur = start + slicelength*step;
2671 if (cur < (size_t)Py_SIZE(self)) {
2672 memmove(self->ob_item + cur - slicelength,
2673 self->ob_item + cur,
2674 (Py_SIZE(self) - cur) *
2675 sizeof(PyObject *));
2676 }
Raymond Hettingera6366fe2004-03-09 13:05:22 +00002677
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002678 Py_SIZE(self) -= slicelength;
2679 list_resize(self, Py_SIZE(self));
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002680
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002681 for (i = 0; i < slicelength; i++) {
2682 Py_DECREF(garbage[i]);
2683 }
2684 PyMem_FREE(garbage);
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002685
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002686 return 0;
2687 }
2688 else {
2689 /* assign slice */
2690 PyObject *ins, *seq;
2691 PyObject **garbage, **seqitems, **selfitems;
2692 Py_ssize_t cur, i;
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002693
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002694 /* protect against a[::-1] = a */
2695 if (self == (PyListObject*)value) {
2696 seq = list_slice((PyListObject*)value, 0,
2697 PyList_GET_SIZE(value));
2698 }
2699 else {
2700 seq = PySequence_Fast(value,
2701 "must assign iterable "
2702 "to extended slice");
2703 }
2704 if (!seq)
2705 return -1;
Michael W. Hudsona69c0302002-12-05 21:32:32 +00002706
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002707 if (PySequence_Fast_GET_SIZE(seq) != slicelength) {
2708 PyErr_Format(PyExc_ValueError,
2709 "attempt to assign sequence of "
2710 "size %zd to extended slice of "
2711 "size %zd",
2712 PySequence_Fast_GET_SIZE(seq),
2713 slicelength);
2714 Py_DECREF(seq);
2715 return -1;
2716 }
Michael W. Hudsona69c0302002-12-05 21:32:32 +00002717
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002718 if (!slicelength) {
2719 Py_DECREF(seq);
2720 return 0;
2721 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002722
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002723 garbage = (PyObject**)
2724 PyMem_MALLOC(slicelength*sizeof(PyObject*));
2725 if (!garbage) {
2726 Py_DECREF(seq);
2727 PyErr_NoMemory();
2728 return -1;
2729 }
Tim Peters3b01a122002-07-19 02:35:45 +00002730
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002731 selfitems = self->ob_item;
2732 seqitems = PySequence_Fast_ITEMS(seq);
2733 for (cur = start, i = 0; i < slicelength;
2734 cur += step, i++) {
2735 garbage[i] = selfitems[cur];
2736 ins = seqitems[i];
2737 Py_INCREF(ins);
2738 selfitems[cur] = ins;
2739 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002740
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002741 for (i = 0; i < slicelength; i++) {
2742 Py_DECREF(garbage[i]);
2743 }
Tim Peters3b01a122002-07-19 02:35:45 +00002744
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002745 PyMem_FREE(garbage);
2746 Py_DECREF(seq);
Tim Peters3b01a122002-07-19 02:35:45 +00002747
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002748 return 0;
2749 }
2750 }
2751 else {
2752 PyErr_Format(PyExc_TypeError,
2753 "list indices must be integers, not %.200s",
2754 item->ob_type->tp_name);
2755 return -1;
2756 }
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002757}
2758
2759static PyMappingMethods list_as_mapping = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002760 (lenfunc)list_length,
2761 (binaryfunc)list_subscript,
2762 (objobjargproc)list_ass_subscript
Michael W. Hudson5efaf7e2002-06-11 10:55:12 +00002763};
2764
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002765PyTypeObject PyList_Type = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002766 PyVarObject_HEAD_INIT(&PyType_Type, 0)
2767 "list",
2768 sizeof(PyListObject),
2769 0,
2770 (destructor)list_dealloc, /* tp_dealloc */
2771 (printfunc)list_print, /* tp_print */
2772 0, /* tp_getattr */
2773 0, /* tp_setattr */
2774 0, /* tp_compare */
2775 (reprfunc)list_repr, /* tp_repr */
2776 0, /* tp_as_number */
2777 &list_as_sequence, /* tp_as_sequence */
2778 &list_as_mapping, /* tp_as_mapping */
2779 (hashfunc)PyObject_HashNotImplemented, /* tp_hash */
2780 0, /* tp_call */
2781 0, /* tp_str */
2782 PyObject_GenericGetAttr, /* tp_getattro */
2783 0, /* tp_setattro */
2784 0, /* tp_as_buffer */
2785 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
2786 Py_TPFLAGS_BASETYPE | Py_TPFLAGS_LIST_SUBCLASS, /* tp_flags */
2787 list_doc, /* tp_doc */
2788 (traverseproc)list_traverse, /* tp_traverse */
2789 (inquiry)list_clear, /* tp_clear */
2790 list_richcompare, /* tp_richcompare */
2791 0, /* tp_weaklistoffset */
2792 list_iter, /* tp_iter */
2793 0, /* tp_iternext */
2794 list_methods, /* tp_methods */
2795 0, /* tp_members */
2796 0, /* tp_getset */
2797 0, /* tp_base */
2798 0, /* tp_dict */
2799 0, /* tp_descr_get */
2800 0, /* tp_descr_set */
2801 0, /* tp_dictoffset */
2802 (initproc)list_init, /* tp_init */
2803 PyType_GenericAlloc, /* tp_alloc */
2804 PyType_GenericNew, /* tp_new */
2805 PyObject_GC_Del, /* tp_free */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002806};
Guido van Rossum4c4e7df1998-06-16 15:18:28 +00002807
2808
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002809/*********************** List Iterator **************************/
2810
2811typedef struct {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002812 PyObject_HEAD
2813 long it_index;
2814 PyListObject *it_seq; /* Set to NULL when iterator is exhausted */
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002815} listiterobject;
2816
Anthony Baxter377be112006-04-11 06:54:30 +00002817static PyObject *list_iter(PyObject *);
2818static void listiter_dealloc(listiterobject *);
2819static int listiter_traverse(listiterobject *, visitproc, void *);
2820static PyObject *listiter_next(listiterobject *);
2821static PyObject *listiter_len(listiterobject *);
2822
2823PyDoc_STRVAR(length_hint_doc, "Private method returning an estimate of len(list(it)).");
2824
2825static PyMethodDef listiter_methods[] = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002826 {"__length_hint__", (PyCFunction)listiter_len, METH_NOARGS, length_hint_doc},
2827 {NULL, NULL} /* sentinel */
Anthony Baxter377be112006-04-11 06:54:30 +00002828};
2829
2830PyTypeObject PyListIter_Type = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002831 PyVarObject_HEAD_INIT(&PyType_Type, 0)
2832 "listiterator", /* tp_name */
2833 sizeof(listiterobject), /* tp_basicsize */
2834 0, /* tp_itemsize */
2835 /* methods */
2836 (destructor)listiter_dealloc, /* tp_dealloc */
2837 0, /* tp_print */
2838 0, /* tp_getattr */
2839 0, /* tp_setattr */
2840 0, /* tp_compare */
2841 0, /* tp_repr */
2842 0, /* tp_as_number */
2843 0, /* tp_as_sequence */
2844 0, /* tp_as_mapping */
2845 0, /* tp_hash */
2846 0, /* tp_call */
2847 0, /* tp_str */
2848 PyObject_GenericGetAttr, /* tp_getattro */
2849 0, /* tp_setattro */
2850 0, /* tp_as_buffer */
2851 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
2852 0, /* tp_doc */
2853 (traverseproc)listiter_traverse, /* tp_traverse */
2854 0, /* tp_clear */
2855 0, /* tp_richcompare */
2856 0, /* tp_weaklistoffset */
2857 PyObject_SelfIter, /* tp_iter */
2858 (iternextfunc)listiter_next, /* tp_iternext */
2859 listiter_methods, /* tp_methods */
2860 0, /* tp_members */
Anthony Baxter377be112006-04-11 06:54:30 +00002861};
2862
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002863
Guido van Rossum5086e492002-07-16 15:56:52 +00002864static PyObject *
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002865list_iter(PyObject *seq)
2866{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002867 listiterobject *it;
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002868
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002869 if (!PyList_Check(seq)) {
2870 PyErr_BadInternalCall();
2871 return NULL;
2872 }
2873 it = PyObject_GC_New(listiterobject, &PyListIter_Type);
2874 if (it == NULL)
2875 return NULL;
2876 it->it_index = 0;
2877 Py_INCREF(seq);
2878 it->it_seq = (PyListObject *)seq;
2879 _PyObject_GC_TRACK(it);
2880 return (PyObject *)it;
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002881}
2882
2883static void
2884listiter_dealloc(listiterobject *it)
2885{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002886 _PyObject_GC_UNTRACK(it);
2887 Py_XDECREF(it->it_seq);
2888 PyObject_GC_Del(it);
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002889}
2890
2891static int
2892listiter_traverse(listiterobject *it, visitproc visit, void *arg)
2893{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002894 Py_VISIT(it->it_seq);
2895 return 0;
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002896}
2897
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002898static PyObject *
Tim Peters93b2cc42002-06-01 05:22:55 +00002899listiter_next(listiterobject *it)
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002900{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002901 PyListObject *seq;
2902 PyObject *item;
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002903
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002904 assert(it != NULL);
2905 seq = it->it_seq;
2906 if (seq == NULL)
2907 return NULL;
2908 assert(PyList_Check(seq));
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002909
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002910 if (it->it_index < PyList_GET_SIZE(seq)) {
2911 item = PyList_GET_ITEM(seq, it->it_index);
2912 ++it->it_index;
2913 Py_INCREF(item);
2914 return item;
2915 }
Guido van Rossum86103ae2002-07-16 20:07:32 +00002916
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002917 Py_DECREF(seq);
2918 it->it_seq = NULL;
2919 return NULL;
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002920}
2921
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00002922static PyObject *
Raymond Hettinger435bf582004-03-18 22:43:10 +00002923listiter_len(listiterobject *it)
2924{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002925 Py_ssize_t len;
2926 if (it->it_seq) {
2927 len = PyList_GET_SIZE(it->it_seq) - it->it_index;
2928 if (len >= 0)
2929 return PyInt_FromSsize_t(len);
2930 }
2931 return PyInt_FromLong(0);
Raymond Hettinger435bf582004-03-18 22:43:10 +00002932}
Anthony Baxter377be112006-04-11 06:54:30 +00002933/*********************** List Reverse Iterator **************************/
Raymond Hettinger435bf582004-03-18 22:43:10 +00002934
Anthony Baxter377be112006-04-11 06:54:30 +00002935typedef struct {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002936 PyObject_HEAD
2937 Py_ssize_t it_index;
2938 PyListObject *it_seq; /* Set to NULL when iterator is exhausted */
Anthony Baxter377be112006-04-11 06:54:30 +00002939} listreviterobject;
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00002940
Anthony Baxter377be112006-04-11 06:54:30 +00002941static PyObject *list_reversed(PyListObject *, PyObject *);
2942static void listreviter_dealloc(listreviterobject *);
2943static int listreviter_traverse(listreviterobject *, visitproc, void *);
2944static PyObject *listreviter_next(listreviterobject *);
Raymond Hettinger7989a4d2008-12-03 15:42:10 +00002945static PyObject *listreviter_len(listreviterobject *);
Anthony Baxter377be112006-04-11 06:54:30 +00002946
Raymond Hettinger7989a4d2008-12-03 15:42:10 +00002947static PyMethodDef listreviter_methods[] = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002948 {"__length_hint__", (PyCFunction)listreviter_len, METH_NOARGS, length_hint_doc},
2949 {NULL, NULL} /* sentinel */
Raymond Hettinger435bf582004-03-18 22:43:10 +00002950};
2951
Anthony Baxter377be112006-04-11 06:54:30 +00002952PyTypeObject PyListRevIter_Type = {
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002953 PyVarObject_HEAD_INIT(&PyType_Type, 0)
2954 "listreverseiterator", /* tp_name */
2955 sizeof(listreviterobject), /* tp_basicsize */
2956 0, /* tp_itemsize */
2957 /* methods */
2958 (destructor)listreviter_dealloc, /* tp_dealloc */
2959 0, /* tp_print */
2960 0, /* tp_getattr */
2961 0, /* tp_setattr */
2962 0, /* tp_compare */
2963 0, /* tp_repr */
2964 0, /* tp_as_number */
2965 0, /* tp_as_sequence */
2966 0, /* tp_as_mapping */
2967 0, /* tp_hash */
2968 0, /* tp_call */
2969 0, /* tp_str */
2970 PyObject_GenericGetAttr, /* tp_getattro */
2971 0, /* tp_setattro */
2972 0, /* tp_as_buffer */
2973 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
2974 0, /* tp_doc */
2975 (traverseproc)listreviter_traverse, /* tp_traverse */
2976 0, /* tp_clear */
2977 0, /* tp_richcompare */
2978 0, /* tp_weaklistoffset */
2979 PyObject_SelfIter, /* tp_iter */
2980 (iternextfunc)listreviter_next, /* tp_iternext */
2981 listreviter_methods, /* tp_methods */
2982 0,
Raymond Hettinger14bd6de2002-05-31 21:40:38 +00002983};
Raymond Hettinger1021c442003-11-07 15:38:09 +00002984
Raymond Hettinger1021c442003-11-07 15:38:09 +00002985static PyObject *
2986list_reversed(PyListObject *seq, PyObject *unused)
2987{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002988 listreviterobject *it;
Raymond Hettinger1021c442003-11-07 15:38:09 +00002989
Antoine Pitrouc83ea132010-05-09 14:46:46 +00002990 it = PyObject_GC_New(listreviterobject, &PyListRevIter_Type);
2991 if (it == NULL)
2992 return NULL;
2993 assert(PyList_Check(seq));
2994 it->it_index = PyList_GET_SIZE(seq) - 1;
2995 Py_INCREF(seq);
2996 it->it_seq = seq;
2997 PyObject_GC_Track(it);
2998 return (PyObject *)it;
Raymond Hettinger1021c442003-11-07 15:38:09 +00002999}
3000
3001static void
3002listreviter_dealloc(listreviterobject *it)
3003{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00003004 PyObject_GC_UnTrack(it);
3005 Py_XDECREF(it->it_seq);
3006 PyObject_GC_Del(it);
Raymond Hettinger1021c442003-11-07 15:38:09 +00003007}
3008
3009static int
3010listreviter_traverse(listreviterobject *it, visitproc visit, void *arg)
3011{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00003012 Py_VISIT(it->it_seq);
3013 return 0;
Raymond Hettinger1021c442003-11-07 15:38:09 +00003014}
3015
3016static PyObject *
3017listreviter_next(listreviterobject *it)
3018{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00003019 PyObject *item;
3020 Py_ssize_t index = it->it_index;
3021 PyListObject *seq = it->it_seq;
Raymond Hettinger1021c442003-11-07 15:38:09 +00003022
Antoine Pitrouc83ea132010-05-09 14:46:46 +00003023 if (index>=0 && index < PyList_GET_SIZE(seq)) {
3024 item = PyList_GET_ITEM(seq, index);
3025 it->it_index--;
3026 Py_INCREF(item);
3027 return item;
3028 }
3029 it->it_index = -1;
3030 if (seq != NULL) {
3031 it->it_seq = NULL;
3032 Py_DECREF(seq);
3033 }
3034 return NULL;
Raymond Hettinger1021c442003-11-07 15:38:09 +00003035}
3036
Raymond Hettinger7989a4d2008-12-03 15:42:10 +00003037static PyObject *
Raymond Hettingeref9bf402004-03-10 10:10:42 +00003038listreviter_len(listreviterobject *it)
3039{
Antoine Pitrouc83ea132010-05-09 14:46:46 +00003040 Py_ssize_t len = it->it_index + 1;
3041 if (it->it_seq == NULL || PyList_GET_SIZE(it->it_seq) < len)
3042 len = 0;
3043 return PyLong_FromSsize_t(len);
Raymond Hettingeref9bf402004-03-10 10:10:42 +00003044}