blob: 05da5dcc0fe6895a273397781ce2f2a5c1d0735b [file] [log] [blame]
/***********************************************************
Copyright 1991-1995 by Stichting Mathematisch Centrum, Amsterdam,
The Netherlands.
All Rights Reserved
Permission to use, copy, modify, and distribute this software and its
documentation for any purpose and without fee is hereby granted,
provided that the above copyright notice appear in all copies and that
both that copyright notice and this permission notice appear in
supporting documentation, and that the names of Stichting Mathematisch
Centrum or CWI or Corporation for National Research Initiatives or
CNRI not be used in advertising or publicity pertaining to
distribution of the software without specific, written prior
permission.
While CWI is the initial source for this software, a modified version
is made available by the Corporation for National Research Initiatives
(CNRI) at the Internet address ftp://ftp.python.org.
STICHTING MATHEMATISCH CENTRUM AND CNRI DISCLAIM ALL WARRANTIES WITH
REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF
MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL STICHTING MATHEMATISCH
CENTRUM OR CNRI BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL
DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
PERFORMANCE OF THIS SOFTWARE.
******************************************************************/
/* List object implementation */
#include "Python.h"
#ifdef STDC_HEADERS
#include <stddef.h>
#else
#include <sys/types.h> /* For size_t */
#endif
#define ROUNDUP(n, PyTryBlock) \
((((n)+(PyTryBlock)-1)/(PyTryBlock))*(PyTryBlock))
static int
roundupsize(n)
int n;
{
if (n < 500)
return ROUNDUP(n, 10);
else
return ROUNDUP(n, 100);
}
#define NRESIZE(var, type, nitems) PyMem_RESIZE(var, type, roundupsize(nitems))
PyObject *
PyList_New(size)
int size;
{
int i;
PyListObject *op;
size_t nbytes;
if (size < 0) {
PyErr_BadInternalCall();
return NULL;
}
nbytes = size * sizeof(PyObject *);
/* Check for overflow */
if (nbytes / sizeof(PyObject *) != (size_t)size) {
return PyErr_NoMemory();
}
op = (PyListObject *) malloc(sizeof(PyListObject));
if (op == NULL) {
return PyErr_NoMemory();
}
if (size <= 0) {
op->ob_item = NULL;
}
else {
op->ob_item = (PyObject **) malloc(nbytes);
if (op->ob_item == NULL) {
free((ANY *)op);
return PyErr_NoMemory();
}
}
op->ob_type = &PyList_Type;
op->ob_size = size;
for (i = 0; i < size; i++)
op->ob_item[i] = NULL;
_Py_NewReference(op);
return (PyObject *) op;
}
int
PyList_Size(op)
PyObject *op;
{
if (!PyList_Check(op)) {
PyErr_BadInternalCall();
return -1;
}
else
return ((PyListObject *)op) -> ob_size;
}
static PyObject *indexerr;
PyObject *
PyList_GetItem(op, i)
PyObject *op;
int i;
{
if (!PyList_Check(op)) {
PyErr_BadInternalCall();
return NULL;
}
if (i < 0 || i >= ((PyListObject *)op) -> ob_size) {
if (indexerr == NULL)
indexerr = PyString_FromString(
"list index out of range");
PyErr_SetObject(PyExc_IndexError, indexerr);
return NULL;
}
return ((PyListObject *)op) -> ob_item[i];
}
int
PyList_SetItem(op, i, newitem)
register PyObject *op;
register int i;
register PyObject *newitem;
{
register PyObject *olditem;
register PyObject **p;
if (!PyList_Check(op)) {
Py_XDECREF(newitem);
PyErr_BadInternalCall();
return -1;
}
if (i < 0 || i >= ((PyListObject *)op) -> ob_size) {
Py_XDECREF(newitem);
PyErr_SetString(PyExc_IndexError,
"list assignment index out of range");
return -1;
}
p = ((PyListObject *)op) -> ob_item + i;
olditem = *p;
*p = newitem;
Py_XDECREF(olditem);
return 0;
}
static int
ins1(self, where, v)
PyListObject *self;
int where;
PyObject *v;
{
int i;
PyObject **items;
if (v == NULL) {
PyErr_BadInternalCall();
return -1;
}
items = self->ob_item;
NRESIZE(items, PyObject *, self->ob_size+1);
if (items == NULL) {
PyErr_NoMemory();
return -1;
}
if (where < 0)
where = 0;
if (where > self->ob_size)
where = self->ob_size;
for (i = self->ob_size; --i >= where; )
items[i+1] = items[i];
Py_INCREF(v);
items[where] = v;
self->ob_item = items;
self->ob_size++;
return 0;
}
int
PyList_Insert(op, where, newitem)
PyObject *op;
int where;
PyObject *newitem;
{
if (!PyList_Check(op)) {
PyErr_BadInternalCall();
return -1;
}
return ins1((PyListObject *)op, where, newitem);
}
int
PyList_Append(op, newitem)
PyObject *op;
PyObject *newitem;
{
if (!PyList_Check(op)) {
PyErr_BadInternalCall();
return -1;
}
return ins1((PyListObject *)op,
(int) ((PyListObject *)op)->ob_size, newitem);
}
/* Methods */
static void
list_dealloc(op)
PyListObject *op;
{
int i;
if (op->ob_item != NULL) {
for (i = 0; i < op->ob_size; i++) {
Py_XDECREF(op->ob_item[i]);
}
free((ANY *)op->ob_item);
}
free((ANY *)op);
}
static int
list_print(op, fp, flags)
PyListObject *op;
FILE *fp;
int flags;
{
int i;
i = Py_ReprEnter((PyObject*)op);
if (i != 0) {
if (i < 0)
return i;
fprintf(fp, "[...]");
return 0;
}
fprintf(fp, "[");
for (i = 0; i < op->ob_size; i++) {
if (i > 0)
fprintf(fp, ", ");
if (PyObject_Print(op->ob_item[i], fp, 0) != 0) {
Py_ReprLeave((PyObject *)op);
return -1;
}
}
fprintf(fp, "]");
Py_ReprLeave((PyObject *)op);
return 0;
}
static PyObject *
list_repr(v)
PyListObject *v;
{
PyObject *s, *comma;
int i;
i = Py_ReprEnter((PyObject*)v);
if (i != 0) {
if (i > 0)
return PyString_FromString("[...]");
return NULL;
}
s = PyString_FromString("[");
comma = PyString_FromString(", ");
for (i = 0; i < v->ob_size && s != NULL; i++) {
if (i > 0)
PyString_Concat(&s, comma);
PyString_ConcatAndDel(&s, PyObject_Repr(v->ob_item[i]));
}
Py_XDECREF(comma);
PyString_ConcatAndDel(&s, PyString_FromString("]"));
Py_ReprLeave((PyObject *)v);
return s;
}
static int
list_compare(v, w)
PyListObject *v, *w;
{
int i;
for (i = 0; i < v->ob_size && i < w->ob_size; i++) {
int cmp = PyObject_Compare(v->ob_item[i], w->ob_item[i]);
if (cmp != 0)
return cmp;
}
return v->ob_size - w->ob_size;
}
static int
list_length(a)
PyListObject *a;
{
return a->ob_size;
}
static PyObject *
list_item(a, i)
PyListObject *a;
int i;
{
if (i < 0 || i >= a->ob_size) {
if (indexerr == NULL)
indexerr = PyString_FromString(
"list index out of range");
PyErr_SetObject(PyExc_IndexError, indexerr);
return NULL;
}
Py_INCREF(a->ob_item[i]);
return a->ob_item[i];
}
static PyObject *
list_slice(a, ilow, ihigh)
PyListObject *a;
int ilow, ihigh;
{
PyListObject *np;
int i;
if (ilow < 0)
ilow = 0;
else if (ilow > a->ob_size)
ilow = a->ob_size;
if (ihigh < ilow)
ihigh = ilow;
else if (ihigh > a->ob_size)
ihigh = a->ob_size;
np = (PyListObject *) PyList_New(ihigh - ilow);
if (np == NULL)
return NULL;
for (i = ilow; i < ihigh; i++) {
PyObject *v = a->ob_item[i];
Py_INCREF(v);
np->ob_item[i - ilow] = v;
}
return (PyObject *)np;
}
PyObject *
PyList_GetSlice(a, ilow, ihigh)
PyObject *a;
int ilow, ihigh;
{
if (!PyList_Check(a)) {
PyErr_BadInternalCall();
return NULL;
}
return list_slice((PyListObject *)a, ilow, ihigh);
}
static PyObject *
list_concat(a, bb)
PyListObject *a;
PyObject *bb;
{
int size;
int i;
PyListObject *np;
if (!PyList_Check(bb)) {
PyErr_BadArgument();
return NULL;
}
#define b ((PyListObject *)bb)
size = a->ob_size + b->ob_size;
np = (PyListObject *) PyList_New(size);
if (np == NULL) {
return NULL;
}
for (i = 0; i < a->ob_size; i++) {
PyObject *v = a->ob_item[i];
Py_INCREF(v);
np->ob_item[i] = v;
}
for (i = 0; i < b->ob_size; i++) {
PyObject *v = b->ob_item[i];
Py_INCREF(v);
np->ob_item[i + a->ob_size] = v;
}
return (PyObject *)np;
#undef b
}
static PyObject *
list_repeat(a, n)
PyListObject *a;
int n;
{
int i, j;
int size;
PyListObject *np;
PyObject **p;
if (n < 0)
n = 0;
size = a->ob_size * n;
np = (PyListObject *) PyList_New(size);
if (np == NULL)
return NULL;
p = np->ob_item;
for (i = 0; i < n; i++) {
for (j = 0; j < a->ob_size; j++) {
*p = a->ob_item[j];
Py_INCREF(*p);
p++;
}
}
return (PyObject *) np;
}
static int
list_ass_slice(a, ilow, ihigh, v)
PyListObject *a;
int ilow, ihigh;
PyObject *v;
{
/* Because [X]DECREF can recursively invoke list operations on
this list, we must postpone all [X]DECREF activity until
after the list is back in its canonical shape. Therefore
we must allocate an additional array, 'recycle', into which
we temporarily copy the items that are deleted from the
list. :-( */
PyObject **recycle, **p;
PyObject **item;
int n; /* Size of replacement list */
int d; /* Change in size */
int k; /* Loop index */
#define b ((PyListObject *)v)
if (v == NULL)
n = 0;
else if (PyList_Check(v)) {
n = b->ob_size;
if (a == b) {
/* Special case "a[i:j] = a" -- copy b first */
int ret;
v = list_slice(b, 0, n);
ret = list_ass_slice(a, ilow, ihigh, v);
Py_DECREF(v);
return ret;
}
}
else {
PyErr_BadArgument();
return -1;
}
if (ilow < 0)
ilow = 0;
else if (ilow > a->ob_size)
ilow = a->ob_size;
if (ihigh < ilow)
ihigh = ilow;
else if (ihigh > a->ob_size)
ihigh = a->ob_size;
item = a->ob_item;
d = n - (ihigh-ilow);
if (ihigh > ilow)
p = recycle = PyMem_NEW(PyObject *, (ihigh-ilow));
else
p = recycle = NULL;
if (d <= 0) { /* Delete -d items; recycle ihigh-ilow items */
for (k = ilow; k < ihigh; k++)
*p++ = item[k];
if (d < 0) {
for (/*k = ihigh*/; k < a->ob_size; k++)
item[k+d] = item[k];
a->ob_size += d;
NRESIZE(item, PyObject *, a->ob_size); /* Can't fail */
a->ob_item = item;
}
}
else { /* Insert d items; recycle ihigh-ilow items */
NRESIZE(item, PyObject *, a->ob_size + d);
if (item == NULL) {
PyMem_XDEL(recycle);
PyErr_NoMemory();
return -1;
}
for (k = a->ob_size; --k >= ihigh; )
item[k+d] = item[k];
for (/*k = ihigh-1*/; k >= ilow; --k)
*p++ = item[k];
a->ob_item = item;
a->ob_size += d;
}
for (k = 0; k < n; k++, ilow++) {
PyObject *w = b->ob_item[k];
Py_XINCREF(w);
item[ilow] = w;
}
if (recycle) {
while (--p >= recycle)
Py_XDECREF(*p);
PyMem_DEL(recycle);
}
return 0;
#undef b
}
int
PyList_SetSlice(a, ilow, ihigh, v)
PyObject *a;
int ilow, ihigh;
PyObject *v;
{
if (!PyList_Check(a)) {
PyErr_BadInternalCall();
return -1;
}
return list_ass_slice((PyListObject *)a, ilow, ihigh, v);
}
static int
list_ass_item(a, i, v)
PyListObject *a;
int i;
PyObject *v;
{
PyObject *old_value;
if (i < 0 || i >= a->ob_size) {
PyErr_SetString(PyExc_IndexError,
"list assignment index out of range");
return -1;
}
if (v == NULL)
return list_ass_slice(a, i, i+1, v);
Py_INCREF(v);
old_value = a->ob_item[i];
a->ob_item[i] = v;
Py_DECREF(old_value);
return 0;
}
static PyObject *
ins(self, where, v)
PyListObject *self;
int where;
PyObject *v;
{
if (ins1(self, where, v) != 0)
return NULL;
Py_INCREF(Py_None);
return Py_None;
}
static PyObject *
listinsert(self, args)
PyListObject *self;
PyObject *args;
{
int i;
PyObject *v;
if (!PyArg_Parse(args, "(iO)", &i, &v))
return NULL;
return ins(self, i, v);
}
static PyObject *
listappend(self, args)
PyListObject *self;
PyObject *args;
{
PyObject *v;
if (!PyArg_Parse(args, "O", &v))
return NULL;
return ins(self, (int) self->ob_size, v);
}
static PyObject *
listextend(self, args)
PyListObject *self;
PyObject *args;
{
PyObject *b = NULL, *res = NULL;
PyObject **items;
int selflen = PyList_GET_SIZE(self);
int blen;
register int i;
if (!PyArg_ParseTuple(args, "O", &b))
return NULL;
if (!PyList_Check(b)) {
PyErr_SetString(PyExc_TypeError,
"list.extend() argument must be a list");
return NULL;
}
if (PyList_GET_SIZE(b) == 0) {
/* short circuit when b is empty */
Py_INCREF(Py_None);
return Py_None;
}
if (self == (PyListObject*)b) {
/* as in list_ass_slice() we must special case the
* situation: a.extend(a)
*
* XXX: I think this way ought to be faster than using
* list_slice() the way list_ass_slice() does.
*/
b = PyList_New(selflen);
if (!b)
return NULL;
for (i = 0; i < selflen; i++) {
PyObject *o = PyList_GET_ITEM(self, i);
Py_INCREF(o);
PyList_SET_ITEM(b, i, o);
}
}
else
/* we want b to have the same refcount semantics for the
* Py_XDECREF() in the finally clause regardless of which
* branch in the above conditional we took.
*/
Py_INCREF(b);
blen = PyList_GET_SIZE(b);
/* resize a using idiom */
items = self->ob_item;
NRESIZE(items, PyObject*, selflen + blen);
if (items == NULL ) {
PyErr_NoMemory();
goto finally;
}
self->ob_item = items;
/* populate the end self with b's items */
for (i = 0; i < blen; i++) {
PyObject *o = PyList_GET_ITEM(b, i);
Py_INCREF(o);
PyList_SET_ITEM(self, self->ob_size++, o);
}
res = Py_None;
Py_INCREF(res);
finally:
Py_XDECREF(b);
return res;
}
static PyObject *
listpop(self, args)
PyListObject *self;
PyObject *args;
{
int i = -1;
PyObject *v;
if (!PyArg_ParseTuple(args, "|i", &i))
return NULL;
if (self->ob_size == 0) {
/* Special-case most common failure cause */
PyErr_SetString(PyExc_IndexError, "pop from empty list");
return NULL;
}
if (i < 0)
i += self->ob_size;
if (i < 0 || i >= self->ob_size) {
PyErr_SetString(PyExc_IndexError, "pop index out of range");
return NULL;
}
v = self->ob_item[i];
Py_INCREF(v);
if (list_ass_slice(self, i, i+1, (PyObject *)NULL) != 0) {
Py_DECREF(v);
return NULL;
}
return v;
}
/* New quicksort implementation for arrays of object pointers.
Thanks to discussions with Tim Peters. */
/* CMPERROR is returned by our comparison function when an error
occurred. This is the largest negative integer (0x80000000 on a
32-bit system). */
#define CMPERROR ( (int) ((unsigned int)1 << (8*sizeof(int) - 1)) )
/* Comparison function. Takes care of calling a user-supplied
comparison function (any callable Python object). Calls the
standard comparison function, PyObject_Compare(), if the user-
supplied function is NULL. */
static int
docompare(x, y, compare)
PyObject *x;
PyObject *y;
PyObject *compare;
{
PyObject *args, *res;
int i;
if (compare == NULL) {
i = PyObject_Compare(x, y);
if (i && PyErr_Occurred())
i = CMPERROR;
return i;
}
args = Py_BuildValue("(OO)", x, y);
if (args == NULL)
return CMPERROR;
res = PyEval_CallObject(compare, args);
Py_DECREF(args);
if (res == NULL)
return CMPERROR;
if (!PyInt_Check(res)) {
Py_DECREF(res);
PyErr_SetString(PyExc_TypeError,
"comparison function must return int");
return CMPERROR;
}
i = PyInt_AsLong(res);
Py_DECREF(res);
if (i < 0)
return -1;
if (i > 0)
return 1;
return 0;
}
/* MINSIZE is the smallest array that will get a full-blown samplesort
treatment; smaller arrays are sorted using binary insertion. It must
be at least 7 for the samplesort implementation to work. Binary
insertion does fewer compares, but can suffer O(N**2) data movement.
The more expensive compares, the larger MINSIZE should be. */
#define MINSIZE 100
/* MINPARTITIONSIZE is the smallest array slice samplesort will bother to
partition; smaller slices are passed to binarysort. It must be at
least 2, and no larger than MINSIZE. Setting it higher reduces the #
of compares slowly, but increases the amount of data movement quickly.
The value here was chosen assuming a compare costs ~25x more than
swapping a pair of memory-resident pointers -- but under that assumption,
changing the value by a few dozen more or less has aggregate effect
under 1%. So the value is crucial, but not touchy <wink>. */
#define MINPARTITIONSIZE 40
/* MAXMERGE is the largest number of elements we'll always merge into
a known-to-be sorted chunk via binary insertion, regardless of the
size of that chunk. Given a chunk of N sorted elements, and a group
of K unknowns, the largest K for which it's better to do insertion
(than a full-blown sort) is a complicated function of N and K mostly
involving the expected number of compares and data moves under each
approach, and the relative cost of those operations on a specific
architecure. The fixed value here is conservative, and should be a
clear win regardless of architecture or N. */
#define MAXMERGE 15
/* STACKSIZE is the size of our work stack. A rough estimate is that
this allows us to sort arrays of size N where
N / ln(N) = MINPARTITIONSIZE * 2**STACKSIZE, so 60 is more than enough
for arrays of size 2**64. Because we push the biggest partition
first, the worst case occurs when all subarrays are always partitioned
exactly in two. */
#define STACKSIZE 60
#define SETK(X,Y) if ((k = docompare(X,Y,compare))==CMPERROR) goto fail
/* binarysort is the best method for sorting small arrays: it does
few compares, but can do data movement quadratic in the number of
elements.
[lo, hi) is a contiguous slice of a list, and is sorted via
binary insertion.
On entry, must have lo <= start <= hi, and that [lo, start) is already
sorted (pass start == lo if you don't know!).
If docompare complains (returns CMPERROR) return -1, else 0.
Even in case of error, the output slice will be some permutation of
the input (nothing is lost or duplicated).
*/
static int
binarysort(lo, hi, start, compare)
PyObject **lo;
PyObject **hi;
PyObject **start;
PyObject *compare;/* Comparison function object, or NULL for default */
{
/* assert lo <= start <= hi
assert [lo, start) is sorted */
register int k;
register PyObject **l, **p, **r;
register PyObject *pivot;
if (lo == start)
++start;
for (; start < hi; ++start) {
/* set l to where *start belongs */
l = lo;
r = start;
pivot = *r;
do {
p = l + ((r - l) >> 1);
SETK(pivot, *p);
if (k < 0)
r = p;
else
l = p + 1;
} while (l < r);
/* Pivot should go at l -- slide over to make room.
Caution: using memmove is much slower under MSVC 5;
we're not usually moving many slots. */
for (p = start; p > l; --p)
*p = *(p-1);
*l = pivot;
}
return 0;
fail:
return -1;
}
/* samplesortslice is the sorting workhorse.
[lo, hi) is a contiguous slice of a list, to be sorted in place.
On entry, must have lo <= hi,
If docompare complains (returns CMPERROR) return -1, else 0.
Even in case of error, the output slice will be some permutation of
the input (nothing is lost or duplicated).
samplesort is basically quicksort on steroids: a power of 2 close
to n/ln(n) is computed, and that many elements (less 1) are picked at
random from the array and sorted. These 2**k - 1 elements are then
used as preselected pivots for an equal number of quicksort
partitioning steps, partitioning the slice into 2**k chunks each of
size about ln(n). These small final chunks are then usually handled
by binarysort. Note that when k=1, this is roughly the same as an
ordinary quicksort using a random pivot, and when k=2 this is roughly
a median-of-3 quicksort. From that view, using k ~= lg(n/ln(n)) makes
this a "median of n/ln(n)" quicksort. You can also view it as a kind
of bucket sort, where 2**k-1 bucket boundaries are picked dynamically.
The large number of samples makes a quadratic-time case almost
impossible, and asymptotically drives the average-case number of
compares from quicksort's 2 N ln N (or 12/7 N ln N for the median-of-
3 variant) down to N lg N.
We also play lots of low-level tricks to cut the number of compares.
Very obscure: To avoid using extra memory, the PPs are stored in the
array and shuffled around as partitioning proceeds. At the start of a
partitioning step, we'll have 2**m-1 (for some m) PPs in sorted order,
adjacent (either on the left or the right!) to a chunk of X elements
that are to be partitioned: P X or X P. In either case we need to
shuffle things *in place* so that the 2**(m-1) smaller PPs are on the
left, followed by the PP to be used for this step (that's the middle
of the PPs), followed by X, followed by the 2**(m-1) larger PPs:
P X or X P -> Psmall pivot X Plarge
and the order of the PPs must not be altered. It can take a while
to realize this isn't trivial! It can take even longer <wink> to
understand why the simple code below works, using only 2**(m-1) swaps.
The key is that the order of the X elements isn't necessarily
preserved: X can end up as some cyclic permutation of its original
order. That's OK, because X is unsorted anyway. If the order of X
had to be preserved too, the simplest method I know of using O(1)
scratch storage requires len(X) + 2**(m-1) swaps, spread over 2 passes.
Since len(X) is typically several times larger than 2**(m-1), that
would slow things down.
*/
struct SamplesortStackNode {
/* Represents a slice of the array, from (& including) lo up
to (but excluding) hi. "extra" additional & adjacent elements
are pre-selected pivots (PPs), spanning [lo-extra, lo) if
extra > 0, or [hi, hi-extra) if extra < 0. The PPs are
already sorted, but nothing is known about the other elements
in [lo, hi). |extra| is always one less than a power of 2.
When extra is 0, we're out of PPs, and the slice must be
sorted by some other means. */
PyObject **lo;
PyObject **hi;
int extra;
};
/* The number of PPs we want is 2**k - 1, where 2**k is as close to
N / ln(N) as possible. So k ~= lg(N / ln(N)). Calling libm routines
is undesirable, so cutoff values are canned in the "cutoff" table
below: cutoff[i] is the smallest N such that k == CUTOFFBASE + i. */
#define CUTOFFBASE 4
static long cutoff[] = {
43, /* smallest N such that k == 4 */
106, /* etc */
250,
576,
1298,
2885,
6339,
13805,
29843,
64116,
137030,
291554,
617916,
1305130,
2748295,
5771662,
12091672,
25276798,
52734615,
109820537,
228324027,
473977813,
982548444, /* smallest N such that k == 26 */
2034159050 /* largest N that fits in signed 32-bit; k == 27 */
};
static int
samplesortslice(lo, hi, compare)
PyObject **lo;
PyObject **hi;
PyObject *compare;/* Comparison function object, or NULL for default */
{
register PyObject **l, **r;
register PyObject *tmp, *pivot;
register int k;
int n, extra, top, extraOnRight;
struct SamplesortStackNode stack[STACKSIZE];
/* assert lo <= hi */
n = hi - lo;
/* ----------------------------------------------------------
* Special cases
* --------------------------------------------------------*/
if (n < 2)
return 0;
/* Set r to the largest value such that [lo,r) is sorted.
This catches the already-sorted case, the all-the-same
case, and the appended-a-few-elements-to-a-sorted-list case.
If the array is unsorted, we're very likely to get out of
the loop fast, so the test is cheap if it doesn't pay off.
*/
/* assert lo < hi */
for (r = lo+1; r < hi; ++r) {
SETK(*r, *(r-1));
if (k < 0)
break;
}
/* [lo,r) is sorted, [r,hi) unknown. Get out cheap if there are
few unknowns, or few elements in total. */
if (hi - r <= MAXMERGE || n < MINSIZE)
return binarysort(lo, hi, r, compare);
/* Check for the array already being reverse-sorted. Typical
benchmark-driven silliness <wink>. */
/* assert lo < hi */
for (r = lo+1; r < hi; ++r) {
SETK(*(r-1), *r);
if (k < 0)
break;
}
if (hi - r <= MAXMERGE) {
/* Reverse the reversed prefix, then insert the tail */
PyObject **originalr = r;
l = lo;
do {
--r;
tmp = *l; *l = *r; *r = tmp;
++l;
} while (l < r);
return binarysort(lo, hi, originalr, compare);
}
/* ----------------------------------------------------------
* Normal case setup: a large array without obvious pattern.
* --------------------------------------------------------*/
/* extra := a power of 2 ~= n/ln(n), less 1.
First find the smallest extra s.t. n < cutoff[extra] */
for (extra = 0;
extra < sizeof(cutoff) / sizeof(cutoff[0]);
++extra) {
if (n < cutoff[extra])
break;
/* note that if we fall out of the loop, the value of
extra still makes *sense*, but may be smaller than
we would like (but the array has more than ~= 2**31
elements in this case!) */
}
/* Now k == extra - 1 + CUTOFFBASE. The smallest value k can
have is CUTOFFBASE-1, so
assert MINSIZE >= 2**(CUTOFFBASE-1) - 1 */
extra = (1 << (extra - 1 + CUTOFFBASE)) - 1;
/* assert extra > 0 and n >= extra */
/* Swap that many values to the start of the array. The
selection of elements is pseudo-random, but the same on
every run (this is intentional! timing algorithm changes is
a pain if timing varies across runs). */
{
unsigned int seed = n / extra; /* arbitrary */
unsigned int i;
for (i = 0; i < (unsigned)extra; ++i) {
/* j := random int in [i, n) */
unsigned int j;
seed = seed * 69069 + 7;
j = i + seed % (n - i);
tmp = lo[i]; lo[i] = lo[j]; lo[j] = tmp;
}
}
/* Recursively sort the preselected pivots. */
if (samplesortslice(lo, lo + extra, compare) < 0)
goto fail;
top = 0; /* index of available stack slot */
lo += extra; /* point to first unknown */
extraOnRight = 0; /* the PPs are at the left end */
/* ----------------------------------------------------------
* Partition [lo, hi), and repeat until out of work.
* --------------------------------------------------------*/
for (;;) {
/* assert lo <= hi, so n >= 0 */
n = hi - lo;
/* We may not want, or may not be able, to partition:
If n is small, it's quicker to insert.
If extra is 0, we're out of pivots, and *must* use
another method.
*/
if (n < MINPARTITIONSIZE || extra == 0) {
if (n >= MINSIZE) {
/* assert extra == 0
This is rare, since the average size
of a final block is only about
ln(original n). */
if (samplesortslice(lo, hi, compare) < 0)
goto fail;
}
else {
/* Binary insertion should be quicker,
and we can take advantage of the PPs
already being sorted. */
if (extraOnRight && extra) {
/* swap the PPs to the left end */
k = extra;
do {
tmp = *lo;
*lo = *hi;
*hi = tmp;
++lo; ++hi;
} while (--k);
}
if (binarysort(lo - extra, hi, lo,
compare) < 0)
goto fail;
}
/* Find another slice to work on. */
if (--top < 0)
break; /* no more -- done! */
lo = stack[top].lo;
hi = stack[top].hi;
extra = stack[top].extra;
extraOnRight = 0;
if (extra < 0) {
extraOnRight = 1;
extra = -extra;
}
continue;
}
/* Pretend the PPs are indexed 0, 1, ..., extra-1.
Then our preselected pivot is at (extra-1)/2, and we
want to move the PPs before that to the left end of
the slice, and the PPs after that to the right end.
The following section changes extra, lo, hi, and the
slice such that:
[lo-extra, lo) contains the smaller PPs.
*lo == our PP.
(lo, hi) contains the unknown elements.
[hi, hi+extra) contains the larger PPs.
*/
k = extra >>= 1; /* num PPs to move */
if (extraOnRight) {
/* Swap the smaller PPs to the left end.
Note that this loop actually moves k+1 items:
the last is our PP */
do {
tmp = *lo; *lo = *hi; *hi = tmp;
++lo; ++hi;
} while (k--);
}
else {
/* Swap the larger PPs to the right end. */
while (k--) {
--lo; --hi;
tmp = *lo; *lo = *hi; *hi = tmp;
}
}
--lo; /* *lo is now our PP */
pivot = *lo;
/* Now an almost-ordinary quicksort partition step.
Note that most of the time is spent here!
Only odd thing is that we partition into < and >=,
instead of the usual <= and >=. This helps when
there are lots of duplicates of different values,
because it eventually tends to make subfiles
"pure" (all duplicates), and we special-case for
duplicates later. */
l = lo + 1;
r = hi - 1;
/* assert lo < l < r < hi (small n weeded out above) */
do {
/* slide l right, looking for key >= pivot */
do {
SETK(*l, pivot);
if (k < 0)
++l;
else
break;
} while (l < r);
/* slide r left, looking for key < pivot */
while (l < r) {
register PyObject *rval = *r--;
SETK(rval, pivot);
if (k < 0) {
/* swap and advance */
r[1] = *l;
*l++ = rval;
break;
}
}
} while (l < r);
/* assert lo < r <= l < hi
assert r == l or r+1 == l
everything to the left of l is < pivot, and
everything to the right of r is >= pivot */
if (l == r) {
SETK(*r, pivot);
if (k < 0)
++l;
else
--r;
}
/* assert lo <= r and r+1 == l and l <= hi
assert r == lo or a[r] < pivot
assert a[lo] is pivot
assert l == hi or a[l] >= pivot
Swap the pivot into "the middle", so we can henceforth
ignore it.
*/
*lo = *r;
*r = pivot;
/* The following is true now, & will be preserved:
All in [lo,r) are < pivot
All in [r,l) == pivot (& so can be ignored)
All in [l,hi) are >= pivot */
/* Check for duplicates of the pivot. One compare is
wasted if there are no duplicates, but can win big
when there are.
Tricky: we're sticking to "<" compares, so deduce
equality indirectly. We know pivot <= *l, so they're
equal iff not pivot < *l.
*/
while (l < hi) {
/* pivot <= *l known */
SETK(pivot, *l);
if (k < 0)
break;
else
/* <= and not < implies == */
++l;
}
/* assert lo <= r < l <= hi
Partitions are [lo, r) and [l, hi) */
/* push fattest first; remember we still have extra PPs
to the left of the left chunk and to the right of
the right chunk! */
/* assert top < STACKSIZE */
if (r - lo <= hi - l) {
/* second is bigger */
stack[top].lo = l;
stack[top].hi = hi;
stack[top].extra = -extra;
hi = r;
extraOnRight = 0;
}
else {
/* first is bigger */
stack[top].lo = lo;
stack[top].hi = r;
stack[top].extra = extra;
lo = l;
extraOnRight = 1;
}
++top;
} /* end of partitioning loop */
return 0;
fail:
return -1;
}
#undef SETK
staticforward PyTypeObject immutable_list_type;
static PyObject *
listsort(self, compare)
PyListObject *self;
PyObject *compare;
{
int err;
self->ob_type = &immutable_list_type;
err = samplesortslice(self->ob_item,
self->ob_item + self->ob_size,
compare);
self->ob_type = &PyList_Type;
if (err < 0)
return NULL;
Py_INCREF(Py_None);
return Py_None;
}
int
PyList_Sort(v)
PyObject *v;
{
if (v == NULL || !PyList_Check(v)) {
PyErr_BadInternalCall();
return -1;
}
v = listsort((PyListObject *)v, (PyObject *)NULL);
if (v == NULL)
return -1;
Py_DECREF(v);
return 0;
}
static PyObject *
listreverse(self, args)
PyListObject *self;
PyObject *args;
{
register PyObject **p, **q;
register PyObject *tmp;
if (args != NULL) {
PyErr_BadArgument();
return NULL;
}
if (self->ob_size > 1) {
for (p = self->ob_item, q = self->ob_item + self->ob_size - 1;
p < q; p++, q--) {
tmp = *p;
*p = *q;
*q = tmp;
}
}
Py_INCREF(Py_None);
return Py_None;
}
int
PyList_Reverse(v)
PyObject *v;
{
if (v == NULL || !PyList_Check(v)) {
PyErr_BadInternalCall();
return -1;
}
v = listreverse((PyListObject *)v, (PyObject *)NULL);
if (v == NULL)
return -1;
Py_DECREF(v);
return 0;
}
PyObject *
PyList_AsTuple(v)
PyObject *v;
{
PyObject *w;
PyObject **p;
int n;
if (v == NULL || !PyList_Check(v)) {
PyErr_BadInternalCall();
return NULL;
}
n = ((PyListObject *)v)->ob_size;
w = PyTuple_New(n);
if (w == NULL)
return NULL;
p = ((PyTupleObject *)w)->ob_item;
memcpy((ANY *)p,
(ANY *)((PyListObject *)v)->ob_item,
n*sizeof(PyObject *));
while (--n >= 0) {
Py_INCREF(*p);
p++;
}
return w;
}
static PyObject *
listindex(self, args)
PyListObject *self;
PyObject *args;
{
int i;
if (args == NULL) {
PyErr_BadArgument();
return NULL;
}
for (i = 0; i < self->ob_size; i++) {
if (PyObject_Compare(self->ob_item[i], args) == 0)
return PyInt_FromLong((long)i);
if (PyErr_Occurred())
return NULL;
}
PyErr_SetString(PyExc_ValueError, "list.index(x): x not in list");
return NULL;
}
static PyObject *
listcount(self, args)
PyListObject *self;
PyObject *args;
{
int count = 0;
int i;
if (args == NULL) {
PyErr_SetString(PyExc_TypeError,
"list.count(x): argument missing");
return NULL;
}
for (i = 0; i < self->ob_size; i++) {
if (PyObject_Compare(self->ob_item[i], args) == 0)
count++;
if (PyErr_Occurred())
return NULL;
}
return PyInt_FromLong((long)count);
}
static PyObject *
listremove(self, args)
PyListObject *self;
PyObject *args;
{
int i;
if (args == NULL) {
PyErr_BadArgument();
return NULL;
}
for (i = 0; i < self->ob_size; i++) {
if (PyObject_Compare(self->ob_item[i], args) == 0) {
if (list_ass_slice(self, i, i+1,
(PyObject *)NULL) != 0)
return NULL;
Py_INCREF(Py_None);
return Py_None;
}
if (PyErr_Occurred())
return NULL;
}
PyErr_SetString(PyExc_ValueError, "list.remove(x): x not in list");
return NULL;
}
static char append_doc[] =
"L.append(object) -- append object to end";
static char extend_doc[] =
"L.extend(list) -- extend list by appending list elements";
static char insert_doc[] =
"L.insert(index, object) -- insert object before index";
static char pop_doc[] =
"L.pop([index]) -> item -- remove and return item at index (default last)";
static char remove_doc[] =
"L.remove(value) -- remove first occurrence of value";
static char index_doc[] =
"L.index(value) -> integer -- return index of first occurrence of value";
static char count_doc[] =
"L.count(value) -> integer -- return number of occurrences of value";
static char reverse_doc[] =
"L.reverse() -- reverse *IN PLACE*";
static char sort_doc[] =
"L.sort([cmpfunc]) -- sort *IN PLACE*; if given, cmpfunc(x, y) -> -1, 0, 1";
static PyMethodDef list_methods[] = {
{"append", (PyCFunction)listappend, 0, append_doc},
{"insert", (PyCFunction)listinsert, 0, insert_doc},
{"extend", (PyCFunction)listextend, 1, extend_doc},
{"pop", (PyCFunction)listpop, 1, pop_doc},
{"remove", (PyCFunction)listremove, 0, remove_doc},
{"index", (PyCFunction)listindex, 0, index_doc},
{"count", (PyCFunction)listcount, 0, count_doc},
{"reverse", (PyCFunction)listreverse, 0, reverse_doc},
{"sort", (PyCFunction)listsort, 0, sort_doc},
{NULL, NULL} /* sentinel */
};
static PyObject *
list_getattr(f, name)
PyListObject *f;
char *name;
{
return Py_FindMethod(list_methods, (PyObject *)f, name);
}
static PySequenceMethods list_as_sequence = {
(inquiry)list_length, /*sq_length*/
(binaryfunc)list_concat, /*sq_concat*/
(intargfunc)list_repeat, /*sq_repeat*/
(intargfunc)list_item, /*sq_item*/
(intintargfunc)list_slice, /*sq_slice*/
(intobjargproc)list_ass_item, /*sq_ass_item*/
(intintobjargproc)list_ass_slice, /*sq_ass_slice*/
};
PyTypeObject PyList_Type = {
PyObject_HEAD_INIT(&PyType_Type)
0,
"list",
sizeof(PyListObject),
0,
(destructor)list_dealloc, /*tp_dealloc*/
(printfunc)list_print, /*tp_print*/
(getattrfunc)list_getattr, /*tp_getattr*/
0, /*tp_setattr*/
(cmpfunc)list_compare, /*tp_compare*/
(reprfunc)list_repr, /*tp_repr*/
0, /*tp_as_number*/
&list_as_sequence, /*tp_as_sequence*/
0, /*tp_as_mapping*/
};
/* During a sort, we really can't have anyone modifying the list; it could
cause core dumps. Thus, we substitute a dummy type that raises an
explanatory exception when a modifying operation is used. Caveat:
comparisons may behave differently; but I guess it's a bad idea anyway to
compare a list that's being sorted... */
static PyObject *
immutable_list_op(/*No args!*/)
{
PyErr_SetString(PyExc_TypeError,
"a list cannot be modified while it is being sorted");
return NULL;
}
static PyMethodDef immutable_list_methods[] = {
{"append", (PyCFunction)immutable_list_op},
{"insert", (PyCFunction)immutable_list_op},
{"remove", (PyCFunction)immutable_list_op},
{"index", (PyCFunction)listindex},
{"count", (PyCFunction)listcount},
{"reverse", (PyCFunction)immutable_list_op},
{"sort", (PyCFunction)immutable_list_op},
{NULL, NULL} /* sentinel */
};
static PyObject *
immutable_list_getattr(f, name)
PyListObject *f;
char *name;
{
return Py_FindMethod(immutable_list_methods, (PyObject *)f, name);
}
static int
immutable_list_ass(/*No args!*/)
{
immutable_list_op();
return -1;
}
static PySequenceMethods immutable_list_as_sequence = {
(inquiry)list_length, /*sq_length*/
(binaryfunc)list_concat, /*sq_concat*/
(intargfunc)list_repeat, /*sq_repeat*/
(intargfunc)list_item, /*sq_item*/
(intintargfunc)list_slice, /*sq_slice*/
(intobjargproc)immutable_list_ass, /*sq_ass_item*/
(intintobjargproc)immutable_list_ass, /*sq_ass_slice*/
};
static PyTypeObject immutable_list_type = {
PyObject_HEAD_INIT(&PyType_Type)
0,
"list (immutable, during sort)",
sizeof(PyListObject),
0,
0, /*tp_dealloc*/ /* Cannot happen */
(printfunc)list_print, /*tp_print*/
(getattrfunc)immutable_list_getattr, /*tp_getattr*/
0, /*tp_setattr*/
0, /*tp_compare*/ /* Won't be called */
(reprfunc)list_repr, /*tp_repr*/
0, /*tp_as_number*/
&immutable_list_as_sequence, /*tp_as_sequence*/
0, /*tp_as_mapping*/
};