blob: 62f9662ee6bddd1e61f71f870ca2731c142a178d [file] [log] [blame]
Guido van Rossum0b191782002-08-02 18:29:53 +00001"""Unittests for heapq."""
2
Thomas Wouterscf297e42007-02-23 15:07:44 +00003from heapq import heappush, heappop, heapify, heapreplace, merge, nlargest, nsmallest
Guido van Rossum0b191782002-08-02 18:29:53 +00004import random
Raymond Hettingerbce036b2004-06-10 05:07:18 +00005import unittest
6from test import test_support
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +00007import sys
Guido van Rossum0b191782002-08-02 18:29:53 +00008
Guido van Rossum0b191782002-08-02 18:29:53 +00009
Raymond Hettingerbce036b2004-06-10 05:07:18 +000010def heapiter(heap):
11 # An iterator returning a heap's elements, smallest-first.
12 try:
13 while 1:
14 yield heappop(heap)
15 except IndexError:
16 pass
Tim Petersaa7d2432002-08-03 02:11:26 +000017
Raymond Hettingerbce036b2004-06-10 05:07:18 +000018class TestHeap(unittest.TestCase):
Tim Petersaa7d2432002-08-03 02:11:26 +000019
Raymond Hettingerbce036b2004-06-10 05:07:18 +000020 def test_push_pop(self):
21 # 1) Push 256 random numbers and pop them off, verifying all's OK.
22 heap = []
23 data = []
24 self.check_invariant(heap)
25 for i in range(256):
26 item = random.random()
27 data.append(item)
28 heappush(heap, item)
29 self.check_invariant(heap)
30 results = []
31 while heap:
32 item = heappop(heap)
33 self.check_invariant(heap)
34 results.append(item)
35 data_sorted = data[:]
36 data_sorted.sort()
37 self.assertEqual(data_sorted, results)
38 # 2) Check that the invariant holds for a sorted array
39 self.check_invariant(results)
40
Neal Norwitzd7be1182004-07-08 01:56:46 +000041 self.assertRaises(TypeError, heappush, [])
Raymond Hettingere1defa42004-11-29 05:54:48 +000042 try:
43 self.assertRaises(TypeError, heappush, None, None)
44 self.assertRaises(TypeError, heappop, None)
45 except AttributeError:
46 pass
Neal Norwitzd7be1182004-07-08 01:56:46 +000047
Raymond Hettingerbce036b2004-06-10 05:07:18 +000048 def check_invariant(self, heap):
49 # Check the heap invariant.
50 for pos, item in enumerate(heap):
51 if pos: # pos 0 has no parent
52 parentpos = (pos-1) >> 1
53 self.assert_(heap[parentpos] <= item)
54
55 def test_heapify(self):
56 for size in range(30):
57 heap = [random.random() for dummy in range(size)]
58 heapify(heap)
59 self.check_invariant(heap)
60
Neal Norwitzd7be1182004-07-08 01:56:46 +000061 self.assertRaises(TypeError, heapify, None)
62
Raymond Hettingerbce036b2004-06-10 05:07:18 +000063 def test_naive_nbest(self):
64 data = [random.randrange(2000) for i in range(1000)]
65 heap = []
66 for item in data:
67 heappush(heap, item)
68 if len(heap) > 10:
69 heappop(heap)
70 heap.sort()
71 self.assertEqual(heap, sorted(data)[-10:])
72
73 def test_nbest(self):
74 # Less-naive "N-best" algorithm, much faster (if len(data) is big
75 # enough <wink>) than sorting all of data. However, if we had a max
76 # heap instead of a min heap, it could go faster still via
77 # heapify'ing all of data (linear time), then doing 10 heappops
78 # (10 log-time steps).
79 data = [random.randrange(2000) for i in range(1000)]
80 heap = data[:10]
81 heapify(heap)
82 for item in data[10:]:
83 if item > heap[0]: # this gets rarer the longer we run
84 heapreplace(heap, item)
85 self.assertEqual(list(heapiter(heap)), sorted(data)[-10:])
86
Neal Norwitzd7be1182004-07-08 01:56:46 +000087 self.assertRaises(TypeError, heapreplace, None)
88 self.assertRaises(TypeError, heapreplace, None, None)
89 self.assertRaises(IndexError, heapreplace, [], None)
90
Raymond Hettingerbce036b2004-06-10 05:07:18 +000091 def test_heapsort(self):
92 # Exercise everything with repeated heapsort checks
Guido van Rossum805365e2007-05-07 22:24:25 +000093 for trial in range(100):
Raymond Hettingerbce036b2004-06-10 05:07:18 +000094 size = random.randrange(50)
95 data = [random.randrange(25) for i in range(size)]
96 if trial & 1: # Half of the time, use heapify
97 heap = data[:]
98 heapify(heap)
99 else: # The rest of the time, use heappush
100 heap = []
101 for item in data:
102 heappush(heap, item)
103 heap_sorted = [heappop(heap) for i in range(size)]
104 self.assertEqual(heap_sorted, sorted(data))
105
Thomas Wouterscf297e42007-02-23 15:07:44 +0000106 def test_merge(self):
107 inputs = []
Guido van Rossum805365e2007-05-07 22:24:25 +0000108 for i in range(random.randrange(5)):
Thomas Wouterscf297e42007-02-23 15:07:44 +0000109 row = sorted(random.randrange(1000) for j in range(random.randrange(10)))
110 inputs.append(row)
111 self.assertEqual(sorted(chain(*inputs)), list(merge(*inputs)))
112 self.assertEqual(list(merge()), [])
113
114 def test_merge_stability(self):
115 class Int(int):
116 pass
117 inputs = [[], [], [], []]
118 for i in range(20000):
119 stream = random.randrange(4)
120 x = random.randrange(500)
121 obj = Int(x)
122 obj.pair = (x, stream)
123 inputs[stream].append(obj)
124 for stream in inputs:
125 stream.sort()
126 result = [i.pair for i in merge(*inputs)]
127 self.assertEqual(result, sorted(result))
128
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000129 def test_nsmallest(self):
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000130 data = [(random.randrange(2000), i) for i in range(1000)]
131 for f in (None, lambda x: x[0] * 547 % 2000):
132 for n in (0, 1, 2, 10, 100, 400, 999, 1000, 1100):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000133 self.assertEqual(list(nsmallest(n, data)), sorted(data)[:n])
134 self.assertEqual(list(nsmallest(n, data, key=f)),
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000135 sorted(data, key=f)[:n])
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000136
Raymond Hettinger4901a1f2004-12-02 08:59:14 +0000137 def test_nlargest(self):
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000138 data = [(random.randrange(2000), i) for i in range(1000)]
139 for f in (None, lambda x: x[0] * 547 % 2000):
140 for n in (0, 1, 2, 10, 100, 400, 999, 1000, 1100):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000141 self.assertEqual(list(nlargest(n, data)),
142 sorted(data, reverse=True)[:n])
143 self.assertEqual(list(nlargest(n, data, key=f)),
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000144 sorted(data, key=f, reverse=True)[:n])
Tim Petersaa7d2432002-08-03 02:11:26 +0000145
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000146
147#==============================================================================
148
149class LenOnly:
150 "Dummy sequence class defining __len__ but not __getitem__."
151 def __len__(self):
152 return 10
153
154class GetOnly:
155 "Dummy sequence class defining __getitem__ but not __len__."
156 def __getitem__(self, ndx):
157 return 10
158
159class CmpErr:
160 "Dummy element that always raises an error during comparison"
161 def __cmp__(self, other):
162 raise ZeroDivisionError
Guido van Rossum47b9ff62006-08-24 00:41:19 +0000163 __eq__ = __ne__ = __lt__ = __le__ = __gt__ = __ge__ = __cmp__
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000164
165def R(seqn):
166 'Regular generator'
167 for i in seqn:
168 yield i
169
170class G:
171 'Sequence using __getitem__'
172 def __init__(self, seqn):
173 self.seqn = seqn
174 def __getitem__(self, i):
175 return self.seqn[i]
176
177class I:
178 'Sequence using iterator protocol'
179 def __init__(self, seqn):
180 self.seqn = seqn
181 self.i = 0
182 def __iter__(self):
183 return self
Georg Brandla18af4e2007-04-21 15:47:16 +0000184 def __next__(self):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000185 if self.i >= len(self.seqn): raise StopIteration
186 v = self.seqn[self.i]
187 self.i += 1
188 return v
189
190class Ig:
191 'Sequence using iterator protocol defined with a generator'
192 def __init__(self, seqn):
193 self.seqn = seqn
194 self.i = 0
195 def __iter__(self):
196 for val in self.seqn:
197 yield val
198
199class X:
200 'Missing __getitem__ and __iter__'
201 def __init__(self, seqn):
202 self.seqn = seqn
203 self.i = 0
Georg Brandla18af4e2007-04-21 15:47:16 +0000204 def __next__(self):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000205 if self.i >= len(self.seqn): raise StopIteration
206 v = self.seqn[self.i]
207 self.i += 1
208 return v
209
210class N:
Georg Brandla18af4e2007-04-21 15:47:16 +0000211 'Iterator missing __next__()'
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000212 def __init__(self, seqn):
213 self.seqn = seqn
214 self.i = 0
215 def __iter__(self):
216 return self
217
218class E:
219 'Test propagation of exceptions'
220 def __init__(self, seqn):
221 self.seqn = seqn
222 self.i = 0
223 def __iter__(self):
224 return self
Georg Brandla18af4e2007-04-21 15:47:16 +0000225 def __next__(self):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000226 3 // 0
227
228class S:
229 'Test immediate stop'
230 def __init__(self, seqn):
231 pass
232 def __iter__(self):
233 return self
Georg Brandla18af4e2007-04-21 15:47:16 +0000234 def __next__(self):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000235 raise StopIteration
236
237from itertools import chain, imap
238def L(seqn):
239 'Test multiple tiers of iterators'
240 return chain(imap(lambda x:x, R(Ig(G(seqn)))))
241
242class TestErrorHandling(unittest.TestCase):
243
244 def test_non_sequence(self):
245 for f in (heapify, heappop):
246 self.assertRaises(TypeError, f, 10)
247 for f in (heappush, heapreplace, nlargest, nsmallest):
248 self.assertRaises(TypeError, f, 10, 10)
249
250 def test_len_only(self):
251 for f in (heapify, heappop):
252 self.assertRaises(TypeError, f, LenOnly())
253 for f in (heappush, heapreplace):
254 self.assertRaises(TypeError, f, LenOnly(), 10)
255 for f in (nlargest, nsmallest):
256 self.assertRaises(TypeError, f, 2, LenOnly())
257
258 def test_get_only(self):
259 for f in (heapify, heappop):
260 self.assertRaises(TypeError, f, GetOnly())
261 for f in (heappush, heapreplace):
262 self.assertRaises(TypeError, f, GetOnly(), 10)
263 for f in (nlargest, nsmallest):
264 self.assertRaises(TypeError, f, 2, GetOnly())
265
266 def test_get_only(self):
267 seq = [CmpErr(), CmpErr(), CmpErr()]
268 for f in (heapify, heappop):
269 self.assertRaises(ZeroDivisionError, f, seq)
270 for f in (heappush, heapreplace):
271 self.assertRaises(ZeroDivisionError, f, seq, 10)
272 for f in (nlargest, nsmallest):
273 self.assertRaises(ZeroDivisionError, f, 2, seq)
274
275 def test_arg_parsing(self):
276 for f in (heapify, heappop, heappush, heapreplace, nlargest, nsmallest):
277 self.assertRaises(TypeError, f, 10)
278
279 def test_iterable_args(self):
280 for f in (nlargest, nsmallest):
Guido van Rossum805365e2007-05-07 22:24:25 +0000281 for s in ("123", "", range(1000), (1, 1.2), range(2000,2200,5)):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000282 for g in (G, I, Ig, L, R):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000283 self.assertEqual(list(f(2, g(s))), list(f(2,s)))
284 self.assertEqual(list(f(2, S(s))), [])
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000285 self.assertRaises(TypeError, f, 2, X(s))
286 self.assertRaises(TypeError, f, 2, N(s))
287 self.assertRaises(ZeroDivisionError, f, 2, E(s))
288
289#==============================================================================
290
291
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +0000292def test_main(verbose=None):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000293 from types import BuiltinFunctionType
294
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +0000295 test_classes = [TestHeap]
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000296 if isinstance(heapify, BuiltinFunctionType):
297 test_classes.append(TestErrorHandling)
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +0000298 test_support.run_unittest(*test_classes)
299
300 # verify reference counting
301 if verbose and hasattr(sys, "gettotalrefcount"):
302 import gc
303 counts = [None] * 5
Guido van Rossum805365e2007-05-07 22:24:25 +0000304 for i in range(len(counts)):
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +0000305 test_support.run_unittest(*test_classes)
306 gc.collect()
307 counts[i] = sys.gettotalrefcount()
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000308 print(counts)
Guido van Rossum0b191782002-08-02 18:29:53 +0000309
310if __name__ == "__main__":
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +0000311 test_main(verbose=True)