blob: e0c49c110f6c98112ed936a16f8c66a70c1d0b01 [file] [log] [blame]
Guido van Rossum0b191782002-08-02 18:29:53 +00001"""Unittests for heapq."""
2
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +00003import sys
Ezio Melotti8269a442011-05-09 07:15:04 +03004import random
Guido van Rossum0b191782002-08-02 18:29:53 +00005
Ezio Melotti8269a442011-05-09 07:15:04 +03006from test import support
7from unittest import TestCase, skipUnless
8
Nick Coghlan47384702009-04-22 16:13:36 +00009py_heapq = support.import_fresh_module('heapq', blocked=['_heapq'])
Ezio Melotti8269a442011-05-09 07:15:04 +030010c_heapq = support.import_fresh_module('heapq', fresh=['_heapq'])
Tim Petersaa7d2432002-08-03 02:11:26 +000011
Ezio Melotti8269a442011-05-09 07:15:04 +030012# _heapq.nlargest/nsmallest are saved in heapq._nlargest/_smallest when
13# _heapq is imported, so check them there
14func_names = ['heapify', 'heappop', 'heappush', 'heappushpop',
15 'heapreplace', '_nlargest', '_nsmallest']
16
17class TestModules(TestCase):
18 def test_py_functions(self):
19 for fname in func_names:
20 self.assertEqual(getattr(py_heapq, fname).__module__, 'heapq')
21
22 @skipUnless(c_heapq, 'requires _heapq')
23 def test_c_functions(self):
24 for fname in func_names:
25 self.assertEqual(getattr(c_heapq, fname).__module__, '_heapq')
26
27
28class TestHeap(TestCase):
Christian Heimesd3eb5a152008-02-24 00:38:49 +000029 module = None
Tim Petersaa7d2432002-08-03 02:11:26 +000030
Raymond Hettingerbce036b2004-06-10 05:07:18 +000031 def test_push_pop(self):
32 # 1) Push 256 random numbers and pop them off, verifying all's OK.
33 heap = []
34 data = []
35 self.check_invariant(heap)
36 for i in range(256):
37 item = random.random()
38 data.append(item)
Christian Heimesd3eb5a152008-02-24 00:38:49 +000039 self.module.heappush(heap, item)
Raymond Hettingerbce036b2004-06-10 05:07:18 +000040 self.check_invariant(heap)
41 results = []
42 while heap:
Christian Heimesd3eb5a152008-02-24 00:38:49 +000043 item = self.module.heappop(heap)
Raymond Hettingerbce036b2004-06-10 05:07:18 +000044 self.check_invariant(heap)
45 results.append(item)
46 data_sorted = data[:]
47 data_sorted.sort()
48 self.assertEqual(data_sorted, results)
49 # 2) Check that the invariant holds for a sorted array
50 self.check_invariant(results)
51
Christian Heimesd3eb5a152008-02-24 00:38:49 +000052 self.assertRaises(TypeError, self.module.heappush, [])
Raymond Hettingere1defa42004-11-29 05:54:48 +000053 try:
Christian Heimesd3eb5a152008-02-24 00:38:49 +000054 self.assertRaises(TypeError, self.module.heappush, None, None)
55 self.assertRaises(TypeError, self.module.heappop, None)
Raymond Hettingere1defa42004-11-29 05:54:48 +000056 except AttributeError:
57 pass
Neal Norwitzd7be1182004-07-08 01:56:46 +000058
Raymond Hettingerbce036b2004-06-10 05:07:18 +000059 def check_invariant(self, heap):
60 # Check the heap invariant.
61 for pos, item in enumerate(heap):
62 if pos: # pos 0 has no parent
63 parentpos = (pos-1) >> 1
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000064 self.assertTrue(heap[parentpos] <= item)
Raymond Hettingerbce036b2004-06-10 05:07:18 +000065
66 def test_heapify(self):
67 for size in range(30):
68 heap = [random.random() for dummy in range(size)]
Christian Heimesd3eb5a152008-02-24 00:38:49 +000069 self.module.heapify(heap)
Raymond Hettingerbce036b2004-06-10 05:07:18 +000070 self.check_invariant(heap)
71
Christian Heimesd3eb5a152008-02-24 00:38:49 +000072 self.assertRaises(TypeError, self.module.heapify, None)
Neal Norwitzd7be1182004-07-08 01:56:46 +000073
Raymond Hettingerbce036b2004-06-10 05:07:18 +000074 def test_naive_nbest(self):
75 data = [random.randrange(2000) for i in range(1000)]
76 heap = []
77 for item in data:
Christian Heimesd3eb5a152008-02-24 00:38:49 +000078 self.module.heappush(heap, item)
Raymond Hettingerbce036b2004-06-10 05:07:18 +000079 if len(heap) > 10:
Christian Heimesd3eb5a152008-02-24 00:38:49 +000080 self.module.heappop(heap)
Raymond Hettingerbce036b2004-06-10 05:07:18 +000081 heap.sort()
82 self.assertEqual(heap, sorted(data)[-10:])
83
Christian Heimesd3eb5a152008-02-24 00:38:49 +000084 def heapiter(self, heap):
85 # An iterator returning a heap's elements, smallest-first.
86 try:
87 while 1:
88 yield self.module.heappop(heap)
89 except IndexError:
90 pass
91
Raymond Hettingerbce036b2004-06-10 05:07:18 +000092 def test_nbest(self):
93 # Less-naive "N-best" algorithm, much faster (if len(data) is big
94 # enough <wink>) than sorting all of data. However, if we had a max
95 # heap instead of a min heap, it could go faster still via
96 # heapify'ing all of data (linear time), then doing 10 heappops
97 # (10 log-time steps).
98 data = [random.randrange(2000) for i in range(1000)]
99 heap = data[:10]
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000100 self.module.heapify(heap)
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000101 for item in data[10:]:
102 if item > heap[0]: # this gets rarer the longer we run
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000103 self.module.heapreplace(heap, item)
104 self.assertEqual(list(self.heapiter(heap)), sorted(data)[-10:])
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000105
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000106 self.assertRaises(TypeError, self.module.heapreplace, None)
107 self.assertRaises(TypeError, self.module.heapreplace, None, None)
108 self.assertRaises(IndexError, self.module.heapreplace, [], None)
Neal Norwitzd7be1182004-07-08 01:56:46 +0000109
Christian Heimesdd15f6c2008-03-16 00:07:10 +0000110 def test_nbest_with_pushpop(self):
111 data = [random.randrange(2000) for i in range(1000)]
112 heap = data[:10]
113 self.module.heapify(heap)
114 for item in data[10:]:
115 self.module.heappushpop(heap, item)
116 self.assertEqual(list(self.heapiter(heap)), sorted(data)[-10:])
117 self.assertEqual(self.module.heappushpop([], 'x'), 'x')
118
119 def test_heappushpop(self):
120 h = []
121 x = self.module.heappushpop(h, 10)
122 self.assertEqual((h, x), ([], 10))
123
124 h = [10]
125 x = self.module.heappushpop(h, 10.0)
126 self.assertEqual((h, x), ([10], 10.0))
127 self.assertEqual(type(h[0]), int)
128 self.assertEqual(type(x), float)
129
130 h = [10];
131 x = self.module.heappushpop(h, 9)
132 self.assertEqual((h, x), ([10], 9))
133
134 h = [10];
135 x = self.module.heappushpop(h, 11)
136 self.assertEqual((h, x), ([11], 10))
137
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000138 def test_heapsort(self):
139 # Exercise everything with repeated heapsort checks
Guido van Rossum805365e2007-05-07 22:24:25 +0000140 for trial in range(100):
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000141 size = random.randrange(50)
142 data = [random.randrange(25) for i in range(size)]
143 if trial & 1: # Half of the time, use heapify
144 heap = data[:]
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000145 self.module.heapify(heap)
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000146 else: # The rest of the time, use heappush
147 heap = []
148 for item in data:
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000149 self.module.heappush(heap, item)
150 heap_sorted = [self.module.heappop(heap) for i in range(size)]
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000151 self.assertEqual(heap_sorted, sorted(data))
152
Thomas Wouterscf297e42007-02-23 15:07:44 +0000153 def test_merge(self):
154 inputs = []
Guido van Rossum805365e2007-05-07 22:24:25 +0000155 for i in range(random.randrange(5)):
Thomas Wouterscf297e42007-02-23 15:07:44 +0000156 row = sorted(random.randrange(1000) for j in range(random.randrange(10)))
157 inputs.append(row)
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000158 self.assertEqual(sorted(chain(*inputs)), list(self.module.merge(*inputs)))
159 self.assertEqual(list(self.module.merge()), [])
Thomas Wouterscf297e42007-02-23 15:07:44 +0000160
161 def test_merge_stability(self):
162 class Int(int):
163 pass
164 inputs = [[], [], [], []]
165 for i in range(20000):
166 stream = random.randrange(4)
167 x = random.randrange(500)
168 obj = Int(x)
169 obj.pair = (x, stream)
170 inputs[stream].append(obj)
171 for stream in inputs:
172 stream.sort()
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000173 result = [i.pair for i in self.module.merge(*inputs)]
Thomas Wouterscf297e42007-02-23 15:07:44 +0000174 self.assertEqual(result, sorted(result))
175
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000176 def test_nsmallest(self):
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000177 data = [(random.randrange(2000), i) for i in range(1000)]
178 for f in (None, lambda x: x[0] * 547 % 2000):
179 for n in (0, 1, 2, 10, 100, 400, 999, 1000, 1100):
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000180 self.assertEqual(list(self.module.nsmallest(n, data)),
181 sorted(data)[:n])
182 self.assertEqual(list(self.module.nsmallest(n, data, key=f)),
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000183 sorted(data, key=f)[:n])
Raymond Hettingerbce036b2004-06-10 05:07:18 +0000184
Raymond Hettinger4901a1f2004-12-02 08:59:14 +0000185 def test_nlargest(self):
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000186 data = [(random.randrange(2000), i) for i in range(1000)]
187 for f in (None, lambda x: x[0] * 547 % 2000):
188 for n in (0, 1, 2, 10, 100, 400, 999, 1000, 1100):
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000189 self.assertEqual(list(self.module.nlargest(n, data)),
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000190 sorted(data, reverse=True)[:n])
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000191 self.assertEqual(list(self.module.nlargest(n, data, key=f)),
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000192 sorted(data, key=f, reverse=True)[:n])
Tim Petersaa7d2432002-08-03 02:11:26 +0000193
Amaury Forgeot d'Arcfdfe62d2008-06-17 20:36:03 +0000194 def test_comparison_operator(self):
Ezio Melottif9756c22011-05-09 18:36:53 +0300195 # Issue 3051: Make sure heapq works with both __lt__
Amaury Forgeot d'Arc2ba198d2008-06-17 21:25:35 +0000196 # For python 3.0, __le__ alone is not enough
Amaury Forgeot d'Arcfdfe62d2008-06-17 20:36:03 +0000197 def hsort(data, comp):
198 data = [comp(x) for x in data]
199 self.module.heapify(data)
200 return [self.module.heappop(data).x for i in range(len(data))]
201 class LT:
202 def __init__(self, x):
203 self.x = x
204 def __lt__(self, other):
205 return self.x > other.x
206 class LE:
207 def __init__(self, x):
208 self.x = x
Amaury Forgeot d'Arc35c86582008-06-17 21:11:29 +0000209 def __le__(self, other):
Amaury Forgeot d'Arcfdfe62d2008-06-17 20:36:03 +0000210 return self.x >= other.x
211 data = [random.random() for i in range(100)]
212 target = sorted(data, reverse=True)
213 self.assertEqual(hsort(data, LT), target)
Amaury Forgeot d'Arc2ba198d2008-06-17 21:25:35 +0000214 self.assertRaises(TypeError, data, LE)
Amaury Forgeot d'Arcfdfe62d2008-06-17 20:36:03 +0000215
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000216
Ezio Melottif9756c22011-05-09 18:36:53 +0300217class TestHeapPython(TestHeap):
218 module = py_heapq
219
220
221@skipUnless(c_heapq, 'requires _heapq')
222class TestHeapC(TestHeap):
223 module = c_heapq
224
225
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000226#==============================================================================
227
228class LenOnly:
229 "Dummy sequence class defining __len__ but not __getitem__."
230 def __len__(self):
231 return 10
232
233class GetOnly:
234 "Dummy sequence class defining __getitem__ but not __len__."
235 def __getitem__(self, ndx):
236 return 10
237
238class CmpErr:
239 "Dummy element that always raises an error during comparison"
Mark Dickinsona56c4672009-01-27 18:17:45 +0000240 def __eq__(self, other):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000241 raise ZeroDivisionError
Mark Dickinsona56c4672009-01-27 18:17:45 +0000242 __ne__ = __lt__ = __le__ = __gt__ = __ge__ = __eq__
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000243
244def R(seqn):
245 'Regular generator'
246 for i in seqn:
247 yield i
248
249class G:
250 'Sequence using __getitem__'
251 def __init__(self, seqn):
252 self.seqn = seqn
253 def __getitem__(self, i):
254 return self.seqn[i]
255
256class I:
257 'Sequence using iterator protocol'
258 def __init__(self, seqn):
259 self.seqn = seqn
260 self.i = 0
261 def __iter__(self):
262 return self
Georg Brandla18af4e2007-04-21 15:47:16 +0000263 def __next__(self):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000264 if self.i >= len(self.seqn): raise StopIteration
265 v = self.seqn[self.i]
266 self.i += 1
267 return v
268
269class Ig:
270 'Sequence using iterator protocol defined with a generator'
271 def __init__(self, seqn):
272 self.seqn = seqn
273 self.i = 0
274 def __iter__(self):
275 for val in self.seqn:
276 yield val
277
278class X:
279 'Missing __getitem__ and __iter__'
280 def __init__(self, seqn):
281 self.seqn = seqn
282 self.i = 0
Georg Brandla18af4e2007-04-21 15:47:16 +0000283 def __next__(self):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000284 if self.i >= len(self.seqn): raise StopIteration
285 v = self.seqn[self.i]
286 self.i += 1
287 return v
288
289class N:
Georg Brandla18af4e2007-04-21 15:47:16 +0000290 'Iterator missing __next__()'
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000291 def __init__(self, seqn):
292 self.seqn = seqn
293 self.i = 0
294 def __iter__(self):
295 return self
296
297class E:
298 'Test propagation of exceptions'
299 def __init__(self, seqn):
300 self.seqn = seqn
301 self.i = 0
302 def __iter__(self):
303 return self
Georg Brandla18af4e2007-04-21 15:47:16 +0000304 def __next__(self):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000305 3 // 0
306
307class S:
308 'Test immediate stop'
309 def __init__(self, seqn):
310 pass
311 def __iter__(self):
312 return self
Georg Brandla18af4e2007-04-21 15:47:16 +0000313 def __next__(self):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000314 raise StopIteration
315
Raymond Hettinger736c0ab2008-03-13 02:09:15 +0000316from itertools import chain
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000317def L(seqn):
318 'Test multiple tiers of iterators'
Raymond Hettingera6c60372008-03-13 01:26:19 +0000319 return chain(map(lambda x:x, R(Ig(G(seqn)))))
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000320
Ezio Melotti8269a442011-05-09 07:15:04 +0300321
Ezio Melotti8269a442011-05-09 07:15:04 +0300322class TestErrorHandling(TestCase):
Ezio Melottifd69abb2011-05-09 07:20:47 +0300323 module = None
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000324
325 def test_non_sequence(self):
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000326 for f in (self.module.heapify, self.module.heappop):
Raymond Hettinger8a9c4d92011-04-13 11:49:57 -0700327 self.assertRaises((TypeError, AttributeError), f, 10)
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000328 for f in (self.module.heappush, self.module.heapreplace,
329 self.module.nlargest, self.module.nsmallest):
Raymond Hettinger8a9c4d92011-04-13 11:49:57 -0700330 self.assertRaises((TypeError, AttributeError), f, 10, 10)
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000331
332 def test_len_only(self):
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000333 for f in (self.module.heapify, self.module.heappop):
Raymond Hettinger8a9c4d92011-04-13 11:49:57 -0700334 self.assertRaises((TypeError, AttributeError), f, LenOnly())
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000335 for f in (self.module.heappush, self.module.heapreplace):
Raymond Hettinger8a9c4d92011-04-13 11:49:57 -0700336 self.assertRaises((TypeError, AttributeError), f, LenOnly(), 10)
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000337 for f in (self.module.nlargest, self.module.nsmallest):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000338 self.assertRaises(TypeError, f, 2, LenOnly())
339
340 def test_get_only(self):
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000341 for f in (self.module.heapify, self.module.heappop):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000342 self.assertRaises(TypeError, f, GetOnly())
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000343 for f in (self.module.heappush, self.module.heapreplace):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000344 self.assertRaises(TypeError, f, GetOnly(), 10)
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000345 for f in (self.module.nlargest, self.module.nsmallest):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000346 self.assertRaises(TypeError, f, 2, GetOnly())
347
348 def test_get_only(self):
349 seq = [CmpErr(), CmpErr(), CmpErr()]
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000350 for f in (self.module.heapify, self.module.heappop):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000351 self.assertRaises(ZeroDivisionError, f, seq)
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000352 for f in (self.module.heappush, self.module.heapreplace):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000353 self.assertRaises(ZeroDivisionError, f, seq, 10)
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000354 for f in (self.module.nlargest, self.module.nsmallest):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000355 self.assertRaises(ZeroDivisionError, f, 2, seq)
356
357 def test_arg_parsing(self):
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000358 for f in (self.module.heapify, self.module.heappop,
359 self.module.heappush, self.module.heapreplace,
360 self.module.nlargest, self.module.nsmallest):
Raymond Hettinger8a9c4d92011-04-13 11:49:57 -0700361 self.assertRaises((TypeError, AttributeError), f, 10)
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000362
363 def test_iterable_args(self):
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000364 for f in (self.module.nlargest, self.module.nsmallest):
Guido van Rossum805365e2007-05-07 22:24:25 +0000365 for s in ("123", "", range(1000), (1, 1.2), range(2000,2200,5)):
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000366 for g in (G, I, Ig, L, R):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000367 self.assertEqual(list(f(2, g(s))), list(f(2,s)))
368 self.assertEqual(list(f(2, S(s))), [])
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000369 self.assertRaises(TypeError, f, 2, X(s))
370 self.assertRaises(TypeError, f, 2, N(s))
371 self.assertRaises(ZeroDivisionError, f, 2, E(s))
372
Christian Heimesd3eb5a152008-02-24 00:38:49 +0000373
Ezio Melottifd69abb2011-05-09 07:20:47 +0300374class TestErrorHandlingPython(TestErrorHandling):
375 module = py_heapq
376
Ezio Melotti19f7ca22011-05-09 07:27:20 +0300377@skipUnless(c_heapq, 'requires _heapq')
Ezio Melottifd69abb2011-05-09 07:20:47 +0300378class TestErrorHandlingC(TestErrorHandling):
379 module = c_heapq
380
Raymond Hettinger855d9a92004-09-28 00:03:54 +0000381
382#==============================================================================
383
384
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +0000385def test_main(verbose=None):
Ezio Melotti19f7ca22011-05-09 07:27:20 +0300386 test_classes = [TestModules, TestHeapPython, TestHeapC,
387 TestErrorHandlingPython, TestErrorHandlingC]
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000388 support.run_unittest(*test_classes)
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +0000389
390 # verify reference counting
391 if verbose and hasattr(sys, "gettotalrefcount"):
392 import gc
393 counts = [None] * 5
Guido van Rossum805365e2007-05-07 22:24:25 +0000394 for i in range(len(counts)):
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000395 support.run_unittest(*test_classes)
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +0000396 gc.collect()
397 counts[i] = sys.gettotalrefcount()
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000398 print(counts)
Guido van Rossum0b191782002-08-02 18:29:53 +0000399
400if __name__ == "__main__":
Raymond Hettinger2e3dfaf2004-06-13 05:26:33 +0000401 test_main(verbose=True)