Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 1 | """Unittests for heapq.""" |
| 2 | |
Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 3 | from heapq import heappush, heappop, heapify, heapreplace, merge, nlargest, nsmallest |
Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 4 | import random |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 5 | import unittest |
| 6 | from test import test_support |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 7 | import sys |
Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 8 | |
Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 9 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 10 | def heapiter(heap): |
| 11 | # An iterator returning a heap's elements, smallest-first. |
| 12 | try: |
| 13 | while 1: |
| 14 | yield heappop(heap) |
| 15 | except IndexError: |
| 16 | pass |
Tim Peters | aa7d243 | 2002-08-03 02:11:26 +0000 | [diff] [blame] | 17 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 18 | class TestHeap(unittest.TestCase): |
Tim Peters | aa7d243 | 2002-08-03 02:11:26 +0000 | [diff] [blame] | 19 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 20 | def test_push_pop(self): |
| 21 | # 1) Push 256 random numbers and pop them off, verifying all's OK. |
| 22 | heap = [] |
| 23 | data = [] |
| 24 | self.check_invariant(heap) |
| 25 | for i in range(256): |
| 26 | item = random.random() |
| 27 | data.append(item) |
| 28 | heappush(heap, item) |
| 29 | self.check_invariant(heap) |
| 30 | results = [] |
| 31 | while heap: |
| 32 | item = heappop(heap) |
| 33 | self.check_invariant(heap) |
| 34 | results.append(item) |
| 35 | data_sorted = data[:] |
| 36 | data_sorted.sort() |
| 37 | self.assertEqual(data_sorted, results) |
| 38 | # 2) Check that the invariant holds for a sorted array |
| 39 | self.check_invariant(results) |
| 40 | |
Neal Norwitz | d7be118 | 2004-07-08 01:56:46 +0000 | [diff] [blame] | 41 | self.assertRaises(TypeError, heappush, []) |
Raymond Hettinger | e1defa4 | 2004-11-29 05:54:48 +0000 | [diff] [blame] | 42 | try: |
| 43 | self.assertRaises(TypeError, heappush, None, None) |
| 44 | self.assertRaises(TypeError, heappop, None) |
| 45 | except AttributeError: |
| 46 | pass |
Neal Norwitz | d7be118 | 2004-07-08 01:56:46 +0000 | [diff] [blame] | 47 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 48 | def check_invariant(self, heap): |
| 49 | # Check the heap invariant. |
| 50 | for pos, item in enumerate(heap): |
| 51 | if pos: # pos 0 has no parent |
| 52 | parentpos = (pos-1) >> 1 |
| 53 | self.assert_(heap[parentpos] <= item) |
| 54 | |
| 55 | def test_heapify(self): |
| 56 | for size in range(30): |
| 57 | heap = [random.random() for dummy in range(size)] |
| 58 | heapify(heap) |
| 59 | self.check_invariant(heap) |
| 60 | |
Neal Norwitz | d7be118 | 2004-07-08 01:56:46 +0000 | [diff] [blame] | 61 | self.assertRaises(TypeError, heapify, None) |
| 62 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 63 | def test_naive_nbest(self): |
| 64 | data = [random.randrange(2000) for i in range(1000)] |
| 65 | heap = [] |
| 66 | for item in data: |
| 67 | heappush(heap, item) |
| 68 | if len(heap) > 10: |
| 69 | heappop(heap) |
| 70 | heap.sort() |
| 71 | self.assertEqual(heap, sorted(data)[-10:]) |
| 72 | |
| 73 | def test_nbest(self): |
| 74 | # Less-naive "N-best" algorithm, much faster (if len(data) is big |
| 75 | # enough <wink>) than sorting all of data. However, if we had a max |
| 76 | # heap instead of a min heap, it could go faster still via |
| 77 | # heapify'ing all of data (linear time), then doing 10 heappops |
| 78 | # (10 log-time steps). |
| 79 | data = [random.randrange(2000) for i in range(1000)] |
| 80 | heap = data[:10] |
| 81 | heapify(heap) |
| 82 | for item in data[10:]: |
| 83 | if item > heap[0]: # this gets rarer the longer we run |
| 84 | heapreplace(heap, item) |
| 85 | self.assertEqual(list(heapiter(heap)), sorted(data)[-10:]) |
| 86 | |
Neal Norwitz | d7be118 | 2004-07-08 01:56:46 +0000 | [diff] [blame] | 87 | self.assertRaises(TypeError, heapreplace, None) |
| 88 | self.assertRaises(TypeError, heapreplace, None, None) |
| 89 | self.assertRaises(IndexError, heapreplace, [], None) |
| 90 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 91 | def test_heapsort(self): |
| 92 | # Exercise everything with repeated heapsort checks |
| 93 | for trial in xrange(100): |
| 94 | size = random.randrange(50) |
| 95 | data = [random.randrange(25) for i in range(size)] |
| 96 | if trial & 1: # Half of the time, use heapify |
| 97 | heap = data[:] |
| 98 | heapify(heap) |
| 99 | else: # The rest of the time, use heappush |
| 100 | heap = [] |
| 101 | for item in data: |
| 102 | heappush(heap, item) |
| 103 | heap_sorted = [heappop(heap) for i in range(size)] |
| 104 | self.assertEqual(heap_sorted, sorted(data)) |
| 105 | |
Thomas Wouters | cf297e4 | 2007-02-23 15:07:44 +0000 | [diff] [blame] | 106 | def test_merge(self): |
| 107 | inputs = [] |
| 108 | for i in xrange(random.randrange(5)): |
| 109 | row = sorted(random.randrange(1000) for j in range(random.randrange(10))) |
| 110 | inputs.append(row) |
| 111 | self.assertEqual(sorted(chain(*inputs)), list(merge(*inputs))) |
| 112 | self.assertEqual(list(merge()), []) |
| 113 | |
| 114 | def test_merge_stability(self): |
| 115 | class Int(int): |
| 116 | pass |
| 117 | inputs = [[], [], [], []] |
| 118 | for i in range(20000): |
| 119 | stream = random.randrange(4) |
| 120 | x = random.randrange(500) |
| 121 | obj = Int(x) |
| 122 | obj.pair = (x, stream) |
| 123 | inputs[stream].append(obj) |
| 124 | for stream in inputs: |
| 125 | stream.sort() |
| 126 | result = [i.pair for i in merge(*inputs)] |
| 127 | self.assertEqual(result, sorted(result)) |
| 128 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 129 | def test_nsmallest(self): |
Thomas Wouters | 902d6eb | 2007-01-09 23:18:33 +0000 | [diff] [blame] | 130 | data = [(random.randrange(2000), i) for i in range(1000)] |
| 131 | for f in (None, lambda x: x[0] * 547 % 2000): |
| 132 | for n in (0, 1, 2, 10, 100, 400, 999, 1000, 1100): |
| 133 | self.assertEqual(nsmallest(n, data), sorted(data)[:n]) |
| 134 | self.assertEqual(nsmallest(n, data, key=f), |
| 135 | sorted(data, key=f)[:n]) |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 136 | |
Raymond Hettinger | 4901a1f | 2004-12-02 08:59:14 +0000 | [diff] [blame] | 137 | def test_nlargest(self): |
Thomas Wouters | 902d6eb | 2007-01-09 23:18:33 +0000 | [diff] [blame] | 138 | data = [(random.randrange(2000), i) for i in range(1000)] |
| 139 | for f in (None, lambda x: x[0] * 547 % 2000): |
| 140 | for n in (0, 1, 2, 10, 100, 400, 999, 1000, 1100): |
| 141 | self.assertEqual(nlargest(n, data), sorted(data, reverse=True)[:n]) |
| 142 | self.assertEqual(nlargest(n, data, key=f), |
| 143 | sorted(data, key=f, reverse=True)[:n]) |
Tim Peters | aa7d243 | 2002-08-03 02:11:26 +0000 | [diff] [blame] | 144 | |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 145 | |
| 146 | #============================================================================== |
| 147 | |
| 148 | class LenOnly: |
| 149 | "Dummy sequence class defining __len__ but not __getitem__." |
| 150 | def __len__(self): |
| 151 | return 10 |
| 152 | |
| 153 | class GetOnly: |
| 154 | "Dummy sequence class defining __getitem__ but not __len__." |
| 155 | def __getitem__(self, ndx): |
| 156 | return 10 |
| 157 | |
| 158 | class CmpErr: |
| 159 | "Dummy element that always raises an error during comparison" |
| 160 | def __cmp__(self, other): |
| 161 | raise ZeroDivisionError |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 162 | __eq__ = __ne__ = __lt__ = __le__ = __gt__ = __ge__ = __cmp__ |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 163 | |
| 164 | def R(seqn): |
| 165 | 'Regular generator' |
| 166 | for i in seqn: |
| 167 | yield i |
| 168 | |
| 169 | class G: |
| 170 | 'Sequence using __getitem__' |
| 171 | def __init__(self, seqn): |
| 172 | self.seqn = seqn |
| 173 | def __getitem__(self, i): |
| 174 | return self.seqn[i] |
| 175 | |
| 176 | class I: |
| 177 | 'Sequence using iterator protocol' |
| 178 | def __init__(self, seqn): |
| 179 | self.seqn = seqn |
| 180 | self.i = 0 |
| 181 | def __iter__(self): |
| 182 | return self |
| 183 | def next(self): |
| 184 | if self.i >= len(self.seqn): raise StopIteration |
| 185 | v = self.seqn[self.i] |
| 186 | self.i += 1 |
| 187 | return v |
| 188 | |
| 189 | class Ig: |
| 190 | 'Sequence using iterator protocol defined with a generator' |
| 191 | def __init__(self, seqn): |
| 192 | self.seqn = seqn |
| 193 | self.i = 0 |
| 194 | def __iter__(self): |
| 195 | for val in self.seqn: |
| 196 | yield val |
| 197 | |
| 198 | class X: |
| 199 | 'Missing __getitem__ and __iter__' |
| 200 | def __init__(self, seqn): |
| 201 | self.seqn = seqn |
| 202 | self.i = 0 |
| 203 | def next(self): |
| 204 | if self.i >= len(self.seqn): raise StopIteration |
| 205 | v = self.seqn[self.i] |
| 206 | self.i += 1 |
| 207 | return v |
| 208 | |
| 209 | class N: |
| 210 | 'Iterator missing next()' |
| 211 | def __init__(self, seqn): |
| 212 | self.seqn = seqn |
| 213 | self.i = 0 |
| 214 | def __iter__(self): |
| 215 | return self |
| 216 | |
| 217 | class E: |
| 218 | 'Test propagation of exceptions' |
| 219 | def __init__(self, seqn): |
| 220 | self.seqn = seqn |
| 221 | self.i = 0 |
| 222 | def __iter__(self): |
| 223 | return self |
| 224 | def next(self): |
| 225 | 3 // 0 |
| 226 | |
| 227 | class S: |
| 228 | 'Test immediate stop' |
| 229 | def __init__(self, seqn): |
| 230 | pass |
| 231 | def __iter__(self): |
| 232 | return self |
| 233 | def next(self): |
| 234 | raise StopIteration |
| 235 | |
| 236 | from itertools import chain, imap |
| 237 | def L(seqn): |
| 238 | 'Test multiple tiers of iterators' |
| 239 | return chain(imap(lambda x:x, R(Ig(G(seqn))))) |
| 240 | |
| 241 | class TestErrorHandling(unittest.TestCase): |
| 242 | |
| 243 | def test_non_sequence(self): |
| 244 | for f in (heapify, heappop): |
| 245 | self.assertRaises(TypeError, f, 10) |
| 246 | for f in (heappush, heapreplace, nlargest, nsmallest): |
| 247 | self.assertRaises(TypeError, f, 10, 10) |
| 248 | |
| 249 | def test_len_only(self): |
| 250 | for f in (heapify, heappop): |
| 251 | self.assertRaises(TypeError, f, LenOnly()) |
| 252 | for f in (heappush, heapreplace): |
| 253 | self.assertRaises(TypeError, f, LenOnly(), 10) |
| 254 | for f in (nlargest, nsmallest): |
| 255 | self.assertRaises(TypeError, f, 2, LenOnly()) |
| 256 | |
| 257 | def test_get_only(self): |
| 258 | for f in (heapify, heappop): |
| 259 | self.assertRaises(TypeError, f, GetOnly()) |
| 260 | for f in (heappush, heapreplace): |
| 261 | self.assertRaises(TypeError, f, GetOnly(), 10) |
| 262 | for f in (nlargest, nsmallest): |
| 263 | self.assertRaises(TypeError, f, 2, GetOnly()) |
| 264 | |
| 265 | def test_get_only(self): |
| 266 | seq = [CmpErr(), CmpErr(), CmpErr()] |
| 267 | for f in (heapify, heappop): |
| 268 | self.assertRaises(ZeroDivisionError, f, seq) |
| 269 | for f in (heappush, heapreplace): |
| 270 | self.assertRaises(ZeroDivisionError, f, seq, 10) |
| 271 | for f in (nlargest, nsmallest): |
| 272 | self.assertRaises(ZeroDivisionError, f, 2, seq) |
| 273 | |
| 274 | def test_arg_parsing(self): |
| 275 | for f in (heapify, heappop, heappush, heapreplace, nlargest, nsmallest): |
| 276 | self.assertRaises(TypeError, f, 10) |
| 277 | |
| 278 | def test_iterable_args(self): |
| 279 | for f in (nlargest, nsmallest): |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 280 | for s in ("123", "", range(1000), (1, 1.2), xrange(2000,2200,5)): |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 281 | for g in (G, I, Ig, L, R): |
| 282 | self.assertEqual(f(2, g(s)), f(2,s)) |
| 283 | self.assertEqual(f(2, S(s)), []) |
| 284 | self.assertRaises(TypeError, f, 2, X(s)) |
| 285 | self.assertRaises(TypeError, f, 2, N(s)) |
| 286 | self.assertRaises(ZeroDivisionError, f, 2, E(s)) |
| 287 | |
| 288 | #============================================================================== |
| 289 | |
| 290 | |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 291 | def test_main(verbose=None): |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 292 | from types import BuiltinFunctionType |
| 293 | |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 294 | test_classes = [TestHeap] |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 295 | if isinstance(heapify, BuiltinFunctionType): |
| 296 | test_classes.append(TestErrorHandling) |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 297 | test_support.run_unittest(*test_classes) |
| 298 | |
| 299 | # verify reference counting |
| 300 | if verbose and hasattr(sys, "gettotalrefcount"): |
| 301 | import gc |
| 302 | counts = [None] * 5 |
| 303 | for i in xrange(len(counts)): |
| 304 | test_support.run_unittest(*test_classes) |
| 305 | gc.collect() |
| 306 | counts[i] = sys.gettotalrefcount() |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 307 | print(counts) |
Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 308 | |
| 309 | if __name__ == "__main__": |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 310 | test_main(verbose=True) |