Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 1 | """Unittests for heapq.""" |
| 2 | |
Raymond Hettinger | 33ecffb | 2004-06-10 05:03:17 +0000 | [diff] [blame] | 3 | from heapq import heappush, heappop, heapify, heapreplace, nlargest, nsmallest |
Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 4 | import random |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 5 | import unittest |
| 6 | from test import test_support |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 7 | import sys |
Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 8 | |
Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 9 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 10 | def heapiter(heap): |
| 11 | # An iterator returning a heap's elements, smallest-first. |
| 12 | try: |
| 13 | while 1: |
| 14 | yield heappop(heap) |
| 15 | except IndexError: |
| 16 | pass |
Tim Peters | aa7d243 | 2002-08-03 02:11:26 +0000 | [diff] [blame] | 17 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 18 | class TestHeap(unittest.TestCase): |
Tim Peters | aa7d243 | 2002-08-03 02:11:26 +0000 | [diff] [blame] | 19 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 20 | def test_push_pop(self): |
| 21 | # 1) Push 256 random numbers and pop them off, verifying all's OK. |
| 22 | heap = [] |
| 23 | data = [] |
| 24 | self.check_invariant(heap) |
| 25 | for i in range(256): |
| 26 | item = random.random() |
| 27 | data.append(item) |
| 28 | heappush(heap, item) |
| 29 | self.check_invariant(heap) |
| 30 | results = [] |
| 31 | while heap: |
| 32 | item = heappop(heap) |
| 33 | self.check_invariant(heap) |
| 34 | results.append(item) |
| 35 | data_sorted = data[:] |
| 36 | data_sorted.sort() |
| 37 | self.assertEqual(data_sorted, results) |
| 38 | # 2) Check that the invariant holds for a sorted array |
| 39 | self.check_invariant(results) |
| 40 | |
Neal Norwitz | d7be118 | 2004-07-08 01:56:46 +0000 | [diff] [blame] | 41 | self.assertRaises(TypeError, heappush, []) |
Raymond Hettinger | e1defa4 | 2004-11-29 05:54:48 +0000 | [diff] [blame] | 42 | try: |
| 43 | self.assertRaises(TypeError, heappush, None, None) |
| 44 | self.assertRaises(TypeError, heappop, None) |
| 45 | except AttributeError: |
| 46 | pass |
Neal Norwitz | d7be118 | 2004-07-08 01:56:46 +0000 | [diff] [blame] | 47 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 48 | def check_invariant(self, heap): |
| 49 | # Check the heap invariant. |
| 50 | for pos, item in enumerate(heap): |
| 51 | if pos: # pos 0 has no parent |
| 52 | parentpos = (pos-1) >> 1 |
| 53 | self.assert_(heap[parentpos] <= item) |
| 54 | |
| 55 | def test_heapify(self): |
| 56 | for size in range(30): |
| 57 | heap = [random.random() for dummy in range(size)] |
| 58 | heapify(heap) |
| 59 | self.check_invariant(heap) |
| 60 | |
Neal Norwitz | d7be118 | 2004-07-08 01:56:46 +0000 | [diff] [blame] | 61 | self.assertRaises(TypeError, heapify, None) |
| 62 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 63 | def test_naive_nbest(self): |
| 64 | data = [random.randrange(2000) for i in range(1000)] |
| 65 | heap = [] |
| 66 | for item in data: |
| 67 | heappush(heap, item) |
| 68 | if len(heap) > 10: |
| 69 | heappop(heap) |
| 70 | heap.sort() |
| 71 | self.assertEqual(heap, sorted(data)[-10:]) |
| 72 | |
| 73 | def test_nbest(self): |
| 74 | # Less-naive "N-best" algorithm, much faster (if len(data) is big |
| 75 | # enough <wink>) than sorting all of data. However, if we had a max |
| 76 | # heap instead of a min heap, it could go faster still via |
| 77 | # heapify'ing all of data (linear time), then doing 10 heappops |
| 78 | # (10 log-time steps). |
| 79 | data = [random.randrange(2000) for i in range(1000)] |
| 80 | heap = data[:10] |
| 81 | heapify(heap) |
| 82 | for item in data[10:]: |
| 83 | if item > heap[0]: # this gets rarer the longer we run |
| 84 | heapreplace(heap, item) |
| 85 | self.assertEqual(list(heapiter(heap)), sorted(data)[-10:]) |
| 86 | |
Neal Norwitz | d7be118 | 2004-07-08 01:56:46 +0000 | [diff] [blame] | 87 | self.assertRaises(TypeError, heapreplace, None) |
| 88 | self.assertRaises(TypeError, heapreplace, None, None) |
| 89 | self.assertRaises(IndexError, heapreplace, [], None) |
| 90 | |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 91 | def test_heapsort(self): |
| 92 | # Exercise everything with repeated heapsort checks |
| 93 | for trial in xrange(100): |
| 94 | size = random.randrange(50) |
| 95 | data = [random.randrange(25) for i in range(size)] |
| 96 | if trial & 1: # Half of the time, use heapify |
| 97 | heap = data[:] |
| 98 | heapify(heap) |
| 99 | else: # The rest of the time, use heappush |
| 100 | heap = [] |
| 101 | for item in data: |
| 102 | heappush(heap, item) |
| 103 | heap_sorted = [heappop(heap) for i in range(size)] |
| 104 | self.assertEqual(heap_sorted, sorted(data)) |
| 105 | |
| 106 | def test_nsmallest(self): |
Thomas Wouters | 902d6eb | 2007-01-09 23:18:33 +0000 | [diff] [blame] | 107 | data = [(random.randrange(2000), i) for i in range(1000)] |
| 108 | for f in (None, lambda x: x[0] * 547 % 2000): |
| 109 | for n in (0, 1, 2, 10, 100, 400, 999, 1000, 1100): |
| 110 | self.assertEqual(nsmallest(n, data), sorted(data)[:n]) |
| 111 | self.assertEqual(nsmallest(n, data, key=f), |
| 112 | sorted(data, key=f)[:n]) |
Raymond Hettinger | bce036b | 2004-06-10 05:07:18 +0000 | [diff] [blame] | 113 | |
Raymond Hettinger | 4901a1f | 2004-12-02 08:59:14 +0000 | [diff] [blame] | 114 | def test_nlargest(self): |
Thomas Wouters | 902d6eb | 2007-01-09 23:18:33 +0000 | [diff] [blame] | 115 | data = [(random.randrange(2000), i) for i in range(1000)] |
| 116 | for f in (None, lambda x: x[0] * 547 % 2000): |
| 117 | for n in (0, 1, 2, 10, 100, 400, 999, 1000, 1100): |
| 118 | self.assertEqual(nlargest(n, data), sorted(data, reverse=True)[:n]) |
| 119 | self.assertEqual(nlargest(n, data, key=f), |
| 120 | sorted(data, key=f, reverse=True)[:n]) |
Tim Peters | aa7d243 | 2002-08-03 02:11:26 +0000 | [diff] [blame] | 121 | |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 122 | |
| 123 | #============================================================================== |
| 124 | |
| 125 | class LenOnly: |
| 126 | "Dummy sequence class defining __len__ but not __getitem__." |
| 127 | def __len__(self): |
| 128 | return 10 |
| 129 | |
| 130 | class GetOnly: |
| 131 | "Dummy sequence class defining __getitem__ but not __len__." |
| 132 | def __getitem__(self, ndx): |
| 133 | return 10 |
| 134 | |
| 135 | class CmpErr: |
| 136 | "Dummy element that always raises an error during comparison" |
| 137 | def __cmp__(self, other): |
| 138 | raise ZeroDivisionError |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 139 | __eq__ = __ne__ = __lt__ = __le__ = __gt__ = __ge__ = __cmp__ |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 140 | |
| 141 | def R(seqn): |
| 142 | 'Regular generator' |
| 143 | for i in seqn: |
| 144 | yield i |
| 145 | |
| 146 | class G: |
| 147 | 'Sequence using __getitem__' |
| 148 | def __init__(self, seqn): |
| 149 | self.seqn = seqn |
| 150 | def __getitem__(self, i): |
| 151 | return self.seqn[i] |
| 152 | |
| 153 | class I: |
| 154 | 'Sequence using iterator protocol' |
| 155 | def __init__(self, seqn): |
| 156 | self.seqn = seqn |
| 157 | self.i = 0 |
| 158 | def __iter__(self): |
| 159 | return self |
| 160 | def next(self): |
| 161 | if self.i >= len(self.seqn): raise StopIteration |
| 162 | v = self.seqn[self.i] |
| 163 | self.i += 1 |
| 164 | return v |
| 165 | |
| 166 | class Ig: |
| 167 | 'Sequence using iterator protocol defined with a generator' |
| 168 | def __init__(self, seqn): |
| 169 | self.seqn = seqn |
| 170 | self.i = 0 |
| 171 | def __iter__(self): |
| 172 | for val in self.seqn: |
| 173 | yield val |
| 174 | |
| 175 | class X: |
| 176 | 'Missing __getitem__ and __iter__' |
| 177 | def __init__(self, seqn): |
| 178 | self.seqn = seqn |
| 179 | self.i = 0 |
| 180 | def next(self): |
| 181 | if self.i >= len(self.seqn): raise StopIteration |
| 182 | v = self.seqn[self.i] |
| 183 | self.i += 1 |
| 184 | return v |
| 185 | |
| 186 | class N: |
| 187 | 'Iterator missing next()' |
| 188 | def __init__(self, seqn): |
| 189 | self.seqn = seqn |
| 190 | self.i = 0 |
| 191 | def __iter__(self): |
| 192 | return self |
| 193 | |
| 194 | class E: |
| 195 | 'Test propagation of exceptions' |
| 196 | def __init__(self, seqn): |
| 197 | self.seqn = seqn |
| 198 | self.i = 0 |
| 199 | def __iter__(self): |
| 200 | return self |
| 201 | def next(self): |
| 202 | 3 // 0 |
| 203 | |
| 204 | class S: |
| 205 | 'Test immediate stop' |
| 206 | def __init__(self, seqn): |
| 207 | pass |
| 208 | def __iter__(self): |
| 209 | return self |
| 210 | def next(self): |
| 211 | raise StopIteration |
| 212 | |
| 213 | from itertools import chain, imap |
| 214 | def L(seqn): |
| 215 | 'Test multiple tiers of iterators' |
| 216 | return chain(imap(lambda x:x, R(Ig(G(seqn))))) |
| 217 | |
| 218 | class TestErrorHandling(unittest.TestCase): |
| 219 | |
| 220 | def test_non_sequence(self): |
| 221 | for f in (heapify, heappop): |
| 222 | self.assertRaises(TypeError, f, 10) |
| 223 | for f in (heappush, heapreplace, nlargest, nsmallest): |
| 224 | self.assertRaises(TypeError, f, 10, 10) |
| 225 | |
| 226 | def test_len_only(self): |
| 227 | for f in (heapify, heappop): |
| 228 | self.assertRaises(TypeError, f, LenOnly()) |
| 229 | for f in (heappush, heapreplace): |
| 230 | self.assertRaises(TypeError, f, LenOnly(), 10) |
| 231 | for f in (nlargest, nsmallest): |
| 232 | self.assertRaises(TypeError, f, 2, LenOnly()) |
| 233 | |
| 234 | def test_get_only(self): |
| 235 | for f in (heapify, heappop): |
| 236 | self.assertRaises(TypeError, f, GetOnly()) |
| 237 | for f in (heappush, heapreplace): |
| 238 | self.assertRaises(TypeError, f, GetOnly(), 10) |
| 239 | for f in (nlargest, nsmallest): |
| 240 | self.assertRaises(TypeError, f, 2, GetOnly()) |
| 241 | |
| 242 | def test_get_only(self): |
| 243 | seq = [CmpErr(), CmpErr(), CmpErr()] |
| 244 | for f in (heapify, heappop): |
| 245 | self.assertRaises(ZeroDivisionError, f, seq) |
| 246 | for f in (heappush, heapreplace): |
| 247 | self.assertRaises(ZeroDivisionError, f, seq, 10) |
| 248 | for f in (nlargest, nsmallest): |
| 249 | self.assertRaises(ZeroDivisionError, f, 2, seq) |
| 250 | |
| 251 | def test_arg_parsing(self): |
| 252 | for f in (heapify, heappop, heappush, heapreplace, nlargest, nsmallest): |
| 253 | self.assertRaises(TypeError, f, 10) |
| 254 | |
| 255 | def test_iterable_args(self): |
| 256 | for f in (nlargest, nsmallest): |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 257 | for s in ("123", "", range(1000), (1, 1.2), xrange(2000,2200,5)): |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 258 | for g in (G, I, Ig, L, R): |
| 259 | self.assertEqual(f(2, g(s)), f(2,s)) |
| 260 | self.assertEqual(f(2, S(s)), []) |
| 261 | self.assertRaises(TypeError, f, 2, X(s)) |
| 262 | self.assertRaises(TypeError, f, 2, N(s)) |
| 263 | self.assertRaises(ZeroDivisionError, f, 2, E(s)) |
| 264 | |
| 265 | #============================================================================== |
| 266 | |
| 267 | |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 268 | def test_main(verbose=None): |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 269 | from types import BuiltinFunctionType |
| 270 | |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 271 | test_classes = [TestHeap] |
Raymond Hettinger | 855d9a9 | 2004-09-28 00:03:54 +0000 | [diff] [blame] | 272 | if isinstance(heapify, BuiltinFunctionType): |
| 273 | test_classes.append(TestErrorHandling) |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 274 | test_support.run_unittest(*test_classes) |
| 275 | |
| 276 | # verify reference counting |
| 277 | if verbose and hasattr(sys, "gettotalrefcount"): |
| 278 | import gc |
| 279 | counts = [None] * 5 |
| 280 | for i in xrange(len(counts)): |
| 281 | test_support.run_unittest(*test_classes) |
| 282 | gc.collect() |
| 283 | counts[i] = sys.gettotalrefcount() |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 284 | print(counts) |
Guido van Rossum | 0b19178 | 2002-08-02 18:29:53 +0000 | [diff] [blame] | 285 | |
| 286 | if __name__ == "__main__": |
Raymond Hettinger | 2e3dfaf | 2004-06-13 05:26:33 +0000 | [diff] [blame] | 287 | test_main(verbose=True) |