blob: eb2024352de18a7d1f483c91007d3d2e9e6301e0 [file] [log] [blame]
Brett Cannon23a4a7b2008-05-12 00:56:28 +00001__all__ = ['deque', 'defaultdict', 'namedtuple', 'UserDict', 'UserList',
Raymond Hettinger2d32f632009-03-02 21:24:57 +00002 'UserString', 'Counter', 'OrderedDict']
Guido van Rossumcd16bf62007-06-13 18:07:49 +00003# For bootstrapping reasons, the collection ABCs are defined in _abcoll.py.
4# They should however be considered an integral part of collections.py.
5from _abcoll import *
6import _abcoll
7__all__ += _abcoll.__all__
8
Christian Heimes99170a52007-12-19 02:07:34 +00009from _collections import deque, defaultdict
10from operator import itemgetter as _itemgetter
11from keyword import iskeyword as _iskeyword
12import sys as _sys
Raymond Hettingerb8baf632009-01-14 02:20:07 +000013import heapq as _heapq
Raymond Hettingerfa11db02010-09-12 04:12:42 +000014from weakref import proxy as _proxy
Raymond Hettingerea9f8db2009-03-02 21:28:41 +000015from itertools import repeat as _repeat, chain as _chain, starmap as _starmap
Raymond Hettinger98a5f3f2010-09-13 21:36:00 +000016from reprlib import recursive_repr as _recursive_repr
Raymond Hettinger2d32f632009-03-02 21:24:57 +000017
18################################################################################
19### OrderedDict
20################################################################################
21
Raymond Hettingerfa11db02010-09-12 04:12:42 +000022class _Link(object):
23 __slots__ = 'prev', 'next', 'key', '__weakref__'
24
Raymond Hettinger345c49b2011-01-01 23:51:55 +000025class OrderedDict(dict):
Raymond Hettinger18ed2cb2009-03-19 23:14:39 +000026 'Dictionary that remembers insertion order'
Raymond Hettingerf1736542009-03-23 05:19:21 +000027 # An inherited dict maps keys to values.
Raymond Hettinger18ed2cb2009-03-19 23:14:39 +000028 # The inherited dict provides __getitem__, __len__, __contains__, and get.
29 # The remaining methods are order-aware.
Raymond Hettinger5db3e012011-04-24 14:26:08 -070030 # Big-O running times for all methods are the same as regular dictionaries.
Raymond Hettingerf1736542009-03-23 05:19:21 +000031
Raymond Hettinger5db3e012011-04-24 14:26:08 -070032 # The internal self.__map dict maps keys to links in a doubly linked list.
Raymond Hettingerf1736542009-03-23 05:19:21 +000033 # The circular doubly linked list starts and ends with a sentinel element.
34 # The sentinel element never gets deleted (this simplifies the algorithm).
Raymond Hettinger5db3e012011-04-24 14:26:08 -070035 # The sentinel is in self.__hardroot with a weakref proxy in self.__root.
Raymond Hettingereaac4f02012-01-26 00:14:16 -080036 # The prev links are weakref proxies (to prevent circular references).
Raymond Hettingerc5c29c02010-09-12 18:13:46 +000037 # Individual links are kept alive by the hard reference in self.__map.
38 # Those hard references disappear when a key is deleted from an OrderedDict.
Raymond Hettinger2d32f632009-03-02 21:24:57 +000039
40 def __init__(self, *args, **kwds):
Raymond Hettinger5db3e012011-04-24 14:26:08 -070041 '''Initialize an ordered dictionary. The signature is the same as
42 regular dictionaries, but keyword arguments are not recommended because
43 their insertion order is arbitrary.
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +000044
45 '''
Raymond Hettinger2d32f632009-03-02 21:24:57 +000046 if len(args) > 1:
47 raise TypeError('expected at most 1 arguments, got %d' % len(args))
Raymond Hettinger08c70cf2009-03-03 20:47:29 +000048 try:
Raymond Hettingerf1736542009-03-23 05:19:21 +000049 self.__root
Raymond Hettinger08c70cf2009-03-03 20:47:29 +000050 except AttributeError:
Raymond Hettingerf7328d02010-09-14 19:40:15 +000051 self.__hardroot = _Link()
52 self.__root = root = _proxy(self.__hardroot)
Raymond Hettingerfa11db02010-09-12 04:12:42 +000053 root.prev = root.next = root
Raymond Hettinger52dc06b2009-03-25 22:45:22 +000054 self.__map = {}
Raymond Hettinger32062e92011-01-01 22:38:00 +000055 self.__update(*args, **kwds)
Raymond Hettinger2d32f632009-03-02 21:24:57 +000056
Raymond Hettingerfa11db02010-09-12 04:12:42 +000057 def __setitem__(self, key, value,
58 dict_setitem=dict.__setitem__, proxy=_proxy, Link=_Link):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +000059 'od.__setitem__(i, y) <==> od[i]=y'
Raymond Hettinger5db3e012011-04-24 14:26:08 -070060 # Setting a new item creates a new link at the end of the linked list,
61 # and the inherited dictionary is updated with the new key/value pair.
Raymond Hettinger2d32f632009-03-02 21:24:57 +000062 if key not in self:
Raymond Hettingerfa11db02010-09-12 04:12:42 +000063 self.__map[key] = link = Link()
Raymond Hettingerf1736542009-03-23 05:19:21 +000064 root = self.__root
Raymond Hettingerfa11db02010-09-12 04:12:42 +000065 last = root.prev
66 link.prev, link.next, link.key = last, root, key
Raymond Hettingerf7328d02010-09-14 19:40:15 +000067 last.next = link
68 root.prev = proxy(link)
69 dict_setitem(self, key, value)
Raymond Hettinger2d32f632009-03-02 21:24:57 +000070
Raymond Hettingerfa11db02010-09-12 04:12:42 +000071 def __delitem__(self, key, dict_delitem=dict.__delitem__):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +000072 'od.__delitem__(y) <==> del od[y]'
Raymond Hettinger5db3e012011-04-24 14:26:08 -070073 # Deleting an existing item uses self.__map to find the link which gets
74 # removed by updating the links in the predecessor and successor nodes.
Raymond Hettinger5be21b72010-08-01 22:10:57 +000075 dict_delitem(self, key)
Raymond Hettingerf1736542009-03-23 05:19:21 +000076 link = self.__map.pop(key)
Raymond Hettingerfa11db02010-09-12 04:12:42 +000077 link_prev = link.prev
78 link_next = link.next
79 link_prev.next = link_next
80 link_next.prev = link_prev
Raymond Hettinger2d32f632009-03-02 21:24:57 +000081
Raymond Hettingerfa11db02010-09-12 04:12:42 +000082 def __iter__(self):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +000083 'od.__iter__() <==> iter(od)'
Raymond Hettingerf1736542009-03-23 05:19:21 +000084 # Traverse the linked list in order.
85 root = self.__root
Raymond Hettingerfa11db02010-09-12 04:12:42 +000086 curr = root.next
Raymond Hettingerf1736542009-03-23 05:19:21 +000087 while curr is not root:
Raymond Hettingerfa11db02010-09-12 04:12:42 +000088 yield curr.key
89 curr = curr.next
Raymond Hettinger2d32f632009-03-02 21:24:57 +000090
Raymond Hettingerfa11db02010-09-12 04:12:42 +000091 def __reversed__(self):
Raymond Hettinger2352cf32009-04-08 01:16:27 +000092 'od.__reversed__() <==> reversed(od)'
Raymond Hettingerf1736542009-03-23 05:19:21 +000093 # Traverse the linked list in reverse order.
94 root = self.__root
Raymond Hettingerfa11db02010-09-12 04:12:42 +000095 curr = root.prev
Raymond Hettingerf1736542009-03-23 05:19:21 +000096 while curr is not root:
Raymond Hettingerfa11db02010-09-12 04:12:42 +000097 yield curr.key
98 curr = curr.prev
Raymond Hettinger2d32f632009-03-02 21:24:57 +000099
Raymond Hettinger5be21b72010-08-01 22:10:57 +0000100 def clear(self):
101 'od.clear() -> None. Remove all items from od.'
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000102 root = self.__root
103 root.prev = root.next = root
104 self.__map.clear()
Raymond Hettinger5be21b72010-08-01 22:10:57 +0000105 dict.clear(self)
106
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000107 def popitem(self, last=True):
Raymond Hettinger331722d2010-09-02 18:44:16 +0000108 '''od.popitem() -> (k, v), return and remove a (key, value) pair.
109 Pairs are returned in LIFO order if last is true or FIFO order if false.
110
111 '''
112 if not self:
113 raise KeyError('dictionary is empty')
114 root = self.__root
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000115 if last:
116 link = root.prev
117 link_prev = link.prev
118 link_prev.next = root
119 root.prev = link_prev
120 else:
121 link = root.next
122 link_next = link.next
123 root.next = link_next
124 link_next.prev = root
125 key = link.key
Raymond Hettinger331722d2010-09-02 18:44:16 +0000126 del self.__map[key]
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000127 value = dict.pop(self, key)
Raymond Hettinger331722d2010-09-02 18:44:16 +0000128 return key, value
129
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000130 def move_to_end(self, key, last=True):
131 '''Move an existing element to the end (or beginning if last==False).
132
133 Raises KeyError if the element does not exist.
134 When last=True, acts like a fast version of self[key]=self.pop(key).
135
136 '''
137 link = self.__map[key]
138 link_prev = link.prev
139 link_next = link.next
140 link_prev.next = link_next
141 link_next.prev = link_prev
142 root = self.__root
143 if last:
144 last = root.prev
145 link.prev = last
146 link.next = root
147 last.next = root.prev = link
148 else:
149 first = root.next
150 link.prev = root
151 link.next = first
152 root.next = first.prev = link
153
Raymond Hettinger35c87f22010-09-16 19:10:17 +0000154 def __sizeof__(self):
155 sizeof = _sys.getsizeof
156 n = len(self) + 1 # number of links including root
157 size = sizeof(self.__dict__) # instance dictionary
158 size += sizeof(self.__map) * 2 # internal dict and inherited dict
159 size += sizeof(self.__hardroot) * n # link objects
160 size += sizeof(self.__root) * n # proxy objects
161 return size
162
Raymond Hettinger32062e92011-01-01 22:38:00 +0000163 update = __update = MutableMapping.update
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000164 keys = MutableMapping.keys
165 values = MutableMapping.values
166 items = MutableMapping.items
Raymond Hettinger5be21b72010-08-01 22:10:57 +0000167 __ne__ = MutableMapping.__ne__
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000168
Raymond Hettinger345c49b2011-01-01 23:51:55 +0000169 __marker = object()
170
171 def pop(self, key, default=__marker):
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700172 '''od.pop(k[,d]) -> v, remove specified key and return the corresponding
173 value. If key is not found, d is returned if given, otherwise KeyError
174 is raised.
175
176 '''
Raymond Hettinger345c49b2011-01-01 23:51:55 +0000177 if key in self:
178 result = self[key]
179 del self[key]
180 return result
181 if default is self.__marker:
182 raise KeyError(key)
183 return default
184
Raymond Hettingera673b1f2010-12-31 23:16:17 +0000185 def setdefault(self, key, default=None):
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700186 'od.setdefault(k[,d]) -> od.get(k,d), also set od[k]=d if k not in od'
Raymond Hettingera673b1f2010-12-31 23:16:17 +0000187 if key in self:
188 return self[key]
189 self[key] = default
190 return default
191
Raymond Hettinger98a5f3f2010-09-13 21:36:00 +0000192 @_recursive_repr()
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000193 def __repr__(self):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +0000194 'od.__repr__() <==> repr(od)'
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000195 if not self:
196 return '%s()' % (self.__class__.__name__,)
Raymond Hettinger98a5f3f2010-09-13 21:36:00 +0000197 return '%s(%r)' % (self.__class__.__name__, list(self.items()))
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000198
Raymond Hettingerfc330ae2011-04-20 13:03:49 -0700199 def __reduce__(self):
200 'Return state information for pickling'
201 items = [[k, self[k]] for k in self]
202 inst_dict = vars(self).copy()
203 for k in vars(OrderedDict()):
204 inst_dict.pop(k, None)
205 if inst_dict:
206 return (self.__class__, (items,), inst_dict)
207 return self.__class__, (items,)
208
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000209 def copy(self):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +0000210 'od.copy() -> a shallow copy of od'
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000211 return self.__class__(self)
212
213 @classmethod
214 def fromkeys(cls, iterable, value=None):
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700215 '''OD.fromkeys(S[, v]) -> New ordered dictionary with keys from S.
216 If not specified, the value defaults to None.
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +0000217
218 '''
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700219 self = cls()
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000220 for key in iterable:
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700221 self[key] = value
222 return self
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000223
224 def __eq__(self, other):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +0000225 '''od.__eq__(y) <==> od==y. Comparison to another OD is order-sensitive
226 while comparison to a regular mapping is order-insensitive.
227
228 '''
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000229 if isinstance(other, OrderedDict):
Raymond Hettinger798ee1a2009-03-23 18:29:11 +0000230 return len(self)==len(other) and \
231 all(p==q for p, q in zip(self.items(), other.items()))
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000232 return dict.__eq__(self, other)
233
Christian Heimes99170a52007-12-19 02:07:34 +0000234
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000235################################################################################
236### namedtuple
237################################################################################
238
Raymond Hettinger81b96562011-05-02 09:50:15 -0700239_class_template = '''\
240from builtins import property as _property, tuple as _tuple
241from operator import itemgetter as _itemgetter
242from collections import OrderedDict
243
244class {typename}(tuple):
245 '{typename}({arg_list})'
246
247 __slots__ = ()
248
249 _fields = {field_names!r}
250
251 def __new__(_cls, {arg_list}):
252 'Create new instance of {typename}({arg_list})'
253 return _tuple.__new__(_cls, ({arg_list}))
254
255 @classmethod
256 def _make(cls, iterable, new=tuple.__new__, len=len):
257 'Make a new {typename} object from a sequence or iterable'
258 result = new(cls, iterable)
259 if len(result) != {num_fields:d}:
260 raise TypeError('Expected {num_fields:d} arguments, got %d' % len(result))
261 return result
262
263 def __repr__(self):
264 'Return a nicely formatted representation string'
265 return self.__class__.__name__ + '({repr_fmt})' % self
266
267 def _asdict(self):
268 'Return a new OrderedDict which maps field names to their values'
269 return OrderedDict(zip(self._fields, self))
270
Raymond Hettinger3d890572011-06-02 23:40:24 -0700271 __dict__ = property(_asdict)
272
Raymond Hettinger81b96562011-05-02 09:50:15 -0700273 def _replace(_self, **kwds):
274 'Return a new {typename} object replacing specified fields with new values'
275 result = _self._make(map(kwds.pop, {field_names!r}, _self))
276 if kwds:
277 raise ValueError('Got unexpected field names: %r' % list(kwds))
278 return result
279
280 def __getnewargs__(self):
281 'Return self as a plain tuple. Used by copy and pickle.'
282 return tuple(self)
283
284{field_defs}
285'''
286
287_repr_template = '{name}=%r'
288
289_field_template = '''\
290 {name} = _property(_itemgetter({index:d}), doc='Alias for field number {index:d}')
291'''
292
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000293def namedtuple(typename, field_names, verbose=False, rename=False):
Guido van Rossumd8faa362007-04-27 19:54:29 +0000294 """Returns a new subclass of tuple with named fields.
295
Raymond Hettinger81b96562011-05-02 09:50:15 -0700296 >>> Point = namedtuple('Point', ['x', 'y'])
Thomas Wouters1b7f8912007-09-19 03:06:30 +0000297 >>> Point.__doc__ # docstring for the new class
Guido van Rossumd8faa362007-04-27 19:54:29 +0000298 'Point(x, y)'
Thomas Wouters1b7f8912007-09-19 03:06:30 +0000299 >>> p = Point(11, y=22) # instantiate with positional args or keywords
Christian Heimes99170a52007-12-19 02:07:34 +0000300 >>> p[0] + p[1] # indexable like a plain tuple
Guido van Rossumd8faa362007-04-27 19:54:29 +0000301 33
Christian Heimes99170a52007-12-19 02:07:34 +0000302 >>> x, y = p # unpack like a regular tuple
Guido van Rossumd8faa362007-04-27 19:54:29 +0000303 >>> x, y
304 (11, 22)
Thomas Wouters1b7f8912007-09-19 03:06:30 +0000305 >>> p.x + p.y # fields also accessable by name
Guido van Rossumd8faa362007-04-27 19:54:29 +0000306 33
Christian Heimes0449f632007-12-15 01:27:15 +0000307 >>> d = p._asdict() # convert to a dictionary
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000308 >>> d['x']
309 11
310 >>> Point(**d) # convert from a dictionary
Guido van Rossumd8faa362007-04-27 19:54:29 +0000311 Point(x=11, y=22)
Christian Heimes0449f632007-12-15 01:27:15 +0000312 >>> p._replace(x=100) # _replace() is like str.replace() but targets named fields
Thomas Wouters1b7f8912007-09-19 03:06:30 +0000313 Point(x=100, y=22)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000314
315 """
316
Christian Heimes2380ac72008-01-09 00:17:24 +0000317 # Parse and validate the field names. Validation serves two purposes,
318 # generating informative error messages and preventing template injection attacks.
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000319 if isinstance(field_names, str):
320 field_names = field_names.replace(',', ' ').split() # names separated by whitespace and/or commas
Raymond Hettinger81b96562011-05-02 09:50:15 -0700321 field_names = list(map(str, field_names))
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000322 if rename:
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000323 seen = set()
Raymond Hettinger81b96562011-05-02 09:50:15 -0700324 for index, name in enumerate(field_names):
325 if (not all(c.isalnum() or c=='_' for c in name)
326 or _iskeyword(name)
327 or not name
328 or name[0].isdigit()
329 or name.startswith('_')
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000330 or name in seen):
Raymond Hettinger81b96562011-05-02 09:50:15 -0700331 field_names[index] = '_%d' % index
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000332 seen.add(name)
Raymond Hettinger81b96562011-05-02 09:50:15 -0700333 for name in [typename] + field_names:
Christian Heimesb9eccbf2007-12-05 20:18:38 +0000334 if not all(c.isalnum() or c=='_' for c in name):
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000335 raise ValueError('Type names and field names can only contain alphanumeric characters and underscores: %r' % name)
336 if _iskeyword(name):
337 raise ValueError('Type names and field names cannot be a keyword: %r' % name)
338 if name[0].isdigit():
339 raise ValueError('Type names and field names cannot start with a number: %r' % name)
Raymond Hettinger81b96562011-05-02 09:50:15 -0700340 seen = set()
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000341 for name in field_names:
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000342 if name.startswith('_') and not rename:
Christian Heimes0449f632007-12-15 01:27:15 +0000343 raise ValueError('Field names cannot start with an underscore: %r' % name)
Raymond Hettinger81b96562011-05-02 09:50:15 -0700344 if name in seen:
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000345 raise ValueError('Encountered duplicate field name: %r' % name)
Raymond Hettinger81b96562011-05-02 09:50:15 -0700346 seen.add(name)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000347
Raymond Hettinger81b96562011-05-02 09:50:15 -0700348 # Fill-in the class template
349 class_definition = _class_template.format(
350 typename = typename,
351 field_names = tuple(field_names),
352 num_fields = len(field_names),
353 arg_list = repr(tuple(field_names)).replace("'", "")[1:-1],
354 repr_fmt = ', '.join(_repr_template.format(name=name) for name in field_names),
355 field_defs = '\n'.join(_field_template.format(index=index, name=name)
356 for index, name in enumerate(field_names))
357 )
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000358
Georg Brandlf08a9dd2008-06-10 16:57:31 +0000359 # Execute the template string in a temporary namespace and
360 # support tracing utilities by setting a value for frame.f_globals['__name__']
Raymond Hettinger81b96562011-05-02 09:50:15 -0700361 namespace = dict(__name__='namedtuple_%s' % typename)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000362 try:
Raymond Hettinger81b96562011-05-02 09:50:15 -0700363 exec(class_definition, namespace)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000364 except SyntaxError as e:
Raymond Hettinger81b96562011-05-02 09:50:15 -0700365 raise SyntaxError(e.msg + ':\n\n' + class_definition)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000366 result = namespace[typename]
Raymond Hettinger81b96562011-05-02 09:50:15 -0700367 if verbose:
368 print(class_definition)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000369
370 # For pickling to work, the __module__ variable needs to be set to the frame
371 # where the named tuple is created. Bypass this step in enviroments where
Benjamin Peterson25c95f12009-05-08 20:42:26 +0000372 # sys._getframe is not defined (Jython for example) or sys._getframe is not
373 # defined for arguments greater than 0 (IronPython).
374 try:
Raymond Hettinger0f055172009-01-27 10:06:09 +0000375 result.__module__ = _sys._getframe(1).f_globals.get('__name__', '__main__')
Benjamin Peterson25c95f12009-05-08 20:42:26 +0000376 except (AttributeError, ValueError):
377 pass
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000378
Guido van Rossumd59da4b2007-05-22 18:11:13 +0000379 return result
Guido van Rossumd8faa362007-04-27 19:54:29 +0000380
Guido van Rossumd8faa362007-04-27 19:54:29 +0000381
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000382########################################################################
383### Counter
384########################################################################
385
Raymond Hettinger96f34102010-12-15 16:30:37 +0000386def _count_elements(mapping, iterable):
387 'Tally elements from the iterable.'
388 mapping_get = mapping.get
389 for elem in iterable:
390 mapping[elem] = mapping_get(elem, 0) + 1
391
392try: # Load C helper function if available
393 from _collections import _count_elements
394except ImportError:
395 pass
396
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000397class Counter(dict):
398 '''Dict subclass for counting hashable items. Sometimes called a bag
399 or multiset. Elements are stored as dictionary keys and their counts
400 are stored as dictionary values.
401
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000402 >>> c = Counter('abcdeabcdabcaba') # count elements from a string
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000403
404 >>> c.most_common(3) # three most common elements
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000405 [('a', 5), ('b', 4), ('c', 3)]
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000406 >>> sorted(c) # list all unique elements
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000407 ['a', 'b', 'c', 'd', 'e']
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000408 >>> ''.join(sorted(c.elements())) # list elements with repetitions
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000409 'aaaaabbbbcccdde'
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000410 >>> sum(c.values()) # total of all counts
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000411 15
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000412
413 >>> c['a'] # count of letter 'a'
414 5
415 >>> for elem in 'shazam': # update counts from an iterable
416 ... c[elem] += 1 # by adding 1 to each element's count
417 >>> c['a'] # now there are seven 'a'
418 7
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000419 >>> del c['b'] # remove all 'b'
420 >>> c['b'] # now there are zero 'b'
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000421 0
422
423 >>> d = Counter('simsalabim') # make another counter
424 >>> c.update(d) # add in the second counter
425 >>> c['a'] # now there are nine 'a'
426 9
427
428 >>> c.clear() # empty the counter
429 >>> c
430 Counter()
431
432 Note: If a count is set to zero or reduced to zero, it will remain
433 in the counter until the entry is deleted or the counter is cleared:
434
435 >>> c = Counter('aaabbc')
436 >>> c['b'] -= 2 # reduce the count of 'b' by two
437 >>> c.most_common() # 'b' is still in, but its count is zero
438 [('a', 3), ('c', 1), ('b', 0)]
439
440 '''
441 # References:
442 # http://en.wikipedia.org/wiki/Multiset
443 # http://www.gnu.org/software/smalltalk/manual-base/html_node/Bag.html
444 # http://www.demo2s.com/Tutorial/Cpp/0380__set-multiset/Catalog0380__set-multiset.htm
445 # http://code.activestate.com/recipes/259174/
446 # Knuth, TAOCP Vol. II section 4.6.3
447
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000448 def __init__(self, iterable=None, **kwds):
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000449 '''Create a new, empty Counter object. And if given, count elements
450 from an input iterable. Or, initialize the count from another mapping
451 of elements to their counts.
452
453 >>> c = Counter() # a new, empty counter
454 >>> c = Counter('gallahad') # a new counter from an iterable
455 >>> c = Counter({'a': 4, 'b': 2}) # a new counter from a mapping
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000456 >>> c = Counter(a=4, b=2) # a new counter from keyword args
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000457
458 '''
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000459 super().__init__()
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000460 self.update(iterable, **kwds)
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000461
462 def __missing__(self, key):
463 'The count of elements not in the Counter is zero.'
464 # Needed so that self[missing_item] does not raise KeyError
465 return 0
466
467 def most_common(self, n=None):
468 '''List the n most common elements and their counts from the most
469 common to the least. If n is None, then list all element counts.
470
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000471 >>> Counter('abcdeabcdabcaba').most_common(3)
472 [('a', 5), ('b', 4), ('c', 3)]
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000473
474 '''
475 # Emulate Bag.sortedByCount from Smalltalk
476 if n is None:
477 return sorted(self.items(), key=_itemgetter(1), reverse=True)
478 return _heapq.nlargest(n, self.items(), key=_itemgetter(1))
479
480 def elements(self):
481 '''Iterator over elements repeating each as many times as its count.
482
483 >>> c = Counter('ABCABC')
484 >>> sorted(c.elements())
485 ['A', 'A', 'B', 'B', 'C', 'C']
486
487 # Knuth's example for prime factors of 1836: 2**2 * 3**3 * 17**1
488 >>> prime_factors = Counter({2: 2, 3: 3, 17: 1})
489 >>> product = 1
490 >>> for factor in prime_factors.elements(): # loop over factors
491 ... product *= factor # and multiply them
492 >>> product
493 1836
494
495 Note, if an element's count has been set to zero or is a negative
496 number, elements() will ignore it.
497
498 '''
499 # Emulate Bag.do from Smalltalk and Multiset.begin from C++.
500 return _chain.from_iterable(_starmap(_repeat, self.items()))
501
502 # Override dict methods where necessary
503
504 @classmethod
505 def fromkeys(cls, iterable, v=None):
506 # There is no equivalent method for counters because setting v=1
507 # means that no element can have a count greater than one.
508 raise NotImplementedError(
509 'Counter.fromkeys() is undefined. Use Counter(iterable) instead.')
510
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000511 def update(self, iterable=None, **kwds):
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000512 '''Like dict.update() but add counts instead of replacing them.
513
514 Source can be an iterable, a dictionary, or another Counter instance.
515
516 >>> c = Counter('which')
517 >>> c.update('witch') # add elements from another iterable
518 >>> d = Counter('watch')
519 >>> c.update(d) # add elements from another counter
520 >>> c['h'] # four 'h' in which, witch, and watch
521 4
522
523 '''
524 # The regular dict.update() operation makes no sense here because the
525 # replace behavior results in the some of original untouched counts
526 # being mixed-in with all of the other counts for a mismash that
527 # doesn't have a straight-forward interpretation in most counting
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000528 # contexts. Instead, we implement straight-addition. Both the inputs
529 # and outputs are allowed to contain zero and negative counts.
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000530
531 if iterable is not None:
532 if isinstance(iterable, Mapping):
Raymond Hettingerdd01f8f2009-01-22 09:09:55 +0000533 if self:
Raymond Hettingerf9092022009-06-29 18:30:43 +0000534 self_get = self.get
Raymond Hettingerdd01f8f2009-01-22 09:09:55 +0000535 for elem, count in iterable.items():
Raymond Hettingerf9092022009-06-29 18:30:43 +0000536 self[elem] = count + self_get(elem, 0)
Raymond Hettingerdd01f8f2009-01-22 09:09:55 +0000537 else:
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000538 super().update(iterable) # fast path when counter is empty
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000539 else:
Raymond Hettinger96f34102010-12-15 16:30:37 +0000540 _count_elements(self, iterable)
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000541 if kwds:
542 self.update(kwds)
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000543
Raymond Hettinger9c01e442010-04-03 10:32:58 +0000544 def subtract(self, iterable=None, **kwds):
545 '''Like dict.update() but subtracts counts instead of replacing them.
546 Counts can be reduced below zero. Both the inputs and outputs are
547 allowed to contain zero and negative counts.
548
549 Source can be an iterable, a dictionary, or another Counter instance.
550
551 >>> c = Counter('which')
552 >>> c.subtract('witch') # subtract elements from another iterable
553 >>> c.subtract(Counter('watch')) # subtract elements from another counter
554 >>> c['h'] # 2 in which, minus 1 in witch, minus 1 in watch
555 0
556 >>> c['w'] # 1 in which, minus 1 in witch, minus 1 in watch
557 -1
558
559 '''
560 if iterable is not None:
Raymond Hettingerfc3c9cd2010-04-11 20:41:56 +0000561 self_get = self.get
Raymond Hettinger9c01e442010-04-03 10:32:58 +0000562 if isinstance(iterable, Mapping):
Raymond Hettinger9c01e442010-04-03 10:32:58 +0000563 for elem, count in iterable.items():
564 self[elem] = self_get(elem, 0) - count
565 else:
Raymond Hettinger9c01e442010-04-03 10:32:58 +0000566 for elem in iterable:
567 self[elem] = self_get(elem, 0) - 1
568 if kwds:
569 self.subtract(kwds)
570
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000571 def copy(self):
Raymond Hettinger1c746c22011-04-15 13:16:46 -0700572 'Return a shallow copy.'
573 return self.__class__(self)
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000574
Raymond Hettingerff728162011-01-03 02:44:14 +0000575 def __reduce__(self):
576 return self.__class__, (dict(self),)
577
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000578 def __delitem__(self, elem):
579 'Like dict.__delitem__() but does not raise KeyError for missing values.'
580 if elem in self:
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000581 super().__delitem__(elem)
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000582
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000583 def __repr__(self):
584 if not self:
585 return '%s()' % self.__class__.__name__
Raymond Hettinger4e6bf412011-11-05 13:35:26 -0700586 try:
587 items = ', '.join(map('%r: %r'.__mod__, self.most_common()))
588 return '%s({%s})' % (self.__class__.__name__, items)
589 except TypeError:
590 # handle case where values are not orderable
591 return '{0}({1!r})'.format(self.__class__.__name__, dict(self))
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000592
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000593 # Multiset-style mathematical operations discussed in:
594 # Knuth TAOCP Volume II section 4.6.3 exercise 19
595 # and at http://en.wikipedia.org/wiki/Multiset
596 #
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000597 # Outputs guaranteed to only include positive counts.
598 #
599 # To strip negative and zero counts, add-in an empty counter:
600 # c += Counter()
601
602 def __add__(self, other):
603 '''Add counts from two counters.
604
605 >>> Counter('abbb') + Counter('bcc')
606 Counter({'b': 4, 'c': 2, 'a': 1})
607
608 '''
609 if not isinstance(other, Counter):
610 return NotImplemented
611 result = Counter()
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700612 for elem, count in self.items():
613 newcount = count + other[elem]
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000614 if newcount > 0:
615 result[elem] = newcount
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700616 for elem, count in other.items():
617 if elem not in self and count > 0:
618 result[elem] = count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000619 return result
620
621 def __sub__(self, other):
622 ''' Subtract count, but keep only results with positive counts.
623
624 >>> Counter('abbbc') - Counter('bccd')
625 Counter({'b': 2, 'a': 1})
626
627 '''
628 if not isinstance(other, Counter):
629 return NotImplemented
630 result = Counter()
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700631 for elem, count in self.items():
632 newcount = count - other[elem]
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000633 if newcount > 0:
634 result[elem] = newcount
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700635 for elem, count in other.items():
636 if elem not in self and count < 0:
637 result[elem] = 0 - count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000638 return result
639
640 def __or__(self, other):
641 '''Union is the maximum of value in either of the input counters.
642
643 >>> Counter('abbb') | Counter('bcc')
644 Counter({'b': 3, 'c': 2, 'a': 1})
645
646 '''
647 if not isinstance(other, Counter):
648 return NotImplemented
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000649 result = Counter()
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700650 for elem, count in self.items():
651 other_count = other[elem]
652 newcount = other_count if count < other_count else count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000653 if newcount > 0:
654 result[elem] = newcount
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700655 for elem, count in other.items():
656 if elem not in self and count > 0:
657 result[elem] = count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000658 return result
659
660 def __and__(self, other):
661 ''' Intersection is the minimum of corresponding counts.
662
663 >>> Counter('abbb') & Counter('bcc')
664 Counter({'b': 1})
665
666 '''
667 if not isinstance(other, Counter):
668 return NotImplemented
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000669 result = Counter()
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700670 for elem, count in self.items():
671 other_count = other[elem]
672 newcount = count if count < other_count else other_count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000673 if newcount > 0:
674 result[elem] = newcount
675 return result
676
Guido van Rossumd8faa362007-04-27 19:54:29 +0000677
Raymond Hettingere6603602011-02-21 19:38:53 +0000678########################################################################
679### ChainMap (helper for configparser)
680########################################################################
681
682class _ChainMap(MutableMapping):
683 ''' A ChainMap groups multiple dicts (or other mappings) together
684 to create a single, updateable view.
685
686 The underlying mappings are stored in a list. That list is public and can
687 accessed or updated using the *maps* attribute. There is no other state.
688
689 Lookups search the underlying mappings successively until a key is found.
690 In contrast, writes, updates, and deletions only operate on the first
691 mapping.
692
693 '''
694
695 def __init__(self, *maps):
696 '''Initialize a ChainMap by setting *maps* to the given mappings.
697 If no mappings are provided, a single empty dictionary is used.
698
699 '''
700 self.maps = list(maps) or [{}] # always at least one map
701
702 def __missing__(self, key):
703 raise KeyError(key)
704
705 def __getitem__(self, key):
706 for mapping in self.maps:
707 try:
708 return mapping[key] # can't use 'key in mapping' with defaultdict
709 except KeyError:
710 pass
711 return self.__missing__(key) # support subclasses that define __missing__
712
713 def get(self, key, default=None):
714 return self[key] if key in self else default
715
716 def __len__(self):
717 return len(set().union(*self.maps)) # reuses stored hash values if possible
718
719 def __iter__(self):
720 return iter(set().union(*self.maps))
721
722 def __contains__(self, key):
723 return any(key in m for m in self.maps)
724
Raymond Hettingera5ac2ce2011-05-02 11:02:13 -0700725 def __bool__(self):
726 return any(self.maps)
727
Raymond Hettingere6603602011-02-21 19:38:53 +0000728 @_recursive_repr()
729 def __repr__(self):
730 return '{0.__class__.__name__}({1})'.format(
731 self, ', '.join(map(repr, self.maps)))
732
733 @classmethod
734 def fromkeys(cls, iterable, *args):
735 'Create a ChainMap with a single dict created from the iterable.'
736 return cls(dict.fromkeys(iterable, *args))
737
738 def copy(self):
739 'New ChainMap or subclass with a new copy of maps[0] and refs to maps[1:]'
740 return self.__class__(self.maps[0].copy(), *self.maps[1:])
741
742 __copy__ = copy
743
Raymond Hettingerdcb29c92011-02-23 08:28:06 +0000744 def new_child(self): # like Django's Context.push()
745 'New ChainMap with a new dict followed by all previous maps.'
746 return self.__class__({}, *self.maps)
747
748 @property
749 def parents(self): # like Django's Context.pop()
750 'New ChainMap from maps[1:].'
751 return self.__class__(*self.maps[1:])
752
Raymond Hettingere6603602011-02-21 19:38:53 +0000753 def __setitem__(self, key, value):
754 self.maps[0][key] = value
755
756 def __delitem__(self, key):
757 try:
758 del self.maps[0][key]
759 except KeyError:
760 raise KeyError('Key not found in the first mapping: {!r}'.format(key))
761
762 def popitem(self):
763 'Remove and return an item pair from maps[0]. Raise KeyError is maps[0] is empty.'
764 try:
765 return self.maps[0].popitem()
766 except KeyError:
767 raise KeyError('No keys found in the first mapping.')
768
769 def pop(self, key, *args):
770 'Remove *key* from maps[0] and return its value. Raise KeyError if *key* not in maps[0].'
771 try:
772 return self.maps[0].pop(key, *args)
773 except KeyError:
774 raise KeyError('Key not found in the first mapping: {!r}'.format(key))
775
776 def clear(self):
777 'Clear maps[0], leaving maps[1:] intact.'
778 self.maps[0].clear()
779
780
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000781################################################################################
782### UserDict
783################################################################################
Guido van Rossumd8faa362007-04-27 19:54:29 +0000784
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000785class UserDict(MutableMapping):
786
787 # Start by filling-out the abstract methods
788 def __init__(self, dict=None, **kwargs):
789 self.data = {}
790 if dict is not None:
791 self.update(dict)
792 if len(kwargs):
793 self.update(kwargs)
794 def __len__(self): return len(self.data)
795 def __getitem__(self, key):
796 if key in self.data:
797 return self.data[key]
798 if hasattr(self.__class__, "__missing__"):
799 return self.__class__.__missing__(self, key)
800 raise KeyError(key)
801 def __setitem__(self, key, item): self.data[key] = item
802 def __delitem__(self, key): del self.data[key]
803 def __iter__(self):
804 return iter(self.data)
805
Raymond Hettinger554c8b82008-02-05 22:54:43 +0000806 # Modify __contains__ to work correctly when __missing__ is present
807 def __contains__(self, key):
808 return key in self.data
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000809
810 # Now, add the methods in dicts but not in MutableMapping
811 def __repr__(self): return repr(self.data)
812 def copy(self):
813 if self.__class__ is UserDict:
814 return UserDict(self.data.copy())
815 import copy
816 data = self.data
817 try:
818 self.data = {}
819 c = copy.copy(self)
820 finally:
821 self.data = data
822 c.update(self)
823 return c
824 @classmethod
825 def fromkeys(cls, iterable, value=None):
826 d = cls()
827 for key in iterable:
828 d[key] = value
829 return d
830
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000831
832
833################################################################################
Raymond Hettinger53dbe392008-02-12 20:03:09 +0000834### UserList
835################################################################################
836
837class UserList(MutableSequence):
838 """A more or less complete user-defined wrapper around list objects."""
839 def __init__(self, initlist=None):
840 self.data = []
841 if initlist is not None:
842 # XXX should this accept an arbitrary sequence?
843 if type(initlist) == type(self.data):
844 self.data[:] = initlist
845 elif isinstance(initlist, UserList):
846 self.data[:] = initlist.data[:]
847 else:
848 self.data = list(initlist)
849 def __repr__(self): return repr(self.data)
850 def __lt__(self, other): return self.data < self.__cast(other)
851 def __le__(self, other): return self.data <= self.__cast(other)
852 def __eq__(self, other): return self.data == self.__cast(other)
853 def __ne__(self, other): return self.data != self.__cast(other)
854 def __gt__(self, other): return self.data > self.__cast(other)
855 def __ge__(self, other): return self.data >= self.__cast(other)
856 def __cast(self, other):
857 return other.data if isinstance(other, UserList) else other
Raymond Hettinger53dbe392008-02-12 20:03:09 +0000858 def __contains__(self, item): return item in self.data
859 def __len__(self): return len(self.data)
860 def __getitem__(self, i): return self.data[i]
861 def __setitem__(self, i, item): self.data[i] = item
862 def __delitem__(self, i): del self.data[i]
863 def __add__(self, other):
864 if isinstance(other, UserList):
865 return self.__class__(self.data + other.data)
866 elif isinstance(other, type(self.data)):
867 return self.__class__(self.data + other)
868 return self.__class__(self.data + list(other))
869 def __radd__(self, other):
870 if isinstance(other, UserList):
871 return self.__class__(other.data + self.data)
872 elif isinstance(other, type(self.data)):
873 return self.__class__(other + self.data)
874 return self.__class__(list(other) + self.data)
875 def __iadd__(self, other):
876 if isinstance(other, UserList):
877 self.data += other.data
878 elif isinstance(other, type(self.data)):
879 self.data += other
880 else:
881 self.data += list(other)
882 return self
883 def __mul__(self, n):
884 return self.__class__(self.data*n)
885 __rmul__ = __mul__
886 def __imul__(self, n):
887 self.data *= n
888 return self
889 def append(self, item): self.data.append(item)
890 def insert(self, i, item): self.data.insert(i, item)
891 def pop(self, i=-1): return self.data.pop(i)
892 def remove(self, item): self.data.remove(item)
893 def count(self, item): return self.data.count(item)
894 def index(self, item, *args): return self.data.index(item, *args)
895 def reverse(self): self.data.reverse()
896 def sort(self, *args, **kwds): self.data.sort(*args, **kwds)
897 def extend(self, other):
898 if isinstance(other, UserList):
899 self.data.extend(other.data)
900 else:
901 self.data.extend(other)
902
903
904
905################################################################################
Raymond Hettingerb3a65f82008-02-21 22:11:37 +0000906### UserString
907################################################################################
908
909class UserString(Sequence):
910 def __init__(self, seq):
911 if isinstance(seq, str):
912 self.data = seq
913 elif isinstance(seq, UserString):
914 self.data = seq.data[:]
915 else:
916 self.data = str(seq)
917 def __str__(self): return str(self.data)
918 def __repr__(self): return repr(self.data)
919 def __int__(self): return int(self.data)
Raymond Hettingerb3a65f82008-02-21 22:11:37 +0000920 def __float__(self): return float(self.data)
921 def __complex__(self): return complex(self.data)
922 def __hash__(self): return hash(self.data)
923
924 def __eq__(self, string):
925 if isinstance(string, UserString):
926 return self.data == string.data
927 return self.data == string
928 def __ne__(self, string):
929 if isinstance(string, UserString):
930 return self.data != string.data
931 return self.data != string
932 def __lt__(self, string):
933 if isinstance(string, UserString):
934 return self.data < string.data
935 return self.data < string
936 def __le__(self, string):
937 if isinstance(string, UserString):
938 return self.data <= string.data
939 return self.data <= string
940 def __gt__(self, string):
941 if isinstance(string, UserString):
942 return self.data > string.data
943 return self.data > string
944 def __ge__(self, string):
945 if isinstance(string, UserString):
946 return self.data >= string.data
947 return self.data >= string
948
949 def __contains__(self, char):
950 if isinstance(char, UserString):
951 char = char.data
952 return char in self.data
953
954 def __len__(self): return len(self.data)
955 def __getitem__(self, index): return self.__class__(self.data[index])
956 def __add__(self, other):
957 if isinstance(other, UserString):
958 return self.__class__(self.data + other.data)
959 elif isinstance(other, str):
960 return self.__class__(self.data + other)
961 return self.__class__(self.data + str(other))
962 def __radd__(self, other):
963 if isinstance(other, str):
964 return self.__class__(other + self.data)
965 return self.__class__(str(other) + self.data)
966 def __mul__(self, n):
967 return self.__class__(self.data*n)
968 __rmul__ = __mul__
969 def __mod__(self, args):
970 return self.__class__(self.data % args)
971
972 # the following methods are defined in alphabetical order:
973 def capitalize(self): return self.__class__(self.data.capitalize())
974 def center(self, width, *args):
975 return self.__class__(self.data.center(width, *args))
976 def count(self, sub, start=0, end=_sys.maxsize):
977 if isinstance(sub, UserString):
978 sub = sub.data
979 return self.data.count(sub, start, end)
980 def encode(self, encoding=None, errors=None): # XXX improve this?
981 if encoding:
982 if errors:
983 return self.__class__(self.data.encode(encoding, errors))
984 return self.__class__(self.data.encode(encoding))
985 return self.__class__(self.data.encode())
986 def endswith(self, suffix, start=0, end=_sys.maxsize):
987 return self.data.endswith(suffix, start, end)
988 def expandtabs(self, tabsize=8):
989 return self.__class__(self.data.expandtabs(tabsize))
990 def find(self, sub, start=0, end=_sys.maxsize):
991 if isinstance(sub, UserString):
992 sub = sub.data
993 return self.data.find(sub, start, end)
994 def format(self, *args, **kwds):
995 return self.data.format(*args, **kwds)
996 def index(self, sub, start=0, end=_sys.maxsize):
997 return self.data.index(sub, start, end)
998 def isalpha(self): return self.data.isalpha()
999 def isalnum(self): return self.data.isalnum()
1000 def isdecimal(self): return self.data.isdecimal()
1001 def isdigit(self): return self.data.isdigit()
1002 def isidentifier(self): return self.data.isidentifier()
1003 def islower(self): return self.data.islower()
1004 def isnumeric(self): return self.data.isnumeric()
1005 def isspace(self): return self.data.isspace()
1006 def istitle(self): return self.data.istitle()
1007 def isupper(self): return self.data.isupper()
1008 def join(self, seq): return self.data.join(seq)
1009 def ljust(self, width, *args):
1010 return self.__class__(self.data.ljust(width, *args))
1011 def lower(self): return self.__class__(self.data.lower())
1012 def lstrip(self, chars=None): return self.__class__(self.data.lstrip(chars))
1013 def partition(self, sep):
1014 return self.data.partition(sep)
1015 def replace(self, old, new, maxsplit=-1):
1016 if isinstance(old, UserString):
1017 old = old.data
1018 if isinstance(new, UserString):
1019 new = new.data
1020 return self.__class__(self.data.replace(old, new, maxsplit))
1021 def rfind(self, sub, start=0, end=_sys.maxsize):
Antoine Pitrouda2ecaf2010-01-02 21:40:36 +00001022 if isinstance(sub, UserString):
1023 sub = sub.data
Raymond Hettingerb3a65f82008-02-21 22:11:37 +00001024 return self.data.rfind(sub, start, end)
1025 def rindex(self, sub, start=0, end=_sys.maxsize):
1026 return self.data.rindex(sub, start, end)
1027 def rjust(self, width, *args):
1028 return self.__class__(self.data.rjust(width, *args))
1029 def rpartition(self, sep):
1030 return self.data.rpartition(sep)
1031 def rstrip(self, chars=None):
1032 return self.__class__(self.data.rstrip(chars))
1033 def split(self, sep=None, maxsplit=-1):
1034 return self.data.split(sep, maxsplit)
1035 def rsplit(self, sep=None, maxsplit=-1):
1036 return self.data.rsplit(sep, maxsplit)
1037 def splitlines(self, keepends=0): return self.data.splitlines(keepends)
1038 def startswith(self, prefix, start=0, end=_sys.maxsize):
1039 return self.data.startswith(prefix, start, end)
1040 def strip(self, chars=None): return self.__class__(self.data.strip(chars))
1041 def swapcase(self): return self.__class__(self.data.swapcase())
1042 def title(self): return self.__class__(self.data.title())
1043 def translate(self, *args):
1044 return self.__class__(self.data.translate(*args))
1045 def upper(self): return self.__class__(self.data.upper())
1046 def zfill(self, width): return self.__class__(self.data.zfill(width))
1047
1048
1049
1050################################################################################
Raymond Hettinger48b8b662008-02-05 01:53:00 +00001051### Simple tests
1052################################################################################
Guido van Rossumd8faa362007-04-27 19:54:29 +00001053
1054if __name__ == '__main__':
Thomas Wouters1b7f8912007-09-19 03:06:30 +00001055 # verify that instances can be pickled
Guido van Rossum99603b02007-07-20 00:22:32 +00001056 from pickle import loads, dumps
Guido van Rossum8ce8a782007-11-01 19:42:39 +00001057 Point = namedtuple('Point', 'x, y', True)
Guido van Rossumd8faa362007-04-27 19:54:29 +00001058 p = Point(x=10, y=20)
1059 assert p == loads(dumps(p))
1060
Guido van Rossum3d392eb2007-11-16 00:35:22 +00001061 # test and demonstrate ability to override methods
Christian Heimes043d6f62008-01-07 17:19:16 +00001062 class Point(namedtuple('Point', 'x y')):
Christian Heimes25bb7832008-01-11 16:17:00 +00001063 __slots__ = ()
Christian Heimes043d6f62008-01-07 17:19:16 +00001064 @property
1065 def hypot(self):
1066 return (self.x ** 2 + self.y ** 2) ** 0.5
Christian Heimes790c8232008-01-07 21:14:23 +00001067 def __str__(self):
Christian Heimes25bb7832008-01-11 16:17:00 +00001068 return 'Point: x=%6.3f y=%6.3f hypot=%6.3f' % (self.x, self.y, self.hypot)
Christian Heimes043d6f62008-01-07 17:19:16 +00001069
Christian Heimes25bb7832008-01-11 16:17:00 +00001070 for p in Point(3, 4), Point(14, 5/7.):
Christian Heimes790c8232008-01-07 21:14:23 +00001071 print (p)
Christian Heimes043d6f62008-01-07 17:19:16 +00001072
1073 class Point(namedtuple('Point', 'x y')):
1074 'Point class with optimized _make() and _replace() without error-checking'
Christian Heimes25bb7832008-01-11 16:17:00 +00001075 __slots__ = ()
Christian Heimes043d6f62008-01-07 17:19:16 +00001076 _make = classmethod(tuple.__new__)
1077 def _replace(self, _map=map, **kwds):
Christian Heimes2380ac72008-01-09 00:17:24 +00001078 return self._make(_map(kwds.get, ('x', 'y'), self))
Christian Heimes043d6f62008-01-07 17:19:16 +00001079
1080 print(Point(11, 22)._replace(x=100))
Guido van Rossum3d392eb2007-11-16 00:35:22 +00001081
Christian Heimes25bb7832008-01-11 16:17:00 +00001082 Point3D = namedtuple('Point3D', Point._fields + ('z',))
1083 print(Point3D.__doc__)
1084
Guido van Rossumd8faa362007-04-27 19:54:29 +00001085 import doctest
Guido van Rossum8ce8a782007-11-01 19:42:39 +00001086 TestResults = namedtuple('TestResults', 'failed attempted')
Guido van Rossumd8faa362007-04-27 19:54:29 +00001087 print(TestResults(*doctest.testmod()))