blob: 2b6abd879fc939deacc88302d883dcfd6d20e699 [file] [log] [blame]
Brett Cannon23a4a7b2008-05-12 00:56:28 +00001__all__ = ['deque', 'defaultdict', 'namedtuple', 'UserDict', 'UserList',
Raymond Hettinger2d32f632009-03-02 21:24:57 +00002 'UserString', 'Counter', 'OrderedDict']
Guido van Rossumcd16bf62007-06-13 18:07:49 +00003# For bootstrapping reasons, the collection ABCs are defined in _abcoll.py.
4# They should however be considered an integral part of collections.py.
5from _abcoll import *
6import _abcoll
7__all__ += _abcoll.__all__
8
Christian Heimes99170a52007-12-19 02:07:34 +00009from _collections import deque, defaultdict
10from operator import itemgetter as _itemgetter
11from keyword import iskeyword as _iskeyword
12import sys as _sys
Raymond Hettingerb8baf632009-01-14 02:20:07 +000013import heapq as _heapq
Raymond Hettingerfa11db02010-09-12 04:12:42 +000014from weakref import proxy as _proxy
Raymond Hettingerea9f8db2009-03-02 21:28:41 +000015from itertools import repeat as _repeat, chain as _chain, starmap as _starmap
Raymond Hettinger98a5f3f2010-09-13 21:36:00 +000016from reprlib import recursive_repr as _recursive_repr
Raymond Hettinger2d32f632009-03-02 21:24:57 +000017
18################################################################################
19### OrderedDict
20################################################################################
21
Raymond Hettingerfa11db02010-09-12 04:12:42 +000022class _Link(object):
23 __slots__ = 'prev', 'next', 'key', '__weakref__'
24
Raymond Hettinger345c49b2011-01-01 23:51:55 +000025class OrderedDict(dict):
Raymond Hettinger18ed2cb2009-03-19 23:14:39 +000026 'Dictionary that remembers insertion order'
Raymond Hettingerf1736542009-03-23 05:19:21 +000027 # An inherited dict maps keys to values.
Raymond Hettinger18ed2cb2009-03-19 23:14:39 +000028 # The inherited dict provides __getitem__, __len__, __contains__, and get.
29 # The remaining methods are order-aware.
Raymond Hettinger5db3e012011-04-24 14:26:08 -070030 # Big-O running times for all methods are the same as regular dictionaries.
Raymond Hettingerf1736542009-03-23 05:19:21 +000031
Raymond Hettinger5db3e012011-04-24 14:26:08 -070032 # The internal self.__map dict maps keys to links in a doubly linked list.
Raymond Hettingerf1736542009-03-23 05:19:21 +000033 # The circular doubly linked list starts and ends with a sentinel element.
34 # The sentinel element never gets deleted (this simplifies the algorithm).
Raymond Hettinger5db3e012011-04-24 14:26:08 -070035 # The sentinel is in self.__hardroot with a weakref proxy in self.__root.
Raymond Hettingerc5c29c02010-09-12 18:13:46 +000036 # The prev/next links are weakref proxies (to prevent circular references).
37 # Individual links are kept alive by the hard reference in self.__map.
38 # Those hard references disappear when a key is deleted from an OrderedDict.
Raymond Hettinger2d32f632009-03-02 21:24:57 +000039
40 def __init__(self, *args, **kwds):
Raymond Hettinger5db3e012011-04-24 14:26:08 -070041 '''Initialize an ordered dictionary. The signature is the same as
42 regular dictionaries, but keyword arguments are not recommended because
43 their insertion order is arbitrary.
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +000044
45 '''
Raymond Hettinger2d32f632009-03-02 21:24:57 +000046 if len(args) > 1:
47 raise TypeError('expected at most 1 arguments, got %d' % len(args))
Raymond Hettinger08c70cf2009-03-03 20:47:29 +000048 try:
Raymond Hettingerf1736542009-03-23 05:19:21 +000049 self.__root
Raymond Hettinger08c70cf2009-03-03 20:47:29 +000050 except AttributeError:
Raymond Hettingerf7328d02010-09-14 19:40:15 +000051 self.__hardroot = _Link()
52 self.__root = root = _proxy(self.__hardroot)
Raymond Hettingerfa11db02010-09-12 04:12:42 +000053 root.prev = root.next = root
Raymond Hettinger52dc06b2009-03-25 22:45:22 +000054 self.__map = {}
Raymond Hettinger32062e92011-01-01 22:38:00 +000055 self.__update(*args, **kwds)
Raymond Hettinger2d32f632009-03-02 21:24:57 +000056
Raymond Hettingerfa11db02010-09-12 04:12:42 +000057 def __setitem__(self, key, value,
58 dict_setitem=dict.__setitem__, proxy=_proxy, Link=_Link):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +000059 'od.__setitem__(i, y) <==> od[i]=y'
Raymond Hettinger5db3e012011-04-24 14:26:08 -070060 # Setting a new item creates a new link at the end of the linked list,
61 # and the inherited dictionary is updated with the new key/value pair.
Raymond Hettinger2d32f632009-03-02 21:24:57 +000062 if key not in self:
Raymond Hettingerfa11db02010-09-12 04:12:42 +000063 self.__map[key] = link = Link()
Raymond Hettingerf1736542009-03-23 05:19:21 +000064 root = self.__root
Raymond Hettingerfa11db02010-09-12 04:12:42 +000065 last = root.prev
66 link.prev, link.next, link.key = last, root, key
Raymond Hettingerf7328d02010-09-14 19:40:15 +000067 last.next = link
68 root.prev = proxy(link)
69 dict_setitem(self, key, value)
Raymond Hettinger2d32f632009-03-02 21:24:57 +000070
Raymond Hettingerfa11db02010-09-12 04:12:42 +000071 def __delitem__(self, key, dict_delitem=dict.__delitem__):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +000072 'od.__delitem__(y) <==> del od[y]'
Raymond Hettinger5db3e012011-04-24 14:26:08 -070073 # Deleting an existing item uses self.__map to find the link which gets
74 # removed by updating the links in the predecessor and successor nodes.
Raymond Hettinger5be21b72010-08-01 22:10:57 +000075 dict_delitem(self, key)
Raymond Hettingerf1736542009-03-23 05:19:21 +000076 link = self.__map.pop(key)
Raymond Hettingerfa11db02010-09-12 04:12:42 +000077 link_prev = link.prev
78 link_next = link.next
79 link_prev.next = link_next
80 link_next.prev = link_prev
Raymond Hettinger2d32f632009-03-02 21:24:57 +000081
Raymond Hettingerfa11db02010-09-12 04:12:42 +000082 def __iter__(self):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +000083 'od.__iter__() <==> iter(od)'
Raymond Hettingerf1736542009-03-23 05:19:21 +000084 # Traverse the linked list in order.
85 root = self.__root
Raymond Hettingerfa11db02010-09-12 04:12:42 +000086 curr = root.next
Raymond Hettingerf1736542009-03-23 05:19:21 +000087 while curr is not root:
Raymond Hettingerfa11db02010-09-12 04:12:42 +000088 yield curr.key
89 curr = curr.next
Raymond Hettinger2d32f632009-03-02 21:24:57 +000090
Raymond Hettingerfa11db02010-09-12 04:12:42 +000091 def __reversed__(self):
Raymond Hettinger2352cf32009-04-08 01:16:27 +000092 'od.__reversed__() <==> reversed(od)'
Raymond Hettingerf1736542009-03-23 05:19:21 +000093 # Traverse the linked list in reverse order.
94 root = self.__root
Raymond Hettingerfa11db02010-09-12 04:12:42 +000095 curr = root.prev
Raymond Hettingerf1736542009-03-23 05:19:21 +000096 while curr is not root:
Raymond Hettingerfa11db02010-09-12 04:12:42 +000097 yield curr.key
98 curr = curr.prev
Raymond Hettinger2d32f632009-03-02 21:24:57 +000099
Raymond Hettinger5be21b72010-08-01 22:10:57 +0000100 def clear(self):
101 'od.clear() -> None. Remove all items from od.'
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000102 root = self.__root
103 root.prev = root.next = root
104 self.__map.clear()
Raymond Hettinger5be21b72010-08-01 22:10:57 +0000105 dict.clear(self)
106
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000107 def popitem(self, last=True):
Raymond Hettinger331722d2010-09-02 18:44:16 +0000108 '''od.popitem() -> (k, v), return and remove a (key, value) pair.
109 Pairs are returned in LIFO order if last is true or FIFO order if false.
110
111 '''
112 if not self:
113 raise KeyError('dictionary is empty')
114 root = self.__root
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000115 if last:
116 link = root.prev
117 link_prev = link.prev
118 link_prev.next = root
119 root.prev = link_prev
120 else:
121 link = root.next
122 link_next = link.next
123 root.next = link_next
124 link_next.prev = root
125 key = link.key
Raymond Hettinger331722d2010-09-02 18:44:16 +0000126 del self.__map[key]
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000127 value = dict.pop(self, key)
Raymond Hettinger331722d2010-09-02 18:44:16 +0000128 return key, value
129
Raymond Hettingerfa11db02010-09-12 04:12:42 +0000130 def move_to_end(self, key, last=True):
131 '''Move an existing element to the end (or beginning if last==False).
132
133 Raises KeyError if the element does not exist.
134 When last=True, acts like a fast version of self[key]=self.pop(key).
135
136 '''
137 link = self.__map[key]
138 link_prev = link.prev
139 link_next = link.next
140 link_prev.next = link_next
141 link_next.prev = link_prev
142 root = self.__root
143 if last:
144 last = root.prev
145 link.prev = last
146 link.next = root
147 last.next = root.prev = link
148 else:
149 first = root.next
150 link.prev = root
151 link.next = first
152 root.next = first.prev = link
153
Raymond Hettinger35c87f22010-09-16 19:10:17 +0000154 def __sizeof__(self):
155 sizeof = _sys.getsizeof
156 n = len(self) + 1 # number of links including root
157 size = sizeof(self.__dict__) # instance dictionary
158 size += sizeof(self.__map) * 2 # internal dict and inherited dict
159 size += sizeof(self.__hardroot) * n # link objects
160 size += sizeof(self.__root) * n # proxy objects
161 return size
162
Raymond Hettinger32062e92011-01-01 22:38:00 +0000163 update = __update = MutableMapping.update
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000164 keys = MutableMapping.keys
165 values = MutableMapping.values
166 items = MutableMapping.items
Raymond Hettinger5be21b72010-08-01 22:10:57 +0000167 __ne__ = MutableMapping.__ne__
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000168
Raymond Hettinger345c49b2011-01-01 23:51:55 +0000169 __marker = object()
170
171 def pop(self, key, default=__marker):
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700172 '''od.pop(k[,d]) -> v, remove specified key and return the corresponding
173 value. If key is not found, d is returned if given, otherwise KeyError
174 is raised.
175
176 '''
Raymond Hettinger345c49b2011-01-01 23:51:55 +0000177 if key in self:
178 result = self[key]
179 del self[key]
180 return result
181 if default is self.__marker:
182 raise KeyError(key)
183 return default
184
Raymond Hettingera673b1f2010-12-31 23:16:17 +0000185 def setdefault(self, key, default=None):
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700186 'od.setdefault(k[,d]) -> od.get(k,d), also set od[k]=d if k not in od'
Raymond Hettingera673b1f2010-12-31 23:16:17 +0000187 if key in self:
188 return self[key]
189 self[key] = default
190 return default
191
Raymond Hettinger98a5f3f2010-09-13 21:36:00 +0000192 @_recursive_repr()
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000193 def __repr__(self):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +0000194 'od.__repr__() <==> repr(od)'
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000195 if not self:
196 return '%s()' % (self.__class__.__name__,)
Raymond Hettinger98a5f3f2010-09-13 21:36:00 +0000197 return '%s(%r)' % (self.__class__.__name__, list(self.items()))
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000198
Raymond Hettingerfc330ae2011-04-20 13:03:49 -0700199 def __reduce__(self):
200 'Return state information for pickling'
201 items = [[k, self[k]] for k in self]
202 inst_dict = vars(self).copy()
203 for k in vars(OrderedDict()):
204 inst_dict.pop(k, None)
205 if inst_dict:
206 return (self.__class__, (items,), inst_dict)
207 return self.__class__, (items,)
208
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000209 def copy(self):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +0000210 'od.copy() -> a shallow copy of od'
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000211 return self.__class__(self)
212
213 @classmethod
214 def fromkeys(cls, iterable, value=None):
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700215 '''OD.fromkeys(S[, v]) -> New ordered dictionary with keys from S.
216 If not specified, the value defaults to None.
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +0000217
218 '''
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700219 self = cls()
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000220 for key in iterable:
Raymond Hettinger5db3e012011-04-24 14:26:08 -0700221 self[key] = value
222 return self
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000223
224 def __eq__(self, other):
Raymond Hettingerf04fa1b2009-04-08 01:15:02 +0000225 '''od.__eq__(y) <==> od==y. Comparison to another OD is order-sensitive
226 while comparison to a regular mapping is order-insensitive.
227
228 '''
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000229 if isinstance(other, OrderedDict):
Raymond Hettinger798ee1a2009-03-23 18:29:11 +0000230 return len(self)==len(other) and \
231 all(p==q for p, q in zip(self.items(), other.items()))
Raymond Hettinger2d32f632009-03-02 21:24:57 +0000232 return dict.__eq__(self, other)
233
Christian Heimes99170a52007-12-19 02:07:34 +0000234
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000235################################################################################
236### namedtuple
237################################################################################
238
Raymond Hettinger81b96562011-05-02 09:50:15 -0700239_class_template = '''\
240from builtins import property as _property, tuple as _tuple
241from operator import itemgetter as _itemgetter
242from collections import OrderedDict
243
244class {typename}(tuple):
245 '{typename}({arg_list})'
246
247 __slots__ = ()
248
249 _fields = {field_names!r}
250
251 def __new__(_cls, {arg_list}):
252 'Create new instance of {typename}({arg_list})'
253 return _tuple.__new__(_cls, ({arg_list}))
254
255 @classmethod
256 def _make(cls, iterable, new=tuple.__new__, len=len):
257 'Make a new {typename} object from a sequence or iterable'
258 result = new(cls, iterable)
259 if len(result) != {num_fields:d}:
260 raise TypeError('Expected {num_fields:d} arguments, got %d' % len(result))
261 return result
262
263 def __repr__(self):
264 'Return a nicely formatted representation string'
265 return self.__class__.__name__ + '({repr_fmt})' % self
266
267 def _asdict(self):
268 'Return a new OrderedDict which maps field names to their values'
269 return OrderedDict(zip(self._fields, self))
270
Raymond Hettinger3d890572011-06-02 23:40:24 -0700271 __dict__ = property(_asdict)
272
Raymond Hettinger81b96562011-05-02 09:50:15 -0700273 def _replace(_self, **kwds):
274 'Return a new {typename} object replacing specified fields with new values'
275 result = _self._make(map(kwds.pop, {field_names!r}, _self))
276 if kwds:
277 raise ValueError('Got unexpected field names: %r' % list(kwds))
278 return result
279
280 def __getnewargs__(self):
281 'Return self as a plain tuple. Used by copy and pickle.'
282 return tuple(self)
283
284{field_defs}
285'''
286
287_repr_template = '{name}=%r'
288
289_field_template = '''\
290 {name} = _property(_itemgetter({index:d}), doc='Alias for field number {index:d}')
291'''
292
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000293def namedtuple(typename, field_names, verbose=False, rename=False):
Guido van Rossumd8faa362007-04-27 19:54:29 +0000294 """Returns a new subclass of tuple with named fields.
295
Raymond Hettinger81b96562011-05-02 09:50:15 -0700296 >>> Point = namedtuple('Point', ['x', 'y'])
Thomas Wouters1b7f8912007-09-19 03:06:30 +0000297 >>> Point.__doc__ # docstring for the new class
Guido van Rossumd8faa362007-04-27 19:54:29 +0000298 'Point(x, y)'
Thomas Wouters1b7f8912007-09-19 03:06:30 +0000299 >>> p = Point(11, y=22) # instantiate with positional args or keywords
Christian Heimes99170a52007-12-19 02:07:34 +0000300 >>> p[0] + p[1] # indexable like a plain tuple
Guido van Rossumd8faa362007-04-27 19:54:29 +0000301 33
Christian Heimes99170a52007-12-19 02:07:34 +0000302 >>> x, y = p # unpack like a regular tuple
Guido van Rossumd8faa362007-04-27 19:54:29 +0000303 >>> x, y
304 (11, 22)
Thomas Wouters1b7f8912007-09-19 03:06:30 +0000305 >>> p.x + p.y # fields also accessable by name
Guido van Rossumd8faa362007-04-27 19:54:29 +0000306 33
Christian Heimes0449f632007-12-15 01:27:15 +0000307 >>> d = p._asdict() # convert to a dictionary
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000308 >>> d['x']
309 11
310 >>> Point(**d) # convert from a dictionary
Guido van Rossumd8faa362007-04-27 19:54:29 +0000311 Point(x=11, y=22)
Christian Heimes0449f632007-12-15 01:27:15 +0000312 >>> p._replace(x=100) # _replace() is like str.replace() but targets named fields
Thomas Wouters1b7f8912007-09-19 03:06:30 +0000313 Point(x=100, y=22)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000314
315 """
316
Christian Heimes2380ac72008-01-09 00:17:24 +0000317 # Parse and validate the field names. Validation serves two purposes,
318 # generating informative error messages and preventing template injection attacks.
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000319 if isinstance(field_names, str):
320 field_names = field_names.replace(',', ' ').split() # names separated by whitespace and/or commas
Raymond Hettinger81b96562011-05-02 09:50:15 -0700321 field_names = list(map(str, field_names))
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000322 if rename:
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000323 seen = set()
Raymond Hettinger81b96562011-05-02 09:50:15 -0700324 for index, name in enumerate(field_names):
325 if (not all(c.isalnum() or c=='_' for c in name)
326 or _iskeyword(name)
327 or not name
328 or name[0].isdigit()
329 or name.startswith('_')
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000330 or name in seen):
Raymond Hettinger81b96562011-05-02 09:50:15 -0700331 field_names[index] = '_%d' % index
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000332 seen.add(name)
Raymond Hettinger81b96562011-05-02 09:50:15 -0700333 for name in [typename] + field_names:
Christian Heimesb9eccbf2007-12-05 20:18:38 +0000334 if not all(c.isalnum() or c=='_' for c in name):
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000335 raise ValueError('Type names and field names can only contain alphanumeric characters and underscores: %r' % name)
336 if _iskeyword(name):
337 raise ValueError('Type names and field names cannot be a keyword: %r' % name)
338 if name[0].isdigit():
339 raise ValueError('Type names and field names cannot start with a number: %r' % name)
Raymond Hettinger81b96562011-05-02 09:50:15 -0700340 seen = set()
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000341 for name in field_names:
Benjamin Petersona86f2c02009-02-10 02:41:10 +0000342 if name.startswith('_') and not rename:
Christian Heimes0449f632007-12-15 01:27:15 +0000343 raise ValueError('Field names cannot start with an underscore: %r' % name)
Raymond Hettinger81b96562011-05-02 09:50:15 -0700344 if name in seen:
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000345 raise ValueError('Encountered duplicate field name: %r' % name)
Raymond Hettinger81b96562011-05-02 09:50:15 -0700346 seen.add(name)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000347
Raymond Hettinger81b96562011-05-02 09:50:15 -0700348 # Fill-in the class template
349 class_definition = _class_template.format(
350 typename = typename,
351 field_names = tuple(field_names),
352 num_fields = len(field_names),
353 arg_list = repr(tuple(field_names)).replace("'", "")[1:-1],
354 repr_fmt = ', '.join(_repr_template.format(name=name) for name in field_names),
355 field_defs = '\n'.join(_field_template.format(index=index, name=name)
356 for index, name in enumerate(field_names))
357 )
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000358
Georg Brandlf08a9dd2008-06-10 16:57:31 +0000359 # Execute the template string in a temporary namespace and
360 # support tracing utilities by setting a value for frame.f_globals['__name__']
Raymond Hettinger81b96562011-05-02 09:50:15 -0700361 namespace = dict(__name__='namedtuple_%s' % typename)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000362 try:
Raymond Hettinger81b96562011-05-02 09:50:15 -0700363 exec(class_definition, namespace)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000364 except SyntaxError as e:
Raymond Hettinger81b96562011-05-02 09:50:15 -0700365 raise SyntaxError(e.msg + ':\n\n' + class_definition)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000366 result = namespace[typename]
Raymond Hettinger81b96562011-05-02 09:50:15 -0700367 if verbose:
368 print(class_definition)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000369
370 # For pickling to work, the __module__ variable needs to be set to the frame
371 # where the named tuple is created. Bypass this step in enviroments where
Benjamin Peterson25c95f12009-05-08 20:42:26 +0000372 # sys._getframe is not defined (Jython for example) or sys._getframe is not
373 # defined for arguments greater than 0 (IronPython).
374 try:
Raymond Hettinger0f055172009-01-27 10:06:09 +0000375 result.__module__ = _sys._getframe(1).f_globals.get('__name__', '__main__')
Benjamin Peterson25c95f12009-05-08 20:42:26 +0000376 except (AttributeError, ValueError):
377 pass
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000378
Guido van Rossumd59da4b2007-05-22 18:11:13 +0000379 return result
Guido van Rossumd8faa362007-04-27 19:54:29 +0000380
Guido van Rossumd8faa362007-04-27 19:54:29 +0000381
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000382########################################################################
383### Counter
384########################################################################
385
Raymond Hettinger96f34102010-12-15 16:30:37 +0000386def _count_elements(mapping, iterable):
387 'Tally elements from the iterable.'
388 mapping_get = mapping.get
389 for elem in iterable:
390 mapping[elem] = mapping_get(elem, 0) + 1
391
392try: # Load C helper function if available
393 from _collections import _count_elements
394except ImportError:
395 pass
396
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000397class Counter(dict):
398 '''Dict subclass for counting hashable items. Sometimes called a bag
399 or multiset. Elements are stored as dictionary keys and their counts
400 are stored as dictionary values.
401
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000402 >>> c = Counter('abcdeabcdabcaba') # count elements from a string
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000403
404 >>> c.most_common(3) # three most common elements
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000405 [('a', 5), ('b', 4), ('c', 3)]
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000406 >>> sorted(c) # list all unique elements
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000407 ['a', 'b', 'c', 'd', 'e']
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000408 >>> ''.join(sorted(c.elements())) # list elements with repetitions
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000409 'aaaaabbbbcccdde'
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000410 >>> sum(c.values()) # total of all counts
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000411 15
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000412
413 >>> c['a'] # count of letter 'a'
414 5
415 >>> for elem in 'shazam': # update counts from an iterable
416 ... c[elem] += 1 # by adding 1 to each element's count
417 >>> c['a'] # now there are seven 'a'
418 7
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000419 >>> del c['b'] # remove all 'b'
420 >>> c['b'] # now there are zero 'b'
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000421 0
422
423 >>> d = Counter('simsalabim') # make another counter
424 >>> c.update(d) # add in the second counter
425 >>> c['a'] # now there are nine 'a'
426 9
427
428 >>> c.clear() # empty the counter
429 >>> c
430 Counter()
431
432 Note: If a count is set to zero or reduced to zero, it will remain
433 in the counter until the entry is deleted or the counter is cleared:
434
435 >>> c = Counter('aaabbc')
436 >>> c['b'] -= 2 # reduce the count of 'b' by two
437 >>> c.most_common() # 'b' is still in, but its count is zero
438 [('a', 3), ('c', 1), ('b', 0)]
439
440 '''
441 # References:
442 # http://en.wikipedia.org/wiki/Multiset
443 # http://www.gnu.org/software/smalltalk/manual-base/html_node/Bag.html
444 # http://www.demo2s.com/Tutorial/Cpp/0380__set-multiset/Catalog0380__set-multiset.htm
445 # http://code.activestate.com/recipes/259174/
446 # Knuth, TAOCP Vol. II section 4.6.3
447
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000448 def __init__(self, iterable=None, **kwds):
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000449 '''Create a new, empty Counter object. And if given, count elements
450 from an input iterable. Or, initialize the count from another mapping
451 of elements to their counts.
452
453 >>> c = Counter() # a new, empty counter
454 >>> c = Counter('gallahad') # a new counter from an iterable
455 >>> c = Counter({'a': 4, 'b': 2}) # a new counter from a mapping
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000456 >>> c = Counter(a=4, b=2) # a new counter from keyword args
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000457
458 '''
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000459 super().__init__()
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000460 self.update(iterable, **kwds)
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000461
462 def __missing__(self, key):
463 'The count of elements not in the Counter is zero.'
464 # Needed so that self[missing_item] does not raise KeyError
465 return 0
466
467 def most_common(self, n=None):
468 '''List the n most common elements and their counts from the most
469 common to the least. If n is None, then list all element counts.
470
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000471 >>> Counter('abcdeabcdabcaba').most_common(3)
472 [('a', 5), ('b', 4), ('c', 3)]
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000473
474 '''
475 # Emulate Bag.sortedByCount from Smalltalk
476 if n is None:
477 return sorted(self.items(), key=_itemgetter(1), reverse=True)
478 return _heapq.nlargest(n, self.items(), key=_itemgetter(1))
479
480 def elements(self):
481 '''Iterator over elements repeating each as many times as its count.
482
483 >>> c = Counter('ABCABC')
484 >>> sorted(c.elements())
485 ['A', 'A', 'B', 'B', 'C', 'C']
486
487 # Knuth's example for prime factors of 1836: 2**2 * 3**3 * 17**1
488 >>> prime_factors = Counter({2: 2, 3: 3, 17: 1})
489 >>> product = 1
490 >>> for factor in prime_factors.elements(): # loop over factors
491 ... product *= factor # and multiply them
492 >>> product
493 1836
494
495 Note, if an element's count has been set to zero or is a negative
496 number, elements() will ignore it.
497
498 '''
499 # Emulate Bag.do from Smalltalk and Multiset.begin from C++.
500 return _chain.from_iterable(_starmap(_repeat, self.items()))
501
502 # Override dict methods where necessary
503
504 @classmethod
505 def fromkeys(cls, iterable, v=None):
506 # There is no equivalent method for counters because setting v=1
507 # means that no element can have a count greater than one.
508 raise NotImplementedError(
509 'Counter.fromkeys() is undefined. Use Counter(iterable) instead.')
510
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000511 def update(self, iterable=None, **kwds):
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000512 '''Like dict.update() but add counts instead of replacing them.
513
514 Source can be an iterable, a dictionary, or another Counter instance.
515
516 >>> c = Counter('which')
517 >>> c.update('witch') # add elements from another iterable
518 >>> d = Counter('watch')
519 >>> c.update(d) # add elements from another counter
520 >>> c['h'] # four 'h' in which, witch, and watch
521 4
522
523 '''
524 # The regular dict.update() operation makes no sense here because the
525 # replace behavior results in the some of original untouched counts
526 # being mixed-in with all of the other counts for a mismash that
527 # doesn't have a straight-forward interpretation in most counting
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000528 # contexts. Instead, we implement straight-addition. Both the inputs
529 # and outputs are allowed to contain zero and negative counts.
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000530
531 if iterable is not None:
532 if isinstance(iterable, Mapping):
Raymond Hettingerdd01f8f2009-01-22 09:09:55 +0000533 if self:
Raymond Hettingerf9092022009-06-29 18:30:43 +0000534 self_get = self.get
Raymond Hettingerdd01f8f2009-01-22 09:09:55 +0000535 for elem, count in iterable.items():
Raymond Hettingerf9092022009-06-29 18:30:43 +0000536 self[elem] = count + self_get(elem, 0)
Raymond Hettingerdd01f8f2009-01-22 09:09:55 +0000537 else:
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000538 super().update(iterable) # fast path when counter is empty
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000539 else:
Raymond Hettinger96f34102010-12-15 16:30:37 +0000540 _count_elements(self, iterable)
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000541 if kwds:
542 self.update(kwds)
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000543
Raymond Hettinger9c01e442010-04-03 10:32:58 +0000544 def subtract(self, iterable=None, **kwds):
545 '''Like dict.update() but subtracts counts instead of replacing them.
546 Counts can be reduced below zero. Both the inputs and outputs are
547 allowed to contain zero and negative counts.
548
549 Source can be an iterable, a dictionary, or another Counter instance.
550
551 >>> c = Counter('which')
552 >>> c.subtract('witch') # subtract elements from another iterable
553 >>> c.subtract(Counter('watch')) # subtract elements from another counter
554 >>> c['h'] # 2 in which, minus 1 in witch, minus 1 in watch
555 0
556 >>> c['w'] # 1 in which, minus 1 in witch, minus 1 in watch
557 -1
558
559 '''
560 if iterable is not None:
Raymond Hettingerfc3c9cd2010-04-11 20:41:56 +0000561 self_get = self.get
Raymond Hettinger9c01e442010-04-03 10:32:58 +0000562 if isinstance(iterable, Mapping):
Raymond Hettinger9c01e442010-04-03 10:32:58 +0000563 for elem, count in iterable.items():
564 self[elem] = self_get(elem, 0) - count
565 else:
Raymond Hettinger9c01e442010-04-03 10:32:58 +0000566 for elem in iterable:
567 self[elem] = self_get(elem, 0) - 1
568 if kwds:
569 self.subtract(kwds)
570
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000571 def copy(self):
Raymond Hettinger1c746c22011-04-15 13:16:46 -0700572 'Return a shallow copy.'
573 return self.__class__(self)
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000574
Raymond Hettingerff728162011-01-03 02:44:14 +0000575 def __reduce__(self):
576 return self.__class__, (dict(self),)
577
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000578 def __delitem__(self, elem):
579 'Like dict.__delitem__() but does not raise KeyError for missing values.'
580 if elem in self:
Raymond Hettinger00d43fd2011-01-02 08:03:33 +0000581 super().__delitem__(elem)
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000582
Raymond Hettingerb8baf632009-01-14 02:20:07 +0000583 def __repr__(self):
584 if not self:
585 return '%s()' % self.__class__.__name__
586 items = ', '.join(map('%r: %r'.__mod__, self.most_common()))
587 return '%s({%s})' % (self.__class__.__name__, items)
588
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000589 # Multiset-style mathematical operations discussed in:
590 # Knuth TAOCP Volume II section 4.6.3 exercise 19
591 # and at http://en.wikipedia.org/wiki/Multiset
592 #
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000593 # Outputs guaranteed to only include positive counts.
594 #
595 # To strip negative and zero counts, add-in an empty counter:
596 # c += Counter()
597
598 def __add__(self, other):
599 '''Add counts from two counters.
600
601 >>> Counter('abbb') + Counter('bcc')
602 Counter({'b': 4, 'c': 2, 'a': 1})
603
604 '''
605 if not isinstance(other, Counter):
606 return NotImplemented
607 result = Counter()
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700608 for elem, count in self.items():
609 newcount = count + other[elem]
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000610 if newcount > 0:
611 result[elem] = newcount
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700612 for elem, count in other.items():
613 if elem not in self and count > 0:
614 result[elem] = count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000615 return result
616
617 def __sub__(self, other):
618 ''' Subtract count, but keep only results with positive counts.
619
620 >>> Counter('abbbc') - Counter('bccd')
621 Counter({'b': 2, 'a': 1})
622
623 '''
624 if not isinstance(other, Counter):
625 return NotImplemented
626 result = Counter()
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700627 for elem, count in self.items():
628 newcount = count - other[elem]
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000629 if newcount > 0:
630 result[elem] = newcount
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700631 for elem, count in other.items():
632 if elem not in self and count < 0:
633 result[elem] = 0 - count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000634 return result
635
636 def __or__(self, other):
637 '''Union is the maximum of value in either of the input counters.
638
639 >>> Counter('abbb') | Counter('bcc')
640 Counter({'b': 3, 'c': 2, 'a': 1})
641
642 '''
643 if not isinstance(other, Counter):
644 return NotImplemented
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000645 result = Counter()
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700646 for elem, count in self.items():
647 other_count = other[elem]
648 newcount = other_count if count < other_count else count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000649 if newcount > 0:
650 result[elem] = newcount
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700651 for elem, count in other.items():
652 if elem not in self and count > 0:
653 result[elem] = count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000654 return result
655
656 def __and__(self, other):
657 ''' Intersection is the minimum of corresponding counts.
658
659 >>> Counter('abbb') & Counter('bcc')
660 Counter({'b': 1})
661
662 '''
663 if not isinstance(other, Counter):
664 return NotImplemented
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000665 result = Counter()
Raymond Hettinger2876a8c2011-04-17 19:46:46 -0700666 for elem, count in self.items():
667 other_count = other[elem]
668 newcount = count if count < other_count else other_count
Raymond Hettinger4d2073a2009-01-20 03:41:22 +0000669 if newcount > 0:
670 result[elem] = newcount
671 return result
672
Guido van Rossumd8faa362007-04-27 19:54:29 +0000673
Raymond Hettingere6603602011-02-21 19:38:53 +0000674########################################################################
675### ChainMap (helper for configparser)
676########################################################################
677
678class _ChainMap(MutableMapping):
679 ''' A ChainMap groups multiple dicts (or other mappings) together
680 to create a single, updateable view.
681
682 The underlying mappings are stored in a list. That list is public and can
683 accessed or updated using the *maps* attribute. There is no other state.
684
685 Lookups search the underlying mappings successively until a key is found.
686 In contrast, writes, updates, and deletions only operate on the first
687 mapping.
688
689 '''
690
691 def __init__(self, *maps):
692 '''Initialize a ChainMap by setting *maps* to the given mappings.
693 If no mappings are provided, a single empty dictionary is used.
694
695 '''
696 self.maps = list(maps) or [{}] # always at least one map
697
698 def __missing__(self, key):
699 raise KeyError(key)
700
701 def __getitem__(self, key):
702 for mapping in self.maps:
703 try:
704 return mapping[key] # can't use 'key in mapping' with defaultdict
705 except KeyError:
706 pass
707 return self.__missing__(key) # support subclasses that define __missing__
708
709 def get(self, key, default=None):
710 return self[key] if key in self else default
711
712 def __len__(self):
713 return len(set().union(*self.maps)) # reuses stored hash values if possible
714
715 def __iter__(self):
716 return iter(set().union(*self.maps))
717
718 def __contains__(self, key):
719 return any(key in m for m in self.maps)
720
Raymond Hettingera5ac2ce2011-05-02 11:02:13 -0700721 def __bool__(self):
722 return any(self.maps)
723
Raymond Hettingere6603602011-02-21 19:38:53 +0000724 @_recursive_repr()
725 def __repr__(self):
726 return '{0.__class__.__name__}({1})'.format(
727 self, ', '.join(map(repr, self.maps)))
728
729 @classmethod
730 def fromkeys(cls, iterable, *args):
731 'Create a ChainMap with a single dict created from the iterable.'
732 return cls(dict.fromkeys(iterable, *args))
733
734 def copy(self):
735 'New ChainMap or subclass with a new copy of maps[0] and refs to maps[1:]'
736 return self.__class__(self.maps[0].copy(), *self.maps[1:])
737
738 __copy__ = copy
739
Raymond Hettingerdcb29c92011-02-23 08:28:06 +0000740 def new_child(self): # like Django's Context.push()
741 'New ChainMap with a new dict followed by all previous maps.'
742 return self.__class__({}, *self.maps)
743
744 @property
745 def parents(self): # like Django's Context.pop()
746 'New ChainMap from maps[1:].'
747 return self.__class__(*self.maps[1:])
748
Raymond Hettingere6603602011-02-21 19:38:53 +0000749 def __setitem__(self, key, value):
750 self.maps[0][key] = value
751
752 def __delitem__(self, key):
753 try:
754 del self.maps[0][key]
755 except KeyError:
756 raise KeyError('Key not found in the first mapping: {!r}'.format(key))
757
758 def popitem(self):
759 'Remove and return an item pair from maps[0]. Raise KeyError is maps[0] is empty.'
760 try:
761 return self.maps[0].popitem()
762 except KeyError:
763 raise KeyError('No keys found in the first mapping.')
764
765 def pop(self, key, *args):
766 'Remove *key* from maps[0] and return its value. Raise KeyError if *key* not in maps[0].'
767 try:
768 return self.maps[0].pop(key, *args)
769 except KeyError:
770 raise KeyError('Key not found in the first mapping: {!r}'.format(key))
771
772 def clear(self):
773 'Clear maps[0], leaving maps[1:] intact.'
774 self.maps[0].clear()
775
776
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000777################################################################################
778### UserDict
779################################################################################
Guido van Rossumd8faa362007-04-27 19:54:29 +0000780
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000781class UserDict(MutableMapping):
782
783 # Start by filling-out the abstract methods
784 def __init__(self, dict=None, **kwargs):
785 self.data = {}
786 if dict is not None:
787 self.update(dict)
788 if len(kwargs):
789 self.update(kwargs)
790 def __len__(self): return len(self.data)
791 def __getitem__(self, key):
792 if key in self.data:
793 return self.data[key]
794 if hasattr(self.__class__, "__missing__"):
795 return self.__class__.__missing__(self, key)
796 raise KeyError(key)
797 def __setitem__(self, key, item): self.data[key] = item
798 def __delitem__(self, key): del self.data[key]
799 def __iter__(self):
800 return iter(self.data)
801
Raymond Hettinger554c8b82008-02-05 22:54:43 +0000802 # Modify __contains__ to work correctly when __missing__ is present
803 def __contains__(self, key):
804 return key in self.data
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000805
806 # Now, add the methods in dicts but not in MutableMapping
807 def __repr__(self): return repr(self.data)
808 def copy(self):
809 if self.__class__ is UserDict:
810 return UserDict(self.data.copy())
811 import copy
812 data = self.data
813 try:
814 self.data = {}
815 c = copy.copy(self)
816 finally:
817 self.data = data
818 c.update(self)
819 return c
820 @classmethod
821 def fromkeys(cls, iterable, value=None):
822 d = cls()
823 for key in iterable:
824 d[key] = value
825 return d
826
Raymond Hettinger48b8b662008-02-05 01:53:00 +0000827
828
829################################################################################
Raymond Hettinger53dbe392008-02-12 20:03:09 +0000830### UserList
831################################################################################
832
833class UserList(MutableSequence):
834 """A more or less complete user-defined wrapper around list objects."""
835 def __init__(self, initlist=None):
836 self.data = []
837 if initlist is not None:
838 # XXX should this accept an arbitrary sequence?
839 if type(initlist) == type(self.data):
840 self.data[:] = initlist
841 elif isinstance(initlist, UserList):
842 self.data[:] = initlist.data[:]
843 else:
844 self.data = list(initlist)
845 def __repr__(self): return repr(self.data)
846 def __lt__(self, other): return self.data < self.__cast(other)
847 def __le__(self, other): return self.data <= self.__cast(other)
848 def __eq__(self, other): return self.data == self.__cast(other)
849 def __ne__(self, other): return self.data != self.__cast(other)
850 def __gt__(self, other): return self.data > self.__cast(other)
851 def __ge__(self, other): return self.data >= self.__cast(other)
852 def __cast(self, other):
853 return other.data if isinstance(other, UserList) else other
Raymond Hettinger53dbe392008-02-12 20:03:09 +0000854 def __contains__(self, item): return item in self.data
855 def __len__(self): return len(self.data)
856 def __getitem__(self, i): return self.data[i]
857 def __setitem__(self, i, item): self.data[i] = item
858 def __delitem__(self, i): del self.data[i]
859 def __add__(self, other):
860 if isinstance(other, UserList):
861 return self.__class__(self.data + other.data)
862 elif isinstance(other, type(self.data)):
863 return self.__class__(self.data + other)
864 return self.__class__(self.data + list(other))
865 def __radd__(self, other):
866 if isinstance(other, UserList):
867 return self.__class__(other.data + self.data)
868 elif isinstance(other, type(self.data)):
869 return self.__class__(other + self.data)
870 return self.__class__(list(other) + self.data)
871 def __iadd__(self, other):
872 if isinstance(other, UserList):
873 self.data += other.data
874 elif isinstance(other, type(self.data)):
875 self.data += other
876 else:
877 self.data += list(other)
878 return self
879 def __mul__(self, n):
880 return self.__class__(self.data*n)
881 __rmul__ = __mul__
882 def __imul__(self, n):
883 self.data *= n
884 return self
885 def append(self, item): self.data.append(item)
886 def insert(self, i, item): self.data.insert(i, item)
887 def pop(self, i=-1): return self.data.pop(i)
888 def remove(self, item): self.data.remove(item)
889 def count(self, item): return self.data.count(item)
890 def index(self, item, *args): return self.data.index(item, *args)
891 def reverse(self): self.data.reverse()
892 def sort(self, *args, **kwds): self.data.sort(*args, **kwds)
893 def extend(self, other):
894 if isinstance(other, UserList):
895 self.data.extend(other.data)
896 else:
897 self.data.extend(other)
898
899
900
901################################################################################
Raymond Hettingerb3a65f82008-02-21 22:11:37 +0000902### UserString
903################################################################################
904
905class UserString(Sequence):
906 def __init__(self, seq):
907 if isinstance(seq, str):
908 self.data = seq
909 elif isinstance(seq, UserString):
910 self.data = seq.data[:]
911 else:
912 self.data = str(seq)
913 def __str__(self): return str(self.data)
914 def __repr__(self): return repr(self.data)
915 def __int__(self): return int(self.data)
Raymond Hettingerb3a65f82008-02-21 22:11:37 +0000916 def __float__(self): return float(self.data)
917 def __complex__(self): return complex(self.data)
918 def __hash__(self): return hash(self.data)
919
920 def __eq__(self, string):
921 if isinstance(string, UserString):
922 return self.data == string.data
923 return self.data == string
924 def __ne__(self, string):
925 if isinstance(string, UserString):
926 return self.data != string.data
927 return self.data != string
928 def __lt__(self, string):
929 if isinstance(string, UserString):
930 return self.data < string.data
931 return self.data < string
932 def __le__(self, string):
933 if isinstance(string, UserString):
934 return self.data <= string.data
935 return self.data <= string
936 def __gt__(self, string):
937 if isinstance(string, UserString):
938 return self.data > string.data
939 return self.data > string
940 def __ge__(self, string):
941 if isinstance(string, UserString):
942 return self.data >= string.data
943 return self.data >= string
944
945 def __contains__(self, char):
946 if isinstance(char, UserString):
947 char = char.data
948 return char in self.data
949
950 def __len__(self): return len(self.data)
951 def __getitem__(self, index): return self.__class__(self.data[index])
952 def __add__(self, other):
953 if isinstance(other, UserString):
954 return self.__class__(self.data + other.data)
955 elif isinstance(other, str):
956 return self.__class__(self.data + other)
957 return self.__class__(self.data + str(other))
958 def __radd__(self, other):
959 if isinstance(other, str):
960 return self.__class__(other + self.data)
961 return self.__class__(str(other) + self.data)
962 def __mul__(self, n):
963 return self.__class__(self.data*n)
964 __rmul__ = __mul__
965 def __mod__(self, args):
966 return self.__class__(self.data % args)
967
968 # the following methods are defined in alphabetical order:
969 def capitalize(self): return self.__class__(self.data.capitalize())
970 def center(self, width, *args):
971 return self.__class__(self.data.center(width, *args))
972 def count(self, sub, start=0, end=_sys.maxsize):
973 if isinstance(sub, UserString):
974 sub = sub.data
975 return self.data.count(sub, start, end)
976 def encode(self, encoding=None, errors=None): # XXX improve this?
977 if encoding:
978 if errors:
979 return self.__class__(self.data.encode(encoding, errors))
980 return self.__class__(self.data.encode(encoding))
981 return self.__class__(self.data.encode())
982 def endswith(self, suffix, start=0, end=_sys.maxsize):
983 return self.data.endswith(suffix, start, end)
984 def expandtabs(self, tabsize=8):
985 return self.__class__(self.data.expandtabs(tabsize))
986 def find(self, sub, start=0, end=_sys.maxsize):
987 if isinstance(sub, UserString):
988 sub = sub.data
989 return self.data.find(sub, start, end)
990 def format(self, *args, **kwds):
991 return self.data.format(*args, **kwds)
992 def index(self, sub, start=0, end=_sys.maxsize):
993 return self.data.index(sub, start, end)
994 def isalpha(self): return self.data.isalpha()
995 def isalnum(self): return self.data.isalnum()
996 def isdecimal(self): return self.data.isdecimal()
997 def isdigit(self): return self.data.isdigit()
998 def isidentifier(self): return self.data.isidentifier()
999 def islower(self): return self.data.islower()
1000 def isnumeric(self): return self.data.isnumeric()
1001 def isspace(self): return self.data.isspace()
1002 def istitle(self): return self.data.istitle()
1003 def isupper(self): return self.data.isupper()
1004 def join(self, seq): return self.data.join(seq)
1005 def ljust(self, width, *args):
1006 return self.__class__(self.data.ljust(width, *args))
1007 def lower(self): return self.__class__(self.data.lower())
1008 def lstrip(self, chars=None): return self.__class__(self.data.lstrip(chars))
1009 def partition(self, sep):
1010 return self.data.partition(sep)
1011 def replace(self, old, new, maxsplit=-1):
1012 if isinstance(old, UserString):
1013 old = old.data
1014 if isinstance(new, UserString):
1015 new = new.data
1016 return self.__class__(self.data.replace(old, new, maxsplit))
1017 def rfind(self, sub, start=0, end=_sys.maxsize):
Antoine Pitrouda2ecaf2010-01-02 21:40:36 +00001018 if isinstance(sub, UserString):
1019 sub = sub.data
Raymond Hettingerb3a65f82008-02-21 22:11:37 +00001020 return self.data.rfind(sub, start, end)
1021 def rindex(self, sub, start=0, end=_sys.maxsize):
1022 return self.data.rindex(sub, start, end)
1023 def rjust(self, width, *args):
1024 return self.__class__(self.data.rjust(width, *args))
1025 def rpartition(self, sep):
1026 return self.data.rpartition(sep)
1027 def rstrip(self, chars=None):
1028 return self.__class__(self.data.rstrip(chars))
1029 def split(self, sep=None, maxsplit=-1):
1030 return self.data.split(sep, maxsplit)
1031 def rsplit(self, sep=None, maxsplit=-1):
1032 return self.data.rsplit(sep, maxsplit)
1033 def splitlines(self, keepends=0): return self.data.splitlines(keepends)
1034 def startswith(self, prefix, start=0, end=_sys.maxsize):
1035 return self.data.startswith(prefix, start, end)
1036 def strip(self, chars=None): return self.__class__(self.data.strip(chars))
1037 def swapcase(self): return self.__class__(self.data.swapcase())
1038 def title(self): return self.__class__(self.data.title())
1039 def translate(self, *args):
1040 return self.__class__(self.data.translate(*args))
1041 def upper(self): return self.__class__(self.data.upper())
1042 def zfill(self, width): return self.__class__(self.data.zfill(width))
1043
1044
1045
1046################################################################################
Raymond Hettinger48b8b662008-02-05 01:53:00 +00001047### Simple tests
1048################################################################################
Guido van Rossumd8faa362007-04-27 19:54:29 +00001049
1050if __name__ == '__main__':
Thomas Wouters1b7f8912007-09-19 03:06:30 +00001051 # verify that instances can be pickled
Guido van Rossum99603b02007-07-20 00:22:32 +00001052 from pickle import loads, dumps
Guido van Rossum8ce8a782007-11-01 19:42:39 +00001053 Point = namedtuple('Point', 'x, y', True)
Guido van Rossumd8faa362007-04-27 19:54:29 +00001054 p = Point(x=10, y=20)
1055 assert p == loads(dumps(p))
1056
Guido van Rossum3d392eb2007-11-16 00:35:22 +00001057 # test and demonstrate ability to override methods
Christian Heimes043d6f62008-01-07 17:19:16 +00001058 class Point(namedtuple('Point', 'x y')):
Christian Heimes25bb7832008-01-11 16:17:00 +00001059 __slots__ = ()
Christian Heimes043d6f62008-01-07 17:19:16 +00001060 @property
1061 def hypot(self):
1062 return (self.x ** 2 + self.y ** 2) ** 0.5
Christian Heimes790c8232008-01-07 21:14:23 +00001063 def __str__(self):
Christian Heimes25bb7832008-01-11 16:17:00 +00001064 return 'Point: x=%6.3f y=%6.3f hypot=%6.3f' % (self.x, self.y, self.hypot)
Christian Heimes043d6f62008-01-07 17:19:16 +00001065
Christian Heimes25bb7832008-01-11 16:17:00 +00001066 for p in Point(3, 4), Point(14, 5/7.):
Christian Heimes790c8232008-01-07 21:14:23 +00001067 print (p)
Christian Heimes043d6f62008-01-07 17:19:16 +00001068
1069 class Point(namedtuple('Point', 'x y')):
1070 'Point class with optimized _make() and _replace() without error-checking'
Christian Heimes25bb7832008-01-11 16:17:00 +00001071 __slots__ = ()
Christian Heimes043d6f62008-01-07 17:19:16 +00001072 _make = classmethod(tuple.__new__)
1073 def _replace(self, _map=map, **kwds):
Christian Heimes2380ac72008-01-09 00:17:24 +00001074 return self._make(_map(kwds.get, ('x', 'y'), self))
Christian Heimes043d6f62008-01-07 17:19:16 +00001075
1076 print(Point(11, 22)._replace(x=100))
Guido van Rossum3d392eb2007-11-16 00:35:22 +00001077
Christian Heimes25bb7832008-01-11 16:17:00 +00001078 Point3D = namedtuple('Point3D', Point._fields + ('z',))
1079 print(Point3D.__doc__)
1080
Guido van Rossumd8faa362007-04-27 19:54:29 +00001081 import doctest
Guido van Rossum8ce8a782007-11-01 19:42:39 +00001082 TestResults = namedtuple('TestResults', 'failed attempted')
Guido van Rossumd8faa362007-04-27 19:54:29 +00001083 print(TestResults(*doctest.testmod()))