blob: b035cbb809f848a29e3d82bcb879e89f1b23c1c2 [file] [log] [blame]
Eric V. Smith2a7bacb2018-05-15 22:44:27 -04001import re
Eric V. Smithf0db54a2017-12-04 16:58:55 -05002import sys
Eric V. Smithf96ddad2018-03-24 17:20:26 -04003import copy
Eric V. Smithf0db54a2017-12-04 16:58:55 -05004import types
Eric V. Smithf0db54a2017-12-04 16:58:55 -05005import inspect
Eric V. Smith4e812962018-05-16 11:31:29 -04006import keyword
Vadim Pushtaev4d12e4d2018-08-12 14:46:05 +03007import builtins
Srinivas Thatiparthy (శ్రీనివాస్ తాటిపర్తి)dd13c882018-10-19 22:24:50 +05308import functools
9import _thread
10
Eric V. Smithf0db54a2017-12-04 16:58:55 -050011
12__all__ = ['dataclass',
13 'field',
Eric V. Smith8e4560a2018-03-21 17:10:22 -040014 'Field',
Eric V. Smithf0db54a2017-12-04 16:58:55 -050015 'FrozenInstanceError',
16 'InitVar',
Eric V. Smith03220fd2017-12-29 13:59:58 -050017 'MISSING',
Eric V. Smithf0db54a2017-12-04 16:58:55 -050018
19 # Helper functions.
20 'fields',
21 'asdict',
22 'astuple',
23 'make_dataclass',
24 'replace',
Eric V. Smithe7ba0132018-01-06 12:41:53 -050025 'is_dataclass',
Eric V. Smithf0db54a2017-12-04 16:58:55 -050026 ]
27
Eric V. Smithea8fc522018-01-27 19:07:40 -050028# Conditions for adding methods. The boxes indicate what action the
Eric V. Smithf8e75492018-05-16 05:14:53 -040029# dataclass decorator takes. For all of these tables, when I talk
30# about init=, repr=, eq=, order=, unsafe_hash=, or frozen=, I'm
31# referring to the arguments to the @dataclass decorator. When
32# checking if a dunder method already exists, I mean check for an
33# entry in the class's __dict__. I never check to see if an attribute
34# is defined in a base class.
Eric V. Smithea8fc522018-01-27 19:07:40 -050035
36# Key:
37# +=========+=========================================+
38# + Value | Meaning |
39# +=========+=========================================+
40# | <blank> | No action: no method is added. |
41# +---------+-----------------------------------------+
42# | add | Generated method is added. |
43# +---------+-----------------------------------------+
Eric V. Smithea8fc522018-01-27 19:07:40 -050044# | raise | TypeError is raised. |
45# +---------+-----------------------------------------+
46# | None | Attribute is set to None. |
47# +=========+=========================================+
48
49# __init__
50#
51# +--- init= parameter
52# |
53# v | | |
54# | no | yes | <--- class has __init__ in __dict__?
55# +=======+=======+=======+
56# | False | | |
57# +-------+-------+-------+
58# | True | add | | <- the default
59# +=======+=======+=======+
60
61# __repr__
62#
63# +--- repr= parameter
64# |
65# v | | |
66# | no | yes | <--- class has __repr__ in __dict__?
67# +=======+=======+=======+
68# | False | | |
69# +-------+-------+-------+
70# | True | add | | <- the default
71# +=======+=======+=======+
72
73
74# __setattr__
75# __delattr__
76#
77# +--- frozen= parameter
78# |
79# v | | |
80# | no | yes | <--- class has __setattr__ or __delattr__ in __dict__?
81# +=======+=======+=======+
82# | False | | | <- the default
83# +-------+-------+-------+
84# | True | add | raise |
85# +=======+=======+=======+
86# Raise because not adding these methods would break the "frozen-ness"
Eric V. Smithf8e75492018-05-16 05:14:53 -040087# of the class.
Eric V. Smithea8fc522018-01-27 19:07:40 -050088
89# __eq__
90#
91# +--- eq= parameter
92# |
93# v | | |
94# | no | yes | <--- class has __eq__ in __dict__?
95# +=======+=======+=======+
96# | False | | |
97# +-------+-------+-------+
98# | True | add | | <- the default
99# +=======+=======+=======+
100
101# __lt__
102# __le__
103# __gt__
104# __ge__
105#
106# +--- order= parameter
107# |
108# v | | |
109# | no | yes | <--- class has any comparison method in __dict__?
110# +=======+=======+=======+
111# | False | | | <- the default
112# +-------+-------+-------+
113# | True | add | raise |
114# +=======+=======+=======+
115# Raise because to allow this case would interfere with using
Eric V. Smithf8e75492018-05-16 05:14:53 -0400116# functools.total_ordering.
Eric V. Smithea8fc522018-01-27 19:07:40 -0500117
118# __hash__
119
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500120# +------------------- unsafe_hash= parameter
121# | +----------- eq= parameter
122# | | +--- frozen= parameter
123# | | |
124# v v v | | |
125# | no | yes | <--- class has explicitly defined __hash__
126# +=======+=======+=======+========+========+
127# | False | False | False | | | No __eq__, use the base class __hash__
128# +-------+-------+-------+--------+--------+
129# | False | False | True | | | No __eq__, use the base class __hash__
130# +-------+-------+-------+--------+--------+
131# | False | True | False | None | | <-- the default, not hashable
132# +-------+-------+-------+--------+--------+
133# | False | True | True | add | | Frozen, so hashable, allows override
134# +-------+-------+-------+--------+--------+
135# | True | False | False | add | raise | Has no __eq__, but hashable
136# +-------+-------+-------+--------+--------+
137# | True | False | True | add | raise | Has no __eq__, but hashable
138# +-------+-------+-------+--------+--------+
139# | True | True | False | add | raise | Not frozen, but hashable
140# +-------+-------+-------+--------+--------+
141# | True | True | True | add | raise | Frozen, so hashable
142# +=======+=======+=======+========+========+
Eric V. Smithea8fc522018-01-27 19:07:40 -0500143# For boxes that are blank, __hash__ is untouched and therefore
Eric V. Smithf8e75492018-05-16 05:14:53 -0400144# inherited from the base class. If the base is object, then
145# id-based hashing is used.
146#
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400147# Note that a class may already have __hash__=None if it specified an
Eric V. Smithf8e75492018-05-16 05:14:53 -0400148# __eq__ method in the class body (not one that was created by
149# @dataclass).
150#
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500151# See _hash_action (below) for a coded version of this table.
Eric V. Smithea8fc522018-01-27 19:07:40 -0500152
153
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500154# Raised when an attempt is made to modify a frozen class.
155class FrozenInstanceError(AttributeError): pass
156
Eric V. Smithf8e75492018-05-16 05:14:53 -0400157# A sentinel object for default values to signal that a default
158# factory will be used. This is given a nice repr() which will appear
159# in the function signature of dataclasses' constructors.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500160class _HAS_DEFAULT_FACTORY_CLASS:
161 def __repr__(self):
162 return '<factory>'
163_HAS_DEFAULT_FACTORY = _HAS_DEFAULT_FACTORY_CLASS()
164
Eric V. Smith03220fd2017-12-29 13:59:58 -0500165# A sentinel object to detect if a parameter is supplied or not. Use
Eric V. Smithf8e75492018-05-16 05:14:53 -0400166# a class to give it a better repr.
Eric V. Smith03220fd2017-12-29 13:59:58 -0500167class _MISSING_TYPE:
168 pass
169MISSING = _MISSING_TYPE()
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500170
171# Since most per-field metadata will be unused, create an empty
Eric V. Smithf8e75492018-05-16 05:14:53 -0400172# read-only proxy that can be shared among all fields.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500173_EMPTY_METADATA = types.MappingProxyType({})
174
175# Markers for the various kinds of fields and pseudo-fields.
Eric V. Smith01abc6e2018-05-15 08:36:21 -0400176class _FIELD_BASE:
177 def __init__(self, name):
178 self.name = name
179 def __repr__(self):
180 return self.name
181_FIELD = _FIELD_BASE('_FIELD')
182_FIELD_CLASSVAR = _FIELD_BASE('_FIELD_CLASSVAR')
183_FIELD_INITVAR = _FIELD_BASE('_FIELD_INITVAR')
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500184
185# The name of an attribute on the class where we store the Field
Eric V. Smithf8e75492018-05-16 05:14:53 -0400186# objects. Also used to check if a class is a Data Class.
Eric V. Smithf199bc62018-03-18 20:40:34 -0400187_FIELDS = '__dataclass_fields__'
188
189# The name of an attribute on the class that stores the parameters to
190# @dataclass.
191_PARAMS = '__dataclass_params__'
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500192
193# The name of the function, that if it exists, is called at the end of
194# __init__.
195_POST_INIT_NAME = '__post_init__'
196
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400197# String regex that string annotations for ClassVar or InitVar must match.
198# Allows "identifier.identifier[" or "identifier[".
199# https://bugs.python.org/issue33453 for details.
200_MODULE_IDENTIFIER_RE = re.compile(r'^(?:\s*(\w+)\s*\.)?\s*(\w+)')
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500201
202class _InitVarMeta(type):
203 def __getitem__(self, params):
Augusto Hack01ee12b2019-06-02 23:14:48 -0300204 return InitVar(params)
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500205
206class InitVar(metaclass=_InitVarMeta):
Augusto Hack01ee12b2019-06-02 23:14:48 -0300207 __slots__ = ('type', )
208
209 def __init__(self, type):
210 self.type = type
211
212 def __repr__(self):
213 return f'dataclasses.InitVar[{self.type.__name__}]'
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500214
215
216# Instances of Field are only ever created from within this module,
Eric V. Smithf8e75492018-05-16 05:14:53 -0400217# and only from the field() function, although Field instances are
218# exposed externally as (conceptually) read-only objects.
219#
220# name and type are filled in after the fact, not in __init__.
221# They're not known at the time this class is instantiated, but it's
222# convenient if they're available later.
223#
Eric V. Smithf199bc62018-03-18 20:40:34 -0400224# When cls._FIELDS is filled in with a list of Field objects, the name
Eric V. Smithf8e75492018-05-16 05:14:53 -0400225# and type fields will have been populated.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500226class Field:
227 __slots__ = ('name',
228 'type',
229 'default',
230 'default_factory',
231 'repr',
232 'hash',
233 'init',
234 'compare',
235 'metadata',
236 '_field_type', # Private: not to be used by user code.
237 )
238
239 def __init__(self, default, default_factory, init, repr, hash, compare,
240 metadata):
241 self.name = None
242 self.type = None
243 self.default = default
244 self.default_factory = default_factory
245 self.init = init
246 self.repr = repr
247 self.hash = hash
248 self.compare = compare
249 self.metadata = (_EMPTY_METADATA
Christopher Huntb01786c2019-02-12 06:50:49 -0500250 if metadata is None else
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500251 types.MappingProxyType(metadata))
252 self._field_type = None
253
254 def __repr__(self):
255 return ('Field('
256 f'name={self.name!r},'
Eric V. Smith2473eea2018-05-14 11:37:28 -0400257 f'type={self.type!r},'
258 f'default={self.default!r},'
259 f'default_factory={self.default_factory!r},'
260 f'init={self.init!r},'
261 f'repr={self.repr!r},'
262 f'hash={self.hash!r},'
263 f'compare={self.compare!r},'
Eric V. Smith01abc6e2018-05-15 08:36:21 -0400264 f'metadata={self.metadata!r},'
265 f'_field_type={self._field_type}'
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500266 ')')
267
Eric V. Smithde7a2f02018-03-26 13:29:16 -0400268 # This is used to support the PEP 487 __set_name__ protocol in the
Eric V. Smithf8e75492018-05-16 05:14:53 -0400269 # case where we're using a field that contains a descriptor as a
Artjome55ca3f2018-07-06 02:09:13 +0300270 # default value. For details on __set_name__, see
Eric V. Smithf8e75492018-05-16 05:14:53 -0400271 # https://www.python.org/dev/peps/pep-0487/#implementation-details.
272 #
273 # Note that in _process_class, this Field object is overwritten
274 # with the default value, so the end result is a descriptor that
275 # had __set_name__ called on it at the right time.
Eric V. Smithde7a2f02018-03-26 13:29:16 -0400276 def __set_name__(self, owner, name):
Eric V. Smith52199522018-03-29 11:07:48 -0400277 func = getattr(type(self.default), '__set_name__', None)
Eric V. Smithde7a2f02018-03-26 13:29:16 -0400278 if func:
Eric V. Smithf8e75492018-05-16 05:14:53 -0400279 # There is a __set_name__ method on the descriptor, call
280 # it.
Eric V. Smith52199522018-03-29 11:07:48 -0400281 func(self.default, owner, name)
Eric V. Smithde7a2f02018-03-26 13:29:16 -0400282
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500283
Eric V. Smithf199bc62018-03-18 20:40:34 -0400284class _DataclassParams:
285 __slots__ = ('init',
286 'repr',
287 'eq',
288 'order',
289 'unsafe_hash',
290 'frozen',
291 )
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400292
Eric V. Smithf199bc62018-03-18 20:40:34 -0400293 def __init__(self, init, repr, eq, order, unsafe_hash, frozen):
294 self.init = init
295 self.repr = repr
296 self.eq = eq
297 self.order = order
298 self.unsafe_hash = unsafe_hash
299 self.frozen = frozen
300
301 def __repr__(self):
302 return ('_DataclassParams('
Eric V. Smith30590422018-05-14 17:16:52 -0400303 f'init={self.init!r},'
304 f'repr={self.repr!r},'
305 f'eq={self.eq!r},'
306 f'order={self.order!r},'
307 f'unsafe_hash={self.unsafe_hash!r},'
308 f'frozen={self.frozen!r}'
Eric V. Smithf199bc62018-03-18 20:40:34 -0400309 ')')
310
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400311
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500312# This function is used instead of exposing Field creation directly,
Eric V. Smithf8e75492018-05-16 05:14:53 -0400313# so that a type checker can be told (via overloads) that this is a
314# function whose type depends on its parameters.
Eric V. Smith03220fd2017-12-29 13:59:58 -0500315def field(*, default=MISSING, default_factory=MISSING, init=True, repr=True,
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500316 hash=None, compare=True, metadata=None):
317 """Return an object to identify dataclass fields.
318
Eric V. Smithf8e75492018-05-16 05:14:53 -0400319 default is the default value of the field. default_factory is a
320 0-argument function called to initialize a field's value. If init
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500321 is True, the field will be a parameter to the class's __init__()
Eric V. Smithf8e75492018-05-16 05:14:53 -0400322 function. If repr is True, the field will be included in the
323 object's repr(). If hash is True, the field will be included in
324 the object's hash(). If compare is True, the field will be used
325 in comparison functions. metadata, if specified, must be a
326 mapping which is stored but not otherwise examined by dataclass.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500327
328 It is an error to specify both default and default_factory.
329 """
330
Eric V. Smith03220fd2017-12-29 13:59:58 -0500331 if default is not MISSING and default_factory is not MISSING:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500332 raise ValueError('cannot specify both default and default_factory')
333 return Field(default, default_factory, init, repr, hash, compare,
334 metadata)
335
336
337def _tuple_str(obj_name, fields):
338 # Return a string representing each field of obj_name as a tuple
Eric V. Smithf8e75492018-05-16 05:14:53 -0400339 # member. So, if fields is ['x', 'y'] and obj_name is "self",
340 # return "(self.x,self.y)".
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500341
342 # Special case for the 0-tuple.
Eric V. Smithea8fc522018-01-27 19:07:40 -0500343 if not fields:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500344 return '()'
345 # Note the trailing comma, needed if this turns out to be a 1-tuple.
346 return f'({",".join([f"{obj_name}.{f.name}" for f in fields])},)'
347
348
Srinivas Thatiparthy (శ్రీనివాస్ తాటిపర్తి)dd13c882018-10-19 22:24:50 +0530349# This function's logic is copied from "recursive_repr" function in
350# reprlib module to avoid dependency.
351def _recursive_repr(user_function):
352 # Decorator to make a repr function return "..." for a recursive
353 # call.
354 repr_running = set()
355
356 @functools.wraps(user_function)
357 def wrapper(self):
358 key = id(self), _thread.get_ident()
359 if key in repr_running:
360 return '...'
361 repr_running.add(key)
362 try:
363 result = user_function(self)
364 finally:
365 repr_running.discard(key)
366 return result
367 return wrapper
368
369
Eric V. Smithea8fc522018-01-27 19:07:40 -0500370def _create_fn(name, args, body, *, globals=None, locals=None,
Eric V. Smith03220fd2017-12-29 13:59:58 -0500371 return_type=MISSING):
Eric V. Smithf8e75492018-05-16 05:14:53 -0400372 # Note that we mutate locals when exec() is called. Caller
373 # beware! The only callers are internal to this module, so no
374 # worries about external callers.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500375 if locals is None:
376 locals = {}
Vadim Pushtaev4d12e4d2018-08-12 14:46:05 +0300377 # __builtins__ may be the "builtins" module or
378 # the value of its "__dict__",
379 # so make sure "__builtins__" is the module.
380 if globals is not None and '__builtins__' not in globals:
381 globals['__builtins__'] = builtins
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500382 return_annotation = ''
Eric V. Smith03220fd2017-12-29 13:59:58 -0500383 if return_type is not MISSING:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500384 locals['_return_type'] = return_type
385 return_annotation = '->_return_type'
386 args = ','.join(args)
387 body = '\n'.join(f' {b}' for b in body)
388
Eric V. Smithf199bc62018-03-18 20:40:34 -0400389 # Compute the text of the entire function.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500390 txt = f'def {name}({args}){return_annotation}:\n{body}'
391
392 exec(txt, globals, locals)
393 return locals[name]
394
395
396def _field_assign(frozen, name, value, self_name):
397 # If we're a frozen class, then assign to our fields in __init__
Eric V. Smithf8e75492018-05-16 05:14:53 -0400398 # via object.__setattr__. Otherwise, just use a simple
399 # assignment.
400 #
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500401 # self_name is what "self" is called in this function: don't
Eric V. Smithf8e75492018-05-16 05:14:53 -0400402 # hard-code "self", since that might be a field name.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500403 if frozen:
Vadim Pushtaev4d12e4d2018-08-12 14:46:05 +0300404 return f'__builtins__.object.__setattr__({self_name},{name!r},{value})'
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500405 return f'{self_name}.{name}={value}'
406
407
408def _field_init(f, frozen, globals, self_name):
409 # Return the text of the line in the body of __init__ that will
Eric V. Smithf8e75492018-05-16 05:14:53 -0400410 # initialize this field.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500411
412 default_name = f'_dflt_{f.name}'
Eric V. Smith03220fd2017-12-29 13:59:58 -0500413 if f.default_factory is not MISSING:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500414 if f.init:
415 # This field has a default factory. If a parameter is
Eric V. Smithf8e75492018-05-16 05:14:53 -0400416 # given, use it. If not, call the factory.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500417 globals[default_name] = f.default_factory
418 value = (f'{default_name}() '
419 f'if {f.name} is _HAS_DEFAULT_FACTORY '
420 f'else {f.name}')
421 else:
422 # This is a field that's not in the __init__ params, but
Eric V. Smithf8e75492018-05-16 05:14:53 -0400423 # has a default factory function. It needs to be
424 # initialized here by calling the factory function,
425 # because there's no other way to initialize it.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500426
427 # For a field initialized with a default=defaultvalue, the
Eric V. Smithf8e75492018-05-16 05:14:53 -0400428 # class dict just has the default value
429 # (cls.fieldname=defaultvalue). But that won't work for a
430 # default factory, the factory must be called in __init__
431 # and we must assign that to self.fieldname. We can't
432 # fall back to the class dict's value, both because it's
433 # not set, and because it might be different per-class
434 # (which, after all, is why we have a factory function!).
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500435
436 globals[default_name] = f.default_factory
437 value = f'{default_name}()'
438 else:
439 # No default factory.
440 if f.init:
Eric V. Smith03220fd2017-12-29 13:59:58 -0500441 if f.default is MISSING:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500442 # There's no default, just do an assignment.
443 value = f.name
Eric V. Smith03220fd2017-12-29 13:59:58 -0500444 elif f.default is not MISSING:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500445 globals[default_name] = f.default
446 value = f.name
447 else:
Eric V. Smithf8e75492018-05-16 05:14:53 -0400448 # This field does not need initialization. Signify that
449 # to the caller by returning None.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500450 return None
451
452 # Only test this now, so that we can create variables for the
Eric V. Smithf8e75492018-05-16 05:14:53 -0400453 # default. However, return None to signify that we're not going
454 # to actually do the assignment statement for InitVars.
Eric V. Smithe7adf2b2018-06-07 14:43:59 -0400455 if f._field_type is _FIELD_INITVAR:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500456 return None
457
458 # Now, actually generate the field assignment.
459 return _field_assign(frozen, f.name, value, self_name)
460
461
462def _init_param(f):
Eric V. Smithf8e75492018-05-16 05:14:53 -0400463 # Return the __init__ parameter string for this field. For
464 # example, the equivalent of 'x:int=3' (except instead of 'int',
465 # reference a variable set to int, and instead of '3', reference a
466 # variable set to 3).
Eric V. Smith03220fd2017-12-29 13:59:58 -0500467 if f.default is MISSING and f.default_factory is MISSING:
Eric V. Smithf8e75492018-05-16 05:14:53 -0400468 # There's no default, and no default_factory, just output the
469 # variable name and type.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500470 default = ''
Eric V. Smith03220fd2017-12-29 13:59:58 -0500471 elif f.default is not MISSING:
Eric V. Smithf8e75492018-05-16 05:14:53 -0400472 # There's a default, this will be the name that's used to look
473 # it up.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500474 default = f'=_dflt_{f.name}'
Eric V. Smith03220fd2017-12-29 13:59:58 -0500475 elif f.default_factory is not MISSING:
Eric V. Smithf8e75492018-05-16 05:14:53 -0400476 # There's a factory function. Set a marker.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500477 default = '=_HAS_DEFAULT_FACTORY'
478 return f'{f.name}:_type_{f.name}{default}'
479
480
481def _init_fn(fields, frozen, has_post_init, self_name):
482 # fields contains both real fields and InitVar pseudo-fields.
483
484 # Make sure we don't have fields without defaults following fields
Eric V. Smithf8e75492018-05-16 05:14:53 -0400485 # with defaults. This actually would be caught when exec-ing the
486 # function source code, but catching it here gives a better error
487 # message, and future-proofs us in case we build up the function
488 # using ast.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500489 seen_default = False
490 for f in fields:
491 # Only consider fields in the __init__ call.
492 if f.init:
Eric V. Smith03220fd2017-12-29 13:59:58 -0500493 if not (f.default is MISSING and f.default_factory is MISSING):
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500494 seen_default = True
495 elif seen_default:
496 raise TypeError(f'non-default argument {f.name!r} '
497 'follows default argument')
498
Eric V. Smith03220fd2017-12-29 13:59:58 -0500499 globals = {'MISSING': MISSING,
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500500 '_HAS_DEFAULT_FACTORY': _HAS_DEFAULT_FACTORY}
501
502 body_lines = []
503 for f in fields:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500504 line = _field_init(f, frozen, globals, self_name)
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400505 # line is None means that this field doesn't require
Eric V. Smithf8e75492018-05-16 05:14:53 -0400506 # initialization (it's a pseudo-field). Just skip it.
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400507 if line:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500508 body_lines.append(line)
509
510 # Does this class have a post-init function?
511 if has_post_init:
512 params_str = ','.join(f.name for f in fields
513 if f._field_type is _FIELD_INITVAR)
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400514 body_lines.append(f'{self_name}.{_POST_INIT_NAME}({params_str})')
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500515
516 # If no body lines, use 'pass'.
Eric V. Smithea8fc522018-01-27 19:07:40 -0500517 if not body_lines:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500518 body_lines = ['pass']
519
520 locals = {f'_type_{f.name}': f.type for f in fields}
521 return _create_fn('__init__',
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400522 [self_name] + [_init_param(f) for f in fields if f.init],
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500523 body_lines,
524 locals=locals,
525 globals=globals,
526 return_type=None)
527
528
529def _repr_fn(fields):
Srinivas Thatiparthy (శ్రీనివాస్ తాటిపర్తి)dd13c882018-10-19 22:24:50 +0530530 fn = _create_fn('__repr__',
531 ('self',),
532 ['return self.__class__.__qualname__ + f"(' +
533 ', '.join([f"{f.name}={{self.{f.name}!r}}"
534 for f in fields]) +
535 ')"'])
536 return _recursive_repr(fn)
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500537
538
Eric V. Smithf199bc62018-03-18 20:40:34 -0400539def _frozen_get_del_attr(cls, fields):
Eric V. Smithf8e75492018-05-16 05:14:53 -0400540 # XXX: globals is modified on the first call to _create_fn, then
541 # the modified version is used in the second call. Is this okay?
Eric V. Smithf199bc62018-03-18 20:40:34 -0400542 globals = {'cls': cls,
543 'FrozenInstanceError': FrozenInstanceError}
544 if fields:
545 fields_str = '(' + ','.join(repr(f.name) for f in fields) + ',)'
546 else:
547 # Special case for the zero-length tuple.
548 fields_str = '()'
549 return (_create_fn('__setattr__',
550 ('self', 'name', 'value'),
551 (f'if type(self) is cls or name in {fields_str}:',
552 ' raise FrozenInstanceError(f"cannot assign to field {name!r}")',
553 f'super(cls, self).__setattr__(name, value)'),
554 globals=globals),
555 _create_fn('__delattr__',
556 ('self', 'name'),
557 (f'if type(self) is cls or name in {fields_str}:',
558 ' raise FrozenInstanceError(f"cannot delete field {name!r}")',
559 f'super(cls, self).__delattr__(name)'),
560 globals=globals),
561 )
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500562
563
564def _cmp_fn(name, op, self_tuple, other_tuple):
565 # Create a comparison function. If the fields in the object are
Eric V. Smithf8e75492018-05-16 05:14:53 -0400566 # named 'x' and 'y', then self_tuple is the string
567 # '(self.x,self.y)' and other_tuple is the string
568 # '(other.x,other.y)'.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500569
570 return _create_fn(name,
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400571 ('self', 'other'),
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500572 [ 'if other.__class__ is self.__class__:',
573 f' return {self_tuple}{op}{other_tuple}',
574 'return NotImplemented'])
575
576
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500577def _hash_fn(fields):
578 self_tuple = _tuple_str('self', fields)
579 return _create_fn('__hash__',
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400580 ('self',),
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500581 [f'return hash({self_tuple})'])
582
583
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400584def _is_classvar(a_type, typing):
Eric V. Smith92858352018-05-16 07:24:00 -0400585 # This test uses a typing internal class, but it's the best way to
586 # test if this is a ClassVar.
587 return (a_type is typing.ClassVar
588 or (type(a_type) is typing._GenericAlias
589 and a_type.__origin__ is typing.ClassVar))
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400590
591
592def _is_initvar(a_type, dataclasses):
593 # The module we're checking against is the module we're
594 # currently in (dataclasses.py).
Augusto Hack01ee12b2019-06-02 23:14:48 -0300595 return (a_type is dataclasses.InitVar
596 or type(a_type) is dataclasses.InitVar)
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400597
598
599def _is_type(annotation, cls, a_module, a_type, is_type_predicate):
600 # Given a type annotation string, does it refer to a_type in
601 # a_module? For example, when checking that annotation denotes a
602 # ClassVar, then a_module is typing, and a_type is
603 # typing.ClassVar.
604
605 # It's possible to look up a_module given a_type, but it involves
606 # looking in sys.modules (again!), and seems like a waste since
607 # the caller already knows a_module.
608
609 # - annotation is a string type annotation
610 # - cls is the class that this annotation was found in
611 # - a_module is the module we want to match
612 # - a_type is the type in that module we want to match
613 # - is_type_predicate is a function called with (obj, a_module)
614 # that determines if obj is of the desired type.
615
616 # Since this test does not do a local namespace lookup (and
617 # instead only a module (global) lookup), there are some things it
618 # gets wrong.
619
Eric V. Smithf8e75492018-05-16 05:14:53 -0400620 # With string annotations, cv0 will be detected as a ClassVar:
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400621 # CV = ClassVar
622 # @dataclass
623 # class C0:
624 # cv0: CV
625
Eric V. Smithf8e75492018-05-16 05:14:53 -0400626 # But in this example cv1 will not be detected as a ClassVar:
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400627 # @dataclass
628 # class C1:
629 # CV = ClassVar
630 # cv1: CV
631
Eric V. Smithf8e75492018-05-16 05:14:53 -0400632 # In C1, the code in this function (_is_type) will look up "CV" in
633 # the module and not find it, so it will not consider cv1 as a
634 # ClassVar. This is a fairly obscure corner case, and the best
635 # way to fix it would be to eval() the string "CV" with the
636 # correct global and local namespaces. However that would involve
637 # a eval() penalty for every single field of every dataclass
638 # that's defined. It was judged not worth it.
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400639
640 match = _MODULE_IDENTIFIER_RE.match(annotation)
641 if match:
642 ns = None
643 module_name = match.group(1)
644 if not module_name:
645 # No module name, assume the class's module did
646 # "from dataclasses import InitVar".
647 ns = sys.modules.get(cls.__module__).__dict__
648 else:
649 # Look up module_name in the class's module.
650 module = sys.modules.get(cls.__module__)
651 if module and module.__dict__.get(module_name) is a_module:
652 ns = sys.modules.get(a_type.__module__).__dict__
653 if ns and is_type_predicate(ns.get(match.group(2)), a_module):
654 return True
655 return False
656
657
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500658def _get_field(cls, a_name, a_type):
Eric V. Smithf96ddad2018-03-24 17:20:26 -0400659 # Return a Field object for this field name and type. ClassVars
Eric V. Smithf8e75492018-05-16 05:14:53 -0400660 # and InitVars are also returned, but marked as such (see
661 # f._field_type).
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500662
Eric V. Smithf8e75492018-05-16 05:14:53 -0400663 # If the default value isn't derived from Field, then it's only a
664 # normal default value. Convert it to a Field().
Eric V. Smith03220fd2017-12-29 13:59:58 -0500665 default = getattr(cls, a_name, MISSING)
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500666 if isinstance(default, Field):
667 f = default
668 else:
Eric V. Smith7389fd92018-03-19 21:07:51 -0400669 if isinstance(default, types.MemberDescriptorType):
670 # This is a field in __slots__, so it has no default value.
671 default = MISSING
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500672 f = field(default=default)
673
Eric V. Smithf8e75492018-05-16 05:14:53 -0400674 # Only at this point do we know the name and the type. Set them.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500675 f.name = a_name
676 f.type = a_type
677
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400678 # Assume it's a normal field until proven otherwise. We're next
Eric V. Smithf8e75492018-05-16 05:14:53 -0400679 # going to decide if it's a ClassVar or InitVar, everything else
680 # is just a normal field.
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400681 f._field_type = _FIELD
682
683 # In addition to checking for actual types here, also check for
Eric V. Smithf8e75492018-05-16 05:14:53 -0400684 # string annotations. get_type_hints() won't always work for us
685 # (see https://github.com/python/typing/issues/508 for example),
686 # plus it's expensive and would require an eval for every stirng
687 # annotation. So, make a best effort to see if this is a ClassVar
688 # or InitVar using regex's and checking that the thing referenced
689 # is actually of the correct type.
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400690
691 # For the complete discussion, see https://bugs.python.org/issue33453
692
693 # If typing has not been imported, then it's impossible for any
Eric V. Smithf8e75492018-05-16 05:14:53 -0400694 # annotation to be a ClassVar. So, only look for ClassVar if
695 # typing has been imported by any module (not necessarily cls's
696 # module).
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500697 typing = sys.modules.get('typing')
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400698 if typing:
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400699 if (_is_classvar(a_type, typing)
700 or (isinstance(f.type, str)
701 and _is_type(f.type, cls, typing, typing.ClassVar,
702 _is_classvar))):
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500703 f._field_type = _FIELD_CLASSVAR
704
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400705 # If the type is InitVar, or if it's a matching string annotation,
706 # then it's an InitVar.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500707 if f._field_type is _FIELD:
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400708 # The module we're checking against is the module we're
709 # currently in (dataclasses.py).
710 dataclasses = sys.modules[__name__]
711 if (_is_initvar(a_type, dataclasses)
712 or (isinstance(f.type, str)
713 and _is_type(f.type, cls, dataclasses, dataclasses.InitVar,
714 _is_initvar))):
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500715 f._field_type = _FIELD_INITVAR
716
Eric V. Smith2a7bacb2018-05-15 22:44:27 -0400717 # Validations for individual fields. This is delayed until now,
718 # instead of in the Field() constructor, since only here do we
719 # know the field name, which allows for better error reporting.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500720
721 # Special restrictions for ClassVar and InitVar.
722 if f._field_type in (_FIELD_CLASSVAR, _FIELD_INITVAR):
Eric V. Smith03220fd2017-12-29 13:59:58 -0500723 if f.default_factory is not MISSING:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500724 raise TypeError(f'field {f.name} cannot have a '
725 'default factory')
726 # Should I check for other field settings? default_factory
Eric V. Smithf8e75492018-05-16 05:14:53 -0400727 # seems the most serious to check for. Maybe add others. For
728 # example, how about init=False (or really,
729 # init=<not-the-default-init-value>)? It makes no sense for
730 # ClassVar and InitVar to specify init=<anything>.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500731
732 # For real fields, disallow mutable defaults for known types.
733 if f._field_type is _FIELD and isinstance(f.default, (list, dict, set)):
734 raise ValueError(f'mutable default {type(f.default)} for field '
735 f'{f.name} is not allowed: use default_factory')
736
737 return f
738
739
Eric V. Smithea8fc522018-01-27 19:07:40 -0500740def _set_new_attribute(cls, name, value):
741 # Never overwrites an existing attribute. Returns True if the
Eric V. Smithf8e75492018-05-16 05:14:53 -0400742 # attribute already exists.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500743 if name in cls.__dict__:
Eric V. Smithea8fc522018-01-27 19:07:40 -0500744 return True
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500745 setattr(cls, name, value)
Eric V. Smithea8fc522018-01-27 19:07:40 -0500746 return False
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500747
748
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500749# Decide if/how we're going to create a hash function. Key is
Eric V. Smithf8e75492018-05-16 05:14:53 -0400750# (unsafe_hash, eq, frozen, does-hash-exist). Value is the action to
751# take. The common case is to do nothing, so instead of providing a
752# function that is a no-op, use None to signify that.
Eric V. Smith01d618c2018-03-24 22:10:14 -0400753
754def _hash_set_none(cls, fields):
755 return None
756
757def _hash_add(cls, fields):
758 flds = [f for f in fields if (f.compare if f.hash is None else f.hash)]
759 return _hash_fn(flds)
760
761def _hash_exception(cls, fields):
762 # Raise an exception.
763 raise TypeError(f'Cannot overwrite attribute __hash__ '
764 f'in class {cls.__name__}')
765
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500766#
767# +-------------------------------------- unsafe_hash?
768# | +------------------------------- eq?
769# | | +------------------------ frozen?
770# | | | +---------------- has-explicit-hash?
771# | | | |
772# | | | | +------- action
773# | | | | |
774# v v v v v
Eric V. Smith01d618c2018-03-24 22:10:14 -0400775_hash_action = {(False, False, False, False): None,
776 (False, False, False, True ): None,
777 (False, False, True, False): None,
778 (False, False, True, True ): None,
779 (False, True, False, False): _hash_set_none,
780 (False, True, False, True ): None,
781 (False, True, True, False): _hash_add,
782 (False, True, True, True ): None,
783 (True, False, False, False): _hash_add,
784 (True, False, False, True ): _hash_exception,
785 (True, False, True, False): _hash_add,
786 (True, False, True, True ): _hash_exception,
787 (True, True, False, False): _hash_add,
788 (True, True, False, True ): _hash_exception,
789 (True, True, True, False): _hash_add,
790 (True, True, True, True ): _hash_exception,
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500791 }
792# See https://bugs.python.org/issue32929#msg312829 for an if-statement
Eric V. Smithf8e75492018-05-16 05:14:53 -0400793# version of this table.
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500794
795
Eric V. Smithf199bc62018-03-18 20:40:34 -0400796def _process_class(cls, init, repr, eq, order, unsafe_hash, frozen):
Eric V. Smithd1388922018-01-07 14:30:17 -0500797 # Now that dicts retain insertion order, there's no reason to use
Eric V. Smithf8e75492018-05-16 05:14:53 -0400798 # an ordered dict. I am leveraging that ordering here, because
799 # derived class fields overwrite base class fields, but the order
800 # is defined by the base class, which is found first.
Eric V. Smithd1388922018-01-07 14:30:17 -0500801 fields = {}
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500802
Eric V. Smithf199bc62018-03-18 20:40:34 -0400803 setattr(cls, _PARAMS, _DataclassParams(init, repr, eq, order,
804 unsafe_hash, frozen))
805
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500806 # Find our base classes in reverse MRO order, and exclude
Eric V. Smithf8e75492018-05-16 05:14:53 -0400807 # ourselves. In reversed order so that more derived classes
808 # override earlier field definitions in base classes. As long as
809 # we're iterating over them, see if any are frozen.
Eric V. Smithf199bc62018-03-18 20:40:34 -0400810 any_frozen_base = False
811 has_dataclass_bases = False
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500812 for b in cls.__mro__[-1:0:-1]:
813 # Only process classes that have been processed by our
Eric V. Smithf8e75492018-05-16 05:14:53 -0400814 # decorator. That is, they have a _FIELDS attribute.
Eric V. Smithf199bc62018-03-18 20:40:34 -0400815 base_fields = getattr(b, _FIELDS, None)
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500816 if base_fields:
Eric V. Smithf199bc62018-03-18 20:40:34 -0400817 has_dataclass_bases = True
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500818 for f in base_fields.values():
819 fields[f.name] = f
Eric V. Smithf199bc62018-03-18 20:40:34 -0400820 if getattr(b, _PARAMS).frozen:
821 any_frozen_base = True
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500822
Eric V. Smith56970b82018-03-22 16:28:48 -0400823 # Annotations that are defined in this class (not in base
Eric V. Smithf8e75492018-05-16 05:14:53 -0400824 # classes). If __annotations__ isn't present, then this class
825 # adds no new annotations. We use this to compute fields that are
826 # added by this class.
827 #
Eric V. Smith56970b82018-03-22 16:28:48 -0400828 # Fields are found from cls_annotations, which is guaranteed to be
Eric V. Smithf8e75492018-05-16 05:14:53 -0400829 # ordered. Default values are from class attributes, if a field
830 # has a default. If the default value is a Field(), then it
831 # contains additional info beyond (and possibly including) the
832 # actual default value. Pseudo-fields ClassVars and InitVars are
833 # included, despite the fact that they're not real fields. That's
834 # dealt with later.
Eric V. Smith56970b82018-03-22 16:28:48 -0400835 cls_annotations = cls.__dict__.get('__annotations__', {})
836
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500837 # Now find fields in our class. While doing so, validate some
Eric V. Smithf8e75492018-05-16 05:14:53 -0400838 # things, and set the default values (as class attributes) where
839 # we can.
Eric V. Smith56970b82018-03-22 16:28:48 -0400840 cls_fields = [_get_field(cls, name, type)
841 for name, type in cls_annotations.items()]
842 for f in cls_fields:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500843 fields[f.name] = f
844
Eric V. Smithf8e75492018-05-16 05:14:53 -0400845 # If the class attribute (which is the default value for this
846 # field) exists and is of type 'Field', replace it with the
847 # real default. This is so that normal class introspection
848 # sees a real default value, not a Field.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500849 if isinstance(getattr(cls, f.name, None), Field):
Eric V. Smith03220fd2017-12-29 13:59:58 -0500850 if f.default is MISSING:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500851 # If there's no default, delete the class attribute.
Eric V. Smithf8e75492018-05-16 05:14:53 -0400852 # This happens if we specify field(repr=False), for
853 # example (that is, we specified a field object, but
854 # no default value). Also if we're using a default
855 # factory. The class attribute should not be set at
856 # all in the post-processed class.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500857 delattr(cls, f.name)
858 else:
859 setattr(cls, f.name, f.default)
860
Eric V. Smith56970b82018-03-22 16:28:48 -0400861 # Do we have any Field members that don't also have annotations?
862 for name, value in cls.__dict__.items():
863 if isinstance(value, Field) and not name in cls_annotations:
864 raise TypeError(f'{name!r} is a field but has no type annotation')
865
Eric V. Smithf199bc62018-03-18 20:40:34 -0400866 # Check rules that apply if we are derived from any dataclasses.
867 if has_dataclass_bases:
868 # Raise an exception if any of our bases are frozen, but we're not.
869 if any_frozen_base and not frozen:
870 raise TypeError('cannot inherit non-frozen dataclass from a '
871 'frozen one')
Eric V. Smith2fa6b9e2018-02-26 20:38:33 -0500872
Eric V. Smithf199bc62018-03-18 20:40:34 -0400873 # Raise an exception if we're frozen, but none of our bases are.
874 if not any_frozen_base and frozen:
875 raise TypeError('cannot inherit frozen dataclass from a '
876 'non-frozen one')
Eric V. Smith2fa6b9e2018-02-26 20:38:33 -0500877
Eric V. Smithf8e75492018-05-16 05:14:53 -0400878 # Remember all of the fields on our class (including bases). This
879 # also marks this class as being a dataclass.
Eric V. Smithf199bc62018-03-18 20:40:34 -0400880 setattr(cls, _FIELDS, fields)
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500881
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500882 # Was this class defined with an explicit __hash__? Note that if
Eric V. Smithf8e75492018-05-16 05:14:53 -0400883 # __eq__ is defined in this class, then python will automatically
884 # set __hash__ to None. This is a heuristic, as it's possible
885 # that such a __hash__ == None was not auto-generated, but it
886 # close enough.
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500887 class_hash = cls.__dict__.get('__hash__', MISSING)
888 has_explicit_hash = not (class_hash is MISSING or
889 (class_hash is None and '__eq__' in cls.__dict__))
Eric V. Smithea8fc522018-01-27 19:07:40 -0500890
Eric V. Smithf8e75492018-05-16 05:14:53 -0400891 # If we're generating ordering methods, we must be generating the
892 # eq methods.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500893 if order and not eq:
894 raise ValueError('eq must be true if order is true')
895
896 if init:
897 # Does this class have a post-init function?
898 has_post_init = hasattr(cls, _POST_INIT_NAME)
899
900 # Include InitVars and regular fields (so, not ClassVars).
Eric V. Smithea8fc522018-01-27 19:07:40 -0500901 flds = [f for f in fields.values()
902 if f._field_type in (_FIELD, _FIELD_INITVAR)]
903 _set_new_attribute(cls, '__init__',
904 _init_fn(flds,
Eric V. Smith2fa6b9e2018-02-26 20:38:33 -0500905 frozen,
Eric V. Smithea8fc522018-01-27 19:07:40 -0500906 has_post_init,
Eric V. Smithf8e75492018-05-16 05:14:53 -0400907 # The name to use for the "self"
908 # param in __init__. Use "self"
909 # if possible.
Eric V. Smithea8fc522018-01-27 19:07:40 -0500910 '__dataclass_self__' if 'self' in fields
911 else 'self',
912 ))
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500913
914 # Get the fields as a list, and include only real fields. This is
Eric V. Smithf8e75492018-05-16 05:14:53 -0400915 # used in all of the following methods.
Eric V. Smithea8fc522018-01-27 19:07:40 -0500916 field_list = [f for f in fields.values() if f._field_type is _FIELD]
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500917
918 if repr:
Eric V. Smithea8fc522018-01-27 19:07:40 -0500919 flds = [f for f in field_list if f.repr]
920 _set_new_attribute(cls, '__repr__', _repr_fn(flds))
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500921
922 if eq:
Eric V. Smithea8fc522018-01-27 19:07:40 -0500923 # Create _eq__ method. There's no need for a __ne__ method,
Eric V. Smithf8e75492018-05-16 05:14:53 -0400924 # since python will call __eq__ and negate it.
Eric V. Smithea8fc522018-01-27 19:07:40 -0500925 flds = [f for f in field_list if f.compare]
926 self_tuple = _tuple_str('self', flds)
927 other_tuple = _tuple_str('other', flds)
928 _set_new_attribute(cls, '__eq__',
929 _cmp_fn('__eq__', '==',
930 self_tuple, other_tuple))
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500931
932 if order:
Eric V. Smithea8fc522018-01-27 19:07:40 -0500933 # Create and set the ordering methods.
934 flds = [f for f in field_list if f.compare]
935 self_tuple = _tuple_str('self', flds)
936 other_tuple = _tuple_str('other', flds)
937 for name, op in [('__lt__', '<'),
938 ('__le__', '<='),
939 ('__gt__', '>'),
940 ('__ge__', '>='),
941 ]:
942 if _set_new_attribute(cls, name,
943 _cmp_fn(name, op, self_tuple, other_tuple)):
944 raise TypeError(f'Cannot overwrite attribute {name} '
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500945 f'in class {cls.__name__}. Consider using '
Eric V. Smithea8fc522018-01-27 19:07:40 -0500946 'functools.total_ordering')
947
Eric V. Smith2fa6b9e2018-02-26 20:38:33 -0500948 if frozen:
Eric V. Smithf199bc62018-03-18 20:40:34 -0400949 for fn in _frozen_get_del_attr(cls, field_list):
950 if _set_new_attribute(cls, fn.__name__, fn):
951 raise TypeError(f'Cannot overwrite attribute {fn.__name__} '
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500952 f'in class {cls.__name__}')
Eric V. Smithea8fc522018-01-27 19:07:40 -0500953
954 # Decide if/how we're going to create a hash function.
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500955 hash_action = _hash_action[bool(unsafe_hash),
956 bool(eq),
957 bool(frozen),
958 has_explicit_hash]
Eric V. Smith01d618c2018-03-24 22:10:14 -0400959 if hash_action:
960 # No need to call _set_new_attribute here, since by the time
Eric V. Smithf8e75492018-05-16 05:14:53 -0400961 # we're here the overwriting is unconditional.
Eric V. Smith01d618c2018-03-24 22:10:14 -0400962 cls.__hash__ = hash_action(cls, field_list)
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500963
964 if not getattr(cls, '__doc__'):
965 # Create a class doc-string.
966 cls.__doc__ = (cls.__name__ +
967 str(inspect.signature(cls)).replace(' -> None', ''))
968
969 return cls
970
971
Serhiy Storchaka2085bd02019-06-01 11:00:15 +0300972def dataclass(cls=None, /, *, init=True, repr=True, eq=True, order=False,
Eric V. Smith5da8cfb2018-03-01 08:01:41 -0500973 unsafe_hash=False, frozen=False):
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500974 """Returns the same class as was passed in, with dunder methods
975 added based on the fields defined in the class.
976
977 Examines PEP 526 __annotations__ to determine fields.
978
979 If init is true, an __init__() method is added to the class. If
980 repr is true, a __repr__() method is added. If order is true, rich
Eric V. Smithdbf9cff2018-02-25 21:30:17 -0500981 comparison dunder methods are added. If unsafe_hash is true, a
982 __hash__() method function is added. If frozen is true, fields may
983 not be assigned to after instance creation.
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500984 """
985
986 def wrap(cls):
Eric V. Smithf199bc62018-03-18 20:40:34 -0400987 return _process_class(cls, init, repr, eq, order, unsafe_hash, frozen)
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500988
989 # See if we're being called as @dataclass or @dataclass().
Serhiy Storchaka2085bd02019-06-01 11:00:15 +0300990 if cls is None:
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500991 # We're called with parens.
992 return wrap
993
994 # We're called as @dataclass without parens.
Serhiy Storchaka2085bd02019-06-01 11:00:15 +0300995 return wrap(cls)
Eric V. Smithf0db54a2017-12-04 16:58:55 -0500996
997
998def fields(class_or_instance):
999 """Return a tuple describing the fields of this dataclass.
1000
1001 Accepts a dataclass or an instance of one. Tuple elements are of
1002 type Field.
1003 """
1004
1005 # Might it be worth caching this, per class?
1006 try:
Eric V. Smith2a7bacb2018-05-15 22:44:27 -04001007 fields = getattr(class_or_instance, _FIELDS)
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001008 except AttributeError:
1009 raise TypeError('must be called with a dataclass type or instance')
1010
Eric V. Smithd1388922018-01-07 14:30:17 -05001011 # Exclude pseudo-fields. Note that fields is sorted by insertion
Eric V. Smithf8e75492018-05-16 05:14:53 -04001012 # order, so the order of the tuple is as the fields were defined.
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001013 return tuple(f for f in fields.values() if f._field_type is _FIELD)
1014
1015
Eric V. Smithe7ba0132018-01-06 12:41:53 -05001016def _is_dataclass_instance(obj):
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001017 """Returns True if obj is an instance of a dataclass."""
Eric V. Smithf199bc62018-03-18 20:40:34 -04001018 return not isinstance(obj, type) and hasattr(obj, _FIELDS)
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001019
1020
Eric V. Smithe7ba0132018-01-06 12:41:53 -05001021def is_dataclass(obj):
1022 """Returns True if obj is a dataclass or an instance of a
1023 dataclass."""
Eric V. Smithf199bc62018-03-18 20:40:34 -04001024 return hasattr(obj, _FIELDS)
Eric V. Smithe7ba0132018-01-06 12:41:53 -05001025
1026
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001027def asdict(obj, *, dict_factory=dict):
1028 """Return the fields of a dataclass instance as a new dictionary mapping
1029 field names to field values.
1030
1031 Example usage:
1032
1033 @dataclass
1034 class C:
1035 x: int
1036 y: int
1037
1038 c = C(1, 2)
1039 assert asdict(c) == {'x': 1, 'y': 2}
1040
1041 If given, 'dict_factory' will be used instead of built-in dict.
1042 The function applies recursively to field values that are
1043 dataclass instances. This will also look into built-in containers:
1044 tuples, lists, and dicts.
1045 """
Eric V. Smithe7ba0132018-01-06 12:41:53 -05001046 if not _is_dataclass_instance(obj):
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001047 raise TypeError("asdict() should be called on dataclass instances")
1048 return _asdict_inner(obj, dict_factory)
1049
Eric V. Smithdbf9cff2018-02-25 21:30:17 -05001050
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001051def _asdict_inner(obj, dict_factory):
Eric V. Smithe7ba0132018-01-06 12:41:53 -05001052 if _is_dataclass_instance(obj):
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001053 result = []
1054 for f in fields(obj):
1055 value = _asdict_inner(getattr(obj, f.name), dict_factory)
1056 result.append((f.name, value))
1057 return dict_factory(result)
Eric V. Smith9b9d97d2018-09-14 11:32:16 -04001058 elif isinstance(obj, tuple) and hasattr(obj, '_fields'):
1059 # obj is a namedtuple. Recurse into it, but the returned
1060 # object is another namedtuple of the same type. This is
1061 # similar to how other list- or tuple-derived classes are
1062 # treated (see below), but we just need to create them
1063 # differently because a namedtuple's __init__ needs to be
1064 # called differently (see bpo-34363).
1065
1066 # I'm not using namedtuple's _asdict()
1067 # method, because:
1068 # - it does not recurse in to the namedtuple fields and
1069 # convert them to dicts (using dict_factory).
1070 # - I don't actually want to return a dict here. The the main
1071 # use case here is json.dumps, and it handles converting
1072 # namedtuples to lists. Admittedly we're losing some
1073 # information here when we produce a json list instead of a
1074 # dict. Note that if we returned dicts here instead of
1075 # namedtuples, we could no longer call asdict() on a data
1076 # structure where a namedtuple was used as a dict key.
1077
1078 return type(obj)(*[_asdict_inner(v, dict_factory) for v in obj])
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001079 elif isinstance(obj, (list, tuple)):
Eric V. Smith9b9d97d2018-09-14 11:32:16 -04001080 # Assume we can create an object of this type by passing in a
1081 # generator (which is not true for namedtuples, handled
1082 # above).
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001083 return type(obj)(_asdict_inner(v, dict_factory) for v in obj)
1084 elif isinstance(obj, dict):
Eric V. Smith9b9d97d2018-09-14 11:32:16 -04001085 return type(obj)((_asdict_inner(k, dict_factory),
1086 _asdict_inner(v, dict_factory))
1087 for k, v in obj.items())
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001088 else:
Eric V. Smithf96ddad2018-03-24 17:20:26 -04001089 return copy.deepcopy(obj)
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001090
1091
1092def astuple(obj, *, tuple_factory=tuple):
1093 """Return the fields of a dataclass instance as a new tuple of field values.
1094
1095 Example usage::
1096
1097 @dataclass
1098 class C:
1099 x: int
1100 y: int
1101
1102 c = C(1, 2)
Raymond Hettingerd55209d2018-01-10 20:56:41 -08001103 assert astuple(c) == (1, 2)
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001104
1105 If given, 'tuple_factory' will be used instead of built-in tuple.
1106 The function applies recursively to field values that are
1107 dataclass instances. This will also look into built-in containers:
1108 tuples, lists, and dicts.
1109 """
1110
Eric V. Smithe7ba0132018-01-06 12:41:53 -05001111 if not _is_dataclass_instance(obj):
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001112 raise TypeError("astuple() should be called on dataclass instances")
1113 return _astuple_inner(obj, tuple_factory)
1114
Eric V. Smithdbf9cff2018-02-25 21:30:17 -05001115
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001116def _astuple_inner(obj, tuple_factory):
Eric V. Smithe7ba0132018-01-06 12:41:53 -05001117 if _is_dataclass_instance(obj):
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001118 result = []
1119 for f in fields(obj):
1120 value = _astuple_inner(getattr(obj, f.name), tuple_factory)
1121 result.append(value)
1122 return tuple_factory(result)
Eric V. Smith9b9d97d2018-09-14 11:32:16 -04001123 elif isinstance(obj, tuple) and hasattr(obj, '_fields'):
1124 # obj is a namedtuple. Recurse into it, but the returned
1125 # object is another namedtuple of the same type. This is
1126 # similar to how other list- or tuple-derived classes are
1127 # treated (see below), but we just need to create them
1128 # differently because a namedtuple's __init__ needs to be
1129 # called differently (see bpo-34363).
1130 return type(obj)(*[_astuple_inner(v, tuple_factory) for v in obj])
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001131 elif isinstance(obj, (list, tuple)):
Eric V. Smith9b9d97d2018-09-14 11:32:16 -04001132 # Assume we can create an object of this type by passing in a
1133 # generator (which is not true for namedtuples, handled
1134 # above).
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001135 return type(obj)(_astuple_inner(v, tuple_factory) for v in obj)
1136 elif isinstance(obj, dict):
1137 return type(obj)((_astuple_inner(k, tuple_factory), _astuple_inner(v, tuple_factory))
1138 for k, v in obj.items())
1139 else:
Eric V. Smithf96ddad2018-03-24 17:20:26 -04001140 return copy.deepcopy(obj)
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001141
1142
Eric V. Smithd80b4432018-01-06 17:09:58 -05001143def make_dataclass(cls_name, fields, *, bases=(), namespace=None, init=True,
Eric V. Smith5da8cfb2018-03-01 08:01:41 -05001144 repr=True, eq=True, order=False, unsafe_hash=False,
Eric V. Smithdbf9cff2018-02-25 21:30:17 -05001145 frozen=False):
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001146 """Return a new dynamically created dataclass.
1147
Eric V. Smithed7d4292018-01-06 16:14:03 -05001148 The dataclass name will be 'cls_name'. 'fields' is an iterable
1149 of either (name), (name, type) or (name, type, Field) objects. If type is
1150 omitted, use the string 'typing.Any'. Field objects are created by
Eric V. Smithd327ae62018-01-07 08:19:45 -05001151 the equivalent of calling 'field(name, type [, Field-info])'.
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001152
Raymond Hettingerd55209d2018-01-10 20:56:41 -08001153 C = make_dataclass('C', ['x', ('y', int), ('z', int, field(init=False))], bases=(Base,))
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001154
1155 is equivalent to:
1156
1157 @dataclass
1158 class C(Base):
Raymond Hettingerd55209d2018-01-10 20:56:41 -08001159 x: 'typing.Any'
1160 y: int
1161 z: int = field(init=False)
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001162
Raymond Hettingerd55209d2018-01-10 20:56:41 -08001163 For the bases and namespace parameters, see the builtin type() function.
Eric V. Smithd80b4432018-01-06 17:09:58 -05001164
Eric V. Smithdbf9cff2018-02-25 21:30:17 -05001165 The parameters init, repr, eq, order, unsafe_hash, and frozen are passed to
Eric V. Smithd80b4432018-01-06 17:09:58 -05001166 dataclass().
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001167 """
1168
1169 if namespace is None:
1170 namespace = {}
1171 else:
1172 # Copy namespace since we're going to mutate it.
1173 namespace = namespace.copy()
1174
Eric V. Smith4e812962018-05-16 11:31:29 -04001175 # While we're looking through the field names, validate that they
1176 # are identifiers, are not keywords, and not duplicates.
1177 seen = set()
Eric V. Smithd1388922018-01-07 14:30:17 -05001178 anns = {}
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001179 for item in fields:
Eric V. Smithed7d4292018-01-06 16:14:03 -05001180 if isinstance(item, str):
1181 name = item
1182 tp = 'typing.Any'
1183 elif len(item) == 2:
1184 name, tp, = item
1185 elif len(item) == 3:
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001186 name, tp, spec = item
1187 namespace[name] = spec
Eric V. Smith4e812962018-05-16 11:31:29 -04001188 else:
1189 raise TypeError(f'Invalid field: {item!r}')
1190
1191 if not isinstance(name, str) or not name.isidentifier():
1192 raise TypeError(f'Field names must be valid identifers: {name!r}')
1193 if keyword.iskeyword(name):
1194 raise TypeError(f'Field names must not be keywords: {name!r}')
1195 if name in seen:
1196 raise TypeError(f'Field name duplicated: {name!r}')
1197
1198 seen.add(name)
Eric V. Smithed7d4292018-01-06 16:14:03 -05001199 anns[name] = tp
1200
1201 namespace['__annotations__'] = anns
Ivan Levkivskyi5a7092d2018-03-31 13:41:17 +01001202 # We use `types.new_class()` instead of simply `type()` to allow dynamic creation
1203 # of generic dataclassses.
1204 cls = types.new_class(cls_name, bases, {}, lambda ns: ns.update(namespace))
Eric V. Smithd80b4432018-01-06 17:09:58 -05001205 return dataclass(cls, init=init, repr=repr, eq=eq, order=order,
Eric V. Smithdbf9cff2018-02-25 21:30:17 -05001206 unsafe_hash=unsafe_hash, frozen=frozen)
1207
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001208
1209def replace(obj, **changes):
1210 """Return a new object replacing specified fields with new values.
1211
1212 This is especially useful for frozen classes. Example usage:
1213
1214 @dataclass(frozen=True)
1215 class C:
1216 x: int
1217 y: int
1218
1219 c = C(1, 2)
1220 c1 = replace(c, x=3)
1221 assert c1.x == 3 and c1.y == 2
1222 """
1223
Eric V. Smithf8e75492018-05-16 05:14:53 -04001224 # We're going to mutate 'changes', but that's okay because it's a
1225 # new dict, even if called with 'replace(obj, **my_changes)'.
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001226
Eric V. Smithe7ba0132018-01-06 12:41:53 -05001227 if not _is_dataclass_instance(obj):
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001228 raise TypeError("replace() should be called on dataclass instances")
1229
1230 # It's an error to have init=False fields in 'changes'.
1231 # If a field is not in 'changes', read its value from the provided obj.
1232
Eric V. Smithf199bc62018-03-18 20:40:34 -04001233 for f in getattr(obj, _FIELDS).values():
Eric V. Smithe7adf2b2018-06-07 14:43:59 -04001234 # Only consider normal fields or InitVars.
1235 if f._field_type is _FIELD_CLASSVAR:
1236 continue
1237
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001238 if not f.init:
1239 # Error if this field is specified in changes.
1240 if f.name in changes:
1241 raise ValueError(f'field {f.name} is declared with '
1242 'init=False, it cannot be specified with '
1243 'replace()')
1244 continue
1245
1246 if f.name not in changes:
Dong-hee Na3d70f7a2018-06-23 23:46:32 +09001247 if f._field_type is _FIELD_INITVAR:
1248 raise ValueError(f"InitVar {f.name!r} "
1249 'must be specified with replace()')
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001250 changes[f.name] = getattr(obj, f.name)
1251
Eric V. Smithf96ddad2018-03-24 17:20:26 -04001252 # Create the new object, which calls __init__() and
Eric V. Smithf8e75492018-05-16 05:14:53 -04001253 # __post_init__() (if defined), using all of the init fields we've
1254 # added and/or left in 'changes'. If there are values supplied in
1255 # changes that aren't fields, this will correctly raise a
1256 # TypeError.
Eric V. Smithf0db54a2017-12-04 16:58:55 -05001257 return obj.__class__(**changes)