Coverage for /pythoncovmergedfiles/medio/medio/usr/lib/python3.9/dataclasses.py: 57%
393 statements
« prev ^ index » next coverage.py v7.3.2, created at 2023-10-20 07:00 +0000
« prev ^ index » next coverage.py v7.3.2, created at 2023-10-20 07:00 +0000
1import re
2import sys
3import copy
4import types
5import inspect
6import keyword
7import builtins
8import functools
9import _thread
10from types import GenericAlias
13__all__ = ['dataclass',
14 'field',
15 'Field',
16 'FrozenInstanceError',
17 'InitVar',
18 'MISSING',
20 # Helper functions.
21 'fields',
22 'asdict',
23 'astuple',
24 'make_dataclass',
25 'replace',
26 'is_dataclass',
27 ]
29# Conditions for adding methods. The boxes indicate what action the
30# dataclass decorator takes. For all of these tables, when I talk
31# about init=, repr=, eq=, order=, unsafe_hash=, or frozen=, I'm
32# referring to the arguments to the @dataclass decorator. When
33# checking if a dunder method already exists, I mean check for an
34# entry in the class's __dict__. I never check to see if an attribute
35# is defined in a base class.
37# Key:
38# +=========+=========================================+
39# + Value | Meaning |
40# +=========+=========================================+
41# | <blank> | No action: no method is added. |
42# +---------+-----------------------------------------+
43# | add | Generated method is added. |
44# +---------+-----------------------------------------+
45# | raise | TypeError is raised. |
46# +---------+-----------------------------------------+
47# | None | Attribute is set to None. |
48# +=========+=========================================+
50# __init__
51#
52# +--- init= parameter
53# |
54# v | | |
55# | no | yes | <--- class has __init__ in __dict__?
56# +=======+=======+=======+
57# | False | | |
58# +-------+-------+-------+
59# | True | add | | <- the default
60# +=======+=======+=======+
62# __repr__
63#
64# +--- repr= parameter
65# |
66# v | | |
67# | no | yes | <--- class has __repr__ in __dict__?
68# +=======+=======+=======+
69# | False | | |
70# +-------+-------+-------+
71# | True | add | | <- the default
72# +=======+=======+=======+
75# __setattr__
76# __delattr__
77#
78# +--- frozen= parameter
79# |
80# v | | |
81# | no | yes | <--- class has __setattr__ or __delattr__ in __dict__?
82# +=======+=======+=======+
83# | False | | | <- the default
84# +-------+-------+-------+
85# | True | add | raise |
86# +=======+=======+=======+
87# Raise because not adding these methods would break the "frozen-ness"
88# of the class.
90# __eq__
91#
92# +--- eq= parameter
93# |
94# v | | |
95# | no | yes | <--- class has __eq__ in __dict__?
96# +=======+=======+=======+
97# | False | | |
98# +-------+-------+-------+
99# | True | add | | <- the default
100# +=======+=======+=======+
102# __lt__
103# __le__
104# __gt__
105# __ge__
106#
107# +--- order= parameter
108# |
109# v | | |
110# | no | yes | <--- class has any comparison method in __dict__?
111# +=======+=======+=======+
112# | False | | | <- the default
113# +-------+-------+-------+
114# | True | add | raise |
115# +=======+=======+=======+
116# Raise because to allow this case would interfere with using
117# functools.total_ordering.
119# __hash__
121# +------------------- unsafe_hash= parameter
122# | +----------- eq= parameter
123# | | +--- frozen= parameter
124# | | |
125# v v v | | |
126# | no | yes | <--- class has explicitly defined __hash__
127# +=======+=======+=======+========+========+
128# | False | False | False | | | No __eq__, use the base class __hash__
129# +-------+-------+-------+--------+--------+
130# | False | False | True | | | No __eq__, use the base class __hash__
131# +-------+-------+-------+--------+--------+
132# | False | True | False | None | | <-- the default, not hashable
133# +-------+-------+-------+--------+--------+
134# | False | True | True | add | | Frozen, so hashable, allows override
135# +-------+-------+-------+--------+--------+
136# | True | False | False | add | raise | Has no __eq__, but hashable
137# +-------+-------+-------+--------+--------+
138# | True | False | True | add | raise | Has no __eq__, but hashable
139# +-------+-------+-------+--------+--------+
140# | True | True | False | add | raise | Not frozen, but hashable
141# +-------+-------+-------+--------+--------+
142# | True | True | True | add | raise | Frozen, so hashable
143# +=======+=======+=======+========+========+
144# For boxes that are blank, __hash__ is untouched and therefore
145# inherited from the base class. If the base is object, then
146# id-based hashing is used.
147#
148# Note that a class may already have __hash__=None if it specified an
149# __eq__ method in the class body (not one that was created by
150# @dataclass).
151#
152# See _hash_action (below) for a coded version of this table.
155# Raised when an attempt is made to modify a frozen class.
156class FrozenInstanceError(AttributeError): pass
158# A sentinel object for default values to signal that a default
159# factory will be used. This is given a nice repr() which will appear
160# in the function signature of dataclasses' constructors.
161class _HAS_DEFAULT_FACTORY_CLASS:
162 def __repr__(self):
163 return '<factory>'
164_HAS_DEFAULT_FACTORY = _HAS_DEFAULT_FACTORY_CLASS()
166# A sentinel object to detect if a parameter is supplied or not. Use
167# a class to give it a better repr.
168class _MISSING_TYPE:
169 pass
170MISSING = _MISSING_TYPE()
172# Since most per-field metadata will be unused, create an empty
173# read-only proxy that can be shared among all fields.
174_EMPTY_METADATA = types.MappingProxyType({})
176# Markers for the various kinds of fields and pseudo-fields.
177class _FIELD_BASE:
178 def __init__(self, name):
179 self.name = name
180 def __repr__(self):
181 return self.name
182_FIELD = _FIELD_BASE('_FIELD')
183_FIELD_CLASSVAR = _FIELD_BASE('_FIELD_CLASSVAR')
184_FIELD_INITVAR = _FIELD_BASE('_FIELD_INITVAR')
186# The name of an attribute on the class where we store the Field
187# objects. Also used to check if a class is a Data Class.
188_FIELDS = '__dataclass_fields__'
190# The name of an attribute on the class that stores the parameters to
191# @dataclass.
192_PARAMS = '__dataclass_params__'
194# The name of the function, that if it exists, is called at the end of
195# __init__.
196_POST_INIT_NAME = '__post_init__'
198# String regex that string annotations for ClassVar or InitVar must match.
199# Allows "identifier.identifier[" or "identifier[".
200# https://bugs.python.org/issue33453 for details.
201_MODULE_IDENTIFIER_RE = re.compile(r'^(?:\s*(\w+)\s*\.)?\s*(\w+)')
203class InitVar:
204 __slots__ = ('type', )
206 def __init__(self, type):
207 self.type = type
209 def __repr__(self):
210 if isinstance(self.type, type):
211 type_name = self.type.__name__
212 else:
213 # typing objects, e.g. List[int]
214 type_name = repr(self.type)
215 return f'dataclasses.InitVar[{type_name}]'
217 def __class_getitem__(cls, type):
218 return InitVar(type)
221# Instances of Field are only ever created from within this module,
222# and only from the field() function, although Field instances are
223# exposed externally as (conceptually) read-only objects.
224#
225# name and type are filled in after the fact, not in __init__.
226# They're not known at the time this class is instantiated, but it's
227# convenient if they're available later.
228#
229# When cls._FIELDS is filled in with a list of Field objects, the name
230# and type fields will have been populated.
231class Field:
232 __slots__ = ('name',
233 'type',
234 'default',
235 'default_factory',
236 'repr',
237 'hash',
238 'init',
239 'compare',
240 'metadata',
241 '_field_type', # Private: not to be used by user code.
242 )
244 def __init__(self, default, default_factory, init, repr, hash, compare,
245 metadata):
246 self.name = None
247 self.type = None
248 self.default = default
249 self.default_factory = default_factory
250 self.init = init
251 self.repr = repr
252 self.hash = hash
253 self.compare = compare
254 self.metadata = (_EMPTY_METADATA
255 if metadata is None else
256 types.MappingProxyType(metadata))
257 self._field_type = None
259 def __repr__(self):
260 return ('Field('
261 f'name={self.name!r},'
262 f'type={self.type!r},'
263 f'default={self.default!r},'
264 f'default_factory={self.default_factory!r},'
265 f'init={self.init!r},'
266 f'repr={self.repr!r},'
267 f'hash={self.hash!r},'
268 f'compare={self.compare!r},'
269 f'metadata={self.metadata!r},'
270 f'_field_type={self._field_type}'
271 ')')
273 # This is used to support the PEP 487 __set_name__ protocol in the
274 # case where we're using a field that contains a descriptor as a
275 # default value. For details on __set_name__, see
276 # https://www.python.org/dev/peps/pep-0487/#implementation-details.
277 #
278 # Note that in _process_class, this Field object is overwritten
279 # with the default value, so the end result is a descriptor that
280 # had __set_name__ called on it at the right time.
281 def __set_name__(self, owner, name):
282 func = getattr(type(self.default), '__set_name__', None)
283 if func:
284 # There is a __set_name__ method on the descriptor, call
285 # it.
286 func(self.default, owner, name)
288 __class_getitem__ = classmethod(GenericAlias)
291class _DataclassParams:
292 __slots__ = ('init',
293 'repr',
294 'eq',
295 'order',
296 'unsafe_hash',
297 'frozen',
298 )
300 def __init__(self, init, repr, eq, order, unsafe_hash, frozen):
301 self.init = init
302 self.repr = repr
303 self.eq = eq
304 self.order = order
305 self.unsafe_hash = unsafe_hash
306 self.frozen = frozen
308 def __repr__(self):
309 return ('_DataclassParams('
310 f'init={self.init!r},'
311 f'repr={self.repr!r},'
312 f'eq={self.eq!r},'
313 f'order={self.order!r},'
314 f'unsafe_hash={self.unsafe_hash!r},'
315 f'frozen={self.frozen!r}'
316 ')')
319# This function is used instead of exposing Field creation directly,
320# so that a type checker can be told (via overloads) that this is a
321# function whose type depends on its parameters.
322def field(*, default=MISSING, default_factory=MISSING, init=True, repr=True,
323 hash=None, compare=True, metadata=None):
324 """Return an object to identify dataclass fields.
326 default is the default value of the field. default_factory is a
327 0-argument function called to initialize a field's value. If init
328 is True, the field will be a parameter to the class's __init__()
329 function. If repr is True, the field will be included in the
330 object's repr(). If hash is True, the field will be included in
331 the object's hash(). If compare is True, the field will be used
332 in comparison functions. metadata, if specified, must be a
333 mapping which is stored but not otherwise examined by dataclass.
335 It is an error to specify both default and default_factory.
336 """
338 if default is not MISSING and default_factory is not MISSING:
339 raise ValueError('cannot specify both default and default_factory')
340 return Field(default, default_factory, init, repr, hash, compare,
341 metadata)
344def _tuple_str(obj_name, fields):
345 # Return a string representing each field of obj_name as a tuple
346 # member. So, if fields is ['x', 'y'] and obj_name is "self",
347 # return "(self.x,self.y)".
349 # Special case for the 0-tuple.
350 if not fields:
351 return '()'
352 # Note the trailing comma, needed if this turns out to be a 1-tuple.
353 return f'({",".join([f"{obj_name}.{f.name}" for f in fields])},)'
356# This function's logic is copied from "recursive_repr" function in
357# reprlib module to avoid dependency.
358def _recursive_repr(user_function):
359 # Decorator to make a repr function return "..." for a recursive
360 # call.
361 repr_running = set()
363 @functools.wraps(user_function)
364 def wrapper(self):
365 key = id(self), _thread.get_ident()
366 if key in repr_running:
367 return '...'
368 repr_running.add(key)
369 try:
370 result = user_function(self)
371 finally:
372 repr_running.discard(key)
373 return result
374 return wrapper
377def _create_fn(name, args, body, *, globals=None, locals=None,
378 return_type=MISSING):
379 # Note that we mutate locals when exec() is called. Caller
380 # beware! The only callers are internal to this module, so no
381 # worries about external callers.
382 if locals is None:
383 locals = {}
384 if 'BUILTINS' not in locals:
385 locals['BUILTINS'] = builtins
386 return_annotation = ''
387 if return_type is not MISSING:
388 locals['_return_type'] = return_type
389 return_annotation = '->_return_type'
390 args = ','.join(args)
391 body = '\n'.join(f' {b}' for b in body)
393 # Compute the text of the entire function.
394 txt = f' def {name}({args}){return_annotation}:\n{body}'
396 local_vars = ', '.join(locals.keys())
397 txt = f"def __create_fn__({local_vars}):\n{txt}\n return {name}"
399 ns = {}
400 exec(txt, globals, ns)
401 return ns['__create_fn__'](**locals)
404def _field_assign(frozen, name, value, self_name):
405 # If we're a frozen class, then assign to our fields in __init__
406 # via object.__setattr__. Otherwise, just use a simple
407 # assignment.
408 #
409 # self_name is what "self" is called in this function: don't
410 # hard-code "self", since that might be a field name.
411 if frozen:
412 return f'BUILTINS.object.__setattr__({self_name},{name!r},{value})'
413 return f'{self_name}.{name}={value}'
416def _field_init(f, frozen, globals, self_name):
417 # Return the text of the line in the body of __init__ that will
418 # initialize this field.
420 default_name = f'_dflt_{f.name}'
421 if f.default_factory is not MISSING:
422 if f.init:
423 # This field has a default factory. If a parameter is
424 # given, use it. If not, call the factory.
425 globals[default_name] = f.default_factory
426 value = (f'{default_name}() '
427 f'if {f.name} is _HAS_DEFAULT_FACTORY '
428 f'else {f.name}')
429 else:
430 # This is a field that's not in the __init__ params, but
431 # has a default factory function. It needs to be
432 # initialized here by calling the factory function,
433 # because there's no other way to initialize it.
435 # For a field initialized with a default=defaultvalue, the
436 # class dict just has the default value
437 # (cls.fieldname=defaultvalue). But that won't work for a
438 # default factory, the factory must be called in __init__
439 # and we must assign that to self.fieldname. We can't
440 # fall back to the class dict's value, both because it's
441 # not set, and because it might be different per-class
442 # (which, after all, is why we have a factory function!).
444 globals[default_name] = f.default_factory
445 value = f'{default_name}()'
446 else:
447 # No default factory.
448 if f.init:
449 if f.default is MISSING:
450 # There's no default, just do an assignment.
451 value = f.name
452 elif f.default is not MISSING:
453 globals[default_name] = f.default
454 value = f.name
455 else:
456 # This field does not need initialization. Signify that
457 # to the caller by returning None.
458 return None
460 # Only test this now, so that we can create variables for the
461 # default. However, return None to signify that we're not going
462 # to actually do the assignment statement for InitVars.
463 if f._field_type is _FIELD_INITVAR:
464 return None
466 # Now, actually generate the field assignment.
467 return _field_assign(frozen, f.name, value, self_name)
470def _init_param(f):
471 # Return the __init__ parameter string for this field. For
472 # example, the equivalent of 'x:int=3' (except instead of 'int',
473 # reference a variable set to int, and instead of '3', reference a
474 # variable set to 3).
475 if f.default is MISSING and f.default_factory is MISSING:
476 # There's no default, and no default_factory, just output the
477 # variable name and type.
478 default = ''
479 elif f.default is not MISSING:
480 # There's a default, this will be the name that's used to look
481 # it up.
482 default = f'=_dflt_{f.name}'
483 elif f.default_factory is not MISSING:
484 # There's a factory function. Set a marker.
485 default = '=_HAS_DEFAULT_FACTORY'
486 return f'{f.name}:_type_{f.name}{default}'
489def _init_fn(fields, frozen, has_post_init, self_name, globals):
490 # fields contains both real fields and InitVar pseudo-fields.
492 # Make sure we don't have fields without defaults following fields
493 # with defaults. This actually would be caught when exec-ing the
494 # function source code, but catching it here gives a better error
495 # message, and future-proofs us in case we build up the function
496 # using ast.
497 seen_default = False
498 for f in fields:
499 # Only consider fields in the __init__ call.
500 if f.init:
501 if not (f.default is MISSING and f.default_factory is MISSING):
502 seen_default = True
503 elif seen_default:
504 raise TypeError(f'non-default argument {f.name!r} '
505 'follows default argument')
507 locals = {f'_type_{f.name}': f.type for f in fields}
508 locals.update({
509 'MISSING': MISSING,
510 '_HAS_DEFAULT_FACTORY': _HAS_DEFAULT_FACTORY,
511 })
513 body_lines = []
514 for f in fields:
515 line = _field_init(f, frozen, locals, self_name)
516 # line is None means that this field doesn't require
517 # initialization (it's a pseudo-field). Just skip it.
518 if line:
519 body_lines.append(line)
521 # Does this class have a post-init function?
522 if has_post_init:
523 params_str = ','.join(f.name for f in fields
524 if f._field_type is _FIELD_INITVAR)
525 body_lines.append(f'{self_name}.{_POST_INIT_NAME}({params_str})')
527 # If no body lines, use 'pass'.
528 if not body_lines:
529 body_lines = ['pass']
531 return _create_fn('__init__',
532 [self_name] + [_init_param(f) for f in fields if f.init],
533 body_lines,
534 locals=locals,
535 globals=globals,
536 return_type=None)
539def _repr_fn(fields, globals):
540 fn = _create_fn('__repr__',
541 ('self',),
542 ['return self.__class__.__qualname__ + f"(' +
543 ', '.join([f"{f.name}={{self.{f.name}!r}}"
544 for f in fields]) +
545 ')"'],
546 globals=globals)
547 return _recursive_repr(fn)
550def _frozen_get_del_attr(cls, fields, globals):
551 locals = {'cls': cls,
552 'FrozenInstanceError': FrozenInstanceError}
553 if fields:
554 fields_str = '(' + ','.join(repr(f.name) for f in fields) + ',)'
555 else:
556 # Special case for the zero-length tuple.
557 fields_str = '()'
558 return (_create_fn('__setattr__',
559 ('self', 'name', 'value'),
560 (f'if type(self) is cls or name in {fields_str}:',
561 ' raise FrozenInstanceError(f"cannot assign to field {name!r}")',
562 f'super(cls, self).__setattr__(name, value)'),
563 locals=locals,
564 globals=globals),
565 _create_fn('__delattr__',
566 ('self', 'name'),
567 (f'if type(self) is cls or name in {fields_str}:',
568 ' raise FrozenInstanceError(f"cannot delete field {name!r}")',
569 f'super(cls, self).__delattr__(name)'),
570 locals=locals,
571 globals=globals),
572 )
575def _cmp_fn(name, op, self_tuple, other_tuple, globals):
576 # Create a comparison function. If the fields in the object are
577 # named 'x' and 'y', then self_tuple is the string
578 # '(self.x,self.y)' and other_tuple is the string
579 # '(other.x,other.y)'.
581 return _create_fn(name,
582 ('self', 'other'),
583 [ 'if other.__class__ is self.__class__:',
584 f' return {self_tuple}{op}{other_tuple}',
585 'return NotImplemented'],
586 globals=globals)
589def _hash_fn(fields, globals):
590 self_tuple = _tuple_str('self', fields)
591 return _create_fn('__hash__',
592 ('self',),
593 [f'return hash({self_tuple})'],
594 globals=globals)
597def _is_classvar(a_type, typing):
598 # This test uses a typing internal class, but it's the best way to
599 # test if this is a ClassVar.
600 return (a_type is typing.ClassVar
601 or (type(a_type) is typing._GenericAlias
602 and a_type.__origin__ is typing.ClassVar))
605def _is_initvar(a_type, dataclasses):
606 # The module we're checking against is the module we're
607 # currently in (dataclasses.py).
608 return (a_type is dataclasses.InitVar
609 or type(a_type) is dataclasses.InitVar)
612def _is_type(annotation, cls, a_module, a_type, is_type_predicate):
613 # Given a type annotation string, does it refer to a_type in
614 # a_module? For example, when checking that annotation denotes a
615 # ClassVar, then a_module is typing, and a_type is
616 # typing.ClassVar.
618 # It's possible to look up a_module given a_type, but it involves
619 # looking in sys.modules (again!), and seems like a waste since
620 # the caller already knows a_module.
622 # - annotation is a string type annotation
623 # - cls is the class that this annotation was found in
624 # - a_module is the module we want to match
625 # - a_type is the type in that module we want to match
626 # - is_type_predicate is a function called with (obj, a_module)
627 # that determines if obj is of the desired type.
629 # Since this test does not do a local namespace lookup (and
630 # instead only a module (global) lookup), there are some things it
631 # gets wrong.
633 # With string annotations, cv0 will be detected as a ClassVar:
634 # CV = ClassVar
635 # @dataclass
636 # class C0:
637 # cv0: CV
639 # But in this example cv1 will not be detected as a ClassVar:
640 # @dataclass
641 # class C1:
642 # CV = ClassVar
643 # cv1: CV
645 # In C1, the code in this function (_is_type) will look up "CV" in
646 # the module and not find it, so it will not consider cv1 as a
647 # ClassVar. This is a fairly obscure corner case, and the best
648 # way to fix it would be to eval() the string "CV" with the
649 # correct global and local namespaces. However that would involve
650 # a eval() penalty for every single field of every dataclass
651 # that's defined. It was judged not worth it.
653 match = _MODULE_IDENTIFIER_RE.match(annotation)
654 if match:
655 ns = None
656 module_name = match.group(1)
657 if not module_name:
658 # No module name, assume the class's module did
659 # "from dataclasses import InitVar".
660 ns = sys.modules.get(cls.__module__).__dict__
661 else:
662 # Look up module_name in the class's module.
663 module = sys.modules.get(cls.__module__)
664 if module and module.__dict__.get(module_name) is a_module:
665 ns = sys.modules.get(a_type.__module__).__dict__
666 if ns and is_type_predicate(ns.get(match.group(2)), a_module):
667 return True
668 return False
671def _get_field(cls, a_name, a_type):
672 # Return a Field object for this field name and type. ClassVars
673 # and InitVars are also returned, but marked as such (see
674 # f._field_type).
676 # If the default value isn't derived from Field, then it's only a
677 # normal default value. Convert it to a Field().
678 default = getattr(cls, a_name, MISSING)
679 if isinstance(default, Field):
680 f = default
681 else:
682 if isinstance(default, types.MemberDescriptorType):
683 # This is a field in __slots__, so it has no default value.
684 default = MISSING
685 f = field(default=default)
687 # Only at this point do we know the name and the type. Set them.
688 f.name = a_name
689 f.type = a_type
691 # Assume it's a normal field until proven otherwise. We're next
692 # going to decide if it's a ClassVar or InitVar, everything else
693 # is just a normal field.
694 f._field_type = _FIELD
696 # In addition to checking for actual types here, also check for
697 # string annotations. get_type_hints() won't always work for us
698 # (see https://github.com/python/typing/issues/508 for example),
699 # plus it's expensive and would require an eval for every string
700 # annotation. So, make a best effort to see if this is a ClassVar
701 # or InitVar using regex's and checking that the thing referenced
702 # is actually of the correct type.
704 # For the complete discussion, see https://bugs.python.org/issue33453
706 # If typing has not been imported, then it's impossible for any
707 # annotation to be a ClassVar. So, only look for ClassVar if
708 # typing has been imported by any module (not necessarily cls's
709 # module).
710 typing = sys.modules.get('typing')
711 if typing:
712 if (_is_classvar(a_type, typing)
713 or (isinstance(f.type, str)
714 and _is_type(f.type, cls, typing, typing.ClassVar,
715 _is_classvar))):
716 f._field_type = _FIELD_CLASSVAR
718 # If the type is InitVar, or if it's a matching string annotation,
719 # then it's an InitVar.
720 if f._field_type is _FIELD:
721 # The module we're checking against is the module we're
722 # currently in (dataclasses.py).
723 dataclasses = sys.modules[__name__]
724 if (_is_initvar(a_type, dataclasses)
725 or (isinstance(f.type, str)
726 and _is_type(f.type, cls, dataclasses, dataclasses.InitVar,
727 _is_initvar))):
728 f._field_type = _FIELD_INITVAR
730 # Validations for individual fields. This is delayed until now,
731 # instead of in the Field() constructor, since only here do we
732 # know the field name, which allows for better error reporting.
734 # Special restrictions for ClassVar and InitVar.
735 if f._field_type in (_FIELD_CLASSVAR, _FIELD_INITVAR):
736 if f.default_factory is not MISSING:
737 raise TypeError(f'field {f.name} cannot have a '
738 'default factory')
739 # Should I check for other field settings? default_factory
740 # seems the most serious to check for. Maybe add others. For
741 # example, how about init=False (or really,
742 # init=<not-the-default-init-value>)? It makes no sense for
743 # ClassVar and InitVar to specify init=<anything>.
745 # For real fields, disallow mutable defaults for known types.
746 if f._field_type is _FIELD and isinstance(f.default, (list, dict, set)):
747 raise ValueError(f'mutable default {type(f.default)} for field '
748 f'{f.name} is not allowed: use default_factory')
750 return f
753def _set_new_attribute(cls, name, value):
754 # Never overwrites an existing attribute. Returns True if the
755 # attribute already exists.
756 if name in cls.__dict__:
757 return True
758 setattr(cls, name, value)
759 return False
762# Decide if/how we're going to create a hash function. Key is
763# (unsafe_hash, eq, frozen, does-hash-exist). Value is the action to
764# take. The common case is to do nothing, so instead of providing a
765# function that is a no-op, use None to signify that.
767def _hash_set_none(cls, fields, globals):
768 return None
770def _hash_add(cls, fields, globals):
771 flds = [f for f in fields if (f.compare if f.hash is None else f.hash)]
772 return _hash_fn(flds, globals)
774def _hash_exception(cls, fields, globals):
775 # Raise an exception.
776 raise TypeError(f'Cannot overwrite attribute __hash__ '
777 f'in class {cls.__name__}')
779#
780# +-------------------------------------- unsafe_hash?
781# | +------------------------------- eq?
782# | | +------------------------ frozen?
783# | | | +---------------- has-explicit-hash?
784# | | | |
785# | | | | +------- action
786# | | | | |
787# v v v v v
788_hash_action = {(False, False, False, False): None,
789 (False, False, False, True ): None,
790 (False, False, True, False): None,
791 (False, False, True, True ): None,
792 (False, True, False, False): _hash_set_none,
793 (False, True, False, True ): None,
794 (False, True, True, False): _hash_add,
795 (False, True, True, True ): None,
796 (True, False, False, False): _hash_add,
797 (True, False, False, True ): _hash_exception,
798 (True, False, True, False): _hash_add,
799 (True, False, True, True ): _hash_exception,
800 (True, True, False, False): _hash_add,
801 (True, True, False, True ): _hash_exception,
802 (True, True, True, False): _hash_add,
803 (True, True, True, True ): _hash_exception,
804 }
805# See https://bugs.python.org/issue32929#msg312829 for an if-statement
806# version of this table.
809def _process_class(cls, init, repr, eq, order, unsafe_hash, frozen):
810 # Now that dicts retain insertion order, there's no reason to use
811 # an ordered dict. I am leveraging that ordering here, because
812 # derived class fields overwrite base class fields, but the order
813 # is defined by the base class, which is found first.
814 fields = {}
816 if cls.__module__ in sys.modules:
817 globals = sys.modules[cls.__module__].__dict__
818 else:
819 # Theoretically this can happen if someone writes
820 # a custom string to cls.__module__. In which case
821 # such dataclass won't be fully introspectable
822 # (w.r.t. typing.get_type_hints) but will still function
823 # correctly.
824 globals = {}
826 setattr(cls, _PARAMS, _DataclassParams(init, repr, eq, order,
827 unsafe_hash, frozen))
829 # Find our base classes in reverse MRO order, and exclude
830 # ourselves. In reversed order so that more derived classes
831 # override earlier field definitions in base classes. As long as
832 # we're iterating over them, see if any are frozen.
833 any_frozen_base = False
834 has_dataclass_bases = False
835 for b in cls.__mro__[-1:0:-1]:
836 # Only process classes that have been processed by our
837 # decorator. That is, they have a _FIELDS attribute.
838 base_fields = getattr(b, _FIELDS, None)
839 if base_fields is not None:
840 has_dataclass_bases = True
841 for f in base_fields.values():
842 fields[f.name] = f
843 if getattr(b, _PARAMS).frozen:
844 any_frozen_base = True
846 # Annotations that are defined in this class (not in base
847 # classes). If __annotations__ isn't present, then this class
848 # adds no new annotations. We use this to compute fields that are
849 # added by this class.
850 #
851 # Fields are found from cls_annotations, which is guaranteed to be
852 # ordered. Default values are from class attributes, if a field
853 # has a default. If the default value is a Field(), then it
854 # contains additional info beyond (and possibly including) the
855 # actual default value. Pseudo-fields ClassVars and InitVars are
856 # included, despite the fact that they're not real fields. That's
857 # dealt with later.
858 cls_annotations = cls.__dict__.get('__annotations__', {})
860 # Now find fields in our class. While doing so, validate some
861 # things, and set the default values (as class attributes) where
862 # we can.
863 cls_fields = [_get_field(cls, name, type)
864 for name, type in cls_annotations.items()]
865 for f in cls_fields:
866 fields[f.name] = f
868 # If the class attribute (which is the default value for this
869 # field) exists and is of type 'Field', replace it with the
870 # real default. This is so that normal class introspection
871 # sees a real default value, not a Field.
872 if isinstance(getattr(cls, f.name, None), Field):
873 if f.default is MISSING:
874 # If there's no default, delete the class attribute.
875 # This happens if we specify field(repr=False), for
876 # example (that is, we specified a field object, but
877 # no default value). Also if we're using a default
878 # factory. The class attribute should not be set at
879 # all in the post-processed class.
880 delattr(cls, f.name)
881 else:
882 setattr(cls, f.name, f.default)
884 # Do we have any Field members that don't also have annotations?
885 for name, value in cls.__dict__.items():
886 if isinstance(value, Field) and not name in cls_annotations:
887 raise TypeError(f'{name!r} is a field but has no type annotation')
889 # Check rules that apply if we are derived from any dataclasses.
890 if has_dataclass_bases:
891 # Raise an exception if any of our bases are frozen, but we're not.
892 if any_frozen_base and not frozen:
893 raise TypeError('cannot inherit non-frozen dataclass from a '
894 'frozen one')
896 # Raise an exception if we're frozen, but none of our bases are.
897 if not any_frozen_base and frozen:
898 raise TypeError('cannot inherit frozen dataclass from a '
899 'non-frozen one')
901 # Remember all of the fields on our class (including bases). This
902 # also marks this class as being a dataclass.
903 setattr(cls, _FIELDS, fields)
905 # Was this class defined with an explicit __hash__? Note that if
906 # __eq__ is defined in this class, then python will automatically
907 # set __hash__ to None. This is a heuristic, as it's possible
908 # that such a __hash__ == None was not auto-generated, but it
909 # close enough.
910 class_hash = cls.__dict__.get('__hash__', MISSING)
911 has_explicit_hash = not (class_hash is MISSING or
912 (class_hash is None and '__eq__' in cls.__dict__))
914 # If we're generating ordering methods, we must be generating the
915 # eq methods.
916 if order and not eq:
917 raise ValueError('eq must be true if order is true')
919 if init:
920 # Does this class have a post-init function?
921 has_post_init = hasattr(cls, _POST_INIT_NAME)
923 # Include InitVars and regular fields (so, not ClassVars).
924 flds = [f for f in fields.values()
925 if f._field_type in (_FIELD, _FIELD_INITVAR)]
926 _set_new_attribute(cls, '__init__',
927 _init_fn(flds,
928 frozen,
929 has_post_init,
930 # The name to use for the "self"
931 # param in __init__. Use "self"
932 # if possible.
933 '__dataclass_self__' if 'self' in fields
934 else 'self',
935 globals,
936 ))
938 # Get the fields as a list, and include only real fields. This is
939 # used in all of the following methods.
940 field_list = [f for f in fields.values() if f._field_type is _FIELD]
942 if repr:
943 flds = [f for f in field_list if f.repr]
944 _set_new_attribute(cls, '__repr__', _repr_fn(flds, globals))
946 if eq:
947 # Create _eq__ method. There's no need for a __ne__ method,
948 # since python will call __eq__ and negate it.
949 flds = [f for f in field_list if f.compare]
950 self_tuple = _tuple_str('self', flds)
951 other_tuple = _tuple_str('other', flds)
952 _set_new_attribute(cls, '__eq__',
953 _cmp_fn('__eq__', '==',
954 self_tuple, other_tuple,
955 globals=globals))
957 if order:
958 # Create and set the ordering methods.
959 flds = [f for f in field_list if f.compare]
960 self_tuple = _tuple_str('self', flds)
961 other_tuple = _tuple_str('other', flds)
962 for name, op in [('__lt__', '<'),
963 ('__le__', '<='),
964 ('__gt__', '>'),
965 ('__ge__', '>='),
966 ]:
967 if _set_new_attribute(cls, name,
968 _cmp_fn(name, op, self_tuple, other_tuple,
969 globals=globals)):
970 raise TypeError(f'Cannot overwrite attribute {name} '
971 f'in class {cls.__name__}. Consider using '
972 'functools.total_ordering')
974 if frozen:
975 for fn in _frozen_get_del_attr(cls, field_list, globals):
976 if _set_new_attribute(cls, fn.__name__, fn):
977 raise TypeError(f'Cannot overwrite attribute {fn.__name__} '
978 f'in class {cls.__name__}')
980 # Decide if/how we're going to create a hash function.
981 hash_action = _hash_action[bool(unsafe_hash),
982 bool(eq),
983 bool(frozen),
984 has_explicit_hash]
985 if hash_action:
986 # No need to call _set_new_attribute here, since by the time
987 # we're here the overwriting is unconditional.
988 cls.__hash__ = hash_action(cls, field_list, globals)
990 if not getattr(cls, '__doc__'):
991 # Create a class doc-string.
992 cls.__doc__ = (cls.__name__ +
993 str(inspect.signature(cls)).replace(' -> None', ''))
995 return cls
998def dataclass(cls=None, /, *, init=True, repr=True, eq=True, order=False,
999 unsafe_hash=False, frozen=False):
1000 """Returns the same class as was passed in, with dunder methods
1001 added based on the fields defined in the class.
1003 Examines PEP 526 __annotations__ to determine fields.
1005 If init is true, an __init__() method is added to the class. If
1006 repr is true, a __repr__() method is added. If order is true, rich
1007 comparison dunder methods are added. If unsafe_hash is true, a
1008 __hash__() method function is added. If frozen is true, fields may
1009 not be assigned to after instance creation.
1010 """
1012 def wrap(cls):
1013 return _process_class(cls, init, repr, eq, order, unsafe_hash, frozen)
1015 # See if we're being called as @dataclass or @dataclass().
1016 if cls is None:
1017 # We're called with parens.
1018 return wrap
1020 # We're called as @dataclass without parens.
1021 return wrap(cls)
1024def fields(class_or_instance):
1025 """Return a tuple describing the fields of this dataclass.
1027 Accepts a dataclass or an instance of one. Tuple elements are of
1028 type Field.
1029 """
1031 # Might it be worth caching this, per class?
1032 try:
1033 fields = getattr(class_or_instance, _FIELDS)
1034 except AttributeError:
1035 raise TypeError('must be called with a dataclass type or instance')
1037 # Exclude pseudo-fields. Note that fields is sorted by insertion
1038 # order, so the order of the tuple is as the fields were defined.
1039 return tuple(f for f in fields.values() if f._field_type is _FIELD)
1042def _is_dataclass_instance(obj):
1043 """Returns True if obj is an instance of a dataclass."""
1044 return hasattr(type(obj), _FIELDS)
1047def is_dataclass(obj):
1048 """Returns True if obj is a dataclass or an instance of a
1049 dataclass."""
1050 cls = obj if isinstance(obj, type) else type(obj)
1051 return hasattr(cls, _FIELDS)
1054def asdict(obj, *, dict_factory=dict):
1055 """Return the fields of a dataclass instance as a new dictionary mapping
1056 field names to field values.
1058 Example usage:
1060 @dataclass
1061 class C:
1062 x: int
1063 y: int
1065 c = C(1, 2)
1066 assert asdict(c) == {'x': 1, 'y': 2}
1068 If given, 'dict_factory' will be used instead of built-in dict.
1069 The function applies recursively to field values that are
1070 dataclass instances. This will also look into built-in containers:
1071 tuples, lists, and dicts.
1072 """
1073 if not _is_dataclass_instance(obj):
1074 raise TypeError("asdict() should be called on dataclass instances")
1075 return _asdict_inner(obj, dict_factory)
1078def _asdict_inner(obj, dict_factory):
1079 if _is_dataclass_instance(obj):
1080 result = []
1081 for f in fields(obj):
1082 value = _asdict_inner(getattr(obj, f.name), dict_factory)
1083 result.append((f.name, value))
1084 return dict_factory(result)
1085 elif isinstance(obj, tuple) and hasattr(obj, '_fields'):
1086 # obj is a namedtuple. Recurse into it, but the returned
1087 # object is another namedtuple of the same type. This is
1088 # similar to how other list- or tuple-derived classes are
1089 # treated (see below), but we just need to create them
1090 # differently because a namedtuple's __init__ needs to be
1091 # called differently (see bpo-34363).
1093 # I'm not using namedtuple's _asdict()
1094 # method, because:
1095 # - it does not recurse in to the namedtuple fields and
1096 # convert them to dicts (using dict_factory).
1097 # - I don't actually want to return a dict here. The main
1098 # use case here is json.dumps, and it handles converting
1099 # namedtuples to lists. Admittedly we're losing some
1100 # information here when we produce a json list instead of a
1101 # dict. Note that if we returned dicts here instead of
1102 # namedtuples, we could no longer call asdict() on a data
1103 # structure where a namedtuple was used as a dict key.
1105 return type(obj)(*[_asdict_inner(v, dict_factory) for v in obj])
1106 elif isinstance(obj, (list, tuple)):
1107 # Assume we can create an object of this type by passing in a
1108 # generator (which is not true for namedtuples, handled
1109 # above).
1110 return type(obj)(_asdict_inner(v, dict_factory) for v in obj)
1111 elif isinstance(obj, dict):
1112 return type(obj)((_asdict_inner(k, dict_factory),
1113 _asdict_inner(v, dict_factory))
1114 for k, v in obj.items())
1115 else:
1116 return copy.deepcopy(obj)
1119def astuple(obj, *, tuple_factory=tuple):
1120 """Return the fields of a dataclass instance as a new tuple of field values.
1122 Example usage::
1124 @dataclass
1125 class C:
1126 x: int
1127 y: int
1129 c = C(1, 2)
1130 assert astuple(c) == (1, 2)
1132 If given, 'tuple_factory' will be used instead of built-in tuple.
1133 The function applies recursively to field values that are
1134 dataclass instances. This will also look into built-in containers:
1135 tuples, lists, and dicts.
1136 """
1138 if not _is_dataclass_instance(obj):
1139 raise TypeError("astuple() should be called on dataclass instances")
1140 return _astuple_inner(obj, tuple_factory)
1143def _astuple_inner(obj, tuple_factory):
1144 if _is_dataclass_instance(obj):
1145 result = []
1146 for f in fields(obj):
1147 value = _astuple_inner(getattr(obj, f.name), tuple_factory)
1148 result.append(value)
1149 return tuple_factory(result)
1150 elif isinstance(obj, tuple) and hasattr(obj, '_fields'):
1151 # obj is a namedtuple. Recurse into it, but the returned
1152 # object is another namedtuple of the same type. This is
1153 # similar to how other list- or tuple-derived classes are
1154 # treated (see below), but we just need to create them
1155 # differently because a namedtuple's __init__ needs to be
1156 # called differently (see bpo-34363).
1157 return type(obj)(*[_astuple_inner(v, tuple_factory) for v in obj])
1158 elif isinstance(obj, (list, tuple)):
1159 # Assume we can create an object of this type by passing in a
1160 # generator (which is not true for namedtuples, handled
1161 # above).
1162 return type(obj)(_astuple_inner(v, tuple_factory) for v in obj)
1163 elif isinstance(obj, dict):
1164 return type(obj)((_astuple_inner(k, tuple_factory), _astuple_inner(v, tuple_factory))
1165 for k, v in obj.items())
1166 else:
1167 return copy.deepcopy(obj)
1170def make_dataclass(cls_name, fields, *, bases=(), namespace=None, init=True,
1171 repr=True, eq=True, order=False, unsafe_hash=False,
1172 frozen=False):
1173 """Return a new dynamically created dataclass.
1175 The dataclass name will be 'cls_name'. 'fields' is an iterable
1176 of either (name), (name, type) or (name, type, Field) objects. If type is
1177 omitted, use the string 'typing.Any'. Field objects are created by
1178 the equivalent of calling 'field(name, type [, Field-info])'.
1180 C = make_dataclass('C', ['x', ('y', int), ('z', int, field(init=False))], bases=(Base,))
1182 is equivalent to:
1184 @dataclass
1185 class C(Base):
1186 x: 'typing.Any'
1187 y: int
1188 z: int = field(init=False)
1190 For the bases and namespace parameters, see the builtin type() function.
1192 The parameters init, repr, eq, order, unsafe_hash, and frozen are passed to
1193 dataclass().
1194 """
1196 if namespace is None:
1197 namespace = {}
1198 else:
1199 # Copy namespace since we're going to mutate it.
1200 namespace = namespace.copy()
1202 # While we're looking through the field names, validate that they
1203 # are identifiers, are not keywords, and not duplicates.
1204 seen = set()
1205 anns = {}
1206 for item in fields:
1207 if isinstance(item, str):
1208 name = item
1209 tp = 'typing.Any'
1210 elif len(item) == 2:
1211 name, tp, = item
1212 elif len(item) == 3:
1213 name, tp, spec = item
1214 namespace[name] = spec
1215 else:
1216 raise TypeError(f'Invalid field: {item!r}')
1218 if not isinstance(name, str) or not name.isidentifier():
1219 raise TypeError(f'Field names must be valid identifiers: {name!r}')
1220 if keyword.iskeyword(name):
1221 raise TypeError(f'Field names must not be keywords: {name!r}')
1222 if name in seen:
1223 raise TypeError(f'Field name duplicated: {name!r}')
1225 seen.add(name)
1226 anns[name] = tp
1228 namespace['__annotations__'] = anns
1229 # We use `types.new_class()` instead of simply `type()` to allow dynamic creation
1230 # of generic dataclassses.
1231 cls = types.new_class(cls_name, bases, {}, lambda ns: ns.update(namespace))
1232 return dataclass(cls, init=init, repr=repr, eq=eq, order=order,
1233 unsafe_hash=unsafe_hash, frozen=frozen)
1236def replace(obj, /, **changes):
1237 """Return a new object replacing specified fields with new values.
1239 This is especially useful for frozen classes. Example usage:
1241 @dataclass(frozen=True)
1242 class C:
1243 x: int
1244 y: int
1246 c = C(1, 2)
1247 c1 = replace(c, x=3)
1248 assert c1.x == 3 and c1.y == 2
1249 """
1251 # We're going to mutate 'changes', but that's okay because it's a
1252 # new dict, even if called with 'replace(obj, **my_changes)'.
1254 if not _is_dataclass_instance(obj):
1255 raise TypeError("replace() should be called on dataclass instances")
1257 # It's an error to have init=False fields in 'changes'.
1258 # If a field is not in 'changes', read its value from the provided obj.
1260 for f in getattr(obj, _FIELDS).values():
1261 # Only consider normal fields or InitVars.
1262 if f._field_type is _FIELD_CLASSVAR:
1263 continue
1265 if not f.init:
1266 # Error if this field is specified in changes.
1267 if f.name in changes:
1268 raise ValueError(f'field {f.name} is declared with '
1269 'init=False, it cannot be specified with '
1270 'replace()')
1271 continue
1273 if f.name not in changes:
1274 if f._field_type is _FIELD_INITVAR and f.default is MISSING:
1275 raise ValueError(f"InitVar {f.name!r} "
1276 'must be specified with replace()')
1277 changes[f.name] = getattr(obj, f.name)
1279 # Create the new object, which calls __init__() and
1280 # __post_init__() (if defined), using all of the init fields we've
1281 # added and/or left in 'changes'. If there are values supplied in
1282 # changes that aren't fields, this will correctly raise a
1283 # TypeError.
1284 return obj.__class__(**changes)