mypy/typestate.py - third_party/github.com/python/mypy - Git at Google

 """
 A shared state for all TypeInfos that holds global cache and dependency information,
 and potentially other mutable TypeInfo state. This module contains mutable global state.
 """

 from typing import Dict, Set, Tuple, Optional, List
 from typing_extensions import ClassVar, Final, TypeAlias as _TypeAlias

 from mypy.nodes import TypeInfo
 from mypy.types import Instance, TypeAliasType, get_proper_type, Type
 from mypy.server.trigger import make_trigger

 # Represents that the 'left' instance is a subtype of the 'right' instance
 SubtypeRelationship: _TypeAlias = Tuple[Instance, Instance]

 # A tuple encoding the specific conditions under which we performed the subtype check.
 # (e.g. did we want a proper subtype? A regular subtype while ignoring variance?)
 SubtypeKind: _TypeAlias = Tuple[bool, ...]

 # A cache that keeps track of whether the given TypeInfo is a part of a particular
 # subtype relationship
 SubtypeCache: _TypeAlias = Dict[TypeInfo, Dict[SubtypeKind, Set[SubtypeRelationship]]]


 class TypeState:
     """This class provides subtype caching to improve performance of subtype checks.
     It also holds protocol fine grained dependencies.

     Note: to avoid leaking global state, 'reset_all_subtype_caches()' should be called
     after a build has finished and after a daemon shutdown. This subtype cache only exists for
     performance reasons, resetting subtype caches for a class has no semantic effect.
     The protocol dependencies however are only stored here, and shouldn't be deleted unless
     not needed any more (e.g. during daemon shutdown).
     """
     # '_subtype_caches' keeps track of (subtype, supertype) pairs where supertypes are
     # instances of the given TypeInfo. The cache also keeps track of whether the check
     # was done in strict optional mode and of the specific *kind* of subtyping relationship,
     # which we represent as an arbitrary hashable tuple.
     # We need the caches, since subtype checks for structural types are very slow.
     _subtype_caches: Final[SubtypeCache] = {}

     # This contains protocol dependencies generated after running a full build,
     # or after an update. These dependencies are special because:
     #   * They are a global property of the program; i.e. some dependencies for imported
     #     classes can be generated in the importing modules.
     #   * Because of the above, they are serialized separately, after a full run,
     #     or a full update.
     # `proto_deps` can be None if after deserialization it turns out that they are
     # inconsistent with the other cache files (or an error occurred during deserialization).
     # A blocking error will be generated in this case, since we can't proceed safely.
     # For the description of kinds of protocol dependencies and corresponding examples,
     # see _snapshot_protocol_deps.
     proto_deps: ClassVar[Optional[Dict[str, Set[str]]]] = {}

     # Protocols (full names) a given class attempted to implement.
     # Used to calculate fine grained protocol dependencies and optimize protocol
     # subtype cache invalidation in fine grained mode. For example, if we pass a value
     # of type a.A to a function expecting something compatible with protocol p.P,
     # we'd have 'a.A' -> {'p.P', ...} in the map. This map is flushed after every incremental
     # update.
     _attempted_protocols: Final[Dict[str, Set[str]]] = {}
     # We also snapshot protocol members of the above protocols. For example, if we pass
     # a value of type a.A to a function expecting something compatible with Iterable, we'd have
     # 'a.A' -> {'__iter__', ...} in the map. This map is also flushed after every incremental
     # update. This map is needed to only generate dependencies like <a.A.__iter__> -> <a.A>
     # instead of a wildcard to avoid unnecessarily invalidating classes.
     _checked_against_members: Final[Dict[str, Set[str]]] = {}
     # TypeInfos that appeared as a left type (subtype) in a subtype check since latest
     # dependency snapshot update. This is an optimisation for fine grained mode; during a full
     # run we only take a dependency snapshot at the very end, so this set will contain all
     # subtype-checked TypeInfos. After a fine grained update however, we can gather only new
     # dependencies generated from (typically) few TypeInfos that were subtype-checked
     # (i.e. appeared as r.h.s. in an assignment or an argument in a function call in
     # a re-checked target) during the update.
     _rechecked_types: Final[Set[TypeInfo]] = set()

     # The two attributes below are assumption stacks for subtyping relationships between
     # recursive type aliases. Normally, one would pass type assumptions as an additional
     # arguments to is_subtype(), but this would mean updating dozens of related functions
     # threading this through all callsites (see also comment for TypeInfo.assuming).
     _assuming: Final[List[Tuple[TypeAliasType, TypeAliasType]]] = []
     _assuming_proper: Final[List[Tuple[TypeAliasType, TypeAliasType]]] = []
     # Ditto for inference of generic constraints against recursive type aliases.
     _inferring: Final[List[TypeAliasType]] = []

     # N.B: We do all of the accesses to these properties through
     # TypeState, instead of making these classmethods and accessing
     # via the cls parameter, since mypyc can optimize accesses to
     # Final attributes of a directly referenced type.

     @staticmethod
     def is_assumed_subtype(left: Type, right: Type) -> bool:
         for (l, r) in reversed(TypeState._assuming):
             if (get_proper_type(l) == get_proper_type(left)
                     and get_proper_type(r) == get_proper_type(right)):
                 return True
         return False

     @staticmethod
     def is_assumed_proper_subtype(left: Type, right: Type) -> bool:
         for (l, r) in reversed(TypeState._assuming_proper):
             if (get_proper_type(l) == get_proper_type(left)
                     and get_proper_type(r) == get_proper_type(right)):
                 return True
         return False

     @staticmethod
     def reset_all_subtype_caches() -> None:
         """Completely reset all known subtype caches."""
         TypeState._subtype_caches.clear()

     @staticmethod
     def reset_subtype_caches_for(info: TypeInfo) -> None:
         """Reset subtype caches (if any) for a given supertype TypeInfo."""
         if info in TypeState._subtype_caches:
             TypeState._subtype_caches[info].clear()

     @staticmethod
     def reset_all_subtype_caches_for(info: TypeInfo) -> None:
         """Reset subtype caches (if any) for a given supertype TypeInfo and its MRO."""
         for item in info.mro:
             TypeState.reset_subtype_caches_for(item)

     @staticmethod
     def is_cached_subtype_check(kind: SubtypeKind, left: Instance, right: Instance) -> bool:
         if left.last_known_value is not None or right.last_known_value is not None:
             # If there is a literal last known value, give up. There
             # will be an unbounded number of potential types to cache,
             # making caching less effective.
             return False
         info = right.type
         cache = TypeState._subtype_caches.get(info)
         if cache is None:
             return False
         subcache = cache.get(kind)
         if subcache is None:
             return False
         return (left, right) in subcache

     @staticmethod
     def record_subtype_cache_entry(kind: SubtypeKind,
                                    left: Instance, right: Instance) -> None:
         if left.last_known_value is not None or right.last_known_value is not None:
             # These are unlikely to match, due to the large space of
             # possible values.  Avoid uselessly increasing cache sizes.
             return
         cache = TypeState._subtype_caches.setdefault(right.type, dict())
         cache.setdefault(kind, set()).add((left, right))

     @staticmethod
     def reset_protocol_deps() -> None:
         """Reset dependencies after a full run or before a daemon shutdown."""
         TypeState.proto_deps = {}
         TypeState._attempted_protocols.clear()
         TypeState._checked_against_members.clear()
         TypeState._rechecked_types.clear()

     @staticmethod
     def record_protocol_subtype_check(left_type: TypeInfo, right_type: TypeInfo) -> None:
         assert right_type.is_protocol
         TypeState._rechecked_types.add(left_type)
         TypeState._attempted_protocols.setdefault(
             left_type.fullname, set()).add(right_type.fullname)
         TypeState._checked_against_members.setdefault(
             left_type.fullname,
             set()).update(right_type.protocol_members)

     @staticmethod
     def _snapshot_protocol_deps() -> Dict[str, Set[str]]:
         """Collect protocol attribute dependencies found so far from registered subtype checks.

         There are three kinds of protocol dependencies. For example, after a subtype check:

             x: Proto = C()

         the following dependencies will be generated:
             1. ..., <SuperProto[wildcard]>, <Proto[wildcard]> -> <Proto>
             2. ..., <B.attr>, <C.attr> -> <C> [for every attr in Proto members]
             3. <C> -> Proto  # this one to invalidate the subtype cache

         The first kind is generated immediately per-module in deps.py (see also an example there
         for motivation why it is needed). While two other kinds are generated here after all
         modules are type checked and we have recorded all the subtype checks. To understand these
         two kinds, consider a simple example:

             class A:
                 def __iter__(self) -> Iterator[int]:
                     ...

             it: Iterable[int] = A()

         We add <a.A.__iter__> -> <a.A> to invalidate the assignment (module target in this case),
         whenever the signature of a.A.__iter__ changes. We also add <a.A> -> typing.Iterable,
         to invalidate the subtype caches of the latter. (Note that the same logic applies to
         proper subtype checks, and calculating meets and joins, if this involves calling
         'subtypes.is_protocol_implementation').
         """
         deps: Dict[str, Set[str]] = {}
         for info in TypeState._rechecked_types:
             for attr in TypeState._checked_against_members[info.fullname]:
                 # The need for full MRO here is subtle, during an update, base classes of
                 # a concrete class may not be reprocessed, so not all <B.x> -> <C.x> deps
                 # are added.
                 for base_info in info.mro[:-1]:
                     trigger = make_trigger('%s.%s' % (base_info.fullname, attr))
                     if 'typing' in trigger or 'builtins' in trigger:
                         # TODO: avoid everything from typeshed
                         continue
                     deps.setdefault(trigger, set()).add(make_trigger(info.fullname))
             for proto in TypeState._attempted_protocols[info.fullname]:
                 trigger = make_trigger(info.fullname)
                 if 'typing' in trigger or 'builtins' in trigger:
                     continue
                 # If any class that was checked against a protocol changes,
                 # we need to reset the subtype cache for the protocol.
                 #
                 # Note: strictly speaking, the protocol doesn't need to be
                 # re-checked, we only need to reset the cache, and its uses
                 # elsewhere are still valid (unless invalidated by other deps).
                 deps.setdefault(trigger, set()).add(proto)
         return deps

     @staticmethod
     def update_protocol_deps(second_map: Optional[Dict[str, Set[str]]] = None) -> None:
         """Update global protocol dependency map.

         We update the global map incrementally, using a snapshot only from recently
         type checked types. If second_map is given, update it as well. This is currently used
         by FineGrainedBuildManager that maintains normal (non-protocol) dependencies.
         """
         assert TypeState.proto_deps is not None, (
             "This should not be called after failed cache load")
         new_deps = TypeState._snapshot_protocol_deps()
         for trigger, targets in new_deps.items():
             TypeState.proto_deps.setdefault(trigger, set()).update(targets)
         if second_map is not None:
             for trigger, targets in new_deps.items():
                 second_map.setdefault(trigger, set()).update(targets)
         TypeState._rechecked_types.clear()
         TypeState._attempted_protocols.clear()
         TypeState._checked_against_members.clear()

     @staticmethod
     def add_all_protocol_deps(deps: Dict[str, Set[str]]) -> None:
         """Add all known protocol dependencies to deps.

         This is used by tests and debug output, and also when collecting
         all collected or loaded dependencies as part of build.
         """
         TypeState.update_protocol_deps()  # just in case
         if TypeState.proto_deps is not None:
             for trigger, targets in TypeState.proto_deps.items():
                 deps.setdefault(trigger, set()).update(targets)


 def reset_global_state() -> None:
     """Reset most existing global state.

     Currently most of it is in this module. Few exceptions are strict optional status and
     and functools.lru_cache.
     """
     TypeState.reset_all_subtype_caches()
     TypeState.reset_protocol_deps()
	"""
	A shared state for all TypeInfos that holds global cache and dependency information,
	and potentially other mutable TypeInfo state. This module contains mutable global state.
	"""

	from typing import Dict, Set, Tuple, Optional, List
	from typing_extensions import ClassVar, Final, TypeAlias as _TypeAlias

	from mypy.nodes import TypeInfo
	from mypy.types import Instance, TypeAliasType, get_proper_type, Type
	from mypy.server.trigger import make_trigger

	# Represents that the 'left' instance is a subtype of the 'right' instance
	SubtypeRelationship: _TypeAlias = Tuple[Instance, Instance]

	# A tuple encoding the specific conditions under which we performed the subtype check.
	# (e.g. did we want a proper subtype? A regular subtype while ignoring variance?)
	SubtypeKind: _TypeAlias = Tuple[bool, ...]

	# A cache that keeps track of whether the given TypeInfo is a part of a particular
	# subtype relationship
	SubtypeCache: _TypeAlias = Dict[TypeInfo, Dict[SubtypeKind, Set[SubtypeRelationship]]]


	class TypeState:
	"""This class provides subtype caching to improve performance of subtype checks.
	It also holds protocol fine grained dependencies.

	Note: to avoid leaking global state, 'reset_all_subtype_caches()' should be called
	after a build has finished and after a daemon shutdown. This subtype cache only exists for
	performance reasons, resetting subtype caches for a class has no semantic effect.
	The protocol dependencies however are only stored here, and shouldn't be deleted unless
	not needed any more (e.g. during daemon shutdown).
	"""
	# '_subtype_caches' keeps track of (subtype, supertype) pairs where supertypes are
	# instances of the given TypeInfo. The cache also keeps track of whether the check
	# was done in strict optional mode and of the specific kind of subtyping relationship,
	# which we represent as an arbitrary hashable tuple.
	# We need the caches, since subtype checks for structural types are very slow.
	_subtype_caches: Final[SubtypeCache] = {}

	# This contains protocol dependencies generated after running a full build,
	# or after an update. These dependencies are special because:
	# * They are a global property of the program; i.e. some dependencies for imported
	# classes can be generated in the importing modules.
	# * Because of the above, they are serialized separately, after a full run,
	# or a full update.
	# `proto_deps` can be None if after deserialization it turns out that they are
	# inconsistent with the other cache files (or an error occurred during deserialization).
	# A blocking error will be generated in this case, since we can't proceed safely.
	# For the description of kinds of protocol dependencies and corresponding examples,
	# see _snapshot_protocol_deps.
	proto_deps: ClassVar[Optional[Dict[str, Set[str]]]] = {}

	# Protocols (full names) a given class attempted to implement.
	# Used to calculate fine grained protocol dependencies and optimize protocol
	# subtype cache invalidation in fine grained mode. For example, if we pass a value
	# of type a.A to a function expecting something compatible with protocol p.P,
	# we'd have 'a.A' -> {'p.P', ...} in the map. This map is flushed after every incremental
	# update.
	_attempted_protocols: Final[Dict[str, Set[str]]] = {}
	# We also snapshot protocol members of the above protocols. For example, if we pass
	# a value of type a.A to a function expecting something compatible with Iterable, we'd have
	# 'a.A' -> {'__iter__', ...} in the map. This map is also flushed after every incremental
	# update. This map is needed to only generate dependencies like <a.A.__iter__> -> <a.A>
	# instead of a wildcard to avoid unnecessarily invalidating classes.
	_checked_against_members: Final[Dict[str, Set[str]]] = {}
	# TypeInfos that appeared as a left type (subtype) in a subtype check since latest
	# dependency snapshot update. This is an optimisation for fine grained mode; during a full
	# run we only take a dependency snapshot at the very end, so this set will contain all
	# subtype-checked TypeInfos. After a fine grained update however, we can gather only new
	# dependencies generated from (typically) few TypeInfos that were subtype-checked
	# (i.e. appeared as r.h.s. in an assignment or an argument in a function call in
	# a re-checked target) during the update.
	_rechecked_types: Final[Set[TypeInfo]] = set()

	# The two attributes below are assumption stacks for subtyping relationships between
	# recursive type aliases. Normally, one would pass type assumptions as an additional
	# arguments to is_subtype(), but this would mean updating dozens of related functions
	# threading this through all callsites (see also comment for TypeInfo.assuming).
	_assuming: Final[List[Tuple[TypeAliasType, TypeAliasType]]] = []
	_assuming_proper: Final[List[Tuple[TypeAliasType, TypeAliasType]]] = []
	# Ditto for inference of generic constraints against recursive type aliases.
	_inferring: Final[List[TypeAliasType]] = []

	# N.B: We do all of the accesses to these properties through
	# TypeState, instead of making these classmethods and accessing
	# via the cls parameter, since mypyc can optimize accesses to
	# Final attributes of a directly referenced type.

	@staticmethod
	def is_assumed_subtype(left: Type, right: Type) -> bool:
	for (l, r) in reversed(TypeState._assuming):
	if (get_proper_type(l) == get_proper_type(left)
	and get_proper_type(r) == get_proper_type(right)):
	return True
	return False

	@staticmethod
	def is_assumed_proper_subtype(left: Type, right: Type) -> bool:
	for (l, r) in reversed(TypeState._assuming_proper):
	if (get_proper_type(l) == get_proper_type(left)
	and get_proper_type(r) == get_proper_type(right)):
	return True
	return False

	@staticmethod
	def reset_all_subtype_caches() -> None:
	"""Completely reset all known subtype caches."""
	TypeState._subtype_caches.clear()

	@staticmethod
	def reset_subtype_caches_for(info: TypeInfo) -> None:
	"""Reset subtype caches (if any) for a given supertype TypeInfo."""
	if info in TypeState._subtype_caches:
	TypeState._subtype_caches[info].clear()

	@staticmethod
	def reset_all_subtype_caches_for(info: TypeInfo) -> None:
	"""Reset subtype caches (if any) for a given supertype TypeInfo and its MRO."""
	for item in info.mro:
	TypeState.reset_subtype_caches_for(item)

	@staticmethod
	def is_cached_subtype_check(kind: SubtypeKind, left: Instance, right: Instance) -> bool:
	if left.last_known_value is not None or right.last_known_value is not None:
	# If there is a literal last known value, give up. There
	# will be an unbounded number of potential types to cache,
	# making caching less effective.
	return False
	info = right.type
	cache = TypeState._subtype_caches.get(info)
	if cache is None:
	return False
	subcache = cache.get(kind)
	if subcache is None:
	return False
	return (left, right) in subcache

	@staticmethod
	def record_subtype_cache_entry(kind: SubtypeKind,
	left: Instance, right: Instance) -> None:
	if left.last_known_value is not None or right.last_known_value is not None:
	# These are unlikely to match, due to the large space of
	# possible values. Avoid uselessly increasing cache sizes.
	return
	cache = TypeState._subtype_caches.setdefault(right.type, dict())
	cache.setdefault(kind, set()).add((left, right))

	@staticmethod
	def reset_protocol_deps() -> None:
	"""Reset dependencies after a full run or before a daemon shutdown."""
	TypeState.proto_deps = {}
	TypeState._attempted_protocols.clear()
	TypeState._checked_against_members.clear()
	TypeState._rechecked_types.clear()

	@staticmethod
	def record_protocol_subtype_check(left_type: TypeInfo, right_type: TypeInfo) -> None:
	assert right_type.is_protocol
	TypeState._rechecked_types.add(left_type)
	TypeState._attempted_protocols.setdefault(
	left_type.fullname, set()).add(right_type.fullname)
	TypeState._checked_against_members.setdefault(
	left_type.fullname,
	set()).update(right_type.protocol_members)

	@staticmethod
	def _snapshot_protocol_deps() -> Dict[str, Set[str]]:
	"""Collect protocol attribute dependencies found so far from registered subtype checks.

	There are three kinds of protocol dependencies. For example, after a subtype check:

	x: Proto = C()

	the following dependencies will be generated:
	1. ..., <SuperProto[wildcard]>, <Proto[wildcard]> -> <Proto>
	2. ..., <B.attr>, <C.attr> -> <C> [for every attr in Proto members]
	3. <C> -> Proto # this one to invalidate the subtype cache

	The first kind is generated immediately per-module in deps.py (see also an example there
	for motivation why it is needed). While two other kinds are generated here after all
	modules are type checked and we have recorded all the subtype checks. To understand these
	two kinds, consider a simple example:

	class A:
	def __iter__(self) -> Iterator[int]:
	...

	it: Iterable[int] = A()

	We add <a.A.__iter__> -> <a.A> to invalidate the assignment (module target in this case),
	whenever the signature of a.A.__iter__ changes. We also add <a.A> -> typing.Iterable,
	to invalidate the subtype caches of the latter. (Note that the same logic applies to
	proper subtype checks, and calculating meets and joins, if this involves calling
	'subtypes.is_protocol_implementation').
	"""
	deps: Dict[str, Set[str]] = {}
	for info in TypeState._rechecked_types:
	for attr in TypeState._checked_against_members[info.fullname]:
	# The need for full MRO here is subtle, during an update, base classes of
	# a concrete class may not be reprocessed, so not all <B.x> -> <C.x> deps
	# are added.
	for base_info in info.mro[:-1]:
	trigger = make_trigger('%s.%s' % (base_info.fullname, attr))
	if 'typing' in trigger or 'builtins' in trigger:
	# TODO: avoid everything from typeshed
	continue
	deps.setdefault(trigger, set()).add(make_trigger(info.fullname))
	for proto in TypeState._attempted_protocols[info.fullname]:
	trigger = make_trigger(info.fullname)
	if 'typing' in trigger or 'builtins' in trigger:
	continue
	# If any class that was checked against a protocol changes,
	# we need to reset the subtype cache for the protocol.
	#
	# Note: strictly speaking, the protocol doesn't need to be
	# re-checked, we only need to reset the cache, and its uses
	# elsewhere are still valid (unless invalidated by other deps).
	deps.setdefault(trigger, set()).add(proto)
	return deps

	@staticmethod
	def update_protocol_deps(second_map: Optional[Dict[str, Set[str]]] = None) -> None:
	"""Update global protocol dependency map.

	We update the global map incrementally, using a snapshot only from recently
	type checked types. If second_map is given, update it as well. This is currently used
	by FineGrainedBuildManager that maintains normal (non-protocol) dependencies.
	"""
	assert TypeState.proto_deps is not None, (
	"This should not be called after failed cache load")
	new_deps = TypeState._snapshot_protocol_deps()
	for trigger, targets in new_deps.items():
	TypeState.proto_deps.setdefault(trigger, set()).update(targets)
	if second_map is not None:
	for trigger, targets in new_deps.items():
	second_map.setdefault(trigger, set()).update(targets)
	TypeState._rechecked_types.clear()
	TypeState._attempted_protocols.clear()
	TypeState._checked_against_members.clear()

	@staticmethod
	def add_all_protocol_deps(deps: Dict[str, Set[str]]) -> None:
	"""Add all known protocol dependencies to deps.

	This is used by tests and debug output, and also when collecting
	all collected or loaded dependencies as part of build.
	"""
	TypeState.update_protocol_deps() # just in case
	if TypeState.proto_deps is not None:
	for trigger, targets in TypeState.proto_deps.items():
	deps.setdefault(trigger, set()).update(targets)


	def reset_global_state() -> None:
	"""Reset most existing global state.

	Currently most of it is in this module. Few exceptions are strict optional status and
	and functools.lru_cache.
	"""
	TypeState.reset_all_subtype_caches()
	TypeState.reset_protocol_deps()