| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295 |
- """
- This module provides Source classes that track the origins of values in PyTorch Dynamo.
- Sources represent where values come from (e.g. local variables, globals, attributes) and
- are used for guard generation and code reconstruction during compilation.
- The module includes specialized sources for:
- - Local variables and synthetic locals
- - Global variables and constants
- - Object attributes and method calls
- - NN module specialization (specialized vs unspecialized)
- - Random values and tensor properties
- - Default argument handling
- - FSDP (Fully Sharded Data Parallel) modules
- Sources play a key role in Dynamo's guard system by tracking value origins for
- guard generation, and in code reconstruction by providing methods to rebuild
- the code needed to recreate values.
- """
- import dataclasses
- import enum
- import functools
- from collections.abc import Callable
- from typing import Any, Optional, TYPE_CHECKING, Union
- from torch import device as device_type
- from torch._guards import (
- ChainedSource,
- dataclass_with_cached_hash,
- Guard,
- GuardSource,
- Source,
- )
- from . import utils
- from .bytecode_transformation import (
- create_binary_subscr,
- create_build_tuple,
- create_call_function,
- )
- if TYPE_CHECKING:
- from .codegen import PyCodegen
- # It shouldn't be supported to construct an NNModuleVariable inside an FSDP module,
- # so those cases are omitted intentionally
- # represents nn.Modules tracked with NNModuleVariable (specialized is implicit in the variable name)
- _GUARD_SOURCE_SPECIALIZED_NN_MODULE = {
- GuardSource.LOCAL: GuardSource.LOCAL_SPECIALIZED_NN_MODULE,
- GuardSource.GLOBAL: GuardSource.GLOBAL_SPECIALIZED_NN_MODULE,
- GuardSource.LOCAL_SPECIALIZED_NN_MODULE: GuardSource.LOCAL_SPECIALIZED_NN_MODULE,
- GuardSource.GLOBAL_SPECIALIZED_NN_MODULE: GuardSource.GLOBAL_SPECIALIZED_NN_MODULE,
- # Just to ensure that guard_source() works
- GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE,
- GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE,
- GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.LOCAL_FSDP_MODULE: GuardSource.LOCAL_FSDP_MODULE,
- GuardSource.GLOBAL_FSDP_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
- }
- # represents nn.Modules tracked with UnspecializedNNModuleVariable
- _GUARD_SOURCE_UNSPECIALIZED_NN_MODULE = {
- GuardSource.LOCAL: GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE,
- GuardSource.GLOBAL: GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE,
- GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE,
- GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE,
- # this happens for an UnspecializedNNModule submodule on a NNModuleVariable
- GuardSource.LOCAL_SPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE,
- GuardSource.GLOBAL_SPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE,
- # Just to ensure that guard_source() works
- GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.LOCAL_FSDP_MODULE: GuardSource.LOCAL_FSDP_MODULE,
- GuardSource.GLOBAL_FSDP_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
- }
- # represents nn.Modules tracked with UnspecializedBuiltinNNModuleVariable
- _GUARD_SOURCE_UNSPECIALIZED_BUILTIN_NN_MODULE = {
- GuardSource.LOCAL: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.GLOBAL: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.LOCAL_SPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.GLOBAL_SPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- # Just to ensure that guard_source() works
- GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
- GuardSource.LOCAL_FSDP_MODULE: GuardSource.LOCAL_FSDP_MODULE,
- GuardSource.GLOBAL_FSDP_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
- }
- _GUARD_SOURCE_FSDP_MODULE = {
- GuardSource.LOCAL: GuardSource.LOCAL_FSDP_MODULE,
- GuardSource.GLOBAL: GuardSource.GLOBAL_FSDP_MODULE,
- GuardSource.LOCAL_SPECIALIZED_NN_MODULE: GuardSource.LOCAL_FSDP_MODULE,
- GuardSource.GLOBAL_SPECIALIZED_NN_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
- GuardSource.LOCAL_FSDP_MODULE: GuardSource.LOCAL_FSDP_MODULE,
- GuardSource.GLOBAL_FSDP_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
- GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE: GuardSource.LOCAL_FSDP_MODULE,
- GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
- GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.LOCAL_FSDP_MODULE,
- GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
- }
- def is_constant_source(source: Source) -> bool:
- if isinstance(source, ConstantSource):
- return True
- try:
- if source.guard_source == GuardSource.CONSTANT:
- return True
- except NotImplementedError:
- pass
- return False
- def _get_source_debug_name(source: Optional[Source]) -> str:
- if source is None:
- return "<unknown source>"
- else:
- try:
- return source.name
- except NotImplementedError:
- return "<unknown source>"
- def _esc_str(s: Any, apply_repr: bool = False) -> str:
- """
- Escapes curly brackets for format strings.
- e.g. "frozenset({0})" becomes "frozenset({{0}})".
- This is used by _name_template for example, because it's
- expected to return a format string, but we may wish to include
- strings that should not be accidentally formatted.
- """
- if apply_repr:
- s = repr(s)
- else:
- s = str(s)
- return s.replace("{", "{{").replace("}", "}}")
- @dataclass_with_cached_hash(frozen=True)
- class LocalSource(Source):
- local_name: str
- # Whether this local is an input to the root frame.
- is_input: bool = False
- # Whether we know this input is dynamic (based on example_inputs)
- # For non tensors, we simply look at the first index of the tuple
- dynamism: Optional[frozenset[str]] = None
- # Whether the item at this source is the _content_ of a cell that is
- # dereferenced from the root frame, i.e., it's a part of the `co_cellvars`
- # or `co_freevars`.
- is_derefed_cell_contents: bool = False
- def reconstruct(self, codegen: "PyCodegen") -> None:
- if self.is_derefed_cell_contents:
- codegen.load_deref(self.local_name)
- else:
- codegen.append_output(codegen.create_load(self.local_name))
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.LOCAL
- @functools.cached_property
- def _name_template(self) -> str:
- return f"L[{_esc_str(self.local_name, apply_repr=True)}]"
- @dataclass_with_cached_hash(frozen=True)
- class TempLocalSource(Source):
- # like LocalSource, but cannot be guarded on
- local_name: str
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.append_output(codegen.create_load(self.local_name))
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.TEMP_LOCAL
- @property
- def _name_template(self) -> str:
- raise NotImplementedError(
- "Cannot create guard on TempLocalSource - this is an internal Dynamo bug. Please file an issue on GitHub."
- )
- @dataclass_with_cached_hash(frozen=True)
- class SyntheticLocalSource(Source):
- local_name: str
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.append_output(codegen.create_load(self.local_name))
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.SYNTHETIC_LOCAL
- @functools.cached_property
- def _name_template(self) -> str:
- return f"SYNTHETIC_LOCAL[{_esc_str(self.local_name, apply_repr=True)}]"
- @dataclass_with_cached_hash(frozen=True)
- class RandomValueSource(Source):
- random_call_index: int
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.RANDOM_VALUE
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.append_output(codegen.create_load(codegen.tx.output.random_values_var))
- codegen.append_output(codegen.create_load_const(self.random_call_index))
- codegen.append_output(create_binary_subscr())
- @functools.cached_property
- def _name_template(self) -> str:
- return f"random_value_{_esc_str(self.random_call_index)}"
- @dataclass_with_cached_hash(frozen=True)
- class GlobalSource(Source):
- global_name: str
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.append_output(codegen.create_load_global(self.global_name, add=True))
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.GLOBAL
- @functools.cached_property
- def _name_template(self) -> str:
- return f"G[{_esc_str(self.global_name, apply_repr=True)}]"
- @dataclass_with_cached_hash(frozen=True)
- class GlobalWeakRefSource(Source):
- global_name: str
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(
- lambda: codegen.append_output(
- codegen.create_load_global(self.global_name, add=True)
- )
- )
- codegen.extend_output(create_call_function(0, False))
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.GLOBAL
- @functools.cached_property
- def _name_template(self) -> str:
- return f"G[{_esc_str(self.global_name, apply_repr=True)}]()"
- @dataclass_with_cached_hash(frozen=True)
- class WeakRefCallSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(lambda: codegen(self.base))
- codegen.extend_output(create_call_function(0, False))
- @property
- def _name_template(self) -> str:
- return "{0}()"
- @dataclass_with_cached_hash(frozen=True)
- class CallFunctionNoArgsSource(WeakRefCallSource):
- pass
- @dataclass_with_cached_hash(frozen=True)
- class AttrSource(ChainedSource):
- member: str
- def __post_init__(self) -> None:
- assert self.base, "Can't construct an AttrSource without a valid base source"
- assert "." not in self.member, (
- f"AttrSource member must not contain '.', got {self.member!r}. "
- "Use OutputGraph.get_chained_attr_source() for dotted paths."
- )
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- codegen.extend_output(codegen.create_load_attrs(self.member))
- @functools.cached_property
- def _name_template(self) -> str:
- if not self.member.isidentifier():
- return f"getattr({{0}}, {_esc_str(self.member, apply_repr=True)})"
- return f"{{0}}.{_esc_str(self.member)}"
- @dataclass_with_cached_hash(frozen=True)
- class CellContentsSource(AttrSource):
- """
- Source for closure cell contents that also stores the freevar name.
- This allows guard failure messages to show which variable the closure cell refers to.
- """
- freevar_name: str = dataclasses.field(default="")
- def __post_init__(self) -> None:
- assert self.base, (
- "Can't construct a CellContentsSource without a valid base source"
- )
- assert self.member == "cell_contents", (
- "CellContentsSource should only be used for cell_contents"
- )
- @dataclass_with_cached_hash(frozen=True)
- class GenericAttrSource(ChainedSource):
- member: str
- def __post_init__(self) -> None:
- assert self.base, (
- "Can't construct a GenericAttrSource without a valid base source"
- )
- assert "." not in self.member, (
- f"GenericAttrSource member must not contain '.', got {self.member!r}. "
- "Use OutputGraph.get_chained_attr_source() for dotted paths."
- )
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- codegen.extend_output(codegen.create_load_attrs(self.member))
- @functools.cached_property
- def _name_template(self) -> str:
- return (
- f"object.__getattribute__({{0}}, {_esc_str(self.member, apply_repr=True)})"
- )
- # Represents obj.__dict__ where obj is a type object
- @dataclass_with_cached_hash(frozen=True)
- class TypeDictSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- codegen.extend_output(codegen.create_load_attrs("__dict__"))
- @property
- def _name_template(self) -> str:
- # type(ob).__dict__ can return a proxy of the dict. But in the C++
- # guard accessor, we are use type->tp_dict which is a dict. So,
- # forcefully pass a dict object to ensure that the GuardManager
- # registers that its working on a dict object.
- return "dict({0}.__dict__)"
- # Represents obj.__mro__ where object is type object
- @dataclass_with_cached_hash(frozen=True)
- class TypeMROSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- codegen.extend_output(codegen.create_load_attrs("__mro__"))
- @property
- def _name_template(self) -> str:
- return "{0}.__mro__"
- @dataclass_with_cached_hash(frozen=True)
- class LocalCellSource(Source):
- """
- Conceptually, this class is `LocalSource` for cell objects implicitly
- generated by Python (e.g., captured variables).
- """
- local_name: str
- def reconstruct(self, codegen: "PyCodegen") -> None:
- # Although `LOAD_FAST` and `LOAD_CLOSURE` have the same semantics,
- # Dynamo's bytecode transformation differentiates them slightly, so we
- # always emit `LOAD_CLOSURE` here.
- codegen.append_output(codegen.create_load_closure(self.local_name))
- # All the other methods are intentionally unimplemented because e.g., a
- # local cell object should never be used for guards.
- # Represents obj.__code__ where object is type object
- @dataclass_with_cached_hash(frozen=True)
- class CodeSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- codegen.extend_output(codegen.create_load_attrs("__code__"))
- @property
- def _name_template(self) -> str:
- return "{0}.__code__"
- # Represents obj.__closure__ where object is type object
- @dataclass_with_cached_hash(frozen=True)
- class ClosureSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- codegen.extend_output(codegen.create_load_attrs("__closure__"))
- @property
- def _name_template(self) -> str:
- return "{0}.__closure__"
- # Represents tensor.grad source. It could be represented by AttrSource as well.
- # But, we could access grad field on tensor directly in C++ without going
- # through the Python bytecodes. Therefore, we use a separate source for grad
- # field.
- @dataclass_with_cached_hash(frozen=True)
- class GradSource(ChainedSource):
- member: str = "grad"
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- codegen.extend_output(codegen.create_load_attrs(self.member))
- @functools.cached_property
- def _name_template(self) -> str:
- return f"{{0}}.{_esc_str(self.member)}"
- @dataclass_with_cached_hash(frozen=True)
- class ParamBufferSource(AttrSource):
- @functools.cached_property
- def guard_source(self) -> GuardSource:
- return _GUARD_SOURCE_SPECIALIZED_NN_MODULE[self.base.guard_source]
- # Special AttrSource to differentiate module._buffers or module._parameters
- @dataclass_with_cached_hash(frozen=True)
- class UnspecializedParamBufferSource(AttrSource):
- pass
- # This source is intended to be used in places where a source is needed but it is expected
- # that the symbol will be simplified out later on. Symbols with ephemeral sources are
- # prioritized to be simplified out when e.g. compared against a symbol without an ephemeral
- # source. Guarding on this source is an error.
- #
- # Example: During subclass view fake-ification, any close-over ViewFunc state should be
- # symbolicized / fake-ified to avoid invalid specialization during view replay. This source
- # is useful for symbols utilized in the middle of the view chain that are not expected to be
- # present within the final view shape metadata.
- @dataclass_with_cached_hash(frozen=True)
- class EphemeralSource(Source):
- desc: Optional[str] = None
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.EPHEMERAL
- @functools.cached_property
- def _name_template(self) -> str:
- desc = ": " + self.desc if self.desc is not None else ""
- return f"<ephemeral{_esc_str(desc)}>"
- def make_guard(self, fn: Callable[..., Any]) -> Guard:
- raise NotImplementedError
- def is_ephemeral(self) -> bool:
- return True
- @dataclass_with_cached_hash(frozen=True)
- class SkipGuardSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- self.base.reconstruct(codegen)
- @property
- def _name_template(self) -> str:
- return "{0}"
- class TensorProperty(enum.Enum):
- SIZE = 0
- STRIDE = 1
- STORAGE_OFFSET = 2
- def method_name(self) -> str:
- if self is TensorProperty.SIZE:
- return "size"
- elif self is TensorProperty.STRIDE:
- return "stride"
- elif self is TensorProperty.STORAGE_OFFSET:
- return "storage_offset"
- else:
- raise AssertionError(f"unhandled {_esc_str(self)}")
- @dataclass_with_cached_hash(frozen=True)
- class TensorPropertySource(ChainedSource):
- prop: TensorProperty
- idx: Optional[int] = None # None for STORAGE_OFFSET
- def __post_init__(self) -> None:
- assert self.base is not None
- if self.prop is TensorProperty.STORAGE_OFFSET:
- assert self.idx is None
- else:
- assert self.idx is not None
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(
- lambda: codegen.load_import_from(
- utils.__name__, f"call_{_esc_str(self.prop.method_name())}"
- )
- )
- codegen(self.base)
- if self.idx is not None:
- codegen.append_output(codegen.create_load_const(self.idx))
- codegen.extend_output(
- create_call_function(2 if self.idx is not None else 1, False)
- )
- @functools.cached_property
- def _name_template(self) -> str:
- if self.prop is TensorProperty.SIZE:
- return f"{{0}}.size()[{_esc_str(self.idx)}]"
- elif self.prop is TensorProperty.STRIDE:
- return f"{{0}}.stride()[{_esc_str(self.idx)}]"
- elif self.prop is TensorProperty.STORAGE_OFFSET:
- assert self.idx is None
- return "{0}.storage_offset()"
- else:
- raise AssertionError(f"unhandled {_esc_str(self.prop)}")
- @dataclass_with_cached_hash(frozen=True)
- class IndexedSource(ChainedSource):
- idx: int
- def __post_init__(self) -> None:
- assert self.base is not None
- def reconstruct(self, codegen: "PyCodegen") -> None:
- raise NotImplementedError
- @functools.cached_property
- def _name_template(self) -> str:
- return f"({_esc_str(self.idx)}, {{0}})"
- @dataclass_with_cached_hash(frozen=True)
- class NegateSource(ChainedSource):
- def __post_init__(self) -> None:
- assert self.base is not None
- def reconstruct(self, codegen: "PyCodegen") -> None:
- raise NotImplementedError
- @property
- def _name_template(self) -> str:
- # NB: use method call so that function stripping regexes work
- return "{0}.__neg__()"
- @dataclass_with_cached_hash(frozen=True)
- class ConvertIntSource(ChainedSource):
- def __post_init__(self) -> None:
- assert self.base is not None
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- @property
- def _name_template(self) -> str:
- return "cast_symbool_to_symint_guardless({0})"
- @dataclass_with_cached_hash(frozen=True)
- class DynamicScalarSource(ChainedSource):
- is_int: bool
- def __post_init__(self) -> None:
- assert self.base is not None
- def reconstruct(self, codegen: "PyCodegen") -> None:
- # Integer casting at reconstruction helps reduce the amount of DynamicInts returned
- # to the user, in favor of plain ints.
- # For example, a compiled region that only does int arithmetic could return a
- # DynamicInt without the casting here.
- codegen.add_push_null(lambda: codegen.load_import_from("builtins", "int"))
- codegen(self.base)
- codegen.extend_output(create_call_function(1, False))
- @property
- def _name_template(self) -> str:
- return "int({0})"
- @dataclass_with_cached_hash(frozen=True)
- class FlattenScriptObjectSource(ChainedSource):
- def __post_init__(self) -> None:
- assert self.base is not None
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- @property
- def _name_template(self) -> str:
- return "{0}.__obj_flatten__()"
- @dataclass_with_cached_hash(frozen=True)
- class ScriptObjectQualifiedNameSource(ChainedSource):
- def __post_init__(self) -> None:
- assert self.base is not None
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- @property
- def _name_template(self) -> str:
- return "{0}._type().qualified_name()"
- class AttrProxySource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- @property
- def _name_template(self) -> str:
- return "{0}.get_base()"
- @dataclass_with_cached_hash(frozen=True)
- class DefaultsSource(ChainedSource):
- idx_key: Union[int, str]
- is_kw: bool = False
- field: str = dataclasses.field(init=False, repr=False, compare=False)
- _name: str = dataclasses.field(init=False, repr=False, compare=False)
- def __post_init__(self) -> None:
- assert self.base, (
- "Base must be a valid source in order to properly track and guard this Defaults to its origin."
- )
- if self.is_kw:
- assert isinstance(self.idx_key, str)
- object.__setattr__(self, "field", "__kwdefaults__")
- object.__setattr__(
- self,
- "_name",
- f"{{0}}.{_esc_str(self.field)}['{_esc_str(self.idx_key)}']",
- )
- else:
- assert isinstance(self.idx_key, int)
- object.__setattr__(self, "field", "__defaults__")
- object.__setattr__(
- self, "_name", f"{{0}}.{_esc_str(self.field)}[{_esc_str(self.idx_key)}]"
- )
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- codegen.extend_output(codegen.create_load_attrs(self.field))
- codegen.append_output(codegen.create_load_const(self.idx_key))
- codegen.append_output(create_binary_subscr())
- @functools.cached_property
- def _name_template(self) -> str:
- return self._name
- @dataclass_with_cached_hash(frozen=True)
- class GetItemSource(ChainedSource):
- index: Any
- index_is_slice: bool = False
- def __post_init__(self) -> None:
- assert self.base is not None
- if isinstance(self.index, slice):
- # store the hashable version of the slice so the whole GetItemSource is hashable
- super().__setattr__("index", self.index.__reduce__())
- super().__setattr__("index_is_slice", True)
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- if self.index_is_slice:
- codegen.append_output(codegen.create_load_const(self.unpack_slice()))
- else:
- codegen.append_output(codegen.create_load_const(self.index))
- codegen.append_output(create_binary_subscr())
- def unpack_slice(self) -> slice:
- assert self.index_is_slice
- slice_class, slice_args = self.index
- return slice_class(*slice_args)
- @functools.cached_property
- def _name_template(self) -> str:
- # Index can be of following types
- # 1) index is a slice - example 1:4
- # 2) index is a constant - example string, integer
- assert not isinstance(self.index, Source)
- if self.index_is_slice:
- return f"{{0}}[{_esc_str(self.unpack_slice(), apply_repr=True)}]"
- else:
- return f"{{0}}[{_esc_str(self.index, apply_repr=True)}]"
- @dataclass_with_cached_hash(frozen=True)
- class ConstDictKeySource(ChainedSource):
- index: Any
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(
- lambda: codegen.load_import_from(utils.__name__, "dict_keys_getitem")
- )
- codegen(self.base)
- codegen.append_output(codegen.create_load_const(self.index))
- codegen.extend_output(create_call_function(2, False))
- @functools.cached_property
- def _name_template(self) -> str:
- # The list creation will be CSE'd by PyExprCSEPass
- return f"list(dict.keys({{0}}))[{_esc_str(self.index, apply_repr=True)}]"
- def is_dict_key(self) -> bool:
- return True
- @dataclass_with_cached_hash(frozen=True)
- class NonSerializableSetGetItemSource(ChainedSource):
- index: int
- def __post_init__(self) -> None:
- from .variables import ConstantVariable
- assert ConstantVariable.is_literal(self.index)
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(
- lambda: codegen.load_import_from(utils.__name__, "set_getitem")
- )
- codegen(self.base)
- codegen.append_output(codegen.create_load_const(self.index))
- codegen.extend_output(create_call_function(2, False))
- @functools.cached_property
- def _name_template(self) -> str:
- # set ordering might not be stable
- return f"list({{0}})[{_esc_str(self.index, apply_repr=True)}]"
- def is_dict_key(self) -> bool:
- return False
- # Used to access an item from the dictionary
- @dataclass_with_cached_hash(frozen=True)
- class DictGetItemSource(ChainedSource):
- # Key to access in the dictionary. It can be one of the following types
- # 1) ConstDictKeySource
- # 2) constant - like string, integer
- index: Any
- def __post_init__(self) -> None:
- from .variables import ConstantVariable
- assert isinstance(
- self.index, ConstDictKeySource
- ) or ConstantVariable.is_literal(self.index)
- def reconstruct(self, codegen: "PyCodegen") -> None:
- # Load dict
- codegen(self.base)
- # Load key
- if isinstance(self.index, Source):
- codegen(self.index)
- else:
- codegen.append_output(codegen.create_load_const(self.index))
- codegen.append_output(create_binary_subscr())
- @functools.cached_property
- def _name_template(self) -> str:
- if isinstance(self.index, ConstDictKeySource):
- return f"{{0}}[{_esc_str(self.index.name)}]"
- else:
- return f"{{0}}[{_esc_str(self.index, apply_repr=True)}]"
- # Same as DictGetItemSource but used for dict.__getitem__ calls to ensure that
- # torch.compile does not run the overridden __getitem__ method
- @dataclass_with_cached_hash(frozen=True)
- class DictSubclassGetItemSource(ChainedSource):
- # Key to access in the dictionary. It can be one of the following types
- # 1) ConstDictKeySource
- # 2) constant - like string, integer
- index: Any
- def __post_init__(self) -> None:
- from .variables import ConstantVariable
- assert isinstance(
- self.index, ConstDictKeySource
- ) or ConstantVariable.is_literal(self.index)
- def reconstruct(self, codegen: "PyCodegen") -> None:
- # reconstruct dict.__getitem__(dct, key)
- # Load dict.__getitem__
- codegen.add_push_null(
- lambda: codegen.load_import_from(utils.__name__, "dict_getitem")
- )
- # Load dict
- codegen(self.base)
- # Load key
- if isinstance(self.index, Source):
- codegen(self.index)
- else:
- codegen.append_output(codegen.create_load_const(self.index))
- codegen.extend_output(create_call_function(2, False))
- @functools.cached_property
- def _name_template(self) -> str:
- if isinstance(self.index, ConstDictKeySource):
- return f"dict.__getitem__({{0}}, {_esc_str(self.index.name)})"
- else:
- return f"{{0}}[{_esc_str(self.index, apply_repr=True)}]"
- @dataclass_with_cached_hash(frozen=True)
- class ListGetItemSource(GetItemSource):
- """
- Same as GetItemSource with reconstruct and name overridden to be list specific.
- """
- def reconstruct(self, codegen: "PyCodegen") -> None:
- # Reconstruct list.__getitem__(lst, index) to avoid any side effects
- # from possibly overridden __getitem__.
- # Load list.__getitem__
- codegen.add_push_null(
- lambda: codegen.load_import_from(utils.__name__, "list_getitem")
- )
- # Load the list
- codegen(self.base)
- # Load the index
- if self.index_is_slice:
- raise RuntimeError(
- "List[slice] is a temporary object and should not have a source"
- )
- else:
- codegen.append_output(codegen.create_load_const(self.index))
- codegen.extend_output(create_call_function(2, False))
- @functools.cached_property
- def _name_template(self) -> str:
- # Index can be of following types
- # 1) index is a slice - example 1:4
- # 2) index is a constant - example string, integer
- assert not isinstance(self.index, Source)
- if self.index_is_slice:
- raise RuntimeError(
- "List[slice] is a temporary object and should not have a source"
- )
- else:
- return f"list.__getitem__({{0}}, {_esc_str(self.index, apply_repr=True)})"
- @dataclass_with_cached_hash(frozen=True)
- class TupleIteratorGetItemSource(GetItemSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(
- lambda: codegen.load_import_from(utils.__name__, "tuple_iterator_getitem")
- )
- codegen(self.base)
- codegen.append_output(codegen.create_load_const(self.index))
- codegen.extend_output(create_call_function(2, False))
- @functools.cached_property
- def _name_template(self) -> str:
- return (
- f"___tuple_iterator_getitem({{0}}, {_esc_str(self.index, apply_repr=True)})"
- )
- @dataclass_with_cached_hash(frozen=True)
- class NamedTupleFieldsSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- codegen.extend_output(codegen.create_load_attrs("_fields"))
- @property
- def _name_template(self) -> str:
- return "___namedtuple_fields({0})"
- @dataclass_with_cached_hash(frozen=True)
- class DataclassFieldsSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(
- lambda: codegen.load_import_from(utils.__name__, "dataclass_fields")
- )
- codegen(self.base)
- codegen.extend_output(create_call_function(1, False))
- @property
- def _name_template(self) -> str:
- return "___dataclass_fields({0})"
- @dataclass_with_cached_hash(frozen=True)
- class TypeSource(ChainedSource):
- def __post_init__(self) -> None:
- assert self.base is not None
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(lambda: codegen.load_import_from("builtins", "type"))
- codegen(self.base)
- codegen.extend_output(create_call_function(1, False))
- @property
- def _name_template(self) -> str:
- return "type({0})"
- @dataclass_with_cached_hash(frozen=True)
- class OptimizerSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- @property
- def _name_template(self) -> str:
- return "{0}"
- @dataclass_with_cached_hash(frozen=True)
- class NNModuleSource(ChainedSource):
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen(self.base)
- @functools.cached_property
- def guard_source(self) -> GuardSource:
- return _GUARD_SOURCE_SPECIALIZED_NN_MODULE[self.base.guard_source]
- @property
- def _name_template(self) -> str:
- return "{0}"
- @dataclass_with_cached_hash(frozen=True)
- class UnspecializedNNModuleSource(NNModuleSource):
- @functools.cached_property
- def guard_source(self) -> GuardSource:
- return _GUARD_SOURCE_UNSPECIALIZED_NN_MODULE[self.base.guard_source]
- @dataclass_with_cached_hash(frozen=True)
- class UnspecializedBuiltinNNModuleSource(UnspecializedNNModuleSource):
- @functools.cached_property
- def guard_source(self) -> GuardSource:
- return _GUARD_SOURCE_UNSPECIALIZED_BUILTIN_NN_MODULE[self.base.guard_source]
- @dataclass_with_cached_hash(frozen=True)
- class FSDPNNModuleSource(NNModuleSource):
- @functools.cached_property
- def guard_source(self) -> GuardSource:
- return _GUARD_SOURCE_FSDP_MODULE[self.base.guard_source]
- @dataclass_with_cached_hash(frozen=True)
- class GlobalStateSource(Source):
- @property
- def _name_template(self) -> str:
- return ""
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.GLOBAL
- @dataclass_with_cached_hash(frozen=True)
- class ImportSource(Source):
- """Points to an imported module - used instead of GlobalSource
- in case the user has overridden the module name in their local namespace"""
- module_name: str
- def __post_init__(self) -> None:
- from .guards import GuardBuilder, install_guard
- install_guard(self.make_guard(GuardBuilder.ID_MATCH))
- @functools.cached_property
- def _name_template(self) -> str:
- return f"__import__('{self.module_name}')"
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.extend_output(
- [
- codegen.create_load_const(0), # level
- create_build_tuple(0), # fromlist
- codegen.create_import_name(self.module_name),
- ]
- )
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.GLOBAL
- @dataclass_with_cached_hash(frozen=True)
- class TorchFunctionModeStackSource(Source):
- ind: int
- @functools.cached_property
- def _name_template(self) -> str:
- return f"___get_torch_function_mode_stack_at({_esc_str(self._get_index())})"
- def _get_index(self) -> int:
- from .variables.torch_function import TorchFunctionModeStackVariable
- return TorchFunctionModeStackVariable.get_mode_index(self.ind)
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(
- lambda: codegen.load_import_from(
- utils.__name__, "get_torch_function_mode_stack_at"
- )
- )
- codegen.extend_output([codegen.create_load_const(self._get_index())])
- codegen.extend_output(create_call_function(1, False))
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.GLOBAL
- @dataclass_with_cached_hash(frozen=True)
- class ConstantSource(Source):
- source_name: str
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.append_output(codegen.create_load_global(self.source_name, add=False))
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.CONSTANT
- @functools.cached_property
- def _name_template(self) -> str:
- return self.source_name
- def make_guard(self, fn: Any) -> Any:
- raise NotImplementedError
- @dataclass_with_cached_hash(frozen=True)
- class NumpyTensorSource(ChainedSource):
- @property
- def _name_template(self) -> str:
- return "___from_numpy({0})"
- def reconstruct(self, codegen: "PyCodegen") -> None:
- codegen.add_push_null(lambda: codegen.load_import_from("torch", "as_tensor"))
- codegen(self.base)
- codegen.extend_output(create_call_function(1, False))
- @dataclass_with_cached_hash(frozen=True)
- class SubclassAttrListSource(ChainedSource):
- @property
- def _name_template(self) -> str:
- return "{0}.__tensor_flatten__()[0]"
- # NB: We don't expect you to actually ever generate guards against this
- # source, it is ephemeral
- @dataclass_with_cached_hash(frozen=True)
- class FloatTensorSource(ChainedSource):
- @property
- def _name_template(self) -> str:
- return "___as_tensor({0})"
- @dataclass_with_cached_hash(frozen=True)
- class CallMethodItemSource(ChainedSource):
- @property
- def _name_template(self) -> str:
- return "{0}.item()"
- # This is a synthetic source that is associated with the singleton
- # shape env guard we always register for all frames. We get the actual
- # guard contents from the ambient ShapeEnv
- @dataclass_with_cached_hash(frozen=True)
- class ShapeEnvSource(Source):
- @property
- def _name_template(self) -> str:
- return ""
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.SHAPE_ENV
- @dataclass_with_cached_hash(frozen=True)
- class CurrentStreamSource(Source):
- device: device_type
- @functools.cached_property
- def _name_template(self) -> str:
- return f"___get_current_stream(torch.device('{_esc_str(self.device.type)}', {_esc_str(self.device.index)}))"
- def reconstruct(self, codegen: "PyCodegen") -> None:
- num_args = 1
- codegen.add_push_null(
- lambda: codegen.load_import_from(utils.__name__, "get_current_stream")
- )
- codegen.add_push_null(lambda: codegen.load_import_from("torch", "device"))
- codegen.extend_output([codegen.create_load_const(self.device.type)])
- if self.device.index is not None:
- num_args += 1
- codegen.extend_output([codegen.create_load_const(self.device.index)])
- codegen.extend_output(create_call_function(num_args, False))
- codegen.extend_output(create_call_function(1, False))
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.GLOBAL
- @dataclass_with_cached_hash(frozen=True)
- class BackwardStateSource(Source):
- @property
- def _name_template(self) -> str:
- return ""
- @property
- def guard_source(self) -> GuardSource:
- return GuardSource.BACKWARD_STATE
- @functools.lru_cache
- def get_local_source_name(
- source: Source, *, only_allow_input: bool = False
- ) -> Optional[str]:
- if isinstance(source, ChainedSource):
- return get_local_source_name(source.base, only_allow_input=only_allow_input)
- if not isinstance(source, LocalSource):
- return None
- if only_allow_input and not source.is_input:
- return None
- return source.local_name
- @functools.lru_cache
- def is_from_local_source(source: Source, *, only_allow_input: bool = False) -> bool:
- return get_local_source_name(source, only_allow_input=only_allow_input) is not None
- @functools.lru_cache
- def is_from_global_source(source: Source) -> bool:
- return get_global_source_name(source) is not None
- @functools.lru_cache
- def get_global_source_name(source: Source | None) -> str | None:
- if isinstance(source, ChainedSource):
- return get_global_source_name(source.base)
- if not isinstance(source, GlobalSource):
- return None
- return source.global_name
- @functools.lru_cache
- def is_from_nonlocal_source(source: Source) -> bool:
- if isinstance(source, ChainedSource):
- return is_from_nonlocal_source(source.base)
- return (
- isinstance(source, LocalSource)
- and source.is_derefed_cell_contents
- and not source.is_input
- )
- @functools.lru_cache
- def is_from_closure_source(source: Source) -> bool:
- if isinstance(source, ClosureSource):
- return True
- if isinstance(source, ChainedSource):
- return is_from_closure_source(source.base)
- return False
- @functools.lru_cache
- def is_from_source(source: Source, target: Source) -> bool:
- if isinstance(source, ChainedSource):
- return is_from_source(source.base, target)
- return source == target
- @functools.lru_cache
- def is_from_unspecialized_nn_module_source(source: Source) -> bool:
- if isinstance(source, UnspecializedNNModuleSource):
- return True
- if isinstance(source, ChainedSource):
- return is_from_unspecialized_nn_module_source(source.base)
- return False
- @functools.lru_cache
- def is_from_unspecialized_builtin_nn_module_source(source: Source) -> bool:
- if isinstance(source, UnspecializedBuiltinNNModuleSource):
- return True
- if isinstance(source, ChainedSource):
- return is_from_unspecialized_builtin_nn_module_source(source.base)
- return False
- @functools.lru_cache
- def is_from_unspecialized_param_buffer_source(source: Source) -> bool:
- if isinstance(source, UnspecializedParamBufferSource):
- return True
- if isinstance(source, ChainedSource):
- return is_from_unspecialized_param_buffer_source(source.base)
- return False
- @functools.lru_cache
- def is_from_flatten_script_object_source(source: Source) -> bool:
- if isinstance(source, FlattenScriptObjectSource):
- return True
- elif isinstance(source, ChainedSource):
- return is_from_flatten_script_object_source(source.base)
- return False
- @functools.lru_cache
- def is_from_optimizer_source(source: Source) -> bool:
- if isinstance(source, OptimizerSource):
- return True
- if isinstance(source, ChainedSource):
- return is_from_optimizer_source(source.base)
- return False
- # TODO: can probably write a generic "test this on everything in the chain"
- # helper
- @functools.lru_cache
- def is_from_defaults(source: Source) -> bool:
- if isinstance(source, DefaultsSource):
- return True
- # Accessed with func.__kwdefaults__["foo"]
- if (
- isinstance(source, DictGetItemSource)
- and isinstance(source.base, AttrSource)
- and source.base.member == "__kwdefaults__"
- ):
- return True
- # Accessed with func.__defaults__[0]
- if (
- isinstance(source, GetItemSource)
- and isinstance(source.base, AttrSource)
- and source.base.member == "__defaults__"
- ):
- return True
- if isinstance(source, ChainedSource):
- return is_from_defaults(source.base)
- return False
- @functools.lru_cache
- def is_from_skip_guard_source(source: Source) -> bool:
- if isinstance(source, SkipGuardSource):
- return True
- if isinstance(source, ChainedSource):
- return is_from_skip_guard_source(source.base)
- return False
|