source.py 39 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196
  1. """
  2. This module provides Source classes that track the origins of values in PyTorch Dynamo.
  3. Sources represent where values come from (e.g. local variables, globals, attributes) and
  4. are used for guard generation and code reconstruction during compilation.
  5. The module includes specialized sources for:
  6. - Local variables and synthetic locals
  7. - Global variables and constants
  8. - Object attributes and method calls
  9. - NN module specialization (specialized vs unspecialized)
  10. - Random values and tensor properties
  11. - Default argument handling
  12. - FSDP (Fully Sharded Data Parallel) modules
  13. Sources play a key role in Dynamo's guard system by tracking value origins for
  14. guard generation, and in code reconstruction by providing methods to rebuild
  15. the code needed to recreate values.
  16. """
  17. import dataclasses
  18. import enum
  19. import functools
  20. from typing import Any, Callable, Optional, TYPE_CHECKING, Union
  21. from torch._guards import ChainedSource, Guard, GuardSource, Source
  22. from . import utils
  23. from .bytecode_transformation import create_call_function, create_instruction
  24. if TYPE_CHECKING:
  25. from .codegen import PyCodegen
  26. # It shouldn't be supported to construct an NNModuleVariable inside an FSDP module,
  27. # so those cases are omitted intentionally
  28. # represents nn.Modules tracked with NNModuleVariable (specialized is implicit in the variable name)
  29. _GUARD_SOURCE_SPECIALIZED_NN_MODULE = {
  30. GuardSource.LOCAL: GuardSource.LOCAL_SPECIALIZED_NN_MODULE,
  31. GuardSource.GLOBAL: GuardSource.GLOBAL_SPECIALIZED_NN_MODULE,
  32. GuardSource.LOCAL_SPECIALIZED_NN_MODULE: GuardSource.LOCAL_SPECIALIZED_NN_MODULE,
  33. GuardSource.GLOBAL_SPECIALIZED_NN_MODULE: GuardSource.GLOBAL_SPECIALIZED_NN_MODULE,
  34. # Just to ensure that guard_source() works
  35. GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE,
  36. GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE,
  37. GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  38. GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  39. GuardSource.LOCAL_FSDP_MODULE: GuardSource.LOCAL_FSDP_MODULE,
  40. GuardSource.GLOBAL_FSDP_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
  41. }
  42. # represents nn.Modules tracked with UnspecializedNNModuleVariable
  43. _GUARD_SOURCE_UNSPECIALIZED_NN_MODULE = {
  44. GuardSource.LOCAL: GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE,
  45. GuardSource.GLOBAL: GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE,
  46. GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE,
  47. GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE,
  48. # this happens for an UnspecializedNNModule submodule on a NNModuleVariable
  49. GuardSource.LOCAL_SPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE,
  50. GuardSource.GLOBAL_SPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE,
  51. # Just to ensure that guard_source() works
  52. GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  53. GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  54. GuardSource.LOCAL_FSDP_MODULE: GuardSource.LOCAL_FSDP_MODULE,
  55. GuardSource.GLOBAL_FSDP_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
  56. }
  57. # represents nn.Modules tracked with UnspecializedBuiltinNNModuleVariable
  58. _GUARD_SOURCE_UNSPECIALIZED_BUILTIN_NN_MODULE = {
  59. GuardSource.LOCAL: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  60. GuardSource.GLOBAL: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  61. GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  62. GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  63. GuardSource.LOCAL_SPECIALIZED_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  64. GuardSource.GLOBAL_SPECIALIZED_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  65. # Just to ensure that guard_source() works
  66. GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  67. GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE,
  68. GuardSource.LOCAL_FSDP_MODULE: GuardSource.LOCAL_FSDP_MODULE,
  69. GuardSource.GLOBAL_FSDP_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
  70. }
  71. _GUARD_SOURCE_FSDP_MODULE = {
  72. GuardSource.LOCAL: GuardSource.LOCAL_FSDP_MODULE,
  73. GuardSource.GLOBAL: GuardSource.GLOBAL_FSDP_MODULE,
  74. GuardSource.LOCAL_SPECIALIZED_NN_MODULE: GuardSource.LOCAL_FSDP_MODULE,
  75. GuardSource.GLOBAL_SPECIALIZED_NN_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
  76. GuardSource.LOCAL_FSDP_MODULE: GuardSource.LOCAL_FSDP_MODULE,
  77. GuardSource.GLOBAL_FSDP_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
  78. GuardSource.LOCAL_UNSPECIALIZED_NN_MODULE: GuardSource.LOCAL_FSDP_MODULE,
  79. GuardSource.GLOBAL_UNSPECIALIZED_NN_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
  80. GuardSource.LOCAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.LOCAL_FSDP_MODULE,
  81. GuardSource.GLOBAL_UNSPECIALIZED_BUILTIN_NN_MODULE: GuardSource.GLOBAL_FSDP_MODULE,
  82. }
  83. def is_constant_source(source: Source) -> bool:
  84. if isinstance(source, ConstantSource):
  85. return True
  86. try:
  87. if source.guard_source() == GuardSource.CONSTANT:
  88. return True
  89. except NotImplementedError:
  90. pass
  91. return False
  92. def _get_source_debug_name(source: Source) -> str:
  93. try:
  94. return source.name()
  95. except NotImplementedError:
  96. return "<unknown source>"
  97. @dataclasses.dataclass(frozen=True)
  98. class LocalSource(Source):
  99. local_name: str
  100. # Whether this local is an input to the root frame.
  101. is_input: bool = False
  102. # Whether we know this input is dynamic (based on example_inputs)
  103. # For non tensors, we simply look at the first index of the tuple
  104. dynamism: Optional[frozenset[str]] = None
  105. # Whether the item at this source is the _content_ of a cell that is
  106. # dereferenced from the root frame, i.e., it's a part of the `co_cellvars`
  107. # or `co_freevars`.
  108. is_derefed_cell_contents: bool = False
  109. def reconstruct(self, codegen: "PyCodegen") -> None:
  110. if self.is_derefed_cell_contents:
  111. codegen.load_deref(self.local_name)
  112. else:
  113. codegen.append_output(codegen.create_load(self.local_name))
  114. def guard_source(self) -> GuardSource:
  115. return GuardSource.LOCAL
  116. def name(self) -> str:
  117. return f"L[{repr(self.local_name)}]"
  118. @dataclasses.dataclass(frozen=True)
  119. class SyntheticLocalSource(Source):
  120. local_name: str
  121. def reconstruct(self, codegen: "PyCodegen") -> None:
  122. codegen.append_output(codegen.create_load(self.local_name))
  123. def guard_source(self) -> GuardSource:
  124. return GuardSource.SYNTHETIC_LOCAL
  125. def name(self) -> str:
  126. return f"SYNTHETIC_LOCAL[{self.local_name!r}]"
  127. @dataclasses.dataclass(frozen=True)
  128. class RandomValueSource(Source):
  129. random_call_index: int
  130. def guard_source(self) -> GuardSource:
  131. return GuardSource.RANDOM_VALUE
  132. def reconstruct(self, codegen: "PyCodegen") -> None:
  133. codegen.append_output(codegen.create_load(codegen.tx.output.random_values_var))
  134. codegen.append_output(codegen.create_load_const(self.random_call_index))
  135. codegen.append_output(create_instruction("BINARY_SUBSCR"))
  136. def name(self) -> str:
  137. return f"random_value_{self.random_call_index}"
  138. @dataclasses.dataclass(frozen=True)
  139. class GlobalSource(Source):
  140. global_name: str
  141. def reconstruct(self, codegen: "PyCodegen") -> None:
  142. codegen.append_output(codegen.create_load_global(self.global_name, add=True))
  143. def guard_source(self) -> GuardSource:
  144. return GuardSource.GLOBAL
  145. def name(self) -> str:
  146. return f"G[{repr(self.global_name)}]"
  147. @dataclasses.dataclass(frozen=True)
  148. class GlobalWeakRefSource(Source):
  149. global_name: str
  150. def reconstruct(self, codegen: "PyCodegen") -> None:
  151. codegen.add_push_null(
  152. lambda: codegen.append_output(
  153. codegen.create_load_global(self.global_name, add=True)
  154. )
  155. )
  156. codegen.extend_output(create_call_function(0, False))
  157. def guard_source(self) -> GuardSource:
  158. return GuardSource.GLOBAL
  159. def name(self) -> str:
  160. return f"G[{repr(self.global_name)}]()"
  161. @dataclasses.dataclass(frozen=True)
  162. class WeakRefCallSource(ChainedSource):
  163. def reconstruct(self, codegen: "PyCodegen") -> None:
  164. codegen.add_push_null(lambda: codegen(self.base))
  165. codegen.extend_output(create_call_function(0, False))
  166. def guard_source(self) -> GuardSource:
  167. return self.base.guard_source()
  168. def name(self) -> str:
  169. return f"{self.base.name()}()"
  170. @dataclasses.dataclass(frozen=True)
  171. class CallFunctionNoArgsSource(WeakRefCallSource):
  172. pass
  173. @dataclasses.dataclass(frozen=True)
  174. class AttrSource(ChainedSource):
  175. member: str
  176. def __post_init__(self) -> None:
  177. assert self.base, "Can't construct an AttrSource without a valid base source"
  178. if "." in self.member:
  179. member_parts = self.member.split(".")
  180. object.__setattr__(
  181. self, "base", AttrSource(self.base, ".".join(member_parts[:-1]))
  182. )
  183. object.__setattr__(self, "member", member_parts[-1])
  184. def reconstruct(self, codegen: "PyCodegen") -> None:
  185. codegen(self.base)
  186. codegen.extend_output(codegen.create_load_attrs(self.member))
  187. def guard_source(self) -> GuardSource:
  188. return self.base.guard_source()
  189. def name(self) -> str:
  190. if not self.member.isidentifier():
  191. return f"getattr({self.base.name()}, {self.member!r})"
  192. return f"{self.base.name()}.{self.member}"
  193. @dataclasses.dataclass(frozen=True)
  194. class GenericAttrSource(ChainedSource):
  195. member: str
  196. def __post_init__(self) -> None:
  197. assert self.base, "Can't construct an AttrSource without a valid base source"
  198. if "." in self.member:
  199. member_parts = self.member.split(".")
  200. object.__setattr__(
  201. self, "base", AttrSource(self.base, ".".join(member_parts[:-1]))
  202. )
  203. object.__setattr__(self, "member", member_parts[-1])
  204. def reconstruct(self, codegen: "PyCodegen") -> None:
  205. codegen(self.base)
  206. codegen.extend_output(codegen.create_load_attrs(self.member))
  207. def guard_source(self) -> GuardSource:
  208. return self.base.guard_source()
  209. def name(self) -> str:
  210. return f"object.__getattribute__({self.base.name()}, {self.member!r})"
  211. # Represents obj.__dict__ where obj is a type object
  212. @dataclasses.dataclass(frozen=True)
  213. class TypeDictSource(ChainedSource):
  214. def reconstruct(self, codegen: "PyCodegen") -> None:
  215. codegen(self.base)
  216. codegen.extend_output(codegen.create_load_attrs("__dict__"))
  217. def guard_source(self) -> GuardSource:
  218. return self.base.guard_source()
  219. def name(self) -> str:
  220. # type(ob).__dict__ can return a proxy of the dict. But in the C++
  221. # guard accessor, we are use type->tp_dict which is a dict. So,
  222. # forcefully pass a dict object to ensure that the GuardManager
  223. # registers that its working on a dict object.
  224. return f"dict({self.base.name()}.__dict__)"
  225. # Represents obj.__mro__ where object is type object
  226. @dataclasses.dataclass(frozen=True)
  227. class TypeMROSource(ChainedSource):
  228. def reconstruct(self, codegen: "PyCodegen") -> None:
  229. codegen(self.base)
  230. codegen.extend_output(codegen.create_load_attrs("__mro__"))
  231. def guard_source(self) -> GuardSource:
  232. return self.base.guard_source()
  233. def name(self) -> str:
  234. return f"{self.base.name()}.__mro__"
  235. @dataclasses.dataclass(frozen=True)
  236. class LocalCellSource(Source):
  237. """
  238. Conceptually, this class is `LocalSource` for cell objects implicitly
  239. generated by Python (e.g., captured variables).
  240. """
  241. local_name: str
  242. def reconstruct(self, codegen: "PyCodegen") -> None:
  243. # Although `LOAD_FAST` and `LOAD_CLOSURE` have the same semantics,
  244. # Dynamo's bytecode transformation differentiates them slightly, so we
  245. # always emit `LOAD_CLOSURE` here.
  246. codegen.append_output(codegen.create_load_closure(self.local_name))
  247. # All the other methods are intentionally unimplemented because e.g., a
  248. # local cell object should never be used for guards.
  249. # Represents obj.__code__ where object is type object
  250. @dataclasses.dataclass(frozen=True)
  251. class CodeSource(ChainedSource):
  252. def reconstruct(self, codegen: "PyCodegen") -> None:
  253. codegen(self.base)
  254. codegen.extend_output(codegen.create_load_attrs("__code__"))
  255. def guard_source(self) -> GuardSource:
  256. return self.base.guard_source()
  257. def name(self) -> str:
  258. return f"{self.base.name()}.__code__"
  259. # Represents obj.__closure__ where object is type object
  260. @dataclasses.dataclass(frozen=True)
  261. class ClosureSource(ChainedSource):
  262. def reconstruct(self, codegen: "PyCodegen") -> None:
  263. codegen(self.base)
  264. codegen.extend_output(codegen.create_load_attrs("__closure__"))
  265. def guard_source(self) -> GuardSource:
  266. return self.base.guard_source()
  267. def name(self) -> str:
  268. return f"{self.base.name()}.__closure__"
  269. # Represents tensor.grad source. It could be represented by AttrSource as well.
  270. # But, we could access grad field on tensor directly in C++ without going
  271. # through the Python bytecodes. Therefore, we use a separate source for grad
  272. # field.
  273. @dataclasses.dataclass(frozen=True)
  274. class GradSource(ChainedSource):
  275. member: str = "grad"
  276. def reconstruct(self, codegen: "PyCodegen") -> None:
  277. codegen(self.base)
  278. codegen.extend_output(codegen.create_load_attrs(self.member))
  279. def guard_source(self) -> GuardSource:
  280. return self.base.guard_source()
  281. def name(self) -> str:
  282. return f"{self.base.name()}.{self.member}"
  283. @dataclasses.dataclass(frozen=True)
  284. class ParamBufferSource(AttrSource):
  285. def guard_source(self) -> GuardSource:
  286. return _GUARD_SOURCE_SPECIALIZED_NN_MODULE[self.base.guard_source()]
  287. # Special AttrSource to differentiate module._buffers or module._parameters
  288. @dataclasses.dataclass(frozen=True)
  289. class UnspecializedParamBufferSource(AttrSource):
  290. pass
  291. # This source is intended to be used in places where a source is needed but it is expected
  292. # that the symbol will be simplified out later on. Symbols with ephemeral sources are
  293. # prioritized to be simplified out when e.g. compared against a symbol without an ephemeral
  294. # source. Guarding on this source is an error.
  295. #
  296. # Example: During subclass view fake-ification, any close-over ViewFunc state should be
  297. # symbolicized / fake-ified to avoid invalid specialization during view replay. This source
  298. # is useful for symbols utilized in the middle of the view chain that are not expected to be
  299. # present within the final view shape metadata.
  300. @dataclasses.dataclass(frozen=True)
  301. class EphemeralSource(Source):
  302. desc: Optional[str] = None
  303. def guard_source(self) -> GuardSource:
  304. return GuardSource.EPHEMERAL
  305. def name(self) -> str:
  306. return f"<ephemeral{': ' + self.desc if self.desc is not None else ''}>"
  307. def make_guard(self, fn: Callable[..., Any]) -> Guard:
  308. raise NotImplementedError
  309. def is_ephemeral(self) -> bool:
  310. return True
  311. @dataclasses.dataclass(frozen=True)
  312. class SkipGuardSource(ChainedSource):
  313. def reconstruct(self, codegen: "PyCodegen") -> None:
  314. self.base.reconstruct(codegen)
  315. def guard_source(self) -> GuardSource:
  316. return self.base.guard_source()
  317. def name(self) -> str:
  318. return self.base.name()
  319. class TensorProperty(enum.Enum):
  320. SIZE = 0
  321. STRIDE = 1
  322. STORAGE_OFFSET = 2
  323. def method_name(self) -> str:
  324. if self is TensorProperty.SIZE:
  325. return "size"
  326. elif self is TensorProperty.STRIDE:
  327. return "stride"
  328. elif self is TensorProperty.STORAGE_OFFSET:
  329. return "storage_offset"
  330. else:
  331. raise AssertionError(f"unhandled {self}")
  332. @dataclasses.dataclass(frozen=True)
  333. class TensorPropertySource(ChainedSource):
  334. prop: TensorProperty
  335. idx: Optional[int] = None # None for STORAGE_OFFSET
  336. def __post_init__(self) -> None:
  337. assert self.base is not None
  338. if self.prop is TensorProperty.STORAGE_OFFSET:
  339. assert self.idx is None
  340. else:
  341. assert self.idx is not None
  342. def reconstruct(self, codegen: "PyCodegen") -> None:
  343. codegen.add_push_null(
  344. lambda: codegen.load_import_from(
  345. utils.__name__, f"call_{self.prop.method_name()}"
  346. )
  347. )
  348. codegen(self.base)
  349. if self.idx is not None:
  350. codegen.append_output(codegen.create_load_const(self.idx))
  351. codegen.extend_output(
  352. create_call_function(2 if self.idx is not None else 1, False)
  353. )
  354. def guard_source(self) -> GuardSource:
  355. return self.base.guard_source()
  356. def name(self) -> str:
  357. if self.prop is TensorProperty.SIZE:
  358. return f"{self.base.name()}.size()[{self.idx}]"
  359. elif self.prop is TensorProperty.STRIDE:
  360. return f"{self.base.name()}.stride()[{self.idx}]"
  361. elif self.prop is TensorProperty.STORAGE_OFFSET:
  362. assert self.idx is None
  363. return f"{self.base.name()}.storage_offset()"
  364. else:
  365. raise AssertionError(f"unhandled {self.prop}")
  366. @dataclasses.dataclass(frozen=True)
  367. class IndexedSource(ChainedSource):
  368. idx: int
  369. def __post_init__(self) -> None:
  370. assert self.base is not None
  371. def reconstruct(self, codegen: "PyCodegen") -> None:
  372. raise NotImplementedError
  373. def guard_source(self) -> GuardSource:
  374. return self.base.guard_source()
  375. def name(self) -> str:
  376. return f"({self.idx}, {self.base.name()})"
  377. @dataclasses.dataclass(frozen=True)
  378. class NegateSource(ChainedSource):
  379. def __post_init__(self) -> None:
  380. assert self.base is not None
  381. def reconstruct(self, codegen: "PyCodegen") -> None:
  382. raise NotImplementedError
  383. def guard_source(self) -> GuardSource:
  384. return self.base.guard_source()
  385. def name(self) -> str:
  386. # NB: use method call so that function stripping regexes work
  387. return f"{self.base.name()}.__neg__()"
  388. @dataclasses.dataclass(frozen=True)
  389. class ConvertIntSource(ChainedSource):
  390. def __post_init__(self) -> None:
  391. assert self.base is not None
  392. def reconstruct(self, codegen: "PyCodegen") -> None:
  393. codegen(self.base)
  394. def guard_source(self) -> GuardSource:
  395. return self.base.guard_source()
  396. def name(self) -> str:
  397. return f"cast_symbool_to_symint_guardless({self.base.name()})"
  398. @dataclasses.dataclass(frozen=True)
  399. class FlattenScriptObjectSource(ChainedSource):
  400. def __post_init__(self) -> None:
  401. assert self.base is not None
  402. def reconstruct(self, codegen: "PyCodegen") -> None:
  403. codegen(self.base)
  404. def guard_source(self) -> GuardSource:
  405. return self.base.guard_source()
  406. def name(self) -> str:
  407. return f"{self.base.name()}.__obj_flatten__()"
  408. @dataclasses.dataclass(frozen=True)
  409. class ScriptObjectQualifiedNameSource(ChainedSource):
  410. def __post_init__(self) -> None:
  411. assert self.base is not None
  412. def reconstruct(self, codegen: "PyCodegen") -> None:
  413. codegen(self.base)
  414. def guard_source(self) -> GuardSource:
  415. return self.base.guard_source()
  416. def name(self) -> str:
  417. return f"{self.base.name()}._type().qualified_name()"
  418. class AttrProxySource(ChainedSource):
  419. def reconstruct(self, codegen: "PyCodegen") -> None:
  420. codegen(self.base)
  421. def guard_source(self) -> GuardSource:
  422. return self.base.guard_source()
  423. def name(self) -> str:
  424. return f"{self.base.name()}.get_base()"
  425. @dataclasses.dataclass(frozen=True)
  426. class DefaultsSource(ChainedSource):
  427. idx_key: Union[int, str]
  428. is_kw: bool = False
  429. field: str = dataclasses.field(init=False, repr=False, compare=False)
  430. _name: str = dataclasses.field(init=False, repr=False, compare=False)
  431. def __post_init__(self) -> None:
  432. assert self.base, (
  433. "Base must be a valid source in order to properly track and guard this Defaults to its origin."
  434. )
  435. if self.is_kw:
  436. assert isinstance(self.idx_key, str)
  437. object.__setattr__(self, "field", "__kwdefaults__")
  438. object.__setattr__(
  439. self, "_name", f"{self.base.name()}.{self.field}['{self.idx_key}']"
  440. )
  441. else:
  442. assert isinstance(self.idx_key, int)
  443. object.__setattr__(self, "field", "__defaults__")
  444. object.__setattr__(
  445. self, "_name", f"{self.base.name()}.{self.field}[{self.idx_key}]"
  446. )
  447. def reconstruct(self, codegen: "PyCodegen") -> None:
  448. codegen(self.base)
  449. codegen.extend_output(codegen.create_load_attrs(self.field))
  450. codegen.append_output(codegen.create_load_const(self.idx_key))
  451. codegen.append_output(create_instruction("BINARY_SUBSCR"))
  452. def guard_source(self) -> GuardSource:
  453. return self.base.guard_source()
  454. def name(self) -> str:
  455. return self._name
  456. @dataclasses.dataclass(frozen=True)
  457. class GetItemSource(ChainedSource):
  458. index: Any
  459. index_is_slice: bool = False
  460. def __post_init__(self) -> None:
  461. assert self.base is not None
  462. if isinstance(self.index, slice):
  463. # store the hashable version of the slice so the whole GetItemSource is hashable
  464. super().__setattr__("index", self.index.__reduce__())
  465. super().__setattr__("index_is_slice", True)
  466. def reconstruct(self, codegen: "PyCodegen") -> None:
  467. codegen(self.base)
  468. if self.index_is_slice:
  469. codegen.append_output(codegen.create_load_const(self.unpack_slice()))
  470. else:
  471. codegen.append_output(codegen.create_load_const(self.index))
  472. codegen.append_output(create_instruction("BINARY_SUBSCR"))
  473. def guard_source(self) -> GuardSource:
  474. return self.base.guard_source()
  475. def unpack_slice(self) -> slice:
  476. assert self.index_is_slice
  477. slice_class, slice_args = self.index
  478. return slice_class(*slice_args)
  479. def name(self) -> str:
  480. # Index can be of following types
  481. # 1) index is a slice - example 1:4
  482. # 2) index is a constant - example string, integer
  483. assert not isinstance(self.index, Source)
  484. if self.index_is_slice:
  485. return f"{self.base.name()}[{self.unpack_slice()!r}]"
  486. else:
  487. return f"{self.base.name()}[{self.index!r}]"
  488. @dataclasses.dataclass(frozen=True)
  489. class ConstDictKeySource(ChainedSource):
  490. index: Any
  491. def guard_source(self) -> GuardSource:
  492. return self.base.guard_source()
  493. def reconstruct(self, codegen: "PyCodegen") -> None:
  494. codegen.add_push_null(
  495. lambda: codegen.load_import_from(utils.__name__, "dict_keys_getitem")
  496. )
  497. codegen(self.base)
  498. codegen.append_output(codegen.create_load_const(self.index))
  499. codegen.extend_output(create_call_function(2, False))
  500. def name(self) -> str:
  501. # The list creation will be CSE'd by PyExprCSEPass
  502. return f"list(dict.keys({self.base.name()}))[{self.index!r}]"
  503. def is_dict_key(self) -> bool:
  504. return True
  505. @dataclasses.dataclass(frozen=True)
  506. class NonSerializableSetGetItemSource(ChainedSource):
  507. index: int
  508. def __post_init__(self) -> None:
  509. from .variables import ConstantVariable
  510. assert ConstantVariable.is_literal(self.index)
  511. def guard_source(self) -> GuardSource:
  512. return self.base.guard_source()
  513. def reconstruct(self, codegen: "PyCodegen") -> None:
  514. codegen.add_push_null(
  515. lambda: codegen.load_import_from(utils.__name__, "set_getitem")
  516. )
  517. codegen(self.base)
  518. codegen.append_output(codegen.create_load_const(self.index))
  519. codegen.extend_output(create_call_function(2, False))
  520. def name(self) -> str:
  521. # set ordering might not be stable
  522. return f"list({self.base.name()})[{self.index!r}]"
  523. def is_dict_key(self) -> bool:
  524. return False
  525. # Used to access an item from the dictionary
  526. @dataclasses.dataclass(frozen=True)
  527. class DictGetItemSource(ChainedSource):
  528. # Key to access in the dictionary. It can be one of the the following types
  529. # 1) ConstDictKeySource
  530. # 2) constant - like string, integer
  531. index: Any
  532. def __post_init__(self) -> None:
  533. from .variables import ConstantVariable
  534. assert isinstance(
  535. self.index, ConstDictKeySource
  536. ) or ConstantVariable.is_literal(self.index)
  537. def guard_source(self) -> GuardSource:
  538. return self.base.guard_source()
  539. def reconstruct(self, codegen: "PyCodegen") -> None:
  540. # Load dict
  541. codegen(self.base)
  542. # Load key
  543. if isinstance(self.index, Source):
  544. codegen(self.index)
  545. else:
  546. codegen.append_output(codegen.create_load_const(self.index))
  547. codegen.append_output(create_instruction("BINARY_SUBSCR"))
  548. def name(self) -> str:
  549. if isinstance(self.index, ConstDictKeySource):
  550. return f"{self.base.name()}[{self.index.name()}]"
  551. else:
  552. return f"{self.base.name()}[{self.index!r}]"
  553. # Same as DictGetItemSource but used for dict.__getitem__ calls to ensure that
  554. # torch.compile does not run the overridden __getitem__ method
  555. @dataclasses.dataclass(frozen=True)
  556. class DictSubclassGetItemSource(ChainedSource):
  557. # Key to access in the dictionary. It can be one of the the following types
  558. # 1) ConstDictKeySource
  559. # 2) constant - like string, integer
  560. index: Any
  561. def __post_init__(self) -> None:
  562. from .variables import ConstantVariable
  563. assert isinstance(
  564. self.index, ConstDictKeySource
  565. ) or ConstantVariable.is_literal(self.index)
  566. def guard_source(self) -> GuardSource:
  567. return self.base.guard_source()
  568. def reconstruct(self, codegen: "PyCodegen") -> None:
  569. # reconstruct dict.__getitem__(dct, key)
  570. # Load dict.__getitem__
  571. codegen.add_push_null(
  572. lambda: codegen.load_import_from(utils.__name__, "dict_getitem")
  573. )
  574. # Load dict
  575. codegen(self.base)
  576. # Load key
  577. if isinstance(self.index, Source):
  578. codegen(self.index)
  579. else:
  580. codegen.append_output(codegen.create_load_const(self.index))
  581. codegen.extend_output(create_call_function(2, False))
  582. def name(self) -> str:
  583. if isinstance(self.index, ConstDictKeySource):
  584. return f"dict.__getitem__({self.base.name()}, {self.index.name()})"
  585. else:
  586. return f"{self.base.name()}[{self.index!r}]"
  587. @dataclasses.dataclass(frozen=True)
  588. class ListGetItemSource(GetItemSource):
  589. """
  590. Same as GetItemSource with reconstruct and name overridden to be list specific.
  591. """
  592. def reconstruct(self, codegen: "PyCodegen") -> None:
  593. # Reconstruct list.__getitem__(lst, index) to avoid any side effects
  594. # from possibly overridden __getitem__.
  595. # Load list.__getitem__
  596. codegen.add_push_null(
  597. lambda: codegen.load_import_from(utils.__name__, "list_getitem")
  598. )
  599. # Load the list
  600. codegen(self.base)
  601. # Load the index
  602. if self.index_is_slice:
  603. raise RuntimeError(
  604. "List[slice] is a temporary object and should not have a source"
  605. )
  606. else:
  607. codegen.append_output(codegen.create_load_const(self.index))
  608. codegen.extend_output(create_call_function(2, False))
  609. def name(self) -> str:
  610. # Index can be of following types
  611. # 1) index is a slice - example 1:4
  612. # 2) index is a constant - example string, integer
  613. assert not isinstance(self.index, Source)
  614. if self.index_is_slice:
  615. raise RuntimeError(
  616. "List[slice] is a temporary object and should not have a source"
  617. )
  618. else:
  619. return f"list.__getitem__({self.base.name()}, {self.index!r})"
  620. @dataclasses.dataclass(frozen=True)
  621. class TupleIteratorGetItemSource(GetItemSource):
  622. def reconstruct(self, codegen: "PyCodegen") -> None:
  623. codegen.add_push_null(
  624. lambda: codegen.load_import_from(utils.__name__, "tuple_iterator_getitem")
  625. )
  626. codegen(self.base)
  627. codegen.append_output(codegen.create_load_const(self.index))
  628. codegen.extend_output(create_call_function(2, False))
  629. def name(self) -> str:
  630. return f"___tuple_iterator_getitem({self.base.name()}, {self.index!r})"
  631. @dataclasses.dataclass(frozen=True)
  632. class NamedTupleFieldsSource(ChainedSource):
  633. def reconstruct(self, codegen: "PyCodegen") -> None:
  634. codegen(self.base)
  635. codegen.extend_output(codegen.create_load_attrs("_fields"))
  636. def guard_source(self) -> GuardSource:
  637. return self.base.guard_source()
  638. def name(self) -> str:
  639. return f"___namedtuple_fields({self.base.name()})"
  640. @dataclasses.dataclass(frozen=True)
  641. class DataclassFieldsSource(ChainedSource):
  642. def reconstruct(self, codegen: "PyCodegen") -> None:
  643. codegen.add_push_null(
  644. lambda: codegen.load_import_from(utils.__name__, "dataclass_fields")
  645. )
  646. codegen(self.base)
  647. codegen.extend_output(create_call_function(1, False))
  648. def guard_source(self) -> GuardSource:
  649. return self.base.guard_source()
  650. def name(self) -> str:
  651. return f"___dataclass_fields({self.base.name()})"
  652. @dataclasses.dataclass(frozen=True)
  653. class TypeSource(ChainedSource):
  654. def __post_init__(self) -> None:
  655. assert self.base is not None
  656. def reconstruct(self, codegen: "PyCodegen") -> None:
  657. codegen.add_push_null(lambda: codegen.load_import_from("builtins", "type"))
  658. codegen(self.base)
  659. codegen.extend_output(create_call_function(1, False))
  660. def guard_source(self) -> GuardSource:
  661. return self.base.guard_source()
  662. def name(self) -> str:
  663. return f"type({self.base.name()})"
  664. @dataclasses.dataclass(frozen=True)
  665. class OptimizerSource(ChainedSource):
  666. def reconstruct(self, codegen: "PyCodegen") -> None:
  667. codegen(self.base)
  668. def guard_source(self) -> GuardSource:
  669. return self.base.guard_source()
  670. def name(self) -> str:
  671. return self.base.name()
  672. @dataclasses.dataclass(frozen=True)
  673. class NNModuleSource(ChainedSource):
  674. def reconstruct(self, codegen: "PyCodegen") -> None:
  675. codegen(self.base)
  676. def guard_source(self) -> GuardSource:
  677. return _GUARD_SOURCE_SPECIALIZED_NN_MODULE[self.base.guard_source()]
  678. def name(self) -> str:
  679. return self.base.name()
  680. @dataclasses.dataclass(frozen=True)
  681. class UnspecializedNNModuleSource(NNModuleSource):
  682. def guard_source(self) -> GuardSource:
  683. return _GUARD_SOURCE_UNSPECIALIZED_NN_MODULE[self.base.guard_source()]
  684. @dataclasses.dataclass(frozen=True)
  685. class UnspecializedBuiltinNNModuleSource(UnspecializedNNModuleSource):
  686. def guard_source(self) -> GuardSource:
  687. return _GUARD_SOURCE_UNSPECIALIZED_BUILTIN_NN_MODULE[self.base.guard_source()]
  688. @dataclasses.dataclass(frozen=True)
  689. class FSDPNNModuleSource(NNModuleSource):
  690. def guard_source(self) -> GuardSource:
  691. return _GUARD_SOURCE_FSDP_MODULE[self.base.guard_source()]
  692. @dataclasses.dataclass(frozen=True)
  693. class GlobalStateSource(Source):
  694. def name(self) -> str:
  695. return ""
  696. def guard_source(self) -> GuardSource:
  697. return GuardSource.GLOBAL
  698. @dataclasses.dataclass(frozen=True)
  699. class TorchSource(Source):
  700. """Points to the actual `torch` module - used instead of GlobalSource
  701. in case the user has overridden `torch` in their local namespace"""
  702. def __init__(self, *args: Any, **kwargs: Any) -> None:
  703. super().__init__(*args, **kwargs)
  704. from .guards import GuardBuilder, install_guard
  705. install_guard(self.make_guard(GuardBuilder.ID_MATCH))
  706. def name(self) -> str:
  707. return "__import__('torch')"
  708. def reconstruct(self, codegen: "PyCodegen") -> None:
  709. codegen.extend_output(
  710. [
  711. codegen.create_load_const(0), # level
  712. create_instruction("BUILD_TUPLE", arg=0), # fromlist
  713. codegen.create_import_name("torch"),
  714. ]
  715. )
  716. def guard_source(self) -> GuardSource:
  717. return GuardSource.GLOBAL
  718. @dataclasses.dataclass(frozen=True)
  719. class TorchFunctionModeStackSource(Source):
  720. ind: int
  721. def name(self) -> str:
  722. return f"___get_torch_function_mode_stack_at({self._get_index()})"
  723. def _get_index(self) -> int:
  724. from .variables.torch_function import TorchFunctionModeStackVariable
  725. return TorchFunctionModeStackVariable.get_mode_index(self.ind)
  726. def reconstruct(self, codegen: "PyCodegen") -> None:
  727. codegen.add_push_null(
  728. lambda: codegen.load_import_from(
  729. utils.__name__, "get_torch_function_mode_stack_at"
  730. )
  731. )
  732. codegen.extend_output([codegen.create_load_const(self._get_index())])
  733. codegen.extend_output(create_call_function(1, False))
  734. def guard_source(self) -> GuardSource:
  735. return GuardSource.GLOBAL
  736. @dataclasses.dataclass(frozen=True)
  737. class ConstantSource(Source):
  738. source_name: str
  739. def reconstruct(self, codegen: "PyCodegen") -> None:
  740. codegen.append_output(codegen.create_load_global(self.source_name, add=False))
  741. def guard_source(self) -> GuardSource:
  742. return GuardSource.CONSTANT
  743. def name(self) -> str:
  744. return self.source_name
  745. def make_guard(self, fn: Any) -> Any:
  746. raise NotImplementedError
  747. @dataclasses.dataclass(frozen=True)
  748. class NumpyTensorSource(ChainedSource):
  749. def name(self) -> str:
  750. return f"___from_numpy({self.base.name()})"
  751. def guard_source(self) -> GuardSource:
  752. return self.base.guard_source()
  753. def reconstruct(self, codegen: "PyCodegen") -> None:
  754. codegen.add_push_null(lambda: codegen.load_import_from("torch", "as_tensor"))
  755. codegen(self.base)
  756. codegen.extend_output(create_call_function(1, False))
  757. @dataclasses.dataclass(frozen=True)
  758. class SubclassAttrListSource(ChainedSource):
  759. def name(self) -> str:
  760. return f"{self.base.name()}.__tensor_flatten__()[0]"
  761. def guard_source(self) -> GuardSource:
  762. return self.base.guard_source()
  763. # NB: We don't expect you to actually ever generate guards against this
  764. # source, it is ephemeral
  765. @dataclasses.dataclass(frozen=True)
  766. class FloatTensorSource(ChainedSource):
  767. def name(self) -> str:
  768. return f"___as_tensor({self.base.name()})"
  769. def guard_source(self) -> GuardSource:
  770. return self.base.guard_source()
  771. @dataclasses.dataclass(frozen=True)
  772. class CallMethodItemSource(ChainedSource):
  773. def name(self) -> str:
  774. return f"{self.base.name()}.item()"
  775. def guard_source(self) -> GuardSource:
  776. return self.base.guard_source()
  777. # This is a synthetic source that is associated with the singleton
  778. # shape env guard we always register for all frames. We get the actual
  779. # guard contents from the ambient ShapeEnv
  780. @dataclasses.dataclass(frozen=True)
  781. class ShapeEnvSource(Source):
  782. def name(self) -> str:
  783. return ""
  784. def guard_source(self) -> GuardSource:
  785. return GuardSource.SHAPE_ENV
  786. @dataclasses.dataclass(frozen=True)
  787. class BackwardStateSource(Source):
  788. def name(self) -> str:
  789. return ""
  790. def guard_source(self) -> GuardSource:
  791. return GuardSource.BACKWARD_STATE
  792. def get_local_source_name(
  793. source: Source, *, only_allow_input: bool = False
  794. ) -> Optional[str]:
  795. if isinstance(source, ChainedSource):
  796. return get_local_source_name(source.base, only_allow_input=only_allow_input)
  797. if not isinstance(source, LocalSource):
  798. return None
  799. if only_allow_input and not source.is_input:
  800. return None
  801. return source.local_name
  802. def is_from_local_source(source: Source, *, only_allow_input: bool = False) -> bool:
  803. return get_local_source_name(source, only_allow_input=only_allow_input) is not None
  804. def is_from_global_source(source: Source) -> bool:
  805. return get_global_source_name(source) is not None
  806. def get_global_source_name(source: Source) -> Optional[str]:
  807. if isinstance(source, ChainedSource):
  808. return get_global_source_name(source.base)
  809. if not isinstance(source, GlobalSource):
  810. return None
  811. return source.global_name
  812. def is_from_nonlocal_source(source: Source) -> bool:
  813. if isinstance(source, ChainedSource):
  814. return is_from_nonlocal_source(source.base)
  815. return (
  816. isinstance(source, LocalSource)
  817. and source.is_derefed_cell_contents
  818. and not source.is_input
  819. )
  820. def is_from_closure_source(source: Source) -> bool:
  821. if isinstance(source, ClosureSource):
  822. return True
  823. if isinstance(source, ChainedSource):
  824. return is_from_closure_source(source.base)
  825. return False
  826. def is_from_source(source: Source, target: Source) -> bool:
  827. if isinstance(source, ChainedSource):
  828. return is_from_source(source.base, target)
  829. return source == target
  830. @functools.lru_cache
  831. def is_from_unspecialized_nn_module_source(source: Source) -> bool:
  832. if isinstance(source, UnspecializedNNModuleSource):
  833. return True
  834. if isinstance(source, ChainedSource):
  835. return is_from_unspecialized_nn_module_source(source.base)
  836. return False
  837. @functools.lru_cache
  838. def is_from_unspecialized_builtin_nn_module_source(source: Source) -> bool:
  839. if isinstance(source, UnspecializedBuiltinNNModuleSource):
  840. return True
  841. if isinstance(source, ChainedSource):
  842. return is_from_unspecialized_builtin_nn_module_source(source.base)
  843. return False
  844. @functools.lru_cache
  845. def is_from_unspecialized_param_buffer_source(source: Source) -> bool:
  846. if isinstance(source, UnspecializedParamBufferSource):
  847. return True
  848. if isinstance(source, ChainedSource):
  849. return is_from_unspecialized_param_buffer_source(source.base)
  850. return False
  851. @functools.lru_cache
  852. def is_from_flatten_script_object_source(source: Source) -> bool:
  853. if isinstance(source, FlattenScriptObjectSource):
  854. return True
  855. elif isinstance(source, ChainedSource):
  856. return is_from_flatten_script_object_source(source.base)
  857. return False
  858. @functools.lru_cache
  859. def is_from_optimizer_source(source: Source) -> bool:
  860. if isinstance(source, OptimizerSource):
  861. return True
  862. if isinstance(source, ChainedSource):
  863. return is_from_optimizer_source(source.base)
  864. return False
  865. # TODO: can probably write a generic "test this on everything in the chain"
  866. # helper
  867. @functools.lru_cache
  868. def is_from_defaults(source: Source) -> bool:
  869. if isinstance(source, DefaultsSource):
  870. return True
  871. # Accessed with func.__kwdefaults__["foo"]
  872. if (
  873. isinstance(source, DictGetItemSource)
  874. and isinstance(source.base, AttrSource)
  875. and source.base.member == "__kwdefaults__"
  876. ):
  877. return True
  878. # Accessed with func.__defaults__[0]
  879. if (
  880. isinstance(source, GetItemSource)
  881. and isinstance(source.base, AttrSource)
  882. and source.base.member == "__defaults__"
  883. ):
  884. return True
  885. if isinstance(source, ChainedSource):
  886. return is_from_defaults(source.base)
  887. return False
  888. @functools.lru_cache
  889. def is_from_skip_guard_source(source: Source) -> bool:
  890. if isinstance(source, SkipGuardSource):
  891. return True
  892. if isinstance(source, ChainedSource):
  893. return is_from_skip_guard_source(source.base)
  894. return False