pytorch
diff --git a/‎torchgen/api/autograd.py
Lines changed: 44 additions & 46 deletions b/‎torchgen/api/autograd.py
Lines changed: 44 additions & 46 deletions
diff --git a/‎torchgen/api/cpp.py
Lines changed: 12 additions & 14 deletions b/‎torchgen/api/cpp.py
Lines changed: 12 additions & 14 deletions
diff --git a/‎torchgen/api/dispatcher.py
Lines changed: 5 additions & 7 deletions b/‎torchgen/api/dispatcher.py
Lines changed: 5 additions & 7 deletions
@@ -1,8 +1,6 @@
-from __future__ import annotations
-
 import re
 from dataclasses import dataclass
-from typing import cast, Sequence
+from typing import cast, Dict, List, Match, Optional, Sequence, Set, Tuple
 
 from torchgen import local
 from torchgen.api import cpp
@@ -50,16 +48,16 @@ class Derivative:
     original_formula: str
 
     # Names of the arguments for which this formula calculates derivatives.
-    var_names: tuple[str, ...]
+    var_names: Tuple[str, ...]
 
     # Saved inputs that are referenced by the formula.
-    saved_inputs: tuple[SavedAttribute, ...]
+    saved_inputs: Tuple[SavedAttribute, ...]
 
     # Saved outputs that are referenced by the formula.
-    saved_outputs: tuple[SavedAttribute, ...]
+    saved_outputs: Tuple[SavedAttribute, ...]
 
     # Gradients that are referenced by name in the formula.
-    named_gradients: set[str]
+    named_gradients: Set[str]
 
 
 # Represents a forward formula that calculates forward derivatives
@@ -73,17 +71,17 @@ class ForwardDerivative:
 
     # Name of the output arguments for which this formula calculates forward
     # derivatives
-    var_names: tuple[str, ...]
+    var_names: Tuple[str, ...]
 
     # Type of the output arguments for which this formula calculates forward
     # derivatives
-    var_types: tuple[Type, ...]
+    var_types: Tuple[Type, ...]
 
     # Inputs for which the forward derivatives are required for this formula
-    required_inputs_fw_grad: tuple[str, ...] | None
+    required_inputs_fw_grad: Optional[Tuple[str, ...]]
 
     # Inputs for which the primal is required for this formula
-    required_inputs_primal: tuple[str, ...] | None
+    required_inputs_primal: Optional[Tuple[str, ...]]
 
     # Flag to specify if this formula requires the original value of self
     # This is only used by inplace operations
@@ -118,7 +116,7 @@ class DifferentiabilityInfo:
     # The name of the generated autograd function.
     # It's set only if we will calculate a derivative, i.e.
     # 'args_with_derivatives' is not empty.
-    op: str | None
+    op: Optional[str]
 
     # The derivatives formulae for this function.
     # Note that the length of this sequence is the number of differentiable inputs
@@ -140,7 +138,7 @@ class DifferentiabilityInfo:
 
     # The named gradients that are used in any of the derivatives.
     # Invariant: all(name in available_named_gradients for name in used_named_gradients)
-    used_named_gradients: set[str]
+    used_named_gradients: Set[str]
 
     # The function's input arguments for which it calculates derivatives.
     # It's the union of 'var_names' of all 'derivatives', sorted by the
@@ -151,15 +149,15 @@ class DifferentiabilityInfo:
     non_differentiable_arg_names: Sequence[str]
 
     # Raw data read from derivatives.yaml.
-    output_differentiability: list[bool] | None
+    output_differentiability: Optional[List[bool]]
 
     # output_differentiability in derivatives.yaml can be a list of
     # conditions that express if the output is differentiable. In this case,
     # the number of conditions must match the number of outputs
     # (NB: we only support one condition right now).
     # output_differentiability gets populated with True for each condition,
     # while output_differentiability_conditions gets populated with the conditions
-    output_differentiability_conditions: list[str] | None
+    output_differentiability_conditions: Optional[List[str]]
 
     @property
     def has_derivatives(self) -> bool:
@@ -172,7 +170,7 @@ def has_derivatives(self) -> bool:
     # See Note [Codegen'd {view}_copy Operators]
     def create_view_copy_from_view_derivative(
         self, g: NativeFunctionsViewGroup
-    ) -> DifferentiabilityInfo | None:
+    ) -> Optional["DifferentiabilityInfo"]:
         if g.view_copy is None:
             return None
         f = g.view_copy
@@ -203,7 +201,7 @@ def create_view_copy_from_view_derivative(
         )
 
 
-def uses_ident(info: DifferentiabilityInfo | None, ident: str) -> bool:
+def uses_ident(info: Optional[DifferentiabilityInfo], ident: str) -> bool:
     if info is None:
         return False
     for derivative in info.derivatives:
@@ -213,11 +211,11 @@ def uses_ident(info: DifferentiabilityInfo | None, ident: str) -> bool:
 
 
-def uses_retain_variables(info: DifferentiabilityInfo | None) -> bool:
+def uses_retain_variables(info: Optional[DifferentiabilityInfo]) -> bool:
     return uses_ident(info, "retain_variables")
 
 
-def uses_single_grad(info: DifferentiabilityInfo | None) -> bool:
+def uses_single_grad(info: Optional[DifferentiabilityInfo]) -> bool:
     return uses_ident(info, "grad")
 
 
@@ -255,8 +253,8 @@ class DifferentiableOutput:
 @dataclass(frozen=True)
 class NativeFunctionWithDifferentiabilityInfo:
     func: NativeFunction
-    info: dict[str, DifferentiabilityInfo] | None
-    fw_derivatives: dict[str, Sequence[ForwardDerivative]] | None
+    info: Optional[Dict[str, DifferentiabilityInfo]]
+    fw_derivatives: Optional[Dict[str, Sequence[ForwardDerivative]]]
 
 
 # TODO: Update comment below since it is out of date.
@@ -365,19 +363,19 @@ def is_reference_for_foreach(
 # TODO(crcrpar): Avoid hard coding "Default" ideally.
 def gen_foreach_derivativeinfo(
     foreach_function: NativeFunction,
-    functional_info_by_signature: dict[
-        FunctionSchema, dict[str, DifferentiabilityInfo]
+    functional_info_by_signature: Dict[
+        FunctionSchema, Dict[str, DifferentiabilityInfo]
     ],
-    non_functional_info_by_signature: dict[
-        FunctionSchema, dict[str, DifferentiabilityInfo]
+    non_functional_info_by_signature: Dict[
+        FunctionSchema, Dict[str, DifferentiabilityInfo]
     ],
     dispatch_key: str = "Default",
-) -> tuple[DifferentiabilityInfo | None, bool]:
+) -> Tuple[Optional[DifferentiabilityInfo], bool]:
     """Generate DifferentiabilityInfo for out-place foreach function, return the existing one for in-place.
 
     The second return value indicates whether the info is generated in this function.
     """
-    ref_diff_info: DifferentiabilityInfo | None = None
+    ref_diff_info: Optional[DifferentiabilityInfo] = None
 
     for function_schema, diff_info in functional_info_by_signature.items():
         if not is_reference_for_foreach(foreach_function, function_schema):
@@ -487,13 +485,13 @@ def gen_foreach_derivativeinfo(
             if arg.name in all_var_names
         ]
 
-    forward_derivatives: list[ForwardDerivative] = []
+    forward_derivatives: List[ForwardDerivative] = []
     fw_derivative: ForwardDerivative
     for fw_derivative in ref_diff_info.forward_derivatives:
-        var_names: list[str] = list(fw_derivative.var_names)  # type: ignore[no-redef]
-        var_types: list[Type] = list(fw_derivative.var_types)
-        required_inputs_fw_grad: list[str] = []
-        required_inputs_primal: list[str] = []
+        var_names: List[str] = list(fw_derivative.var_names)  # type: ignore[no-redef]
+        var_types: List[Type] = list(fw_derivative.var_types)
+        required_inputs_fw_grad: List[str] = []
+        required_inputs_primal: List[str] = []
         if fw_derivative.required_inputs_fw_grad is not None:
             required_inputs_fw_grad = list(fw_derivative.required_inputs_fw_grad)
         if fw_derivative.required_inputs_primal:
@@ -580,9 +578,9 @@ def gen_foreach_derivativeinfo(
 
 
 def match_differentiability_info(
-    native_functions: list[NativeFunction],
-    differentiability_infos: dict[FunctionSchema, dict[str, DifferentiabilityInfo]],
-) -> list[NativeFunctionWithDifferentiabilityInfo]:
+    native_functions: List[NativeFunction],
+    differentiability_infos: Dict[FunctionSchema, Dict[str, DifferentiabilityInfo]],
+) -> List[NativeFunctionWithDifferentiabilityInfo]:
     """Sets the "derivative" key on declarations to matching autograd function
     In-place functions will use the out-of-place derivative definition if there
     is no in-place specific derivative.
@@ -601,7 +599,7 @@ def match_differentiability_info(
 
     def find_info(
         f: NativeFunction,
-    ) -> tuple[dict[str, DifferentiabilityInfo] | None, bool]:
+    ) -> Tuple[Optional[Dict[str, DifferentiabilityInfo]], bool]:
         # Don't bother matching info to generated out= variants
         if "generated" in f.tags and f.func.kind() == SchemaKind.out:
             return None, False
@@ -655,7 +653,7 @@ def find_info(
 
         return None, False
 
-    result: list[NativeFunctionWithDifferentiabilityInfo] = []
+    result: List[NativeFunctionWithDifferentiabilityInfo] = []
     for f in native_functions:
         info_dict, is_exact_match = find_info(f)
 
@@ -679,7 +677,7 @@ def find_info(
             )
             continue
 
-        fw_derivative_dict: dict[str, Sequence[ForwardDerivative]] = {}
+        fw_derivative_dict: Dict[str, Sequence[ForwardDerivative]] = {}
         for key, info in info_dict.items():
             if not info.forward_derivatives:
                 fw_derivative_dict[key] = []
@@ -715,7 +713,7 @@ def find_info(
                 formula = fw_info.formula
 
                 def replace_self_with_original_self(formula: str, postfix: str) -> str:
-                    def repl(m: re.Match[str]) -> str:
+                    def repl(m: Match[str]) -> str:
                         return f"{m.group(1)}original_self{postfix}{m.group(2)}"
 
                     return re.sub(IDENT_REGEX.format(f"self{postfix}"), repl, formula)
@@ -736,7 +734,7 @@ def repl(m: re.Match[str]) -> str:
                         formula = replace_self_with_original_self(formula, "_t")
 
                 # replace "result" from the formula by "self_p"
-                def repl(m: re.Match[str]) -> str:
+                def repl(m: Match[str]) -> str:
                     return f"{m.group(1)}self_p{m.group(2)}"
 
                 formula = re.sub(IDENT_REGEX.format("result"), repl, formula)
@@ -760,8 +758,8 @@ def repl(m: re.Match[str]) -> str:
                     # If there is a need, we can relax (2) to allow any op that has an in-place variant
                     is_single_method_on_self_t = False
                     directly_do_inplace = False
-                    op_name: str | None = None
-                    between_parens: str | None = None
+                    op_name: Optional[str] = None
+                    between_parens: Optional[str] = None
                     match = re.fullmatch(r"self_t.([\w]*)\((.*)\)", formula)
                     if match:
                         op_name, between_parens = match.group(1), match.group(2)
@@ -825,7 +823,7 @@ def check_parens_nest_level_gt_zero(s: str) -> bool:
 
 
 def is_differentiable(
-    name: str, type: Type, info: DifferentiabilityInfo | None
+    name: str, type: Type, info: Optional[DifferentiabilityInfo]
 ) -> bool:
     return type.is_tensor_like() and (
         info is None or name not in info.non_differentiable_arg_names
@@ -834,10 +832,10 @@ def is_differentiable(
 
 def gen_differentiable_outputs(
     fn: NativeFunctionWithDifferentiabilityInfo, key: str = "Default"
-) -> list[DifferentiableOutput]:
+) -> List[DifferentiableOutput]:
     f = fn.func
     info = fn.info[key] if fn.info else None
-    outputs: list[DifferentiableOutput] = [
+    outputs: List[DifferentiableOutput] = [
         DifferentiableOutput(
             name=name,
             type=ret.type,
@@ -852,7 +850,7 @@ def gen_differentiable_outputs(
                 f"The length of output_differentiability ({len(output_differentiability)}), "
                 f"does not match the number of outputs ({len(outputs)})."
             )
-        differentiable_outputs: list[DifferentiableOutput] = []
+        differentiable_outputs: List[DifferentiableOutput] = []
         if False in output_differentiability and f.func.kind() == SchemaKind.inplace:
             raise RuntimeError(
                 "output_differentiability=False for inplace operation (version_counter won't get updated)"
 
@@ -1,6 +1,4 @@
-from __future__ import annotations
-
-from typing import Sequence
+from typing import List, Optional, Sequence, Set, Union
 
 from torchgen import local
 from torchgen.api.types import (
@@ -96,7 +94,7 @@ def valuetype_type(
     binds: ArgName,
     remove_non_owning_ref_types: bool = False,
     symint: bool = False,
-) -> NamedCType | None:
+) -> Optional[NamedCType]:
     if isinstance(t, BaseType):
         if t.name == BaseTy.Tensor or t.name == BaseTy.Scalar:
             return None
@@ -281,7 +279,7 @@ def returns_type(rs: Sequence[Return], *, symint: bool = False) -> CType:
 
 
 def return_names(f: NativeFunction, *, fallback_name: str = "result") -> Sequence[str]:
-    returns: list[str] = []
+    returns: List[str] = []
     for i, r in enumerate(f.func.returns):
         # If we have an inplace function, the return argument is
         # implicitly named self.
@@ -370,17 +368,17 @@ def default_expr(d: str, t: Type, *, symint: bool) -> str:
 
 
 def argument(
-    a: Argument | TensorOptionsArguments | SelfArgument,
+    a: Union[Argument, TensorOptionsArguments, SelfArgument],
     *,
-    cpp_no_default_args: set[str],
+    cpp_no_default_args: Set[str],
     method: bool,
     faithful: bool,
     symint: bool = False,
     has_tensor_options: bool,
-) -> list[Binding]:
+) -> List[Binding]:
     def sub_argument(
-        a: Argument | TensorOptionsArguments | SelfArgument,
-    ) -> list[Binding]:
+        a: Union[Argument, TensorOptionsArguments, SelfArgument]
+    ) -> List[Binding]:
         return argument(
             a,
             cpp_no_default_args=cpp_no_default_args,
@@ -396,7 +394,7 @@ def sub_argument(
             binds = SpecialArgName.possibly_redundant_memory_format
         else:
             binds = a.name
-        default: str | None = None
+        default: Optional[str] = None
         if a.name not in cpp_no_default_args and a.default is not None:
             default = default_expr(a.default, a.type, symint=symint)
         return [
@@ -447,9 +445,9 @@ def arguments(
     faithful: bool,
     symint: bool = False,
     method: bool,
-    cpp_no_default_args: set[str],
-) -> list[Binding]:
-    args: list[Argument | TensorOptionsArguments | SelfArgument] = []
+    cpp_no_default_args: Set[str],
+) -> List[Binding]:
+    args: List[Union[Argument, TensorOptionsArguments, SelfArgument]] = []
     if faithful:
         args.extend(arguments.non_out)
         args.extend(arguments.out)
 
@@ -1,7 +1,5 @@
-from __future__ import annotations
-
 import itertools
-from typing import Sequence
+from typing import List, Sequence, Union
 
 from torchgen.api import cpp
 from torchgen.api.types import ArgName, Binding, CType, NamedCType
@@ -78,10 +76,10 @@ def returns_type(rs: Sequence[Return], *, symint: bool = True) -> CType:
     return cpp.returns_type(rs, symint=symint)
 
 
-def jit_arguments(func: FunctionSchema) -> list[Argument]:
+def jit_arguments(func: FunctionSchema) -> List[Argument]:
     def to_argument(
-        a: Argument | TensorOptionsArguments | SelfArgument,
-    ) -> list[Argument]:
+        a: Union[Argument, TensorOptionsArguments, SelfArgument]
+    ) -> List[Argument]:
         if isinstance(a, Argument):
             return [a]
         elif isinstance(a, SelfArgument):
@@ -116,5 +114,5 @@ def argument(
     )
 
 
-def arguments(func: FunctionSchema, *, symint: bool = True) -> list[Binding]:
+def arguments(func: FunctionSchema, *, symint: bool = True) -> List[Binding]:
     return [argument(a, symint=symint) for a in jit_arguments(func)]