Assume torch in certain files

cyyever · cyyever · commit d0a30b91a2ea · 2025-09-07T14:38:17.000+08:00
Signed-off-by: Yuanyuan Chen &lt;cyyever@outlook.com&gt;
diff --git a/src/transformers/debug_utils.py b/src/transformers/debug_utils.py
@@ -14,11 +14,9 @@
 
 import collections
 
-from .utils import ExplicitEnum, is_torch_available, logging
+import torch
 
-
-if is_torch_available():
-    import torch
+from .utils import ExplicitEnum, logging
 
 
 logger = logging.get_logger(__name__)
diff --git a/src/transformers/image_processing_utils_fast.py b/src/transformers/image_processing_utils_fast.py
@@ -18,6 +18,7 @@
 from typing import Any, Optional, TypedDict, Union
 
 import numpy as np
+import torch
 
 from .image_processing_utils import BaseImageProcessor, BatchFeature, get_size_dict
 from .image_transforms import (
@@ -44,7 +45,6 @@
 from .utils import (
     TensorType,
     auto_docstring,
-    is_torch_available,
     is_torchvision_available,
     is_torchvision_v2_available,
     is_vision_available,
@@ -56,8 +56,6 @@
 if is_vision_available():
     from .image_utils import PILImageResampling
 
-if is_torch_available():
-    import torch
 
 if is_torchvision_available():
     from .image_utils import pil_torch_interpolation_mapping
@@ -115,7 +113,7 @@ def validate_fast_preprocess_arguments(
         raise ValueError("Only channel first data format is currently supported.")
 
 
-def safe_squeeze(tensor: "torch.Tensor", axis: Optional[int] = None) -> "torch.Tensor":
+def safe_squeeze(tensor: torch.Tensor, axis: Optional[int] = None) -> torch.Tensor:
     """
     Squeezes a tensor, but only if the axis specified has dim 1.
     """
@@ -135,7 +133,7 @@ def max_across_indices(values: Iterable[Any]) -> list[Any]:
     return [max(values_i) for values_i in zip(*values)]
 
 
-def get_max_height_width(images: list["torch.Tensor"]) -> tuple[int]:
+def get_max_height_width(images: list[torch.Tensor]) -> tuple[int]:
     """
     Get the maximum height and width across all images in a batch.
     """
@@ -145,19 +143,17 @@ def get_max_height_width(images: list["torch.Tensor"]) -> tuple[int]:
     return (max_height, max_width)
 
 
-def divide_to_patches(
-    image: Union[np.array, "torch.Tensor"], patch_size: int
-) -> list[Union[np.array, "torch.Tensor"]]:
+def divide_to_patches(image: Union[np.array, torch.Tensor], patch_size: int) -> list[Union[np.array, torch.Tensor]]:
     """
     Divides an image into patches of a specified size.
 
     Args:
-        image (`Union[np.array, "torch.Tensor"]`):
+        image (`Union[np.array, torch.Tensor]`):
             The input image.
         patch_size (`int`):
             The size of each patch.
     Returns:
-        list: A list of Union[np.array, "torch.Tensor"] representing the patches.
+        list: A list of Union[np.array, torch.Tensor] representing the patches.
     """
     patches = []
     height, width = get_image_size(image, channel_dim=ChannelDimension.FIRST)
@@ -241,12 +237,12 @@ def is_fast(self) -> bool:
 
     def resize(
         self,
-        image: "torch.Tensor",
+        image: torch.Tensor,
         size: SizeDict,
         interpolation: Optional["F.InterpolationMode"] = None,
         antialias: bool = True,
         **kwargs,
-    ) -> "torch.Tensor":
+    ) -> torch.Tensor:
         """
         Resize an image to `(size["height"], size["width"])`.
 
@@ -295,11 +291,11 @@ def resize(
 
     @staticmethod
     def compile_friendly_resize(
-        image: "torch.Tensor",
+        image: torch.Tensor,
         new_size: tuple[int, int],
         interpolation: Optional["F.InterpolationMode"] = None,
         antialias: bool = True,
-    ) -> "torch.Tensor":
+    ) -> torch.Tensor:
         """
         A wrapper around `F.resize` so that it is compatible with torch.compile when the image is a uint8 tensor.
         """
@@ -316,10 +312,10 @@ def compile_friendly_resize(
 
     def rescale(
         self,
-        image: "torch.Tensor",
+        image: torch.Tensor,
         scale: float,
         **kwargs,
-    ) -> "torch.Tensor":
+    ) -> torch.Tensor:
         """
         Rescale an image by a scale factor. image = image * scale.
 
@@ -336,11 +332,11 @@ def rescale(
 
     def normalize(
         self,
-        image: "torch.Tensor",
+        image: torch.Tensor,
         mean: Union[float, Iterable[float]],
         std: Union[float, Iterable[float]],
         **kwargs,
-    ) -> "torch.Tensor":
+    ) -> torch.Tensor:
         """
         Normalize an image. image = (image - image_mean) / image_std.
 
@@ -376,13 +372,13 @@ def _fuse_mean_std_and_rescale_factor(
 
     def rescale_and_normalize(
         self,
-        images: "torch.Tensor",
+        images: torch.Tensor,
         do_rescale: bool,
         rescale_factor: float,
         do_normalize: bool,
         image_mean: Union[float, list[float]],
         image_std: Union[float, list[float]],
-    ) -> "torch.Tensor":
+    ) -> torch.Tensor:
         """
         Rescale and normalize images.
         """
@@ -404,16 +400,16 @@ def rescale_and_normalize(
 
     def center_crop(
         self,
-        image: "torch.Tensor",
+        image: torch.Tensor,
         size: dict[str, int],
         **kwargs,
-    ) -> "torch.Tensor":
+    ) -> torch.Tensor:
         """
         Center crop an image to `(size["height"], size["width"])`. If the input size is smaller than `crop_size` along
         any edge, the image is padded with 0's and then center cropped.
 
         Args:
-            image (`"torch.Tensor"`):
+            image (`torch.Tensor`):
                 Image to center crop.
             size (`dict[str, int]`):
                 Size of the output image.
@@ -479,7 +475,7 @@ def _process_image(
         do_convert_rgb: Optional[bool] = None,
         input_data_format: Optional[Union[str, ChannelDimension]] = None,
         device: Optional["torch.device"] = None,
-    ) -> "torch.Tensor":
+    ) -> torch.Tensor:
         image_type = get_image_type(image)
         if image_type not in [ImageType.PIL, ImageType.TORCH, ImageType.NUMPY]:
             raise ValueError(f"Unsupported input image type {image_type}")
@@ -518,7 +514,7 @@ def _prepare_image_like_inputs(
         input_data_format: Optional[Union[str, ChannelDimension]] = None,
         device: Optional["torch.device"] = None,
         expected_ndims: int = 3,
-    ) -> list["torch.Tensor"]:
+    ) -> list[torch.Tensor]:
         """
         Prepare image-like inputs for processing.
 
@@ -685,7 +681,7 @@ def _preprocess_image_like_inputs(
 
     def _preprocess(
         self,
-        images: list["torch.Tensor"],
+        images: list[torch.Tensor],
         do_resize: bool,
         size: SizeDict,
         interpolation: Optional["F.InterpolationMode"],
diff --git a/src/transformers/integrations/higgs.py b/src/transformers/integrations/higgs.py
@@ -16,18 +16,15 @@
 from math import sqrt
 from typing import Optional
 
+import torch
+from torch import nn
+
 from ..utils import (
     is_flute_available,
     is_hadamard_available,
-    is_torch_available,
 )
 
 
-if is_torch_available():
-    import torch
-    from torch import nn
-
-
 if is_flute_available():
     from flute.integrations.higgs import prepare_data_transposed
     from flute.tune import TuneMetaData, qgemm_v2
diff --git a/src/transformers/model_debugging_utils.py b/src/transformers/model_debugging_utils.py
@@ -21,20 +21,17 @@
 from io import StringIO
 from typing import Optional
 
-from .utils.import_utils import is_torch_available, requires
+import torch
+from safetensors.torch import save_file
 
+from .utils.import_utils import requires
 
-if is_torch_available():
-    import torch
-    from safetensors.torch import save_file
 
-    # Note to code inspectors: this toolbox is intended for people who add models to `transformers`.
-    if torch.distributed.is_available():
-        import torch.distributed.tensor
+# Note to code inspectors: this toolbox is intended for people who add models to `transformers`.
+if torch.distributed.is_available():
+    import torch.distributed.tensor
 
-        _torch_distributed_available = True
-else:
-    _torch_distributed_available = False
+    _torch_distributed_available = True
 from .utils import logging
 
 
diff --git a/src/transformers/trainer_pt_utils.py b/src/transformers/trainer_pt_utils.py
@@ -42,7 +42,6 @@
 from .tokenization_utils_base import BatchEncoding
 from .utils import (
     is_sagemaker_mp_enabled,
-    is_torch_available,
     is_torch_xla_available,
     is_training_run_on_sagemaker,
     logging,
@@ -55,8 +54,7 @@
 if is_torch_xla_available():
     import torch_xla.runtime as xr
 
-if is_torch_available():
-    from torch.optim.lr_scheduler import LRScheduler
+from torch.optim.lr_scheduler import LRScheduler
 
 
 logger = logging.get_logger(__name__)
diff --git a/src/transformers/video_processing_utils.py b/src/transformers/video_processing_utils.py
@@ -21,6 +21,7 @@
 from typing import Any, Callable, Optional, Union
 
 import numpy as np
+import torch
 
 from .dynamic_module_utils import custom_object_save
 from .image_processing_utils import (
@@ -44,7 +45,6 @@
     download_url,
     is_offline_mode,
     is_remote_url,
-    is_torch_available,
     is_torchcodec_available,
     is_torchvision_available,
     is_torchvision_v2_available,
@@ -65,9 +65,6 @@
 )
 
 
-if is_torch_available():
-    import torch
-
 if is_torchvision_available():
     if is_torchvision_v2_available():
         from torchvision.transforms.v2 import functional as F