pytorch · vfdev-5 · Nov 22, 2023 · Nov 2, 2023 · Nov 3, 2023 · Nov 10, 2023
diff --git a/torchvision/transforms/v2/functional/_geometry.py b/torchvision/transforms/v2/functional/_geometry.py
@@ -188,6 +188,21 @@ def resize(
     return kernel(inpt, size=size, interpolation=interpolation, max_size=max_size, antialias=antialias)
 
 
+# This is an internal helper method for resize_image. We should put it here instead of keeping it
+# inside resize_image due to torchscript.
+# uint8 dtype support for bilinear and bicubic is limited to cpu and
+# according to our benchmarks, non-AVX CPUs should still prefer u8->f32->interpolate->u8 path for bilinear
+# For torch.compile we use uint8 input and let decomposition work
-# For torch.compile we use uint8 input and let decomposition work
-# For torch.compile we use uint8 input and let decomposition work
+def _do_native_uint8_resize_on_cpu(interpolation: Union[InterpolationMode, int]) -> bool:
+    if interpolation == InterpolationMode.BILINEAR:
+        if torch._dynamo.is_compiling():
+            return True
+        else:
+            return "AVX2" in torch.backends.cpu.get_cpu_capability()
+
+    return interpolation == InterpolationMode.BICUBIC
+
+
 @_register_kernel_internal(resize, torch.Tensor)
 @_register_kernel_internal(resize, tv_tensors.Image)
 def resize_image(
@@ -215,21 +230,15 @@ def resize_image(
     if (new_height, new_width) == (old_height, old_width):
         return image
     elif numel > 0:
-        image = image.reshape(-1, num_channels, old_height, old_width)
-
         dtype = image.dtype
         acceptable_dtypes = [torch.float32, torch.float64]
         if interpolation == InterpolationMode.NEAREST or interpolation == InterpolationMode.NEAREST_EXACT:
             # uint8 dtype can be included for cpu and cuda input if nearest mode
             acceptable_dtypes.append(torch.uint8)
-        elif image.device.type == "cpu":
-            # uint8 dtype support for bilinear and bicubic is limited to cpu and
-            # according to our benchmarks, non-AVX CPUs should still prefer u8->f32->interpolate->u8 path for bilinear
-            if (interpolation == InterpolationMode.BILINEAR and "AVX2" in torch.backends.cpu.get_cpu_capability()) or (
-                interpolation == InterpolationMode.BICUBIC
-            ):
-                acceptable_dtypes.append(torch.uint8)
+        elif image.device.type == "cpu" and _do_native_uint8_resize_on_cpu(interpolation):
+            acceptable_dtypes.append(torch.uint8)
 
+        image = image.reshape(-1, num_channels, old_height, old_width)
         strides = image.stride()
         if image.is_contiguous(memory_format=torch.channels_last) and image.shape[0] == 1 and numel != strides[0]:
             # There is a weird behaviour in torch core where the output tensor of `interpolate()` can be allocated as