Annotate types for ints passed as str/None, extract opencv conversion to function

Dan-Flores · Dan-Flores · commit b97e7bfb7947 · 2025-06-12T11:33:44.000-07:00
diff --git a/benchmarks/decoders/benchmark_decoders_library.py b/benchmarks/decoders/benchmark_decoders_library.py
@@ -174,11 +174,7 @@ def decode_frames(self, video_file, pts_list):
             if current_frame in approx_frame_indices:  # only decompress needed
                 ret, frame = cap.retrieve()
                 if ret:
-                    # OpenCV uses BGR, change to RGB
-                    frame = self.cv2.cvtColor(frame, self.cv2.COLOR_BGR2RGB)
-                    # Update to C, H, W
-                    frame = np.transpose(frame, (2, 0, 1))
-                    frame = torch.from_numpy(frame)
+                    frame = self.convert_frame_to_rgb_tensor(frame)
                     frames.append(frame)
 
             if len(frames) == len(approx_frame_indices):
@@ -200,11 +196,7 @@ def decode_first_n_frames(self, video_file, n):
                 raise ValueError("Could not grab video frame")
             ret, frame = cap.retrieve()
             if ret:
-                # OpenCV uses BGR, change to RGB
-                frame = self.cv2.cvtColor(frame, self.cv2.COLOR_BGR2RGB)
-                # Update to C, H, W
-                frame = np.transpose(frame, (2, 0, 1))
-                frame = torch.from_numpy(frame)
+                frame = self.convert_frame_to_rgb_tensor(frame)
                 frames.append(frame)
         cap.release()
         assert len(frames) == n
@@ -219,9 +211,23 @@ def decode_and_resize(self, video_file, pts_list, height, width, device):
         ]
         return frames
 
+    def convert_frame_to_rgb_tensor(self, frame):
+        # OpenCV uses BGR, change to RGB
+        frame = self.cv2.cvtColor(frame, self.cv2.COLOR_BGR2RGB)
+        # Update to C, H, W
+        frame = np.transpose(frame, (2, 0, 1))
+        # Convert to tensor
+        frame = torch.from_numpy(frame)
+        return frame
+
 
 class TorchCodecCore(AbstractDecoder):
-    def __init__(self, num_threads=None, color_conversion_library=None, device="cpu"):
+    def __init__(
+        self,
+        num_threads: str | None = None,
+        color_conversion_library=None,
+        device="cpu",
+    ):
         self._num_threads = int(num_threads) if num_threads else None
         self._color_conversion_library = color_conversion_library
         self._device = device
@@ -259,7 +265,12 @@ def decode_first_n_frames(self, video_file, n):
 
 
 class TorchCodecCoreNonBatch(AbstractDecoder):
-    def __init__(self, num_threads=None, color_conversion_library=None, device="cpu"):
+    def __init__(
+        self,
+        num_threads: str | None = None,
+        color_conversion_library=None,
+        device="cpu",
+    ):
         self._num_threads = num_threads
         self._color_conversion_library = color_conversion_library
         self._device = device
@@ -328,7 +339,12 @@ def decode_and_resize(self, video_file, pts_list, height, width, device):
 
 
 class TorchCodecCoreBatch(AbstractDecoder):
-    def __init__(self, num_threads=None, color_conversion_library=None, device="cpu"):
+    def __init__(
+        self,
+        num_threads: str | None = None,
+        color_conversion_library=None,
+        device="cpu",
+    ):
         self._print_each_iteration_time = False
         self._num_threads = int(num_threads) if num_threads else None
         self._color_conversion_library = color_conversion_library
@@ -369,10 +385,10 @@ def decode_first_n_frames(self, video_file, n):
 class TorchCodecPublic(AbstractDecoder):
     def __init__(
         self,
-        num_ffmpeg_threads=None,
+        num_ffmpeg_threads: str | None = None,
         device="cpu",
         seek_mode="exact",
-        stream_index=None,
+        stream_index: str | None = None,
     ):
         self._num_ffmpeg_threads = num_ffmpeg_threads
         self._device = device
@@ -433,7 +449,12 @@ def decode_and_resize(self, video_file, pts_list, height, width, device):
 
 
 class TorchCodecPublicNonBatch(AbstractDecoder):
-    def __init__(self, num_ffmpeg_threads=None, device="cpu", seek_mode="approximate"):
+    def __init__(
+        self,
+        num_ffmpeg_threads: str | None = None,
+        device="cpu",
+        seek_mode="approximate",
+    ):
         self._num_ffmpeg_threads = num_ffmpeg_threads
         self._device = device
         self._seek_mode = seek_mode
@@ -536,7 +557,7 @@ def decode_first_n_frames(self, video_file, n):
 
 
 class TorchAudioDecoder(AbstractDecoder):
-    def __init__(self, stream_index=None):
+    def __init__(self, stream_index: str | None = None):
         import torchaudio  # noqa: F401
 
         self.torchaudio = torchaudio