[general] Add strict=True to all zip() calls as per new ruff lint

Breakthrough · Breakthrough · commit 75243b026465 · 2026-01-21T19:55:18.000-05:00
diff --git a/benchmark/autoshot_dataset.py b/benchmark/autoshot_dataset.py
@@ -17,7 +17,7 @@ def __init__(self, dataset_dir: str):
         self._scene_files = [
             file for file in sorted(glob.glob(os.path.join(dataset_dir, "annotations", "*.txt")))
         ]
-        for video_file, scene_file in zip(self._video_files, self._scene_files):
+        for video_file, scene_file in zip(self._video_files, self._scene_files, strict=True):
             video_id = os.path.basename(video_file).split(".")[0]
             scene_id = os.path.basename(scene_file).split(".")[0]
             assert video_id == scene_id
diff --git a/benchmark/bbc_dataset.py b/benchmark/bbc_dataset.py
@@ -18,7 +18,7 @@ def __init__(self, dataset_dir: str):
             file for file in sorted(glob.glob(os.path.join(dataset_dir, "fixed", "*.txt")))
         ]
         assert len(self._video_files) == len(self._scene_files)
-        for video_file, scene_file in zip(self._video_files, self._scene_files):
+        for video_file, scene_file in zip(self._video_files, self._scene_files, strict=True):
             video_id = os.path.basename(video_file).replace("bbc_", "").split(".")[0]
             scene_id = os.path.basename(scene_file).split("-")[0]
             assert video_id == scene_id
diff --git a/scenedetect/detectors/content_detector.py b/scenedetect/detectors/content_detector.py
@@ -173,7 +173,8 @@ def _calculate_frame_score(self, timecode: FrameTimecode, frame_img: numpy.ndarr
         )
 
         frame_score: float = sum(
-            component * weight for (component, weight) in zip(score_components, self._weights)
+            component * weight
+            for (component, weight) in zip(score_components, self._weights, strict=True)
         ) / sum(abs(weight) for weight in self._weights)
 
         # Record components and frame score if needed for analysis.
diff --git a/scenedetect/detectors/transnet_v2.py b/scenedetect/detectors/transnet_v2.py
@@ -0,0 +1,213 @@
+#
+#            PySceneDetect: Python-Based Video Scene Detector
+#   -------------------------------------------------------------------
+#     [  Site:    https://scenedetect.com                           ]
+#     [  Docs:    https://scenedetect.com/docs/                     ]
+#     [  Github:  https://github.com/Breakthrough/PySceneDetect/    ]
+#
+# Copyright (C) 2014-2024 Brandon Castellano <http://www.bcastell.com>.
+# PySceneDetect is licensed under the BSD 3-Clause License; see the
+# included LICENSE file, or visit one of the above pages for details.
+#
+""":class:`TransnetV2Detector` uses a pretrained neural network.
+
+This detector is available from the command-line as the `detect-transnetv2` command.
+"""
+
+import typing as ty
+import warnings
+from enum import Enum
+from logging import getLogger
+from pathlib import Path
+
+import cv2
+import numpy as np
+
+from scenedetect.common import FrameTimecode, Timecode
+from scenedetect.detector import FlashFilter, SceneDetector
+
+logger = getLogger("pyscenedetect")
+
+
+class Detector:
+    def __init__(self, threshold: float, flash_filter: FlashFilter):
+        self.i = 0
+        self.y_prev = 0
+        self.threshold = threshold
+        self.flash_filter = flash_filter
+
+    def push(self, ys: np.ndarray, ts: np.ndarray):
+        predictions = (ys > self.threshold).astype(np.uint8)
+
+        cuts = []
+        for y, t in zip(predictions, ts, strict=True):
+            if self.y_prev == 0 and y == 1 and self.i > 0:
+                cuts.append(t)
+            self.y_prev = y
+            self.i += 1
+
+        return cuts
+
+
+class Predictor:
+    def __init__(
+        self,
+        model_path: ty.Union[str, Path],
+        flash_filter: FlashFilter,
+        onnx_providers: ty.Union[ty.List[str], None],
+        threshold,
+    ):
+        import onnxruntime as ort
+
+        ort.set_default_logger_severity(3)
+
+        if onnx_providers is None:
+            onnx_providers = ort.get_available_providers()
+
+        sess_opt = ort.SessionOptions()
+        sess_opt.log_severity_level = 3
+
+        self.session = ort.InferenceSession(model_path, sess_opt=sess_opt, providers=onnx_providers)
+
+        self.pixels = None
+        self.time = None
+
+        self.det = Detector(threshold, flash_filter)
+
+    def _inference(self, pixels: np.ndarray, time: np.ndarray):
+        pred = np.array(self.session.run(["output"], {"input": pixels}))[0]
+
+        cuts = []
+        for i in range(pred.shape[0]):
+            cuts.extend(self.det.push(pred[i, 25:75, 0], time[i, 25:75]))
+        return cuts
+
+    def push(self, pixels: np.ndarray, time: np.ndarray):
+        if self.pixels is None:
+            self.pixels = pixels
+            self.time = time
+
+            return self._inference(
+                np.stack(
+                    (
+                        np.tile(np.expand_dims(pixels[0], axis=0), (100, 1, 1, 1)),
+                        np.concatenate(
+                            (
+                                np.tile(np.expand_dims(pixels[0], axis=0), (25, 1, 1, 1)),
+                                pixels[:75],
+                            ),
+                            0,
+                        ),
+                    )
+                ),
+                np.stack(
+                    (
+                        np.tile(np.expand_dims(time[0], axis=0), (100,)),
+                        np.concatenate(
+                            (np.tile(np.expand_dims(time[0], axis=0), (25,)), time[:75]), 0
+                        ),
+                    )
+                ),
+            )
+        else:
+            c1 = self.pixels
+            c2 = pixels
+
+            t1 = self.time
+            t2 = time
+
+            self.pixels = pixels
+            self.time = time
+
+            return self._inference(
+                np.stack(
+                    (np.concatenate((c1[25:], c2[:25]), 0), np.concatenate((c1[75:], c2[:75]), 0))
+                ),
+                np.stack(
+                    (np.concatenate((t1[25:], t2[:25]), 0), np.concatenate((t1[75:], t2[:75]), 0))
+                ),
+            )
+
+
+class TransnetV2Detector(SceneDetector):
+    def __init__(
+        self,
+        model_path: ty.Union[str, Path] = "tests/resources/transnetv2.onnx",
+        onnx_providers: ty.Union[ty.List[str], None] = None,
+        threshold: float = 0.5,
+        min_scene_len: int = 15,
+        filter_mode: FlashFilter.Mode = FlashFilter.Mode.MERGE,
+    ):
+        super().__init__()
+
+        self.px = np.zeros((2, 100, 27, 48, 3), dtype=np.uint8)
+        self.time = np.zeros((2, 100), dtype=np.int64)
+
+        self.blank = np.zeros(self.px.shape[2:], dtype=np.uint8)
+
+        self.i = 0
+        self.j = 0
+
+        self.predictor = Predictor(
+            model_path=model_path,
+            flash_filter=FlashFilter(mode=filter_mode, length=min_scene_len),
+            onnx_providers=onnx_providers,
+            threshold=threshold,
+        )
+        # TODO(https://scenedetect.com/issue/168): Figure out a better long term plan for handling
+        # `min_scene_len` which should be specified in seconds, not frames.
+        self._flash_filter = FlashFilter(mode=filter_mode, length=min_scene_len)
+
+    def mk_ft(self, pts: int):
+        # t = Timecode(pts=pts, time_base=self.time_base)
+        t = float(pts * self.time_base)
+        return FrameTimecode(t, fps=self._fps)
+
+    def process_frame(
+        self, timecode: FrameTimecode, frame_img: np.ndarray
+    ) -> ty.List[FrameTimecode]:
+        """Process the next frame."""
+
+        self.time_base = timecode.time_base
+        self._fps = timecode._rate
+
+        pixels = cv2.resize(frame_img, (48, 27), interpolation=cv2.INTER_AREA)
+
+        self.px[self.j, self.i] = pixels
+        self.time[self.j, self.i] = timecode.pts
+        self.i += 1
+
+        if self.i >= 100:
+            cuts = self.predictor.push(self.px[self.j], self.time[self.j])
+            self.j = 1 - self.j
+            self.i = 0
+
+            filtered_cuts = []
+            for cut in cuts:
+                filtered_cuts += self._flash_filter.filter(self.mk_ft(cut), True)
+            return filtered_cuts
+        else:
+            return []
+
+    def post_process(self, timecode: FrameTimecode) -> ty.List[FrameTimecode]:
+        """Writes a final scene cut if the last detected fade was a fade-out."""
+
+        cuts = []
+
+        last_time = timecode.pts
+        blank_frame = self.blank[:]
+
+        self.px[self.j, self.i :] = blank_frame
+        self.time[self.j, self.i :] = last_time
+        cuts.extend(self.predictor.push(self.px[self.j], self.time[self.j]))
+
+        self.j = 1 - self.j
+
+        self.px[self.j, :] = blank_frame
+        self.time[self.j, :] = last_time
+        cuts.extend(self.predictor.push(self.px[self.j], self.time[self.j]))
+
+        filtered_cuts = []
+        for cut in cuts:
+            filtered_cuts += self._flash_filter.filter(self.mk_ft(cut), True)
+        return filtered_cuts

Original file line number	Diff line number	Diff line change
`@@ -17,7 +17,7 @@ def __init__(self, dataset_dir: str):`
`17`	`17`	`self._scene_files = [`
`18`	`18`	`file for file in sorted(glob.glob(os.path.join(dataset_dir, "annotations", "*.txt")))`
`19`	`19`	`]`
`20`		`- for video_file, scene_file in zip(self._video_files, self._scene_files):`
	`20`	`+ for video_file, scene_file in zip(self._video_files, self._scene_files, strict=True):`
`21`	`21`	`video_id = os.path.basename(video_file).split(".")[0]`
`22`	`22`	`scene_id = os.path.basename(scene_file).split(".")[0]`
`23`	`23`	`assert video_id == scene_id`
Original file line number	Diff line number	Diff line change
`@@ -18,7 +18,7 @@ def __init__(self, dataset_dir: str):`
`18`	`18`	`file for file in sorted(glob.glob(os.path.join(dataset_dir, "fixed", "*.txt")))`
`19`	`19`	`]`
`20`	`20`	`assert len(self._video_files) == len(self._scene_files)`
`21`		`- for video_file, scene_file in zip(self._video_files, self._scene_files):`
	`21`	`+ for video_file, scene_file in zip(self._video_files, self._scene_files, strict=True):`
`22`	`22`	`video_id = os.path.basename(video_file).replace("bbc_", "").split(".")[0]`
`23`	`23`	`scene_id = os.path.basename(scene_file).split("-")[0]`
`24`	`24`	`assert video_id == scene_id`
Original file line number	Diff line number	Diff line change
`@@ -173,7 +173,8 @@ def _calculate_frame_score(self, timecode: FrameTimecode, frame_img: numpy.ndarr`
`173`	`173`	`)`
`174`	`174`
`175`	`175`	`frame_score: float = sum(`
`176`		`- component * weight for (component, weight) in zip(score_components, self._weights)`
	`176`	`+ component * weight`
	`177`	`+ for (component, weight) in zip(score_components, self._weights, strict=True)`
`177`	`178`	`) / sum(abs(weight) for weight in self._weights)`
`178`	`179`
`179`	`180`	`# Record components and frame score if needed for analysis.`