[api] Strengthen type hints for detectors

Breakthrough · Breakthrough · commit 006fe37b48fa · 2026-04-25T13:56:37.000-04:00
diff --git a/docs/api/migration_guide.rst b/docs/api/migration_guide.rst
@@ -160,7 +160,37 @@ All backends now return presentation timestamp (PTS) backed values from ``VideoS
 ``StatsManager`` Changes
 =======================================================================
 
-The ``StatsManager`` methods ``get_metrics()``, ``set_metrics()``, and ``metrics_exist()`` now take a ``FrameTimecode`` instead of ``int`` for the frame identifier, matching the detector interface change.
+The ``StatsManager`` methods ``get_metrics()``, ``set_metrics()``, and ``metrics_exist()`` now formally accept either a ``FrameTimecode`` or a plain ``int`` frame number for the timecode argument. Passing a ``FrameTimecode`` is preferred and matches the detector interface; the ``int`` form is retained for compatibility with the deprecated ``load_from_csv()`` path, which keys metrics by integer frame number.
+
+``StatsManager.load_from_csv()`` also accepts ``os.PathLike`` (e.g. ``pathlib.Path``) in addition to ``str`` / ``bytes`` / file handles.
+
+
+=======================================================================
+``SceneDetector`` Annotation Fixes
+=======================================================================
+
+``SceneDetector.post_process()`` now declares its parameter as ``timecode: FrameTimecode`` (previously typed as ``int``). The method already received a ``FrameTimecode`` at runtime and concrete detectors (e.g. ``ThresholdDetector``, ``ContentDetector``) already used the ``FrameTimecode`` type — only the abstract-base-class annotation was inconsistent. No call-site changes are needed; this just brings the signature into agreement with the documented and actual behavior.
+
+
+=======================================================================
+``SceneManager.detect_scenes()`` Time Arguments
+=======================================================================
+
+The ``duration`` and ``end_time`` arguments now formally accept ``int`` (frames), ``float`` (seconds), ``str`` (timecode string, e.g. ``"00:00:05.000"``), or ``FrameTimecode``. The internal code already validated these forms; the annotation was previously narrower than the documented behavior.
+
+.. code:: python
+
+    # All of these were always supported at runtime; now they type-check too:
+    scene_manager.detect_scenes(video=video, end_time=15.0)         # seconds
+    scene_manager.detect_scenes(video=video, end_time=1500)         # frames
+    scene_manager.detect_scenes(video=video, end_time="00:01:00")   # timecode
+
+
+=======================================================================
+``save_images()`` Path Handling
+=======================================================================
+
+The ``output_dir`` argument of :func:`scenedetect.output.save_images` now accepts ``os.PathLike`` (e.g. ``pathlib.Path``) in addition to ``str``. No changes are required for existing string-based callers.
 
 
 =======================================================================
diff --git a/pyproject.toml b/pyproject.toml
@@ -61,6 +61,9 @@ unfixable = []
 
 [tool.pyright]
 include = ["scenedetect", "tests"]
+# Vendored third-party code: don't lint upstream source (mirrors the ruff
+# per-file-ignores convention).
+exclude = ["scenedetect/_thirdparty"]
 # Run pyright from inside an activated venv (or pass `--pythonpath` /
 # configure your editor's interpreter) so cv2 / av / numpy / moviepy
 # resolve. Without this, pyright uses its bundled Python and the report
diff --git a/scenedetect/_cli/context.py b/scenedetect/_cli/context.py
@@ -206,6 +206,7 @@ def handle_options(
 
         # The `scenedetect` command was just started, let's initialize logging and try to load any
         # config files that were specified.
+        init_log: list = []
         try:
             init_failure = not self.config.initialized
             init_log = self.config.get_init_log()
@@ -305,9 +306,9 @@ def handle_options(
             scene_manager.auto_downscale = True
         else:
             scene_manager.auto_downscale = False
-            downscale = self.config.get_value("global", "downscale", downscale)
+            downscale_value: int = self.config.get_value("global", "downscale", downscale)
             try:
-                scene_manager.downscale = downscale
+                scene_manager.downscale = downscale_value
             except ValueError as ex:
                 logger.debug(str(ex))
                 raise click.BadParameter(str(ex), param_hint="downscale factor") from ex
@@ -532,11 +533,13 @@ def _open_video_stream(
                     framerate=framerate,
                     backend=backend,
                 )
+            duration = self.video_stream.duration
+            duration_str = f"{duration} ({duration.frame_num} frames)" if duration else "unknown"
             logger.debug(f"""Video information:
   Backend:      {type(self.video_stream).__name__}
   Resolution:   {self.video_stream.frame_size}
   Framerate:    {self.video_stream.frame_rate}
-  Duration:     {self.video_stream.duration} ({self.video_stream.duration.frame_num} frames)""")
+  Duration:     {duration_str}""")
 
         except FrameRateUnavailable as ex:
             if __debug__:
diff --git a/scenedetect/detector.py b/scenedetect/detector.py
@@ -61,7 +61,7 @@ def process_frame(
 
     # Optional Methods
 
-    def post_process(self, timecode: int) -> list[FrameTimecode]:
+    def post_process(self, timecode: FrameTimecode) -> list[FrameTimecode]:
         """Called after there are no more frames to process.
 
         Args:
diff --git a/scenedetect/detectors/adaptive_detector.py b/scenedetect/detectors/adaptive_detector.py
@@ -100,6 +100,10 @@ def get_metrics(self) -> list[str]:
     def process_frame(self, timecode: FrameTimecode, frame_img: np.ndarray) -> list[FrameTimecode]:
         super().process_frame(timecode=timecode, frame_img=frame_img)
 
+        # If the parent could not calculate a frame score, there's nothing to buffer.
+        if self._frame_score is None:
+            return []
+
         # Initialize last scene cut point at the beginning of the frames of interest.
         if self._last_cut is None:
             self._last_cut = timecode
diff --git a/scenedetect/detectors/content_detector.py b/scenedetect/detectors/content_detector.py
@@ -169,7 +169,9 @@ def _calculate_frame_score(self, timecode: FrameTimecode, frame_img: numpy.ndarr
             delta_sat=_mean_pixel_distance(sat, self._last_frame.sat),
             delta_lum=_mean_pixel_distance(lum, self._last_frame.lum),
             delta_edges=(
-                0.0 if edges is None else _mean_pixel_distance(edges, self._last_frame.edges)
+                0.0
+                if edges is None or self._last_frame.edges is None
+                else _mean_pixel_distance(edges, self._last_frame.edges)
             ),
         )
 
diff --git a/scenedetect/detectors/transnet_v2.py b/scenedetect/detectors/transnet_v2.py
@@ -107,6 +107,8 @@ def push(self, pixels: np.ndarray, time: np.ndarray):
                 ),
             )
         else:
+            # `self.time` is set in lockstep with `self.pixels` above, so it is non-None here.
+            assert self.time is not None
             c1 = self.pixels
             c2 = pixels
 
diff --git a/scenedetect/output/image.py b/scenedetect/output/image.py
@@ -28,7 +28,7 @@
     Interpolation,
     SceneList,
 )
-from scenedetect.platform import get_and_create_path, get_cv2_imwrite_params, tqdm
+from scenedetect.platform import StrPath, get_and_create_path, get_cv2_imwrite_params, tqdm
 from scenedetect.video_stream import VideoStream
 
 logger = logging.getLogger("pyscenedetect")
@@ -162,7 +162,7 @@ def run(
         self,
         video: VideoStream,
         scene_list: SceneList,
-        output_dir: str | None = None,
+        output_dir: StrPath | None = None,
         show_progress=False,
     ) -> dict[int, list[str]]:
         """Run image extraction on `video` using the current parameters. Thread-safe.
@@ -355,7 +355,7 @@ def save_images(
     image_extension: str = "jpg",
     encoder_param: int = 95,
     image_name_template: str = "$VIDEO_NAME-Scene-$SCENE_NUMBER-$IMAGE_NUMBER",
-    output_dir: str | None = None,
+    output_dir: StrPath | None = None,
     show_progress: bool | None = False,
     scale: float | None = None,
     height: int | None = None,
diff --git a/scenedetect/scene_manager.py b/scenedetect/scene_manager.py
@@ -419,8 +419,8 @@ def stop(self) -> None:
     def detect_scenes(
         self,
         video: VideoStream | None = None,
-        duration: FrameTimecode | None = None,
-        end_time: FrameTimecode | None = None,
+        duration: "int | float | str | FrameTimecode | None" = None,
+        end_time: "int | float | str | FrameTimecode | None" = None,
         frame_skip: int = 0,
         show_progress: bool = False,
         callback: ty.Callable[[np.ndarray, FrameTimecode], None] | None = None,
diff --git a/scenedetect/stats_manager.py b/scenedetect/stats_manager.py
@@ -96,19 +96,22 @@ class StatsManager:
     Only metrics consisting of `float` or `int` should be used currently.
     """
 
-    def __init__(self, base_timecode: FrameTimecode | None = None):
+    def __init__(self, base_timecode: int | FrameTimecode | None = None):
         """Initialize a new StatsManager.
 
         Arguments:
             base_timecode: Timecode associated with this object. Must not be None (default value
                 will be removed in a future release).
         """
-        # Frame metrics is a dict of frame (int): metric_dict (Dict[str, float])
-        # of each frame metric key and the value it represents (usually float).
-        self._frame_metrics: dict[FrameTimecode, dict[str, float]] = dict()
+        # Frame metrics keyed by either an `int` frame number or a `FrameTimecode`. Both forms
+        # hash/compare to the same dict slot (`FrameTimecode.__hash__` returns `frame_num`), so
+        # public methods accept both interchangeably for the same frame.
+        self._frame_metrics: dict[int | FrameTimecode, dict[str, float]] = dict()
         self._metric_keys: set[str] = set()
         self._metrics_updated: bool = False  # Flag indicating if metrics require saving.
-        self._base_timecode: FrameTimecode | None = base_timecode  # Used for timing calculations.
+        self._base_timecode: int | FrameTimecode | None = (
+            base_timecode  # Used for timing calculations.
+        )
 
     @property
     def metric_keys(self) -> ty.Iterable[str]:
@@ -120,7 +123,9 @@ def register_metrics(self, metric_keys: ty.Iterable[str]) -> None:
 
     # TODO(https://scenedetect.com/issues/507): We should support the dictionary protocol instead
     # of using this bespoke interface. It would be useful for Pandas compatibility as well.
-    def get_metrics(self, timecode: FrameTimecode, metric_keys: ty.Iterable[str]) -> list[ty.Any]:
+    def get_metrics(
+        self, timecode: int | FrameTimecode, metric_keys: ty.Iterable[str]
+    ) -> list[ty.Any]:
         """Return the requested statistics/metrics for a given timecode.
 
         Returns:
@@ -129,7 +134,7 @@ def get_metrics(self, timecode: FrameTimecode, metric_keys: ty.Iterable[str]) ->
         """
         return [self._get_metric(timecode, metric_key) for metric_key in metric_keys]
 
-    def set_metrics(self, timecode: FrameTimecode, metric_kv_dict: dict[str, ty.Any]) -> None:
+    def set_metrics(self, timecode: int | FrameTimecode, metric_kv_dict: dict[str, ty.Any]) -> None:
         """Set Metrics: Sets the provided statistics/metrics for a given frame.
 
         Arguments:
@@ -139,7 +144,7 @@ def set_metrics(self, timecode: FrameTimecode, metric_kv_dict: dict[str, ty.Any]
         for metric_key in metric_kv_dict:
             self._set_metric(timecode, metric_key, metric_kv_dict[metric_key])
 
-    def metrics_exist(self, timecode: FrameTimecode, metric_keys: ty.Iterable[str]) -> bool:
+    def metrics_exist(self, timecode: int | FrameTimecode, metric_keys: ty.Iterable[str]) -> bool:
         """Metrics Exist: Checks if the given metrics/stats exist for the given frame.
 
         Returns:
@@ -188,6 +193,10 @@ def save_to_csv(
         frame_keys = sorted(self._frame_metrics.keys())
         logger.info("Writing %d frames to CSV...", len(frame_keys))
         for frame_key in frame_keys:
+            # `frame_key` may be a bare `int` if the deprecated `load_from_csv` populated the dict.
+            # Skip such rows since we cannot recover a timecode without a base framerate.
+            if not isinstance(frame_key, FrameTimecode):
+                continue
             csv_writer.writerow(
                 [frame_key.frame_num + 1, frame_key.get_timecode()]
                 + [str(metric) for metric in self.get_metrics(frame_key, metric_keys)]
@@ -209,7 +218,7 @@ def valid_header(row: list[str]) -> bool:
 
     # TODO(v1.0): Create a replacement for a calculation cache that functions like load_from_csv
     # did, but is better integrated with detectors for cached calculations instead of statistics.
-    def load_from_csv(self, csv_file: str | bytes | ty.TextIO) -> int | None:
+    def load_from_csv(self, csv_file: StrPath | bytes | ty.TextIO) -> int | None:
         """[DEPRECATED] DO NOT USE
 
         Load all metrics stored in a CSV file into the StatsManager instance. Will be removed in a
@@ -233,7 +242,7 @@ def load_from_csv(self, csv_file: str | bytes | ty.TextIO) -> int | None:
 
         # If we get a path instead of an open file handle, check that it exists, and if so,
         # recursively call ourselves again but with file set instead of path.
-        if isinstance(csv_file, (str, bytes, Path)):
+        if isinstance(csv_file, (str, bytes, os.PathLike)):
             if os.path.exists(csv_file):
                 with open(csv_file) as file:
                     return self.load_from_csv(csv_file=file)
@@ -288,16 +297,18 @@ def load_from_csv(self, csv_file: str | bytes | ty.TextIO) -> int | None:
 
     # TODO: Get rid of these functions and simplify the implementation of this class.
 
-    def _get_metric(self, timecode: FrameTimecode, metric_key: str) -> ty.Any | None:
+    def _get_metric(self, timecode: int | FrameTimecode, metric_key: str) -> ty.Any | None:
         if self._metric_exists(timecode, metric_key):
             return self._frame_metrics[timecode][metric_key]
         return None
 
-    def _set_metric(self, timecode: FrameTimecode, metric_key: str, metric_value: ty.Any) -> None:
+    def _set_metric(
+        self, timecode: int | FrameTimecode, metric_key: str, metric_value: ty.Any
+    ) -> None:
         self._metrics_updated = True
         if timecode not in self._frame_metrics:
             self._frame_metrics[timecode] = dict()
         self._frame_metrics[timecode][metric_key] = metric_value
 
-    def _metric_exists(self, timecode: FrameTimecode, metric_key: str) -> bool:
+    def _metric_exists(self, timecode: int | FrameTimecode, metric_key: str) -> bool:
         return timecode in self._frame_metrics and metric_key in self._frame_metrics[timecode]
diff --git a/tests/test_api.py b/tests/test_api.py
@@ -101,18 +101,19 @@ def test_api_stats_manager(test_video_file: str):
     scene_manager.detect_scenes(video=video)
     # Save per-frame statistics to disk.
     filename = f"{test_video_file}.stats.csv"
+    assert scene_manager.stats_manager is not None
     scene_manager.stats_manager.save_to_csv(csv_file=filename)
 
 
 def test_api_scene_manager_callback(test_video_file: str):
     """Demonstrate how to use a callback with the SceneManager detect_scenes method."""
     import numpy
 
-    from scenedetect import ContentDetector, SceneManager, open_video
+    from scenedetect import ContentDetector, FrameTimecode, SceneManager, open_video
 
     # Callback to invoke on the first frame of every new scene detection.
-    def on_new_scene(frame_img: numpy.ndarray, frame_num: int):
-        print(f"New scene found at frame {frame_num}.")
+    def on_new_scene(frame_img: numpy.ndarray, position: FrameTimecode):
+        print(f"New scene found at frame {position.frame_num}.")
 
     video = open_video(test_video_file)
     scene_manager = SceneManager()
@@ -127,11 +128,11 @@ def test_api_device_callback(test_video_file: str):
     import cv2
     import numpy
 
-    from scenedetect import ContentDetector, SceneManager, VideoCaptureAdapter
+    from scenedetect import ContentDetector, FrameTimecode, SceneManager, VideoCaptureAdapter
 
     # Callback to invoke on the first frame of every new scene detection.
-    def on_new_scene(frame_img: numpy.ndarray, frame_num: int):
-        print(f"New scene found at frame {frame_num}.")
+    def on_new_scene(frame_img: numpy.ndarray, position: FrameTimecode):
+        print(f"New scene found at frame {position.frame_num}.")
 
     # We open a file just for test purposes, but we can also use a device or pipe here.
     cap = cv2.VideoCapture(test_video_file)
diff --git a/tests/test_backend_opencv.py b/tests/test_backend_opencv.py
@@ -31,6 +31,7 @@ def test_open_image_sequence(test_image_sequence: str):
     sequence = VideoStreamCv2(test_image_sequence, framerate=25.0)
     assert sequence.is_seekable
     assert sequence.frame_size[0] > 0 and sequence.frame_size[1] > 0
+    assert sequence.duration is not None
     assert sequence.duration.frame_num == 30
     assert sequence.read() is not False
     sequence.seek(100)
diff --git a/tests/test_cli.py b/tests/test_cli.py
@@ -37,6 +37,7 @@
 
 import scenedetect
 from scenedetect.output import is_ffmpeg_available, is_mkvmerge_available
+from scenedetect.platform import StrPath
 from tests.helpers import invoke_cli
 
 SCENEDETECT_CMD = sys.executable + " -m scenedetect"
@@ -66,7 +67,7 @@
 
 def invoke_scenedetect(
     args: str = "",
-    output_dir: str | None = None,
+    output_dir: StrPath | None = None,
     config_file: str | None = DEFAULT_CONFIG_FILE,
     **kwargs,
 ):
@@ -536,7 +537,7 @@ def test_cli_save_images(tmp_path: Path):
     # Should detect two scenes and generate 3 images per scene with above params.
     assert len(images) == 6
     # Open one of the created images and make sure it has the correct resolution.
-    image = cv2.imread(images[0])
+    image = cv2.imread(str(images[0]))
     assert image.shape == (544, 1280, 3)
 
 
@@ -575,7 +576,7 @@ def test_cli_save_images_rotation(rotated_video_file, tmp_path: Path):
     images = [image for image in tmp_path.glob("*.jpg")]
     # Should detect two scenes and generate 3 images per scene with above params.
     assert len(images) == 6
-    image = cv2.imread(images[0])
+    image = cv2.imread(str(images[0]))
     # Note same resolution as in test_cli_save_images but rotated 90 degrees.
     assert image.shape == (1280, 544, 3)
 
diff --git a/tests/test_detectors.py b/tests/test_detectors.py
@@ -31,14 +31,16 @@
     ThresholdDetector,
 )
 
-FAST_CUT_DETECTORS: tuple[type[SceneDetector]] = (
+# Untyped so each entry retains its concrete `type[…]` for parameterized construction
+# (calls below pass detector-specific kwargs like `min_scene_len`).
+FAST_CUT_DETECTORS = (
     AdaptiveDetector,
     ContentDetector,
     HashDetector,
     HistogramDetector,
 )
 
-ALL_DETECTORS: tuple[type[SceneDetector]] = (*FAST_CUT_DETECTORS, ThresholdDetector)
+ALL_DETECTORS = (*FAST_CUT_DETECTORS, ThresholdDetector)
 
 # TODO(https://scenedetect.com/issues/53): Add a test that verifies algorithms output relatively
 # consistent frame scores regardless of resolution. This will ensure that threshold values will hold
diff --git a/tests/test_platform.py b/tests/test_platform.py
@@ -37,4 +37,4 @@ def test_long_command():
     """
     if platform.system() == "Windows":
         with pytest.raises(CommandTooLong):
-            invoke_command("x" * 2**15)
+            invoke_command(["x" * 2**15])
diff --git a/tests/test_scene_manager.py b/tests/test_scene_manager.py
@@ -198,15 +198,15 @@ def test_detect_scenes_crop(test_video_file):
 
 def test_crop_invalid():
     sm = SceneManager()
-    sm.crop = None
+    sm.crop = None  # type: ignore[assignment]
     sm.crop = (0, 0, 0, 0)
     sm.crop = (1, 1, 0, 0)
     sm.crop = (0, 0, 1, 1)
     with pytest.raises(TypeError):
-        sm.crop = 1
+        sm.crop = 1  # type: ignore[assignment]
     with pytest.raises(TypeError):
-        sm.crop = (1, 1)
+        sm.crop = (1, 1)  # type: ignore[assignment]
     with pytest.raises(TypeError):
-        sm.crop = (1, 1, 1)
+        sm.crop = (1, 1, 1)  # type: ignore[assignment]
     with pytest.raises(ValueError):
         sm.crop = (1, 1, 1, -1)
diff --git a/tests/test_timecode.py b/tests/test_timecode.py
diff --git a/tests/test_video_stream.py b/tests/test_video_stream.py
diff --git a/website/pages/changelog.md b/website/pages/changelog.md

Original file line number	Diff line number	Diff line change
`@@ -107,6 +107,8 @@ def push(self, pixels: np.ndarray, time: np.ndarray):`
`107`	`107`	`),`
`108`	`108`	`)`
`109`	`109`	`else:`
	`110`	+ # `self.time` is set in lockstep with `self.pixels` above, so it is non-None here.
	`111`	`+ assert self.time is not None`
`110`	`112`	`c1 = self.pixels`
`111`	`113`	`c2 = pixels`
`112`	`114`