Merge branch 'main' into issue-496-deflake-moviepy-tests

Breakthrough · web-flow · commit a68e94715049 · 2026-04-19T19:35:36.000-04:00
diff --git a/.github/actions/setup-ffmpeg/action.yml b/.github/actions/setup-ffmpeg/action.yml
@@ -1,41 +1,68 @@
 name: 'Setup FFmpeg'
+description: 'Ensure ffmpeg is available on the runner, using OS package managers as a fallback.'
 inputs:
   github-token:
-    required: true
+    description: 'Unused; kept for backward compatibility with existing callers.'
+    required: false
+    default: ''
 
 runs:
   using: 'composite'
   steps:
-    - name: Setup FFmpeg (latest)
-      id: latest
-      continue-on-error: true
-      uses: FedericoCarboni/setup-ffmpeg@v3
-      with:
-        github-token: ${{ inputs.github-token }}
+    - name: Check for preinstalled ffmpeg
+      id: check
+      shell: bash
+      run: |
+        if command -v ffmpeg >/dev/null 2>&1; then
+          echo "ffmpeg already available at: $(command -v ffmpeg)"
+          ffmpeg -version | head -n 1
+          echo "installed=true" >> "$GITHUB_OUTPUT"
+        else
+          echo "ffmpeg not found on PATH; will install via package manager."
+          echo "installed=false" >> "$GITHUB_OUTPUT"
+        fi
 
-    - name: Setup FFmpeg (7.0.0)
-      if: ${{ steps.latest.outcome == 'failure' }}
-      id: v7-0-0
-      continue-on-error: true
-      uses: FedericoCarboni/setup-ffmpeg@v3
-      with:
-        github-token: ${{ inputs.github-token }}
-        ffmpeg-version: "7.0.0"
+    - name: Install ffmpeg (Linux)
+      if: ${{ steps.check.outputs.installed == 'false' && runner.os == 'Linux' }}
+      shell: bash
+      run: |
+        for attempt in 1 2 3; do
+          echo "apt-get attempt $attempt"
+          if sudo apt-get update && sudo apt-get install -y ffmpeg; then
+            exit 0
+          fi
+          sleep 10
+        done
+        echo "Failed to install ffmpeg via apt-get after 3 attempts" >&2
+        exit 1
 
-    - name: Setup FFmpeg (6.1.1)
-      if: ${{ steps.v7-0-0.outcome == 'failure' }}
-      id: v6-1-1
-      continue-on-error: true
-      uses: FedericoCarboni/setup-ffmpeg@v3
-      with:
-        github-token: ${{ inputs.github-token }}
-        ffmpeg-version: "6.1.1"
+    - name: Install ffmpeg (macOS)
+      if: ${{ steps.check.outputs.installed == 'false' && runner.os == 'macOS' }}
+      shell: bash
+      run: |
+        for attempt in 1 2 3; do
+          echo "brew attempt $attempt"
+          if brew install ffmpeg; then
+            exit 0
+          fi
+          sleep 10
+        done
+        echo "Failed to install ffmpeg via brew after 3 attempts" >&2
+        exit 1
 
-  # The oldest version we allow falling back to must not have `continue-on-error: true`
-    - name: Setup FFmpeg (6.1.0)
-      if: ${{ steps.v6-1-1.outcome == 'failure' }}
-      id: v6-1-0
-      uses: FedericoCarboni/setup-ffmpeg@v3
-      with:
-        github-token: ${{ inputs.github-token }}
-        ffmpeg-version: "6.1.0"
+    - name: Install ffmpeg (Windows)
+      if: ${{ steps.check.outputs.installed == 'false' && runner.os == 'Windows' }}
+      shell: pwsh
+      run: |
+        for ($attempt = 1; $attempt -le 3; $attempt++) {
+          Write-Host "choco attempt $attempt"
+          choco install ffmpeg -y --no-progress
+          if ($LASTEXITCODE -eq 0) { exit 0 }
+          Start-Sleep -Seconds 10
+        }
+        Write-Error "Failed to install ffmpeg via choco after 3 attempts"
+        exit 1
+
+    - name: Verify ffmpeg
+      shell: bash
+      run: ffmpeg -version | head -n 1
diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
@@ -36,9 +36,6 @@ jobs:
       - uses: actions/checkout@v4
 
       - name: Setup FFmpeg
-        # TODO: This action currently does not work for non-x64 builders (e.g. macos-14):
-        # https://github.com/federicocarboni/setup-ffmpeg/issues/21
-        if: ${{ runner.arch == 'X64' }}
         uses: ./.github/actions/setup-ffmpeg
         with:
           github-token: ${{ secrets.GITHUB_TOKEN }}
diff --git a/scenedetect.cfg b/scenedetect.cfg
@@ -227,7 +227,8 @@
 # Compression amount for png images (0 to 9). Only affects size, not quality.
 #compression = 3
 
-# Number of frames to ignore around each scene cut when selecting frames.
+# Padding around each scene cut when selecting frames. Accepts a number of frames (1),
+# seconds with `s` suffix (0.1s), or timecode (00:00:00.100).
 #frame-margin = 1
 
 # Resize by scale factor (0.5 = half, 1.0 = same, 2.0 = double).
diff --git a/scenedetect/_cli/__init__.py b/scenedetect/_cli/__init__.py
@@ -1397,11 +1397,11 @@ def split_video_command(
 @click.option(
     "-m",
     "--frame-margin",
-    metavar="N",
+    metavar="DURATION",
     default=None,
-    type=click.INT,
-    help="Number of frames to ignore at beginning/end of scenes when saving images. Controls temporal padding on scene boundaries.%s"
-    % (USER_CONFIG.get_help_string("save-images", "num-images")),
+    type=click.STRING,
+    help="Padding around the beginning/end of each scene used when selecting which frames to extract. DURATION can be specified in frames (-m 1), in seconds with `s` suffix (-m 0.1s), or timecode (-m 00:00:00.100).%s"
+    % (USER_CONFIG.get_help_string("save-images", "frame-margin")),
 )
 @click.option(
     "--scale",
@@ -1441,7 +1441,7 @@ def save_images_command(
     quality: ty.Optional[int] = None,
     png: bool = False,
     compression: ty.Optional[int] = None,
-    frame_margin: ty.Optional[int] = None,
+    frame_margin: ty.Optional[str] = None,
     scale: ty.Optional[float] = None,
     height: ty.Optional[int] = None,
     width: ty.Optional[int] = None,
diff --git a/scenedetect/_cli/config.py b/scenedetect/_cli/config.py
@@ -412,7 +412,7 @@ class XmlFormat(Enum):
         "compression": RangeValue(3, min_val=0, max_val=9),
         "filename": "$VIDEO_NAME-Scene-$SCENE_NUMBER-$IMAGE_NUMBER",
         "format": "jpeg",
-        "frame-margin": 1,
+        "frame-margin": TimecodeValue(1),
         "height": 0,
         "num-images": 3,
         "output": None,
diff --git a/scenedetect/detector.py b/scenedetect/detector.py
@@ -24,6 +24,7 @@
     event (in, out, cut, etc...).
 """
 
+import math
 import typing as ty
 from abc import ABC, abstractmethod
 from enum import Enum
@@ -114,26 +115,48 @@ class Mode(Enum):
         SUPPRESS = 1
         """Suppress consecutive cuts until the filter length has passed."""
 
-    def __init__(self, mode: Mode, length: int):
+    def __init__(self, mode: Mode, length: ty.Union[int, float, str]):
         """
         Arguments:
             mode: The mode to use when enforcing `length`.
-            length: Number of frames to use when filtering cuts.
+            length: Minimum scene length. Accepts an `int` (number of frames), `float` (seconds),
+                or `str` (timecode, e.g. ``"0.6s"`` or ``"00:00:00.600"``).
         """
         self._mode = mode
-        self._filter_length = length  # Number of frames to use for activating the filter.
-        self._filter_secs: ty.Optional[float] = None  # Threshold in seconds, computed on first use.
+        # Frame count (int) and seconds (float) representations of `length`. Exactly one is
+        # populated up front; the other is computed on the first frame once the framerate is
+        # known. Temporal inputs (float/non-digit str) populate `_filter_secs`; integer inputs
+        # (int/digit str) populate `_filter_length`.
+        self._filter_length: int = 0
+        self._filter_secs: ty.Optional[float] = None
+        if isinstance(length, float):
+            self._filter_secs = length
+        elif isinstance(length, str) and not length.strip().isdigit():
+            self._filter_secs = FrameTimecode(timecode=length, fps=100.0).seconds
+        else:
+            self._filter_length = int(length)
         self._last_above = None  # Last frame above threshold.
         self._merge_enabled = False  # Used to disable merging until at least one cut was found.
         self._merge_triggered = False  # True when the merge filter is active.
         self._merge_start = None  # Frame number where we started the merge filter.
 
     @property
     def max_behind(self) -> int:
-        return 0 if self._mode == FlashFilter.Mode.SUPPRESS else self._filter_length
+        if self._mode == FlashFilter.Mode.SUPPRESS:
+            return 0
+        if self._filter_secs is not None:
+            # Estimate using 240fps so the event buffer is large enough for any reasonable input.
+            return math.ceil(self._filter_secs * 240.0)
+        return self._filter_length
+
+    @property
+    def _is_disabled(self) -> bool:
+        if self._filter_secs is not None:
+            return self._filter_secs <= 0.0
+        return self._filter_length <= 0
 
     def filter(self, timecode: FrameTimecode, above_threshold: bool) -> ty.List[FrameTimecode]:
-        if not self._filter_length > 0:
+        if self._is_disabled:
             return [timecode] if above_threshold else []
         if self._last_above is None:
             self._last_above = timecode
diff --git a/scenedetect/detectors/adaptive_detector.py b/scenedetect/detectors/adaptive_detector.py
@@ -38,7 +38,7 @@ class AdaptiveDetector(ContentDetector):
     def __init__(
         self,
         adaptive_threshold: float = 3.0,
-        min_scene_len: int = 15,
+        min_scene_len: ty.Union[int, float, str] = 15,
         window_width: int = 2,
         min_content_val: float = 15.0,
         weights: ContentDetector.Components = ContentDetector.DEFAULT_COMPONENT_WEIGHTS,
@@ -49,8 +49,9 @@ def __init__(
         Arguments:
             adaptive_threshold: Threshold (float) that score ratio must exceed to trigger a
                 new scene (see frame metric adaptive_ratio in stats file).
-            min_scene_len: Once a cut is detected, this many frames must pass before a new one can
-                be added to the scene list. Can be an int or FrameTimecode type.
+            min_scene_len: Once a cut is detected, this much time must pass before a new one can
+                be added to the scene list. Accepts an int (frames), float (seconds), or
+                str (e.g. ``"0.6s"``, ``"00:00:00.600"``).
             window_width: Size of window (number of frames) before and after each frame to
                 average together in order to detect deviations from the mean. Must be at least 1.
             min_content_val: Minimum threshold (float) that the content_val must exceed in order to
diff --git a/scenedetect/detectors/content_detector.py b/scenedetect/detectors/content_detector.py
@@ -104,7 +104,7 @@ class _FrameData:
     def __init__(
         self,
         threshold: float = 27.0,
-        min_scene_len: int = 15,
+        min_scene_len: ty.Union[int, float, str] = 15,
         weights: "ContentDetector.Components" = DEFAULT_COMPONENT_WEIGHTS,
         luma_only: bool = False,
         kernel_size: ty.Optional[int] = None,
@@ -113,8 +113,9 @@ def __init__(
         """
         Arguments:
             threshold: Threshold the average change in pixel intensity must exceed to trigger a cut.
-            min_scene_len: Once a cut is detected, this many frames must pass before a new one can
-                be added to the scene list. Can be an int or FrameTimecode type.
+            min_scene_len: Once a cut is detected, this much time must pass before a new one can
+                be added to the scene list. Accepts an int (frames), float (seconds), or
+                str (e.g. ``"0.6s"``, ``"00:00:00.600"``).
             weights: Weight to place on each component when calculating frame score
                 (`content_val` in a statsfile, the value `threshold` is compared against).
             luma_only: If True, only considers changes in the luminance channel of the video.
diff --git a/scenedetect/detectors/hash_detector.py b/scenedetect/detectors/hash_detector.py
@@ -41,16 +41,17 @@ class HashDetector(SceneDetector):
         size: Size of square of low frequency data to use for the DCT
         lowpass:  How much high frequency information to filter from the DCT. A value of 2 means
             keep lower 1/2 of the frequency data, 4 means only keep 1/4, etc...
-        min_scene_len: Once a cut is detected, this many frames must pass before a new one can
-                be added to the scene list. Can be an int or FrameTimecode type.
+        min_scene_len: Once a cut is detected, this much time must pass before a new one can
+                be added to the scene list. Accepts an int (frames), float (seconds), or
+                str (e.g. ``"0.6s"``, ``"00:00:00.600"``).
     """
 
     def __init__(
         self,
         threshold: float = 0.395,
         size: int = 16,
         lowpass: int = 2,
-        min_scene_len: int = 15,
+        min_scene_len: ty.Union[int, float, str] = 15,
     ):
         super(HashDetector, self).__init__()
         self._threshold = threshold
diff --git a/scenedetect/detectors/histogram_detector.py b/scenedetect/detectors/histogram_detector.py
@@ -30,16 +30,22 @@ class HistogramDetector(SceneDetector):
 
     METRIC_KEYS = ["hist_diff"]
 
-    def __init__(self, threshold: float = 0.05, bins: int = 256, min_scene_len: int = 15):
+    def __init__(
+        self,
+        threshold: float = 0.05,
+        bins: int = 256,
+        min_scene_len: ty.Union[int, float, str] = 15,
+    ):
         """
         Arguments:
             threshold: maximum relative difference between 0.0 and 1.0 that the histograms can
                 differ. Histograms are calculated on the Y channel after converting the frame to
                 YUV, and normalized based on the number of bins. Higher dicfferences imply greater
                 change in content, so larger threshold values are less sensitive to cuts.
             bins: Number of bins to use for the histogram.
-            min_scene_len:   Once a cut is detected, this many frames must pass before a new one can
-                be added to the scene list. Can be an int or FrameTimecode type.
+            min_scene_len:   Once a cut is detected, this much time must pass before a new one can
+                be added to the scene list. Accepts an int (frames), float (seconds), or
+                str (e.g. ``"0.6s"``, ``"00:00:00.600"``).
         """
         super().__init__()
         # Internally, threshold represents the correlation between two histograms and has values
diff --git a/scenedetect/detectors/threshold_detector.py b/scenedetect/detectors/threshold_detector.py
@@ -48,7 +48,7 @@ class Method(Enum):
     def __init__(
         self,
         threshold: float = 12,
-        min_scene_len: int = 15,
+        min_scene_len: ty.Union[int, float, str] = 15,
         fade_bias: float = 0.0,
         add_final_scene: bool = False,
         method: Method = Method.FLOOR,
@@ -58,8 +58,9 @@ def __init__(
         Arguments:
             threshold:  8-bit intensity value that each pixel value (R, G, and B)
                 must be <= to in order to trigger a fade in/out.
-            min_scene_len:   Once a cut is detected, this many frames must pass before a new one can
-                be added to the scene list. Can be an int or FrameTimecode type.
+            min_scene_len:   Once a cut is detected, this much time must pass before a new one can
+                be added to the scene list. Accepts an int (frames), float (seconds), or
+                str (e.g. ``"0.6s"``, ``"00:00:00.600"``).
             fade_bias:  Float between -1.0 and +1.0 representing the percentage of
                 timecode skew for the start of a scene (-1.0 causing a cut at the
                 fade-to-black, 0.0 in the middle, and +1.0 causing the cut to be
diff --git a/scenedetect/detectors/transnet_v2.py b/scenedetect/detectors/transnet_v2.py
@@ -135,7 +135,7 @@ def __init__(
         model_path: ty.Union[str, Path] = "tests/resources/transnetv2.onnx",
         onnx_providers: ty.Union[ty.List[str], None] = None,
         threshold: float = 0.5,
-        min_scene_len: int = 15,
+        min_scene_len: ty.Union[int, float, str] = 15,
         filter_mode: FlashFilter.Mode = FlashFilter.Mode.MERGE,
     ):
         super().__init__()
diff --git a/scenedetect/output/image.py b/scenedetect/output/image.py
diff --git a/tests/test_detectors.py b/tests/test_detectors.py
diff --git a/tests/test_output.py b/tests/test_output.py
diff --git a/website/pages/changelog.md b/website/pages/changelog.md