EvolvingLMMs-Lab
diff --git a/‎.gitignore‎
Lines changed: 10 additions & 0 deletions b/‎.gitignore‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎llava_next/.dockerignore‎
Lines changed: 47 additions & 0 deletions b/‎llava_next/.dockerignore‎
Lines changed: 47 additions & 0 deletions
diff --git a/‎llava_next/Compressed_Video_Reader/README.md‎
Lines changed: 55 additions & 0 deletions b/‎llava_next/Compressed_Video_Reader/README.md‎
Lines changed: 55 additions & 0 deletions
diff --git a/‎llava_next/Compressed_Video_Reader/dockerfile‎
Lines changed: 53 additions & 0 deletions b/‎llava_next/Compressed_Video_Reader/dockerfile‎
Lines changed: 53 additions & 0 deletions
@@ -107,6 +107,7 @@ secret/
 *.log
 log/
 logs/
+eval_log/
 *.pid
 *.pid.lock
 *.seed
@@ -369,6 +370,7 @@ autogen/
 .openapi/
 openapi_generated/
 swagger_generated/
+.huggingface_cache/
 
 ########################################
 # Distributed / cluster training logs
@@ -506,3 +508,11 @@ ckpts
 .gitginore
 
 _codeql*
+
+# ===========================================
+# Allow example training data demo files
+# ===========================================
+!llava_next/examples/training_data_demo/output/
+!llava_next/examples/training_data_demo/output/**
+!llava_next/examples/training_data_demo/videos/
+!llava_next/examples/training_data_demo/videos/*.mp4
@@ -0,0 +1,47 @@
+# Exclude model checkpoints (very large)
+checkpoints/
+*.pt
+*.pth
+*.bin
+*.safetensors
+*.ckpt
+
+# Exclude Git related
+.git/
+.gitignore
+
+# Exclude Python cache
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+*.egg-info/
+*.egg
+dist/
+build/
+eggs/
+.eggs/
+
+# Exclude editor and IDE files
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+.DS_Store
+
+# Exclude logs and temporary files
+*.log
+logs/
+wandb/
+runs/
+outputs/
+temp/
+tmp/
+
+# Exclude test data (if large)
+Compressed_Video_Reader/test_data/
+
+# Exclude build artifacts (FFmpeg will be recompiled inside the image)
+Compressed_Video_Reader/ffmpeg/ffmpeg_source/
@@ -0,0 +1,55 @@
+# Compressed Video Reader
+
+The Compressed Video Reader is designed to read motion vectors and residuals from H.264/H.265 encoded videos.
+
+## Installation
+
+To install the reader, you can run the installation script located in the project root:
+
+```shell
+bash install.sh
+```
+
+The script will perform the following tasks:
+
+1. Download the source code of FFmpeg
+2. Apply patches to the source code
+3. Configure and compile the FFmpeg package
+4. Build and install the reader
+
+To test if the reader has been successfully installed, run the following command:
+
+```bash
+# Test if the reader is installed successfully.
+cv_reader -h || echo "Installation failed!"
+```
+
+## Python API
+
+```python
+import cv_reader
+video_frames = cv_reader.read_video(video_path=path_to_video, with_residual=True)
+```
+
+## CLI Interface
+
+You can use the following command to extract motion vectors and residuals from a compressed video:
+
+```text
+$ cv_reader -h
+usage: Compressed Video Reader [-h] video output
+
+positional arguments:
+  video       Path to h.264/h.265 video file
+  output      Path to save extracted motion vectors and residuals
+
+optional arguments:
+  -h, --help  show this help message and exit
+```
+
+To run the extraction process on the example video, execute the following command:
+
+```bash
+python debug_vis_mvres.py --video ../test_videos/h264_sample.mp4 --num_frames 16 --out_dir ./h264_debug
+python debug_vis_mvres.py --video ../test_videos/h265_sample.mp4 --num_frames 16 --out_dir ./h265_debug
+```
@@ -0,0 +1,53 @@
+FROM pytorch/pytorch:2.7.0-cuda11.8-cudnn9-runtime
+
+# Avoid interactive prompts during installation
+ENV DEBIAN_FRONTEND=noninteractive
+
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends \
+        build-essential \
+        pkg-config \
+        wget \
+        # These are common dependencies used by ffmpeg/install_ffmpeg.sh
+        libass-dev \
+        libfreetype6-dev \
+        libsdl2-dev \
+        libtool \
+        libva-dev \
+        libvdpau-dev \
+        libvorbis-dev \
+        libxcb1-dev \
+        libxcb-shm0-dev \
+        libxcb-xfixes0-dev \
+        texinfo \
+        zlib1g-dev \
+        nasm \
+        yasm \
+        libx264-dev \
+        libx265-dev \
+        libnuma-dev \
+        libvpx-dev \
+        libmp3lame-dev \
+        libopus-dev \
+        libgl1 \
+        libglib2.0-0 \
+        libsm6 \
+        libxext6 \
+        libxrender1 \
+        vim \
+    && apt-get clean && rm -rf /var/lib/apt/lists/*
+
+WORKDIR /workspace/
+COPY . .
+
+# cv_reader CLI imports cv2, install headless version suitable for containers
+RUN pip install --no-cache-dir opencv-python-headless
+
+# Execute install.sh to install ffmpeg / cv_reader etc
+RUN bash install.sh
+
+# Default working directory
+WORKDIR /workspace
+
+# Start bash by default for debugging
+CMD ["bash"]