Skip to content

Commit d63732d

Browse files
authored
Merge pull request #209 from LightricksResearch/sync_public_main
sync: Update tests, fp8 configs, and minor fixes
2 parents 34625c3 + 98a0ce6 commit d63732d

19 files changed

Lines changed: 1227 additions & 1216 deletions

.gitattributes

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,3 +2,4 @@
22
*.jpeg filter=lfs diff=lfs merge=lfs -text
33
*.png filter=lfs diff=lfs merge=lfs -text
44
*.gif filter=lfs diff=lfs merge=lfs -text
5+
tests/utils/car.png filter=lfs diff=lfs merge=lfs -text

.github/workflows/pylint.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,9 +10,9 @@ jobs:
1010
python-version: ["3.10"]
1111
steps:
1212
- name: Checkout repository and submodules
13-
uses: actions/checkout@v3
13+
uses: actions/checkout@v4
1414
- name: Set up Python ${{ matrix.python-version }}
15-
uses: actions/setup-python@v3
15+
uses: actions/setup-python@v5
1616
with:
1717
python-version: ${{ matrix.python-version }}
1818
- name: Install dependencies

.gitignore

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -163,4 +163,6 @@ cython_debug/
163163

164164
# From inference.py
165165
outputs/
166-
video_output_*.mp4
166+
*.mp4
167+
*.png
168+
!tests/utils/car.png

README.md

Lines changed: 36 additions & 30 deletions
Large diffs are not rendered by default.

__init__.py

Whitespace-only changes.
Lines changed: 34 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,34 @@
1+
pipeline_type: multi-scale
2+
checkpoint_path: "ltxv-13b-0.9.7-dev-fp8.safetensors"
3+
downscale_factor: 0.6666666
4+
spatial_upscaler_model_path: "ltxv-spatial-upscaler-0.9.7.safetensors"
5+
stg_mode: "attention_values" # options: "attention_values", "attention_skip", "residual", "transformer_block"
6+
decode_timestep: 0.05
7+
decode_noise_scale: 0.025
8+
text_encoder_model_name_or_path: "PixArt-alpha/PixArt-XL-2-1024-MS"
9+
precision: "float8_e4m3fn" # options: "float8_e4m3fn", "bfloat16", "mixed_precision"
10+
sampler: "from_checkpoint" # options: "uniform", "linear-quadratic", "from_checkpoint"
11+
prompt_enhancement_words_threshold: 120
12+
prompt_enhancer_image_caption_model_name_or_path: "MiaoshouAI/Florence-2-large-PromptGen-v2.0"
13+
prompt_enhancer_llm_model_name_or_path: "unsloth/Llama-3.2-3B-Instruct"
14+
stochastic_sampling: false
15+
16+
first_pass:
17+
guidance_scale: [1, 1, 6, 8, 6, 1, 1]
18+
stg_scale: [0, 0, 4, 4, 4, 2, 1]
19+
rescaling_scale: [1, 1, 0.5, 0.5, 1, 1, 1]
20+
guidance_timesteps: [1.0, 0.996, 0.9933, 0.9850, 0.9767, 0.9008, 0.6180]
21+
skip_block_list: [[], [11, 25, 35, 39], [22, 35, 39], [28], [28], [28], [28]]
22+
num_inference_steps: 30
23+
skip_final_inference_steps: 3
24+
cfg_star_rescale: true
25+
26+
second_pass:
27+
guidance_scale: [1]
28+
stg_scale: [1]
29+
rescaling_scale: [1]
30+
guidance_timesteps: [1.0]
31+
skip_block_list: [27]
32+
num_inference_steps: 30
33+
skip_initial_inference_steps: 17
34+
cfg_star_rescale: true
Lines changed: 28 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
pipeline_type: multi-scale
2+
checkpoint_path: "ltxv-13b-0.9.7-distilled-fp8.safetensors"
3+
downscale_factor: 0.6666666
4+
spatial_upscaler_model_path: "ltxv-spatial-upscaler-0.9.7.safetensors"
5+
stg_mode: "attention_values" # options: "attention_values", "attention_skip", "residual", "transformer_block"
6+
decode_timestep: 0.05
7+
decode_noise_scale: 0.025
8+
text_encoder_model_name_or_path: "PixArt-alpha/PixArt-XL-2-1024-MS"
9+
precision: "float8_e4m3fn" # options: "float8_e4m3fn", "bfloat16", "mixed_precision"
10+
sampler: "from_checkpoint" # options: "uniform", "linear-quadratic", "from_checkpoint"
11+
prompt_enhancement_words_threshold: 120
12+
prompt_enhancer_image_caption_model_name_or_path: "MiaoshouAI/Florence-2-large-PromptGen-v2.0"
13+
prompt_enhancer_llm_model_name_or_path: "unsloth/Llama-3.2-3B-Instruct"
14+
stochastic_sampling: false
15+
16+
first_pass:
17+
timesteps: [1.0000, 0.9937, 0.9875, 0.9812, 0.9750, 0.9094, 0.7250]
18+
guidance_scale: 1
19+
stg_scale: 0
20+
rescaling_scale: 1
21+
skip_block_list: [42]
22+
23+
second_pass:
24+
timesteps: [0.9094, 0.7250, 0.4219]
25+
guidance_scale: 1
26+
stg_scale: 0
27+
rescaling_scale: 1
28+
skip_block_list: [42]

0 commit comments

Comments
 (0)