Skip to content

Commit 3afb621

Browse files
committed
Add NVIDIA distributed platform configs
1 parent 1674697 commit 3afb621

9 files changed

Lines changed: 264 additions & 0 deletions
Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,27 @@
1+
{
2+
"model_cls": "flux2_dev",
3+
"task": "t2i",
4+
"infer_steps": 50,
5+
"aspect_ratio": "16:9",
6+
"sample_guide_scale": 4.0,
7+
"vae_scale_factor": 16,
8+
"feature_caching": "None",
9+
"enable_cfg": false,
10+
"patch_size": 2,
11+
"tokenizer_max_length": 512,
12+
"text_encoder_out_layers": [
13+
10,
14+
20,
15+
30
16+
],
17+
"attn_type": "flash_attn2",
18+
"cpu_offload": false,
19+
"offload_granularity": "block",
20+
"modulate_type": "torch",
21+
"rope_type": "torch",
22+
"layer_norm_type": "torch",
23+
"rms_norm_type": "torch",
24+
"parallel": {
25+
"tensor_p_size": 8
26+
}
27+
}
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
{
2+
"infer_steps": 50,
3+
"transformer_model_name": "480p_i2v",
4+
"fps": 24,
5+
"target_video_length": 121,
6+
"vae_stride": [
7+
4,
8+
16,
9+
16
10+
],
11+
"sample_shift": 5.0,
12+
"sample_guide_scale": 6.0,
13+
"aspect_ratio": "16:9",
14+
"enable_cfg": true,
15+
"attn_type": "flash_attn2",
16+
"modulate_type": "torch",
17+
"rope_type": "torch",
18+
"layer_norm_type": "torch",
19+
"rms_norm_type": "torch",
20+
"parallel": {
21+
"seq_p_size": 4,
22+
"seq_p_attn_type": "ulysses",
23+
"cfg_p_size": 2
24+
},
25+
"align_single_card_shape": true
26+
}
Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
{
2+
"infer_steps": 50,
3+
"aspect_ratio": "16:9",
4+
"attn_type": "flash_attn2",
5+
"enable_cfg": true,
6+
"sample_guide_scale": 4.0,
7+
"enable_cfg_renorm": true,
8+
"cfg_renorm_min": 0.0,
9+
"axes_dims_rope": [
10+
16,
11+
56,
12+
56
13+
],
14+
"dit_quant_scheme": "Default",
15+
"rms_norm_type": "torch",
16+
"modulate_type": "torch",
17+
"rope_type": "torch",
18+
"layer_norm_type": "torch",
19+
"parallel": {
20+
"seq_p_size": 4,
21+
"seq_p_attn_type": "ulysses",
22+
"cfg_p_size": 2
23+
}
24+
}
Lines changed: 57 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,57 @@
1+
{
2+
"infer_steps": 30,
3+
"target_video_length": 121,
4+
"target_height": 512,
5+
"target_width": 768,
6+
"attn_type": "flash_attn2",
7+
"sample_guide_scale": 3.0,
8+
"sample_shift": [
9+
2.05,
10+
0.95
11+
],
12+
"enable_cfg": true,
13+
"cpu_offload": false,
14+
"gemma_cpu_offload": true,
15+
"vae_cpu_offload": false,
16+
"norm_modulate_backend": "torch",
17+
"modulate_type": "torch",
18+
"rope_type": "torch",
19+
"layer_norm_type": "torch",
20+
"rms_norm_type": "torch",
21+
"num_channels_latents": 128,
22+
"fps": 24,
23+
"audio_fps": 24000,
24+
"audio_mel_bins": 16,
25+
"double_precision_rope": false,
26+
"use_tiling_vae": false,
27+
"dit_original_ckpt": "/data/nvme1/wushuo/hf_models/models/LTX-2.3/ltx-2.3-22b-dev.safetensors",
28+
"caption_proj_before_connector": true,
29+
"cross_attention_adaln": true,
30+
"apply_gated_attention": true,
31+
"mm_guider": {
32+
"enabled": true,
33+
"video": {
34+
"cfg_scale": 3.0,
35+
"stg_scale": 1.0,
36+
"stg_blocks": [
37+
28
38+
],
39+
"modality_scale": 3.0,
40+
"rescale_scale": 0.7,
41+
"skip_step": 0
42+
},
43+
"audio": {
44+
"cfg_scale": 7.0,
45+
"stg_scale": 1.0,
46+
"stg_blocks": [
47+
28
48+
],
49+
"modality_scale": 3.0,
50+
"rescale_scale": 0.7,
51+
"skip_step": 0
52+
}
53+
},
54+
"parallel": {
55+
"tensor_p_size": 8
56+
}
57+
}
Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
{
2+
"infer_steps": 50,
3+
"aspect_ratio": "16:9",
4+
"prompt_template_encode": "<|im_start|>system\nDescribe the image by detailing the color, shape, size, texture, quantity, text, spatial relationships of the objects and background:<|im_end|>\n<|im_start|>user\n{}<|im_end|>\n<|im_start|>assistant\n",
5+
"prompt_template_encode_start_idx": 34,
6+
"attn_type": "flash_attn2",
7+
"enable_cfg": true,
8+
"sample_guide_scale": 4.0,
9+
"cpu_offload": false,
10+
"offload_granularity": "model",
11+
"modulate_type": "torch",
12+
"rope_type": "torch",
13+
"layer_norm_type": "torch",
14+
"rms_norm_type": "torch",
15+
"parallel": {
16+
"seq_p_size": 4,
17+
"seq_p_attn_type": "ulysses",
18+
"cfg_p_size": 2
19+
}
20+
}
Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,30 @@
1+
{
2+
"infer_steps": 40,
3+
"target_video_length": 81,
4+
"text_len": 512,
5+
"target_height": 720,
6+
"target_width": 1280,
7+
"self_attn_1_type": "flash_attn2",
8+
"cross_attn_1_type": "flash_attn2",
9+
"cross_attn_2_type": "flash_attn2",
10+
"sample_guide_scale": [
11+
4.0,
12+
3.0
13+
],
14+
"sample_shift": 12.0,
15+
"enable_cfg": true,
16+
"cpu_offload": false,
17+
"offload_granularity": "model",
18+
"t5_cpu_offload": false,
19+
"vae_cpu_offload": false,
20+
"boundary": 0.875,
21+
"modulate_type": "torch",
22+
"rope_type": "torch",
23+
"layer_norm_type": "torch",
24+
"rms_norm_type": "torch",
25+
"parallel": {
26+
"seq_p_size": 4,
27+
"seq_p_attn_type": "ulysses",
28+
"cfg_p_size": 2
29+
}
30+
}
Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
{
2+
"infer_steps": 50,
3+
"target_video_length": 81,
4+
"text_len": 512,
5+
"target_height": 480,
6+
"target_width": 832,
7+
"self_attn_1_type": "flash_attn2",
8+
"cross_attn_1_type": "flash_attn2",
9+
"cross_attn_2_type": "flash_attn2",
10+
"sample_guide_scale": 6,
11+
"sample_shift": 8,
12+
"enable_cfg": true,
13+
"cpu_offload": false,
14+
"offload_granularity": "model",
15+
"modulate_type": "torch",
16+
"rope_type": "torch",
17+
"layer_norm_type": "torch",
18+
"rms_norm_type": "torch",
19+
"parallel": {
20+
"seq_p_size": 4,
21+
"seq_p_attn_type": "ulysses",
22+
"cfg_p_size": 2
23+
}
24+
}
Lines changed: 37 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,37 @@
1+
{
2+
"infer_steps": 4,
3+
"target_video_length": 81,
4+
"text_len": 512,
5+
"target_height": 480,
6+
"target_width": 832,
7+
"self_attn_1_type": "flash_attn2",
8+
"cross_attn_1_type": "flash_attn2",
9+
"cross_attn_2_type": "flash_attn2",
10+
"sample_guide_scale": 1,
11+
"sample_shift": 5.0,
12+
"enable_cfg": false,
13+
"cpu_offload": false,
14+
"dit_original_ckpt": "/data/nvme1/wushuo/hf_models/models/Self-Forcing/checkpoints/self_forcing_dmd.pt",
15+
"causal_rope_type": "torch",
16+
"modulate_type": "torch",
17+
"rope_type": "torch",
18+
"layer_norm_type": "torch",
19+
"rms_norm_type": "torch",
20+
"ar_config": {
21+
"local_attn_size": -1,
22+
"num_frame_per_chunk": 3,
23+
"timesteps_index": [
24+
0,
25+
179,
26+
358,
27+
679
28+
],
29+
"kv_offload": false,
30+
"async_vae_decode": false
31+
},
32+
"parallel": {
33+
"seq_p_size": 4,
34+
"cfg_p_size": 2,
35+
"seq_p_attn_type": "ulysses"
36+
}
37+
}
Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,19 @@
1+
{
2+
"aspect_ratio": "16:9",
3+
"num_channels_latents": 16,
4+
"infer_steps": 9,
5+
"attn_type": "flash_attn2",
6+
"enable_cfg": false,
7+
"sample_guide_scale": 0.0,
8+
"patch_size": 2,
9+
"cpu_offload": false,
10+
"offload_granularity": "model",
11+
"modulate_type": "torch",
12+
"rope_type": "torch",
13+
"layer_norm_type": "torch",
14+
"rms_norm_type": "torch",
15+
"parallel": {
16+
"seq_p_size": 2,
17+
"seq_p_attn_type": "ulysses"
18+
}
19+
}

0 commit comments

Comments
 (0)