You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
# value to auto-shard based on available slices and devices.
203
206
# By default, product of the DCN axes should equal number of slices
204
207
# and product of the ICI axes should equal number of devices per slice.
205
-
dcn_data_parallelism: 1# recommended DCN axis to be auto-sharded
208
+
dcn_data_parallelism: 1
206
209
dcn_fsdp_parallelism: 1
207
-
dcn_context_parallelism: -1
210
+
dcn_context_parallelism: -1# recommended DCN axis to be auto-sharded
208
211
dcn_tensor_parallelism: 1
209
212
ici_data_parallelism: 1
210
213
ici_fsdp_parallelism: 1
@@ -338,8 +341,8 @@ prompt: "A cat and a dog baking a cake together in a kitchen. The cat is careful
338
341
prompt_2: "A cat and a dog baking a cake together in a kitchen. The cat is carefully measuring flour, while the dog is stirring the batter with a wooden spoon. The kitchen is cozy, with sunlight streaming through the window."
339
342
negative_prompt: "Bright tones, overexposed, static, blurred details, subtitles, style, works, paintings, images, static, overall gray, worst quality, low quality, JPEG compression residue, ugly, incomplete, extra fingers, poorly drawn hands, poorly drawn faces, deformed, disfigured, misshapen limbs, fused fingers, still picture, messy background, three legs, many people in the background, walking backwards"
340
343
do_classifier_free_guidance: True
341
-
height: 480
342
-
width: 832
344
+
height: 720
345
+
width: 1280
343
346
num_frames: 81
344
347
guidance_scale: 5.0
345
348
flow_shift: 3.0
@@ -348,6 +351,10 @@ flow_shift: 3.0
348
351
# Skips the unconditional forward pass on ~35% of steps via residual compensation.
349
352
# See: FasterCache (Lv et al. 2024), WAN 2.1 paper §4.4.2
350
353
use_cfg_cache: False
354
+
355
+
# Batch positive and negative prompts in text encoder to save compute.
# value to auto-shard based on available slices and devices.
191
195
# By default, product of the DCN axes should equal number of slices
192
196
# and product of the ICI axes should equal number of devices per slice.
193
-
dcn_data_parallelism: 1# recommended DCN axis to be auto-sharded
197
+
dcn_data_parallelism: 1
194
198
dcn_fsdp_parallelism: 1
195
-
dcn_context_parallelism: -1
199
+
dcn_context_parallelism: -1# recommended DCN axis to be auto-sharded
196
200
dcn_tensor_parallelism: 1
197
201
ici_data_parallelism: 1
198
202
ici_fsdp_parallelism: 1
@@ -304,17 +308,17 @@ prompt: "A cat and a dog baking a cake together in a kitchen. The cat is careful
304
308
prompt_2: "A cat and a dog baking a cake together in a kitchen. The cat is carefully measuring flour, while the dog is stirring the batter with a wooden spoon. The kitchen is cozy, with sunlight streaming through the window."
305
309
negative_prompt: "Bright tones, overexposed, static, blurred details, subtitles, style, works, paintings, images, static, overall gray, worst quality, low quality, JPEG compression residue, ugly, incomplete, extra fingers, poorly drawn hands, poorly drawn faces, deformed, disfigured, misshapen limbs, fused fingers, still picture, messy background, three legs, many people in the background, walking backwards"
306
310
do_classifier_free_guidance: True
307
-
height: 480
308
-
width: 832
311
+
height: 720
312
+
width: 1280
309
313
num_frames: 81
310
314
flow_shift: 3.0
311
315
312
316
# Reference for below guidance scale and boundary values: https://github.com/Wan-Video/Wan2.2/blob/main/wan/configs/wan_t2v_A14B.py
313
317
# guidance scale factor for low noise transformer
314
-
guidance_scale_low: 3.0
318
+
guidance_scale_low: 3.0
315
319
316
320
# guidance scale factor for high noise transformer
317
-
guidance_scale_high: 4.0
321
+
guidance_scale_high: 4.0
318
322
319
323
# The timestep threshold. If `t` is at or above this value,
320
324
# the `high_noise_model` is considered as the required model.
@@ -323,14 +327,19 @@ boundary_ratio: 0.875
323
327
324
328
# Diffusion CFG cache (FasterCache-style)
325
329
use_cfg_cache: False
330
+
331
+
# Batch positive and negative prompts in text encoder to save compute.
0 commit comments