You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: src/maxdiffusion/configs/base_wan_14b.yml
+8-2Lines changed: 8 additions & 2 deletions
Original file line number
Diff line number
Diff line change
@@ -244,7 +244,7 @@ num_eval_samples: 420
244
244
245
245
warmup_steps_fraction: 0.1
246
246
learning_rate_schedule_steps: -1# By default the length of the schedule is set to the number of steps.
247
-
save_optimizer: False
247
+
save_optimizer: True
248
248
249
249
# However you may choose a longer schedule (learning_rate_schedule_steps > steps), in which case the training will end before
250
250
# dropping fully down. Or you may choose a shorter schedule, where the unspecified steps will have a learning rate of 0.
@@ -326,4 +326,10 @@ eval_data_dir: ""
326
326
enable_generate_video_for_eval: False # This will increase the used TPU memory.
327
327
eval_max_number_of_samples_in_bucket: 60# The number of samples per bucket for evaluation. This is calculated by num_eval_samples / len(timesteps_list).
328
328
329
-
enable_ssim: False
329
+
enable_ssim: False
330
+
331
+
# Model surgery
332
+
override_model_dims: True
333
+
# If doubling the target_head_dim, then must halve the num_heads
0 commit comments