File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -342,7 +342,6 @@ After installation completes, run the training script.
342342 num_frames=81 \
343343 num_inference_steps=50 \
344344 jax_cache_dir=${OUTPUT_DIR} /jax_cache/ \
345- max_train_steps=1000 \
346345 enable_profiler=True \
347346 dataset_save_location=${SAVE_DATASET_DIR} \
348347 remat_policy='HIDDEN_STATE_WITH_OFFLOAD' \
@@ -353,7 +352,17 @@ After installation completes, run the training script.
353352 per_device_batch_size=0.25 \
354353 ici_data_parallelism=64 \
355354 ici_fsdp_parallelism=2 \
356- ici_tensor_parallelism=1"
355+ ici_tensor_parallelism=1" \
356+ max_train_steps=5000 \
357+ eval_every=100 \
358+ eval_data_dir=${EVAL_DATA_DIR} \
359+ enable_generate_video_for_eval=True \
360+ warmup_steps_fraction=0.025"
361+ --base-docker-image=${IMAGE_DIR} \
362+ --enable-debug-logs \
363+ --workload=${RUN_NAME} \
364+ --priority=medium \
365+ --max-restarts=0
357366 ` ` `
358367
359368 # # Flux Training
You can’t perform that action at this time.
0 commit comments