Skip to content

Commit 7af151a

Browse files
committed
change base branch
1 parent 535c75e commit 7af151a

4 files changed

Lines changed: 1397 additions & 1307 deletions

File tree

Lines changed: 70 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -1,18 +1,3 @@
1-
# Copyright 2025 Google LLC
2-
3-
# Licensed under the Apache License, Version 2.0 (the "License");
4-
# you may not use this file except in compliance with the License.
5-
# You may obtain a copy of the License at
6-
7-
# https://www.apache.org/licenses/LICENSE-2.0
8-
9-
# Unless required by applicable law or agreed to in writing, software
10-
# distributed under the License is distributed on an "AS IS" BASIS,
11-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12-
# See the License for the specific language governing permissions and
13-
# limitations under the License.
14-
15-
161
#hardware
172
hardware: 'tpu'
183
skip_jax_distributed_system: False
@@ -25,30 +10,91 @@ activations_dtype: 'bfloat16'
2510
run_name: ''
2611
output_dir: 'ltx-video-output'
2712
save_config_to_gcs: False
13+
#Checkpoints
14+
text_encoder_model_name_or_path: "ariG23498/t5-v1-1-xxl-flax"
15+
prompt_enhancer_image_caption_model_name_or_path: "MiaoshouAI/Florence-2-large-PromptGen-v2.0"
16+
prompt_enhancer_llm_model_name_or_path: "unsloth/Llama-3.2-3B-Instruct"
17+
frame_rate: 30
18+
max_sequence_length: 512
19+
sampler: "from_checkpoint"
20+
21+
2822

29-
#parallelism
30-
mesh_axes: ['data', 'fsdp', 'tensor']
23+
24+
25+
# Generation parameters
26+
pipeline_type: multi-scale
27+
prompt: ["A man in a dimly lit room talks on a vintage telephone, hangs up, and looks down with a sad expression. He holds the black rotary phone to his right ear with his right hand, his left hand holding a rocks glass with amber liquid. He wears a brown suit jacket over a white shirt, and a gold ring on his left ring finger. His short hair is neatly combed, and he has light skin with visible wrinkles around his eyes. The camera remains stationary, focused on his face and upper body. The room is dark, lit only by a warm light source off-screen to the left, casting shadows on the wall behind him. The scene appears to be from a movie.", "A man walks towards a window, looks out, and then turns around. He has short, dark hair, dark skin, and is wearing a brown coat over a red and gray scarf. He walks from left to right towards a window, his gaze fixed on something outside. The camera follows him from behind at a medium distance. The room is brightly lit, with white walls and a large window covered by a white curtain. As he approaches the window, he turns his head slightly to the left, then back to the right. He then turns his entire body to the right, facing the window. The camera remains stationary as he stands in front of the window. The scene is captured in real-life footage."]
28+
height: 512
29+
width: 512
30+
num_frames: 88 #344
31+
flow_shift: 5.0
32+
downscale_factor: 0.6666666
33+
spatial_upscaler_model_path: "ltxv-spatial-upscaler-0.9.7.safetensors"
34+
prompt_enhancement_words_threshold: 120
35+
# guidance_scale: [1, 1, 6, 8, 6, 1, 1] #4.5
36+
# stg_scale: [0, 0, 4, 4, 4, 2, 1] #1.0
37+
# rescaling_scale: [1, 1, 0.5, 0.5, 1, 1, 1] #0.7
38+
# num_inference_steps: 30
39+
# skip_final_inference_steps: 3
40+
# skip_initial_inference_steps: 0
41+
# guidance_timesteps: [1.0, 0.996, 0.9933, 0.9850, 0.9767, 0.9008, 0.6180]
42+
# skip_block_list: [[], [11, 25, 35, 39], [22, 35, 39], [28], [28], [28], [28]]
43+
stg_mode: "attention_values"
44+
decode_timestep: 0.05
45+
decode_noise_scale: 0.025
46+
# cfg_star_rescale: True
47+
48+
49+
first_pass:
50+
guidance_scale: [1, 1, 6, 8, 6, 1, 1]
51+
stg_scale: [0, 0, 4, 4, 4, 2, 1]
52+
rescaling_scale: [1, 1, 0.5, 0.5, 1, 1, 1]
53+
guidance_timesteps: [1.0, 0.996, 0.9933, 0.9850, 0.9767, 0.9008, 0.6180]
54+
skip_block_list: [[], [11, 25, 35, 39], [22, 35, 39], [28], [28], [28], [28]]
55+
num_inference_steps: 30
56+
skip_final_inference_steps: 3
57+
skip_initial_inference_steps: 0
58+
cfg_star_rescale: True
59+
60+
second_pass:
61+
guidance_scale: [1]
62+
stg_scale: [1]
63+
rescaling_scale: [1]
64+
guidance_timesteps: [1.0]
65+
skip_block_list: [27]
66+
num_inference_steps: 30
67+
skip_initial_inference_steps: 17
68+
skip_final_inference_steps: 0
69+
cfg_star_rescale: True
70+
71+
#Parallelism
72+
mesh_axes: ['data', 'fsdp', 'tensor', 'fsdp_transpose', 'expert', 'tensor_transpose', 'tensor_sequence', 'sequence']
3173
logical_axis_rules: [
3274
['batch', 'data'],
33-
['activation_heads', 'fsdp'],
3475
['activation_batch', ['data','fsdp']],
76+
['activation_heads', 'tensor'],
3577
['activation_kv', 'tensor'],
3678
['mlp','tensor'],
3779
['embed','fsdp'],
3880
['heads', 'tensor'],
39-
['norm', 'fsdp'],
4081
['conv_batch', ['data','fsdp']],
4182
['out_channels', 'tensor'],
4283
['conv_out', 'fsdp'],
43-
['conv_in', 'fsdp']
4484
]
45-
data_sharding: [['data', 'fsdp', 'tensor']]
85+
data_sharding: [['data', 'fsdp', 'tensor', 'fsdp_transpose', 'expert', 'tensor_transpose', 'tensor_sequence', 'sequence']]
4686
dcn_data_parallelism: 1 # recommended DCN axis to be auto-sharded
4787
dcn_fsdp_parallelism: -1
4888
dcn_tensor_parallelism: 1
49-
ici_data_parallelism: 1
50-
ici_fsdp_parallelism: -1 # recommended ICI axis to be auto-sharded
89+
90+
ici_data_parallelism: -1
91+
ici_fsdp_parallelism: 1 # recommended ICI axis to be auto-sharded
5192
ici_tensor_parallelism: 1
93+
ici_fsdp_transpose_parallelism: 1
94+
ici_sequence_parallelism: 1
95+
ici_tensor_transpose_parallelism: 1
96+
ici_expert_parallelism: 1
97+
ici_sequence_parallelism: 1
5298

5399

54100

@@ -65,4 +111,4 @@ per_device_batch_size: 1
65111
compile_topology_num_slices: -1
66112
quantization_local_shard_count: -1
67113
jit_initializers: True
68-
enable_single_replica_ckpt_restoring: False
114+
enable_single_replica_ckpt_restoring: False

0 commit comments

Comments
 (0)