Skip to content

Commit eafd8fb

Browse files
committed
cross attn dim and vocoder weights
1 parent d79b6dd commit eafd8fb

2 files changed

Lines changed: 2 additions & 2 deletions

File tree

src/maxdiffusion/models/ltx2/ltx2_3_utils.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -389,7 +389,7 @@ def load_vocoder_weights_2_3(
389389

390390
if flax_key[-1] == "kernel":
391391
if "upsamplers" in flax_key:
392-
tensor = tensor.transpose(2, 0, 1)[::-1, :, :]
392+
tensor = tensor.transpose(2, 0, 1)
393393
else:
394394
tensor = tensor.transpose(2, 1, 0)
395395

src/maxdiffusion/pipelines/ltx2/ltx2_pipeline.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -119,7 +119,7 @@ def create_model(rngs: nnx.Rngs, ltx2_config: dict):
119119
"in_channels": 128,
120120
"num_attention_heads": 32,
121121
"attention_head_dim": 128,
122-
"cross_attention_dim": 8192,
122+
"cross_attention_dim": 4096,
123123
"audio_in_channels": 128,
124124
"audio_num_attention_heads": 32,
125125
"audio_attention_head_dim": 64,

0 commit comments

Comments
 (0)