Skip to content

Commit 1118ae5

Browse files
committed
changes for vae mean and std
1 parent f4de876 commit 1118ae5

2 files changed

Lines changed: 7 additions & 6 deletions

File tree

src/maxdiffusion/pipelines/ltx2/ltx2_pipeline.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -242,8 +242,8 @@ def __init__(
242242
self.transformer_spatial_patch_size = getattr(self.transformer.config, "patch_size", 1)
243243
self.transformer_temporal_patch_size = getattr(self.transformer.config, "patch_size_t", 1)
244244

245-
self.audio_sampling_rate = getattr(self.audio_vae.config, "sample_rate", 16000)
246-
self.audio_hop_length = getattr(self.audio_vae.config, "mel_hop_length", 160)
245+
self.audio_sampling_rate = getattr(self.audio_vae.config, "sample_rate", 16000) if getattr(self, "audio_vae", None) is not None else 16000
246+
self.audio_hop_length = getattr(self.audio_vae.config, "mel_hop_length", 160) if getattr(self, "audio_vae", None) is not None else 160
247247

248248
# Initialize video processor
249249
self.video_processor = VideoProcessor(vae_scale_factor=self.vae_spatial_compression_ratio)

test_vae_load.py

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,8 @@
66
argv = ["", "src/maxdiffusion/configs/ltx2_video.yml"]
77
pyconfig.initialize(argv)
88

9-
pipeline = LTX2Pipeline.from_pretrained(pyconfig.config, vae_only=True)
10-
print("latents_mean:", pipeline.vae.latents_mean.value[:10])
11-
print("latents_std:", pipeline.vae.latents_std.value[:10])
12-
print("audio_latents_mean:", pipeline.audio_vae.latents_mean.value[:10])
9+
pipeline = LTX2Pipeline.from_pretrained(pyconfig.config, load_transformer=False)
10+
print("latents_mean (Video VAE):", pipeline.vae.latents_mean.value[:5])
11+
print("latents_std (Video VAE):", pipeline.vae.latents_std.value[:5])
12+
print("latents_mean (Audio VAE):", pipeline.audio_vae.latents_mean.value[:5])
13+
print("latents_std (Audio VAE):", pipeline.audio_vae.latents_std.value[:5])

0 commit comments

Comments
 (0)