Skip to content

Commit 5f2affa

Browse files
committed
debug for generated mel spectrogram
1 parent 13f1cbd commit 5f2affa

1 file changed

Lines changed: 3 additions & 0 deletions

File tree

src/maxdiffusion/pipelines/ltx2/ltx2_pipeline.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1729,6 +1729,9 @@ def convert_to_vel(lat, x0):
17291729
audio_latents = audio_latents.astype(self.audio_vae.dtype)
17301730
generated_mel_spectrograms = self.audio_vae.decode(audio_latents, return_dict=False)[0]
17311731
print(f"DEBUG: generated_mel_spectrograms shape: {generated_mel_spectrograms.shape}")
1732+
print(f"DEBUG: generated_mel_spectrograms min: {generated_mel_spectrograms.min()}")
1733+
print(f"DEBUG: generated_mel_spectrograms max: {generated_mel_spectrograms.max()}")
1734+
print(f"DEBUG: generated_mel_spectrograms mean: {generated_mel_spectrograms.mean()}")
17321735

17331736
# Audio VAE outputs (B, T, F, C), Vocoder expects (B, Channels, Time, MelBins)
17341737
generated_mel_spectrograms = generated_mel_spectrograms.transpose(0, 3, 1, 2)

0 commit comments

Comments
 (0)