pipeline fix

prishajain1 · prishajain1 · commit 5ed0991eab89 · 2026-04-27T12:38:19.000+05:30
diff --git a/src/maxdiffusion/models/ltx2/transformer_ltx2.py b/src/maxdiffusion/models/ltx2/transformer_ltx2.py
@@ -1089,6 +1089,12 @@ def __call__(
           video_ca_timestep * timestep_cross_attn_gate_scale_factor,
           hidden_dtype=hidden_states.dtype,
       )
+      
+      if video_cross_attn_scale_shift.shape[0] < batch_size:
+        video_cross_attn_scale_shift = jnp.repeat(video_cross_attn_scale_shift, batch_size // video_cross_attn_scale_shift.shape[0], axis=0)
+      if video_cross_attn_a2v_gate.shape[0] < batch_size:
+        video_cross_attn_a2v_gate = jnp.repeat(video_cross_attn_a2v_gate, batch_size // video_cross_attn_a2v_gate.shape[0], axis=0)
+        
       video_cross_attn_scale_shift = video_cross_attn_scale_shift.reshape(
           batch_size, -1, video_cross_attn_scale_shift.shape[-1]
       )
@@ -1102,6 +1108,12 @@ def __call__(
           audio_ca_timestep * timestep_cross_attn_gate_scale_factor,
           hidden_dtype=audio_hidden_states.dtype,
       )
+      
+      if audio_cross_attn_scale_shift.shape[0] < batch_size:
+        audio_cross_attn_scale_shift = jnp.repeat(audio_cross_attn_scale_shift, batch_size // audio_cross_attn_scale_shift.shape[0], axis=0)
+      if audio_cross_attn_v2a_gate.shape[0] < batch_size:
+        audio_cross_attn_v2a_gate = jnp.repeat(audio_cross_attn_v2a_gate, batch_size // audio_cross_attn_v2a_gate.shape[0], axis=0)
+        
       audio_cross_attn_scale_shift = audio_cross_attn_scale_shift.reshape(
           batch_size, -1, audio_cross_attn_scale_shift.shape[-1]
       )