@@ -768,6 +768,24 @@ def translate_ltx2_nnx_path_to_diffusers_lora(nnx_path_str, scan_layers=False):
768768 "av_cross_attn_audio_v2a_gate.linear" : "diffusion_model.av_ca_v2a_gate_adaln_single.linear" ,
769769 "av_cross_attn_audio_scale_shift.linear" : "diffusion_model.av_ca_audio_scale_shift_adaln_single.linear" ,
770770 "av_cross_attn_video_scale_shift.linear" : "diffusion_model.av_ca_video_scale_shift_adaln_single.linear" ,
771+
772+ # Nested conditioning layers
773+ "time_embed.emb.timestep_embedder.linear_1" : "diffusion_model.adaln_single.emb.timestep_embedder.linear_1" ,
774+ "time_embed.emb.timestep_embedder.linear_2" : "diffusion_model.adaln_single.emb.timestep_embedder.linear_2" ,
775+ "audio_time_embed.emb.timestep_embedder.linear_1" : "diffusion_model.audio_adaln_single.emb.timestep_embedder.linear_1" ,
776+ "audio_time_embed.emb.timestep_embedder.linear_2" : "diffusion_model.audio_adaln_single.emb.timestep_embedder.linear_2" ,
777+ "av_cross_attn_video_scale_shift.emb.timestep_embedder.linear_1" : "diffusion_model.av_ca_video_scale_shift_adaln_single.emb.timestep_embedder.linear_1" ,
778+ "av_cross_attn_video_scale_shift.emb.timestep_embedder.linear_2" : "diffusion_model.av_ca_video_scale_shift_adaln_single.emb.timestep_embedder.linear_2" ,
779+ "av_cross_attn_audio_scale_shift.emb.timestep_embedder.linear_1" : "diffusion_model.av_ca_audio_scale_shift_adaln_single.emb.timestep_embedder.linear_1" ,
780+ "av_cross_attn_audio_scale_shift.emb.timestep_embedder.linear_2" : "diffusion_model.av_ca_audio_scale_shift_adaln_single.emb.timestep_embedder.linear_2" ,
781+ "av_cross_attn_video_a2v_gate.emb.timestep_embedder.linear_1" : "diffusion_model.av_ca_a2v_gate_adaln_single.emb.timestep_embedder.linear_1" ,
782+ "av_cross_attn_video_a2v_gate.emb.timestep_embedder.linear_2" : "diffusion_model.av_ca_a2v_gate_adaln_single.emb.timestep_embedder.linear_2" ,
783+ "av_cross_attn_audio_v2a_gate.emb.timestep_embedder.linear_1" : "diffusion_model.av_ca_v2a_gate_adaln_single.emb.timestep_embedder.linear_1" ,
784+ "av_cross_attn_audio_v2a_gate.emb.timestep_embedder.linear_2" : "diffusion_model.av_ca_v2a_gate_adaln_single.emb.timestep_embedder.linear_2" ,
785+ "caption_projection.linear_1" : "diffusion_model.caption_projection.linear_1" ,
786+ "caption_projection.linear_2" : "diffusion_model.caption_projection.linear_2" ,
787+ "audio_caption_projection.linear_1" : "diffusion_model.audio_caption_projection.linear_1" ,
788+ "audio_caption_projection.linear_2" : "diffusion_model.audio_caption_projection.linear_2" ,
771789 }
772790
773791 if nnx_path_str in global_map :
0 commit comments