File tree Expand file tree Collapse file tree
src/maxdiffusion/models/ltx2/text_encoders Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -34,8 +34,8 @@ class LTX2VideoGemmaTextEncoder(nnx.Module):
3434 def __init__ (
3535 self ,
3636 # Feature Extractor Config
37- gemma_dim : int = 3072 , # Gemma-2-9b or similar
38- gemma_layers : int = 42 ,
37+ gemma_dim : int = 3840 , # Gemma-3-12b
38+ gemma_layers : int = 49 , # Gemma-3 has 48 layers + 1 embedding layer output = 49 hidden states
3939 projection_dim : int = 4096 , # LTX-2 conditioning dim
4040 # Connector Config
4141 connector_heads : int = 32 ,
@@ -93,8 +93,8 @@ class LTX2AudioVideoGemmaTextEncoder(nnx.Module):
9393 def __init__ (
9494 self ,
9595 # Feature Extractor Config (Shared)
96- gemma_dim : int = 3072 ,
97- gemma_layers : int = 42 ,
96+ gemma_dim : int = 3840 , # Gemma-3-12b
97+ gemma_layers : int = 49 , # Gemma-3 has 48 layers + 1 embedding layer output = 49 hidden states
9898 projection_dim : int = 4096 ,
9999 # Connector Config
100100 connector_heads : int = 32 ,
You can’t perform that action at this time.
0 commit comments