Skip to content

Commit 95fcbd5

Browse files
author
James
committed
Merge teamA/James into ltx2-dev
2 parents 0606006 + b7831ee commit 95fcbd5

1 file changed

Lines changed: 4 additions & 4 deletions

File tree

src/maxdiffusion/models/ltx2/text_encoders/text_encoders_ltx2.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -34,8 +34,8 @@ class LTX2VideoGemmaTextEncoder(nnx.Module):
3434
def __init__(
3535
self,
3636
# Feature Extractor Config
37-
gemma_dim: int = 3072, # Gemma-2-9b or similar
38-
gemma_layers: int = 42,
37+
gemma_dim: int = 3840, # Gemma-3-12b
38+
gemma_layers: int = 49, # Gemma-3 has 48 layers + 1 embedding layer output = 49 hidden states
3939
projection_dim: int = 4096, # LTX-2 conditioning dim
4040
# Connector Config
4141
connector_heads: int = 32,
@@ -93,8 +93,8 @@ class LTX2AudioVideoGemmaTextEncoder(nnx.Module):
9393
def __init__(
9494
self,
9595
# Feature Extractor Config (Shared)
96-
gemma_dim: int = 3072,
97-
gemma_layers: int = 42,
96+
gemma_dim: int = 3840, # Gemma-3-12b
97+
gemma_layers: int = 49, # Gemma-3 has 48 layers + 1 embedding layer output = 49 hidden states
9898
projection_dim: int = 4096,
9999
# Connector Config
100100
connector_heads: int = 32,

0 commit comments

Comments
 (0)