Skip to content

Commit 0b5e567

Browse files
committed
Update Tokamax Splash attention config to use base2 exp and experimental scheduler
1 parent ad3b565 commit 0b5e567

1 file changed

Lines changed: 3 additions & 1 deletion

File tree

src/maxdiffusion/models/attention_flax.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -198,7 +198,8 @@ def convert_to_tokamax_splash_config(
198198
residual_checkpoint_name: str | None = None,
199199
attn_logits_soft_cap: float | None = None,
200200
fuse_reciprocal: bool = True,
201-
use_base2_exp: bool = False,
201+
use_base2_exp: bool = True,
202+
use_experimental_scheduler: bool = True,
202203
max_logit_const: float | None = None,
203204
interpret: bool = False,
204205
dq_reduction_steps: int | None = None,
@@ -221,6 +222,7 @@ def convert_to_tokamax_splash_config(
221222
attn_logits_soft_cap=attn_logits_soft_cap,
222223
fuse_reciprocal=fuse_reciprocal,
223224
use_base2_exp=use_base2_exp,
225+
use_experimental_scheduler=use_experimental_scheduler,
224226
max_logit_const=max_logit_const,
225227
interpret=interpret,
226228
dq_reduction_steps=dq_reduction_steps,

0 commit comments

Comments
 (0)