@@ -91,7 +91,7 @@ def setUpClass(cls):
9191 "ici_context_parallelism=4" ,
9292 "ici_tensor_parallelism=1" ,
9393 "flash_min_seq_length=0" ,
94- 'flash_block_sizes={"block_q":3024,"block_kv_compute":1024,"block_kv":2048,"block_q_dkv":3024,"block_kv_dkv":2048,"block_kv_dkv_compute":1024,"use_fused_bwd_kernel":false }' ,
94+ 'flash_block_sizes={"block_q":3024,"block_kv_compute":1024,"block_kv":2048,"block_q_dkv":3024,"block_kv_dkv":2048,"block_kv_dkv_compute":1024,"use_fused_bwd_kernel":true }' ,
9595 ],
9696 unittest = True ,
9797 )
@@ -167,7 +167,7 @@ def setUpClass(cls):
167167 "ici_context_parallelism=4" ,
168168 "ici_tensor_parallelism=1" ,
169169 "flash_min_seq_length=0" ,
170- 'flash_block_sizes={"block_q":3024,"block_kv_compute":1024,"block_kv":2048,"block_q_dkv":3024,"block_kv_dkv":2048,"block_kv_dkv_compute":1024,"use_fused_bwd_kernel":false }' ,
170+ 'flash_block_sizes={"block_q":3024,"block_kv_compute":1024,"block_kv":2048,"block_q_dkv":3024,"block_kv_dkv":2048,"block_kv_dkv_compute":1024,"use_fused_bwd_kernel":true }' ,
171171 ],
172172 unittest = True ,
173173 )
@@ -246,7 +246,7 @@ def setUpClass(cls):
246246 "ici_context_parallelism=4" ,
247247 "ici_tensor_parallelism=1" ,
248248 "flash_min_seq_length=0" ,
249- 'flash_block_sizes={"block_q":3024,"block_kv_compute":1024,"block_kv":2048,"block_q_dkv":3024,"block_kv_dkv":2048,"block_kv_dkv_compute":1024,"use_fused_bwd_kernel":false }' ,
249+ 'flash_block_sizes={"block_q":3024,"block_kv_compute":1024,"block_kv":2048,"block_q_dkv":3024,"block_kv_dkv":2048,"block_kv_dkv_compute":1024,"use_fused_bwd_kernel":true }' ,
250250 ],
251251 unittest = True ,
252252 )
@@ -327,7 +327,7 @@ def setUpClass(cls):
327327 "ici_context_parallelism=4" ,
328328 "ici_tensor_parallelism=1" ,
329329 "flash_min_seq_length=0" ,
330- 'flash_block_sizes={"block_q":3024,"block_kv_compute":1024,"block_kv":2048,"block_q_dkv":3024,"block_kv_dkv":2048,"block_kv_dkv_compute":1024,"use_fused_bwd_kernel":false }' ,
330+ 'flash_block_sizes={"block_q":3024,"block_kv_compute":1024,"block_kv":2048,"block_q_dkv":3024,"block_kv_dkv":2048,"block_kv_dkv_compute":1024,"use_fused_bwd_kernel":true }' ,
331331 ],
332332 unittest = True ,
333333 )
0 commit comments