mirror of
https://github.com/deepseek-ai/FlashMLA
synced 2025-06-26 18:15:54 +00:00
enable fp8 api
This commit is contained in:
@@ -63,5 +63,6 @@ def flash_mla_with_kvcache(
|
||||
causal,
|
||||
tile_scheduler_metadata,
|
||||
num_splits,
|
||||
None, None, None,
|
||||
)
|
||||
return out, softmax_lse
|
||||
|
||||
Reference in New Issue
Block a user