enable fp8 api

This commit is contained in:
chenhongmin.will
2025-02-25 22:34:01 +08:00
parent c50d29d170
commit dfe8ffc75a
3 changed files with 18 additions and 8 deletions

View File

@@ -63,5 +63,6 @@ def flash_mla_with_kvcache(
causal,
tile_scheduler_metadata,
num_splits,
None, None, None,
)
return out, softmax_lse