mirror of
https://github.com/deepseek-ai/FlashMLA
synced 2025-06-26 18:15:54 +00:00
update fp8 api
This commit is contained in:
@@ -17,6 +17,9 @@ struct Flash_fwd_mla_params {
|
||||
void *__restrict__ o_ptr;
|
||||
void *__restrict__ softmax_lse_ptr;
|
||||
|
||||
float* __restrict__ descale_q_ptr = nullptr;
|
||||
float* __restrict__ descale_k_ptr = nullptr;
|
||||
|
||||
index_t q_batch_stride;
|
||||
index_t k_batch_stride;
|
||||
index_t v_batch_stride;
|
||||
|
||||
Reference in New Issue
Block a user