FlashMLA/csrc/flash_fwd_mla_bf16_sm90.cu
chenhongmin.will b67a18f850 update gmem
2025-02-25 09:45:19 +08:00

4 lines
172 B
Plaintext

#include "flash_fwd_mla_kernel.h"
template void run_mha_fwd_splitkv_mla<cutlass::bfloat16_t, cutlass::bfloat16_t, 576>(Flash_fwd_mla_params &params, cudaStream_t stream);