FlashMLA/csrc/flash_fwd_mla_fp8_sm90.cu
chenhongmin.will dae0690055 init fp8
2025-02-24 21:12:36 +08:00

3 lines
152 B
Plaintext

#include "flash_fwd_mla_kernel.h"
template void run_mha_fwd_splitkv_mla<cutlass::float_e4m3_t, 576>(Flash_fwd_mla_params &params, cudaStream_t stream);