This commit is contained in:
chenhongmin.will
2025-02-24 21:12:36 +08:00
parent bcb90f2afd
commit dae0690055
2 changed files with 4 additions and 0 deletions

View File

@@ -0,0 +1,3 @@
#include "flash_fwd_mla_kernel.h"
template void run_mha_fwd_splitkv_mla<cutlass::float_e4m3_t, 576>(Flash_fwd_mla_params &params, cudaStream_t stream);