mirror of
https://github.com/deepseek-ai/DeepEP
synced 2025-05-02 03:04:07 +00:00
Fix zero-copy mode tests
This commit is contained in:
parent
c4d12b4f8f
commit
26fa72d80f
@ -78,7 +78,7 @@ def test_main(num_tokens: int, hidden: int, num_experts: int, num_topk: int,
|
|||||||
buffer.get_next_low_latency_combine_buffer(handle)[:, :, :] = simulated_gemm_x
|
buffer.get_next_low_latency_combine_buffer(handle)[:, :, :] = simulated_gemm_x
|
||||||
out = torch.empty((num_tokens, hidden), dtype=torch.bfloat16, device='cuda')
|
out = torch.empty((num_tokens, hidden), dtype=torch.bfloat16, device='cuda')
|
||||||
combined_x, event, hook = buffer.low_latency_combine(simulated_gemm_x, topk_idx, topk_weights, handle,
|
combined_x, event, hook = buffer.low_latency_combine(simulated_gemm_x, topk_idx, topk_weights, handle,
|
||||||
async_finish=not return_recv_hook,
|
async_finish=not return_recv_hook, zero_copy=zero_copy,
|
||||||
return_recv_hook=return_recv_hook, out=out)
|
return_recv_hook=return_recv_hook, out=out)
|
||||||
hook() if return_recv_hook else event.current_stream_wait()
|
hook() if return_recv_hook else event.current_stream_wait()
|
||||||
if do_check:
|
if do_check:
|
||||||
|
Loading…
Reference in New Issue
Block a user