mirror of
https://github.com/deepseek-ai/DeepEP
synced 2025-06-26 18:28:11 +00:00
Remove the low-latency usage flag (#214)
This commit is contained in:
@@ -166,7 +166,6 @@ def test_loop(local_rank: int, num_local_ranks: int):
|
||||
print(f'Allocating buffer size: {num_rdma_bytes / 1e6} MB ...', flush=True)
|
||||
buffer = deep_ep.Buffer(group, num_rdma_bytes=num_rdma_bytes, low_latency_mode=True,
|
||||
num_qps_per_rank=num_experts // num_ranks)
|
||||
buffer.get_low_latency_usage_flag()
|
||||
test_main(num_tokens, hidden, num_experts, num_topk, rank, num_ranks, group, buffer, seed=1)
|
||||
|
||||
do_pressure_test = False
|
||||
|
||||
Reference in New Issue
Block a user