From aae9fa9a6dd0fec2a723fbb85ec4b22460fab670 Mon Sep 17 00:00:00 2001 From: Chenggang Zhao Date: Fri, 23 May 2025 20:14:50 +0800 Subject: [PATCH] Allow NVLink traffic for low-latency kernels by default --- deep_ep/buffer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/deep_ep/buffer.py b/deep_ep/buffer.py index 8527f24..4c2c0fc 100644 --- a/deep_ep/buffer.py +++ b/deep_ep/buffer.py @@ -32,7 +32,7 @@ class Buffer: def __init__(self, group: dist.ProcessGroup, num_nvl_bytes: int = 0, num_rdma_bytes: int = 0, low_latency_mode: bool = False, num_qps_per_rank: int = 12, - allow_nvlink_for_low_latency_mode: bool = False) -> None: + allow_nvlink_for_low_latency_mode: bool = True) -> None: """ Initialize the communication buffer.