mirror of
https://github.com/deepseek-ai/DeepEP
synced 2025-06-10 00:16:22 +00:00
Allow NVLink traffic for low-latency kernels by default
This commit is contained in:
parent
8da1b1f81e
commit
aae9fa9a6d
@ -32,7 +32,7 @@ class Buffer:
|
|||||||
def __init__(self, group: dist.ProcessGroup,
|
def __init__(self, group: dist.ProcessGroup,
|
||||||
num_nvl_bytes: int = 0, num_rdma_bytes: int = 0,
|
num_nvl_bytes: int = 0, num_rdma_bytes: int = 0,
|
||||||
low_latency_mode: bool = False, num_qps_per_rank: int = 12,
|
low_latency_mode: bool = False, num_qps_per_rank: int = 12,
|
||||||
allow_nvlink_for_low_latency_mode: bool = False) -> None:
|
allow_nvlink_for_low_latency_mode: bool = True) -> None:
|
||||||
"""
|
"""
|
||||||
Initialize the communication buffer.
|
Initialize the communication buffer.
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user