mirror of
https://github.com/deepseek-ai/DeepEP
synced 2025-05-06 13:04:22 +00:00
comments
This commit is contained in:
parent
b3b61ef5ef
commit
50ac280ae7
@ -498,7 +498,7 @@ class Buffer:
|
|||||||
# noinspection PyTypeChecker
|
# noinspection PyTypeChecker
|
||||||
def low_latency_combine(self, x: torch.Tensor, topk_idx: torch.Tensor, topk_weights: torch.Tensor,
|
def low_latency_combine(self, x: torch.Tensor, topk_idx: torch.Tensor, topk_weights: torch.Tensor,
|
||||||
handle: tuple, async_finish: bool = False, return_recv_hook: bool = False,
|
handle: tuple, async_finish: bool = False, return_recv_hook: bool = False,
|
||||||
out: torch.Tensor | None = None) -> \
|
out: Optional[torch.Tensor] = None) -> \
|
||||||
Tuple[torch.Tensor, EventOverlap, Callable]:
|
Tuple[torch.Tensor, EventOverlap, Callable]:
|
||||||
"""
|
"""
|
||||||
A low-latency implementation for combining tokens (reduce **with weights**) with IBGDA.
|
A low-latency implementation for combining tokens (reduce **with weights**) with IBGDA.
|
||||||
|
Loading…
Reference in New Issue
Block a user