mirror of
https://github.com/deepseek-ai/DeepEP
synced 2025-05-05 12:34:50 +00:00
comments
This commit is contained in:
parent
b3b61ef5ef
commit
50ac280ae7
@ -498,7 +498,7 @@ class Buffer:
|
||||
# noinspection PyTypeChecker
|
||||
def low_latency_combine(self, x: torch.Tensor, topk_idx: torch.Tensor, topk_weights: torch.Tensor,
|
||||
handle: tuple, async_finish: bool = False, return_recv_hook: bool = False,
|
||||
out: torch.Tensor | None = None) -> \
|
||||
out: Optional[torch.Tensor] = None) -> \
|
||||
Tuple[torch.Tensor, EventOverlap, Callable]:
|
||||
"""
|
||||
A low-latency implementation for combining tokens (reduce **with weights**) with IBGDA.
|
||||
|
Loading…
Reference in New Issue
Block a user