mirror of
https://github.com/deepseek-ai/DeepEP
synced 2025-05-02 11:11:17 +00:00
Merge pull request #96 from songhexiang/adjust_kNumThreads_of_notify_dispatch
Adjust kNumThreads of notify_dispatch
This commit is contained in:
commit
dcf46f1c26
@ -428,7 +428,7 @@ void notify_dispatch(const int* num_tokens_per_rank, int* moe_recv_counter_mappe
|
||||
buffer_ptrs, task_fifo_ptrs, head, rank, \
|
||||
cpu_rdma_team); } break
|
||||
|
||||
constexpr int kNumThreads = 256;
|
||||
constexpr int kNumThreads = std::max(256, 32 * num_channels);
|
||||
const auto num_rdma_ranks = num_ranks / NUM_MAX_NVL_PEERS;
|
||||
|
||||
// Get clean meta
|
||||
|
Loading…
Reference in New Issue
Block a user