mirror of
https://github.com/deepseek-ai/DeepGEMM
synced 2025-06-26 23:15:49 +00:00
Fix illegal memory address when skipping -1 m indices (#113)
Co-authored-by: Shixian Cui <shixian@amazon.com>
This commit is contained in:
parent
8dfa329827
commit
0c88cd0139
@ -116,7 +116,7 @@ struct Scheduler {
|
|||||||
if constexpr (kGemmType == GemmType::Normal) {
|
if constexpr (kGemmType == GemmType::Normal) {
|
||||||
return block_idx * block_size;
|
return block_idx * block_size;
|
||||||
} else if constexpr (kGemmType == GemmType::GroupedContiguous) {
|
} else if constexpr (kGemmType == GemmType::GroupedContiguous) {
|
||||||
auto offset = kIgnoreGroupedForGroupedContiguous ? 0 : __ldg(grouped_layout + m_block_idx * BLOCK_M);
|
auto offset = kIgnoreGroupedForGroupedContiguous ? 0 : max(0, __ldg(grouped_layout + m_block_idx * BLOCK_M));
|
||||||
return offset * shape_dim + block_idx * block_size;
|
return offset * shape_dim + block_idx * block_size;
|
||||||
} else if constexpr (kGemmType == GemmType::GroupedMasked) {
|
} else if constexpr (kGemmType == GemmType::GroupedMasked) {
|
||||||
return curr_group_idx * shape_dim + block_idx * block_size;
|
return curr_group_idx * shape_dim + block_idx * block_size;
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user