From 81de20843046b478640b5c156326361f7247872c Mon Sep 17 00:00:00 2001 From: Chenggang Zhao Date: Tue, 27 May 2025 12:00:10 +0800 Subject: [PATCH] Format --- deep_gemm/include/deep_gemm/scheduler.cuh | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/deep_gemm/include/deep_gemm/scheduler.cuh b/deep_gemm/include/deep_gemm/scheduler.cuh index d137057..81bfeba 100644 --- a/deep_gemm/include/deep_gemm/scheduler.cuh +++ b/deep_gemm/include/deep_gemm/scheduler.cuh @@ -34,7 +34,7 @@ struct Scheduler { // Only used for masked layout uint32_t curr_group_idx, curr_cumsum; - __device__ __forceinline__ explicit Scheduler(const uint32_t shape_m, + __device__ __forceinline__ explicit Scheduler(const uint32_t& shape_m, int* grouped_layout = nullptr) { num_aligned_m_blocks = ceil_div(shape_m, BLOCK_M); if constexpr (kGemmType == GemmType::Normal) { @@ -76,7 +76,7 @@ struct Scheduler { } } - __device__ __forceinline__ void get_swizzled_block_idx(const uint32_t num_m_blocks, uint32_t block_idx, + __device__ __forceinline__ void get_swizzled_block_idx(const uint32_t& num_m_blocks, const uint32_t& block_idx, uint32_t& m_block_idx, uint32_t& n_block_idx) { DG_STATIC_ASSERT(kNum1DBlocksPerGroup % kNumTMAMulticast == 0, "Invalid group size"); @@ -111,7 +111,7 @@ struct Scheduler { } template - __device__ __forceinline__ uint32_t get_global_idx(const uint32_t shape_dim, const uint32_t block_size, + __device__ __forceinline__ uint32_t get_global_idx(const uint32_t& shape_dim, const uint32_t& block_size, const uint32_t& block_idx, const uint32_t& m_block_idx=0) { if constexpr (kGemmType == GemmType::Normal) { return block_idx * block_size;