Skip to content

Commit e215ef6

Browse files
Update csrc/moe/moe_align_sum_kernels.cu
Co-authored-by: Tyler Michael Smith <[email protected]> Signed-off-by: ElizaWszola <[email protected]>
1 parent 4c6ca52 commit e215ef6

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

csrc/moe/moe_align_sum_kernels.cu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -38,8 +38,8 @@ __global__ void moe_align_block_size_kernel(scalar_t* __restrict__ topk_ids,
3838
(cnts_byte_offset + sizeof(int32_t) - 1) / sizeof(int32_t);
3939

4040
extern __shared__ int32_t shared_mem[];
41-
token_cnts_t* tokens_cnts = (token_cnts_t*)
42-
shared_mem; // 2d tensor with shape (blockDim.x + 1, num_experts)
41+
token_cnts_t* tokens_cnts = reinterpret_cast<token_cnts_t*>(
42+
shared_mem); // 2d tensor with shape (blockDim.x + 1, num_experts)
4343
int32_t* cumsum =
4444
shared_mem + aligned_offset; // 1d tensor with shape (num_experts + 1)
4545

0 commit comments

Comments
 (0)