diff --git a/python/sglang/srt/layers/moe/fused_moe_triton/fused_moe.py b/python/sglang/srt/layers/moe/fused_moe_triton/fused_moe.py index c90be69e6dac..5d3e319e5132 100644 --- a/python/sglang/srt/layers/moe/fused_moe_triton/fused_moe.py +++ b/python/sglang/srt/layers/moe/fused_moe_triton/fused_moe.py @@ -707,7 +707,7 @@ def moe_align_block_size( dtype=torch.int32, device=topk_ids.device, ) - cumsum_buffer = torch.zeros( + cumsum_buffer = torch.empty( num_experts + 1, dtype=torch.int32, device=topk_ids.device )