We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent cb5d8fa commit 2f0bc46Copy full SHA for 2f0bc46
python/sglang/srt/layers/moe/fused_moe_triton/fused_moe.py
@@ -152,6 +152,7 @@ def fused_moe_kernel(
152
return
153
offs_token_id = pid_m * BLOCK_SIZE_M + tl.arange(0, BLOCK_SIZE_M)
154
offs_token = tl.load(sorted_token_ids_ptr + offs_token_id)
155
+ offs_token = offs_token.to(tl.int64)
156
token_mask = offs_token < num_valid_tokens
157
158
offs_bn = (pid_n * BLOCK_SIZE_N + tl.arange(0, BLOCK_SIZE_N)) % N
0 commit comments