Skip to content

Commit

Permalink
fix kernel bug
Browse files Browse the repository at this point in the history
  • Loading branch information
sleepcoo committed Feb 16, 2025
1 parent 60d0c0a commit d802719
Showing 1 changed file with 1 addition and 3 deletions.
4 changes: 1 addition & 3 deletions python/sglang/srt/layers/moe/ep_moe/kernels.py
Original file line number Diff line number Diff line change
Expand Up @@ -295,12 +295,10 @@ def grouped_gemm_triton_kernel(
a_ptr += BLOCK_SIZE_K
b_ptr += BLOCK_SIZE_K

if use_fp8_w8a8:
if use_fp8_w8a8 and not (group_k > 0 and group_n > 0):
scale_a_value = tl.load(scale_a + expert_id)
scale_b_value = tl.load(scale_b + expert_id)
accumulator *= scale_a_value * scale_b_value
elif not (group_k > 0 and group_n > 0):
accumulator *= a_scale * b_scale

c_tile = accumulator.to(c_dtype)

Expand Down

0 comments on commit d802719

Please sign in to comment.