Skip to content

Commit

Permalink
fix
Browse files Browse the repository at this point in the history
  • Loading branch information
sleepcoo committed Feb 16, 2025
1 parent d51b907 commit c2edfb7
Showing 1 changed file with 5 additions and 1 deletion.
6 changes: 5 additions & 1 deletion python/sglang/srt/layers/moe/ep_moe/layer.py
Original file line number Diff line number Diff line change
Expand Up @@ -78,6 +78,10 @@ def forward(
)
else:
assert weight_column_major == True
if self.quant_method.quant_config == None:
block_size = None
else:
block_size = (self.quant_method.quant_config.weight_block_size,)
c = grouped_gemm_triton(
a,
b,
Expand All @@ -89,7 +93,7 @@ def forward(
use_fp8_w8a8,
scale_a,
scale_b,
block_shape=self.quant_method.quant_config.weight_block_size,
block_shape=block_size,
)
return c

Expand Down

0 comments on commit c2edfb7

Please sign in to comment.