Skip to content

Commit 0d116b9

Browse files
authored
Clean up deprecated tile_tokens_dim for next flashinfer (sgl-project#13341)
Signed-off-by: Vincent Zhong <207368749+vincentzed@users.noreply.github.com>
1 parent 4a56fa5 commit 0d116b9

4 files changed

Lines changed: 0 additions & 4 deletions

File tree

python/sglang/srt/layers/moe/fused_moe_triton/layer.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1129,7 +1129,6 @@ def forward(self, hidden_states: torch.Tensor, topk_output: TopKOutput):
11291129
local_expert_offset=self.moe_ep_rank * self.num_local_experts,
11301130
local_num_experts=self.num_local_experts,
11311131
routed_scaling_factor=self.moe_runner_config.routed_scaling_factor,
1132-
tile_tokens_dim=None,
11331132
routing_method_type=RoutingMethodType.DeepSeekV3,
11341133
do_finalize=True,
11351134
output=symm_output,

python/sglang/srt/layers/quantization/fp8.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1245,7 +1245,6 @@ def apply_with_router_logits(
12451245
routed_scaling_factor=(
12461246
routed_scaling_factor if routed_scaling_factor is not None else 1.0
12471247
),
1248-
tile_tokens_dim=None,
12491248
routing_method_type=routing_method_type,
12501249
use_shuffled_weight=False,
12511250
)

python/sglang/srt/layers/quantization/modelopt_quant.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -695,7 +695,6 @@ def apply(
695695
else 1.0
696696
),
697697
use_routing_scales_on_input=use_routing_scales_on_input,
698-
tile_tokens_dim=None,
699698
routing_method_type=routing_method_type,
700699
)
701700

python/sglang/srt/layers/quantization/mxfp4.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -681,7 +681,6 @@ def apply(
681681
layer.moe_ep_rank * layer.num_local_experts, # local_expert_offset
682682
layer.num_local_experts, # local num experts
683683
None,
684-
None, # tile_tokens_dim
685684
1, # routing_method_type, renormalize
686685
True, # do finalize
687686
output=symm_output,

0 commit comments

Comments
 (0)