Skip to content

Commit a47d09b

Browse files
zhyncsjianan-gu
authored andcommitted
fix: use DeepEPDispatcher on CUDA (sgl-project#5180)
1 parent 4eee521 commit a47d09b

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

python/sglang/srt/models/deepseek_v2.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,6 @@
5555
)
5656
from sglang.srt.layers.logits_processor import LogitsProcessor
5757
from sglang.srt.layers.moe.ep_moe.layer import DeepEPMoE, EPMoE
58-
from sglang.srt.layers.moe.ep_moe.token_dispatcher import DeepEPDispatcher
5958
from sglang.srt.layers.moe.fused_moe_triton import FusedMoE
6059
from sglang.srt.layers.moe.topk import select_experts
6160
from sglang.srt.layers.quantization.base_config import QuantizationConfig
@@ -88,6 +87,8 @@
8887

8988
if _is_cuda:
9089
from sgl_kernel import awq_dequantize, bmm_fp8
90+
91+
from sglang.srt.layers.moe.ep_moe.token_dispatcher import DeepEPDispatcher
9192
else:
9293
from vllm import _custom_ops as ops
9394

0 commit comments

Comments
 (0)