We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4eee521 commit a47d09bCopy full SHA for a47d09b
python/sglang/srt/models/deepseek_v2.py
@@ -55,7 +55,6 @@
55
)
56
from sglang.srt.layers.logits_processor import LogitsProcessor
57
from sglang.srt.layers.moe.ep_moe.layer import DeepEPMoE, EPMoE
58
-from sglang.srt.layers.moe.ep_moe.token_dispatcher import DeepEPDispatcher
59
from sglang.srt.layers.moe.fused_moe_triton import FusedMoE
60
from sglang.srt.layers.moe.topk import select_experts
61
from sglang.srt.layers.quantization.base_config import QuantizationConfig
@@ -88,6 +87,8 @@
88
87
89
if _is_cuda:
90
from sgl_kernel import awq_dequantize, bmm_fp8
+
91
+ from sglang.srt.layers.moe.ep_moe.token_dispatcher import DeepEPDispatcher
92
else:
93
from vllm import _custom_ops as ops
94
0 commit comments