File tree Expand file tree Collapse file tree 3 files changed +3
-3
lines changed
sglang/srt/layers/quantization Expand file tree Collapse file tree 3 files changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -47,7 +47,7 @@ runtime_common = [
47
47
48
48
srt = [
49
49
" sglang[runtime_common]" ,
50
- " sgl-kernel==0.0.8" ,
50
+ " sgl-kernel==0.0.8.post3 " ,
51
51
" flashinfer_python==0.2.3" ,
52
52
" torch==2.5.1" ,
53
53
" torchvision==0.20.1" ,
Original file line number Diff line number Diff line change 41
41
42
42
_is_cuda = is_cuda ()
43
43
if _is_cuda :
44
- import deep_gemm # `pip install "sgl-kernel>=0.0.4.post3"`
44
+ import deep_gemm
45
45
from sgl_kernel import sgl_per_token_group_quant_fp8 , sgl_per_token_quant_fp8
46
46
47
47
sm_version = get_device_sm ()
Original file line number Diff line number Diff line change @@ -20,7 +20,7 @@ pip install --upgrade pip
20
20
21
21
# Install flashinfer and sgl-kernel
22
22
pip install flashinfer_python==0.2.3 --find-links ${FLASHINFER_REPO} --no-cache-dir
23
- pip install sgl-kernel==0.0.8 --no-cache-dir
23
+ pip install sgl-kernel==0.0.8.post3 --no-cache-dir
24
24
25
25
# Install the main package
26
26
pip install -e " python[all]" --find-links ${FLASHINFER_REPO}
You can’t perform that action at this time.
0 commit comments