Skip to content

Commit 9ce081c

Browse files
yubofredwangfinger92
authored andcommitted
Use public model for FA3 speculative decode testing (sgl-project#5152)
1 parent 7103f81 commit 9ce081c

File tree

1 file changed

+2
-4
lines changed

1 file changed

+2
-4
lines changed

test/srt/test_fa3.py

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -7,8 +7,6 @@
77
from sglang.srt.utils import get_device_sm, kill_process_tree
88
from sglang.test.few_shot_gsm8k import run_eval as run_eval_few_shot_gsm8k
99
from sglang.test.test_utils import (
10-
DEFAULT_EAGLE_DRAFT_MODEL_FOR_TEST,
11-
DEFAULT_EAGLE_TARGET_MODEL_FOR_TEST,
1210
DEFAULT_MLA_MODEL_NAME_FOR_TEST,
1311
DEFAULT_MODEL_NAME_FOR_TEST,
1412
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
@@ -125,7 +123,7 @@ def get_server_args(cls):
125123
class TestFlashAttention3SpeculativeDecode(BaseFlashAttentionTest):
126124
"""Test FlashAttention3 with speculative decode enabled."""
127125

128-
model = DEFAULT_EAGLE_TARGET_MODEL_FOR_TEST
126+
model = "meta-llama/Llama-3.1-8B-Instruct"
129127

130128
@classmethod
131129
def get_server_args(cls):
@@ -137,7 +135,7 @@ def get_server_args(cls):
137135
"--speculative-algorithm",
138136
"EAGLE3",
139137
"--speculative-draft",
140-
DEFAULT_EAGLE_DRAFT_MODEL_FOR_TEST,
138+
"jamesliu1/sglang-EAGLE3-Llama-3.1-Instruct-8B",
141139
"--speculative-num-steps",
142140
"3",
143141
"--speculative-eagle-topk",

0 commit comments

Comments
 (0)