Skip to content

Commit 408ba02

Browse files
authored
Add Llama 4 to FA3 test (#5509)
1 parent 094891c commit 408ba02

File tree

4 files changed

+178
-104
lines changed

4 files changed

+178
-104
lines changed

.github/workflows/pr-test.yml

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -87,6 +87,26 @@ jobs:
8787
cd test/srt
8888
python3 run_suite.py --suite per-commit-2-gpu
8989
90+
unit-test-backend-8-gpu:
91+
if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
92+
github.event.pull_request.draft == false
93+
runs-on: 8-gpu-runner
94+
steps:
95+
- name: Checkout code
96+
uses: actions/checkout@v4
97+
98+
- name: Install dependencies
99+
env:
100+
FLASHINFER_REPO: ${{ inputs.version == 'nightly' && 'https://flashinfer.ai/whl/nightly/cu124/torch2.5/flashinfer-python' || 'https://flashinfer.ai/whl/cu124/torch2.5/flashinfer-python' }}
101+
run: |
102+
bash scripts/ci_install_dependency.sh
103+
104+
- name: Run test
105+
timeout-minutes: 30
106+
run: |
107+
cd test/srt
108+
python3 run_suite.py --suite per-commit-8-gpu
109+
90110
performance-test-1-gpu-part-1:
91111
if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
92112
github.event.pull_request.draft == false

python/sglang/test/test_utils.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,13 @@
4444
)
4545

4646
DEFAULT_MODEL_NAME_FOR_TEST = "meta-llama/Llama-3.1-8B-Instruct"
47+
DEFAULT_MODEL_NAME_FOR_TEST_EAGLE3 = "jamesliu1/sglang-EAGLE3-Llama-3.1-Instruct-8B"
48+
DEFAULT_MODEL_NAME_FOR_TEST_MLA = "lmsys/sglang-ci-dsv3-test"
49+
DEFAULT_MODEL_NAME_FOR_TEST_MLA_NEXTN = "lmsys/sglang-ci-dsv3-test-NextN"
4750
DEFAULT_SMALL_MODEL_NAME_FOR_TEST = "meta-llama/Llama-3.2-1B-Instruct"
51+
DEFAULT_MODEL_NAME_FOR_TEST_LOCAL_ATTENTION = (
52+
"meta-llama/Llama-4-Scout-17B-16E-Instruct"
53+
)
4854
DEFAULT_MOE_MODEL_NAME_FOR_TEST = "mistralai/Mixtral-8x7B-Instruct-v0.1"
4955
DEFAULT_SMALL_MOE_MODEL_NAME_FOR_TEST = "Qwen/Qwen1.5-MoE-A2.7B"
5056
DEFAULT_SMALL_EMBEDDING_MODEL_NAME_FOR_TEST = "Alibaba-NLP/gte-Qwen2-1.5B-instruct"

test/srt/run_suite.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,6 @@ class TestFile:
3030
TestFile("test_chunked_prefill.py", 336),
3131
TestFile("test_eagle_infer.py", 500),
3232
TestFile("test_ebnf_constrained.py"),
33-
TestFile("test_fa3.py", 200),
3433
TestFile("test_fp8_kernel.py", 8),
3534
TestFile("test_embedding_openai_server.py", 36),
3635
TestFile("test_hidden_states.py", 55),
@@ -91,6 +90,9 @@ class TestFile:
9190
TestFile("test_update_weights_from_distributed.py", 100),
9291
TestFile("test_verl_engine.py", 100),
9392
],
93+
"per-commit-8-gpu": [
94+
TestFile("test_fa3.py", 30),
95+
],
9496
"nightly": [
9597
TestFile("test_nightly_gsm8k_eval.py"),
9698
],

0 commit comments

Comments
 (0)