@@ -29,7 +29,7 @@ concurrency:
2929jobs :
3030
3131 unit-test-frontend :
32- if : github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
32+ if : ( github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') && github.event.pull_request.draft == false
3333 runs-on : 1-gpu-runner
3434 steps :
3535 - name : Checkout code
@@ -48,11 +48,12 @@ jobs:
4848 python3 run_suite.py --suite per-commit
4949
5050 unit-test-backend-1-gpu :
51- if : github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
51+ if : ( github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') && github.event.pull_request.draft == false
5252 runs-on : 1-gpu-runner
5353 strategy :
54+ fail-fast : false
5455 matrix :
55- range : [0-6, 6-16, 16-23, 23-30, 30-38, 38 -100]
56+ range : [0-6, 6-15, 15-22, 22-32, 32-40, 40 -100]
5657 steps :
5758 - name : Checkout code
5859 uses : actions/checkout@v3
7576
7677
7778 unit-test-backend-2-gpu :
78- if : github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
79+ if : ( github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') && github.event.pull_request.draft == false
7980 runs-on : 2-gpu-runner
8081 steps :
8182 - name : Checkout code
@@ -112,7 +113,7 @@ jobs:
112113 python3 test_moe_ep.py
113114
114115 performance-test-1-gpu-part-1 :
115- if : github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
116+ if : ( github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') && github.event.pull_request.draft == false
116117 runs-on : 1-gpu-runner
117118 steps :
118119 - name : Checkout code
@@ -128,7 +129,7 @@ jobs:
128129 timeout-minutes : 10
129130 run : |
130131 cd test/srt
131- python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_default
132+ python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_bs1
132133
133134 - name : Benchmark online latency
134135 timeout-minutes : 10
@@ -148,8 +149,15 @@ jobs:
148149 cd test/srt
149150 python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_non_stream_small_batch_size
150151
152+ - name : Benchmark online latency (EAGLE)
153+ timeout-minutes : 10
154+ run : |
155+ cd test/srt
156+ python3 -m unittest test_bench_serving.TestBenchServing.test_online_latency_eagle
157+
158+
151159 performance-test-1-gpu-part-2 :
152- if : github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
160+ if : ( github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') && github.event.pull_request.draft == false
153161 runs-on : 1-gpu-runner
154162 steps :
155163 - name : Checkout code
@@ -180,7 +188,7 @@ jobs:
180188 python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_default_fp8
181189
182190 performance-test-2-gpu :
183- if : github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
191+ if : ( github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') && github.event.pull_request.draft == false
184192 runs-on : 2-gpu-runner
185193 steps :
186194 - name : Checkout code
@@ -196,7 +204,13 @@ jobs:
196204 timeout-minutes : 10
197205 run : |
198206 cd test/srt
199- python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_moe_default
207+ python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_moe_tp2_bs1
208+
209+ - name : Benchmark single latency + torch.compile (TP=2)
210+ timeout-minutes : 10
211+ run : |
212+ cd test/srt
213+ python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_torch_compile_tp2_bs1
200214
201215 - name : Benchmark offline throughput (TP=2)
202216 timeout-minutes : 10
@@ -210,8 +224,9 @@ jobs:
210224 cd test/srt
211225 python3 -m unittest test_bench_serving.TestBenchServing.test_moe_offline_throughput_without_radix_cache
212226
227+
213228 accuracy-test-1-gpu :
214- if : github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
229+ if : ( github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') && github.event.pull_request.draft == false
215230 runs-on : 1-gpu-runner
216231 steps :
217232 - name : Checkout code
@@ -235,7 +250,7 @@ jobs:
235250
236251
237252 accuracy-test-2-gpu :
238- if : github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
253+ if : ( github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') && github.event.pull_request.draft == false
239254 runs-on : 2-gpu-runner
240255 steps :
241256 - name : Checkout code
0 commit comments