@@ -36,19 +36,19 @@ jobs:
36
36
uses : actions/checkout@v4
37
37
38
38
- name : Start CI container
39
- run : bash scripts/amd_ci_start_container.sh
39
+ run : bash scripts/ci/ amd_ci_start_container.sh
40
40
env :
41
41
GITHUB_WORKSPACE : ${{ github.workspace }}
42
42
43
43
- name : Install dependencies
44
- run : bash scripts/amd_ci_install_dependency.sh
44
+ run : bash scripts/ci/ amd_ci_install_dependency.sh
45
45
46
46
- name : Evaluate Accuracy
47
47
timeout-minutes : 30
48
48
run : |
49
- bash scripts/amd_ci_exec.sh -e SGLANG_USE_AITER=0 python3 test_eval_accuracy_large.py
50
- bash scripts/amd_ci_exec.sh python3 test_eval_fp8_accuracy.py
51
- bash scripts/amd_ci_exec.sh python3 models/test_qwen_models.py
49
+ bash scripts/ci/ amd_ci_exec.sh -e SGLANG_USE_AITER=0 python3 test_eval_accuracy_large.py
50
+ bash scripts/ci/ amd_ci_exec.sh python3 test_eval_fp8_accuracy.py
51
+ bash scripts/ci/ amd_ci_exec.sh python3 models/test_qwen_models.py
52
52
53
53
accuracy-test-2-gpu-amd :
54
54
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
@@ -62,17 +62,17 @@ jobs:
62
62
uses : actions/checkout@v4
63
63
64
64
- name : Start CI container
65
- run : bash scripts/amd_ci_start_container.sh
65
+ run : bash scripts/ci/ amd_ci_start_container.sh
66
66
env :
67
67
GITHUB_WORKSPACE : ${{ github.workspace }}
68
68
69
69
- name : Install dependencies
70
- run : bash scripts/amd_ci_install_dependency.sh
70
+ run : bash scripts/ci/ amd_ci_install_dependency.sh
71
71
72
72
- name : Evaluate accuracy (TP=2)
73
73
timeout-minutes : 30
74
74
run : |
75
- bash scripts/amd_ci_exec.sh -e SGLANG_USE_AITER=0 python3 test_moe_eval_accuracy_large.py
75
+ bash scripts/ci/ amd_ci_exec.sh -e SGLANG_USE_AITER=0 python3 test_moe_eval_accuracy_large.py
76
76
77
77
mla-test-1-gpu-amd :
78
78
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
@@ -86,17 +86,17 @@ jobs:
86
86
uses : actions/checkout@v4
87
87
88
88
- name : Start CI container
89
- run : bash scripts/amd_ci_start_container.sh
89
+ run : bash scripts/ci/ amd_ci_start_container.sh
90
90
env :
91
91
GITHUB_WORKSPACE : ${{ github.workspace }}
92
92
93
93
- name : Install dependencies
94
- run : bash scripts/amd_ci_install_dependency.sh
94
+ run : bash scripts/ci/ amd_ci_install_dependency.sh
95
95
96
96
- name : MLA TEST
97
97
timeout-minutes : 30
98
98
run : |
99
- bash scripts/amd_ci_exec.sh python3 test_mla.py
99
+ bash scripts/ci/ amd_ci_exec.sh python3 test_mla.py
100
100
101
101
performance-test-1-gpu-part-1-amd :
102
102
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
@@ -110,33 +110,33 @@ jobs:
110
110
uses : actions/checkout@v4
111
111
112
112
- name : Start CI container
113
- run : bash scripts/amd_ci_start_container.sh
113
+ run : bash scripts/ci/ amd_ci_start_container.sh
114
114
env :
115
115
GITHUB_WORKSPACE : ${{ github.workspace }}
116
116
117
117
- name : Install dependencies
118
- run : bash scripts/amd_ci_install_dependency.sh
118
+ run : bash scripts/ci/ amd_ci_install_dependency.sh
119
119
120
120
- name : Benchmark single latency
121
121
timeout-minutes : 20
122
122
run : |
123
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_bs1_small
124
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_bs1_default
123
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_bs1_small
124
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_bs1_default
125
125
126
126
- name : Benchmark online latency
127
127
timeout-minutes : 15
128
128
run : |
129
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_online_latency_default
129
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_online_latency_default
130
130
131
131
- name : Benchmark offline throughput
132
132
timeout-minutes : 15
133
133
run : |
134
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_default
134
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_default
135
135
136
136
- name : Benchmark offline throughput (Non-streaming, small batch size)
137
137
timeout-minutes : 15
138
138
run : |
139
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_non_stream_small_batch_size
139
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_non_stream_small_batch_size
140
140
141
141
performance-test-1-gpu-part-2-amd :
142
142
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
@@ -150,27 +150,27 @@ jobs:
150
150
uses : actions/checkout@v4
151
151
152
152
- name : Start CI container
153
- run : bash scripts/amd_ci_start_container.sh
153
+ run : bash scripts/ci/ amd_ci_start_container.sh
154
154
env :
155
155
GITHUB_WORKSPACE : ${{ github.workspace }}
156
156
157
157
- name : Install dependencies
158
- run : bash scripts/amd_ci_install_dependency.sh
158
+ run : bash scripts/ci/ amd_ci_install_dependency.sh
159
159
160
160
- name : Benchmark offline throughput (w/o RadixAttention)
161
161
timeout-minutes : 15
162
162
run : |
163
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_without_radix_cache
163
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_without_radix_cache
164
164
165
165
- name : Benchmark offline throughput (w/ Triton)
166
166
timeout-minutes : 15
167
167
run : |
168
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_with_triton_attention_backend
168
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_with_triton_attention_backend
169
169
170
170
- name : Benchmark offline throughput (w/ FP8)
171
171
timeout-minutes : 15
172
172
run : |
173
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_default_fp8
173
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_offline_throughput_default_fp8
174
174
175
175
bench-test-2-gpu-amd :
176
176
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
@@ -184,37 +184,37 @@ jobs:
184
184
uses : actions/checkout@v4
185
185
186
186
- name : Start CI container
187
- run : bash scripts/amd_ci_start_container.sh
187
+ run : bash scripts/ci/ amd_ci_start_container.sh
188
188
env :
189
189
GITHUB_WORKSPACE : ${{ github.workspace }}
190
190
191
191
- name : Install dependencies
192
- run : bash scripts/amd_ci_install_dependency.sh
192
+ run : bash scripts/ci/ amd_ci_install_dependency.sh
193
193
194
194
- name : Benchmark dummy grok (TP=2)
195
195
timeout-minutes : 30
196
196
run : |
197
- bash scripts/amd_ci_exec.sh python3 models/test_dummy_grok_models.py
197
+ bash scripts/ci/ amd_ci_exec.sh python3 models/test_dummy_grok_models.py
198
198
199
199
- name : Benchmark single latency (TP=2)
200
200
timeout-minutes : 25
201
201
run : |
202
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_moe_tp2_bs1
202
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_moe_tp2_bs1
203
203
204
204
- name : Benchmark single latency + torch.compile (TP=2)
205
205
timeout-minutes : 25
206
206
run : |
207
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_torch_compile_tp2_bs1
207
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_one_batch.TestBenchOneBatch.test_torch_compile_tp2_bs1
208
208
209
209
- name : Benchmark offline throughput (TP=2)
210
210
timeout-minutes : 25
211
211
run : |
212
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_moe_offline_throughput_default
212
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_moe_offline_throughput_default
213
213
214
214
- name : Benchmark offline throughput (w/o RadixAttention) (TP=2)
215
215
timeout-minutes : 25
216
216
run : |
217
- bash scripts/amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_moe_offline_throughput_without_radix_cache
217
+ bash scripts/ci/ amd_ci_exec.sh python3 -m unittest test_bench_serving.TestBenchServing.test_moe_offline_throughput_without_radix_cache
218
218
219
219
unit-test-backend-1-gpu-amd :
220
220
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
@@ -230,17 +230,17 @@ jobs:
230
230
uses : actions/checkout@v4
231
231
232
232
- name : Start CI container
233
- run : bash scripts/amd_ci_start_container.sh
233
+ run : bash scripts/ci/ amd_ci_start_container.sh
234
234
env :
235
235
GITHUB_WORKSPACE : ${{ github.workspace }}
236
236
237
237
- name : Install dependencies
238
- run : bash scripts/amd_ci_install_dependency.sh
238
+ run : bash scripts/ci/ amd_ci_install_dependency.sh
239
239
240
240
- name : Run test
241
241
timeout-minutes : 50
242
242
run : |
243
- bash scripts/amd_ci_exec.sh python3 run_suite.py --suite per-commit-amd --auto-partition-id ${{ matrix.part }} --auto-partition-size 7
243
+ bash scripts/ci/ amd_ci_exec.sh python3 run_suite.py --suite per-commit-amd --auto-partition-id ${{ matrix.part }} --auto-partition-size 7
244
244
245
245
unit-test-backend-2-gpu-amd :
246
246
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
@@ -254,17 +254,17 @@ jobs:
254
254
uses : actions/checkout@v4
255
255
256
256
- name : Start CI container
257
- run : bash scripts/amd_ci_start_container.sh
257
+ run : bash scripts/ci/ amd_ci_start_container.sh
258
258
env :
259
259
GITHUB_WORKSPACE : ${{ github.workspace }}
260
260
261
261
- name : Install dependencies
262
- run : bash scripts/amd_ci_install_dependency.sh
262
+ run : bash scripts/ci/ amd_ci_install_dependency.sh
263
263
264
264
- name : Run test
265
265
timeout-minutes : 40
266
266
run : |
267
- bash scripts/amd_ci_exec.sh python3 run_suite.py --suite per-commit-2-gpu-amd
267
+ bash scripts/ci/ amd_ci_exec.sh python3 run_suite.py --suite per-commit-2-gpu-amd
268
268
269
269
unit-test-backend-8-gpu-amd :
270
270
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
@@ -278,22 +278,22 @@ jobs:
278
278
uses : actions/checkout@v4
279
279
280
280
- name : Start CI container
281
- run : bash scripts/amd_ci_start_container.sh
281
+ run : bash scripts/ci/ amd_ci_start_container.sh
282
282
env :
283
283
GITHUB_WORKSPACE : ${{ github.workspace }}
284
284
285
285
- name : Install dependencies
286
- run : bash scripts/amd_ci_install_dependency.sh
286
+ run : bash scripts/ci/ amd_ci_install_dependency.sh
287
287
288
288
- name : Run test
289
289
timeout-minutes : 60
290
290
run : |
291
- bash scripts/amd_ci_exec.sh python3 run_suite.py --suite per-commit-8-gpu-amd --timeout-per-file 3600
291
+ bash scripts/ci/ amd_ci_exec.sh python3 run_suite.py --suite per-commit-8-gpu-amd --timeout-per-file 3600
292
292
293
293
- name : Run CustomAllReduce test
294
294
timeout-minutes : 20
295
295
run : |
296
- bash scripts/amd_ci_exec.sh -e CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 python3 -m unittest test_custom_allreduce.TestCustomAllReduce
296
+ bash scripts/ci/ amd_ci_exec.sh -e CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 python3 -m unittest test_custom_allreduce.TestCustomAllReduce
297
297
298
298
unit-test-sgl-kernel-amd :
299
299
if : (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
@@ -308,13 +308,13 @@ jobs:
308
308
uses : actions/checkout@v4
309
309
310
310
- name : Start CI container
311
- run : bash scripts/amd_ci_start_container.sh
311
+ run : bash scripts/ci/ amd_ci_start_container.sh
312
312
env :
313
313
GITHUB_WORKSPACE : ${{ github.workspace }}
314
314
315
315
- name : Install dependencies
316
316
run : |
317
- bash scripts/amd_ci_install_dependency.sh
317
+ bash scripts/ci/ amd_ci_install_dependency.sh
318
318
319
319
- name : Run test
320
320
timeout-minutes : 10
0 commit comments