Skip to content

Commit 3c4e0ee

Browse files
authored
[CI] Tune threshold (#5787)
1 parent 9c08882 commit 3c4e0ee

File tree

3 files changed

+5
-5
lines changed

3 files changed

+5
-5
lines changed

test/srt/run_suite.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -82,10 +82,10 @@ class TestFile:
8282
TestFile("test_triton_moe_channel_fp8_kernel.py", 25),
8383
],
8484
"per-commit-2-gpu": [
85-
TestFile("models/lora/test_lora_tp.py", 300),
85+
TestFile("models/lora/test_lora_tp.py", 150),
8686
TestFile("test_data_parallelism.py", 90),
87-
TestFile("test_dp_attention.py", 90),
88-
TestFile("test_mla_tp.py", 420),
87+
TestFile("test_dp_attention.py", 150),
88+
TestFile("test_mla_tp.py", 174),
8989
TestFile("test_moe_ep.py", 220),
9090
TestFile("test_patch_torch.py", 30),
9191
TestFile("test_update_weights_from_distributed.py", 100),

test/srt/test_bench_one_batch.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -51,7 +51,7 @@ def test_torch_compile_tp2_bs1(self):
5151
f"### test_torch_compile_tp2_bs1\n"
5252
f"output_throughput : {output_throughput:.2f} token/s\n"
5353
)
54-
self.assertGreater(output_throughput, 235)
54+
self.assertGreater(output_throughput, 225)
5555

5656

5757
if __name__ == "__main__":

test/srt/test_torch_native_attention_backend.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ def test_latency(self):
2828

2929
if is_in_ci():
3030
# Torch native backend is expected to be slower
31-
assert output_throughput > 50, f"{output_throughput=}"
31+
self.assertGreater(output_throughput, 40)
3232

3333
def test_mmlu(self):
3434
model = DEFAULT_MODEL_NAME_FOR_TEST

0 commit comments

Comments
 (0)