Skip to content

Commit 2b31408

Browse files
committed
using dpsk v2 lite model
1 parent 97b8cb1 commit 2b31408

File tree

1 file changed

+3
-4
lines changed

1 file changed

+3
-4
lines changed

test/srt/test_flash_mla_attention_backend.py

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@
1717
)
1818

1919
# Use DeepSeek V3 model for testing
20-
DSV3_MODEL_FOR_TEST = "deepseek-ai/DeepSeek-V3"
20+
DSV3_MODEL_FOR_TEST = "deepseek-ai/DeepSeek-V2-Lite"
2121

2222

2323
class TestFlashMLAAttnBackend(unittest.TestCase):
@@ -30,6 +30,7 @@ def test_latency(self):
3030
"--enable-torch-compile",
3131
"--cuda-graph-max-bs",
3232
"16",
33+
"--trust-remote-code",
3334
],
3435
)
3536

@@ -56,9 +57,7 @@ def test_mmlu(self):
5657
)
5758

5859
metrics = run_eval(args)
59-
self.assertGreaterEqual(
60-
metrics["score"], 0.87
61-
) # Higher threshold based on DSV3 MMLU score from PR
60+
self.assertGreaterEqual(metrics["score"], 0.2)
6261
finally:
6362
kill_process_tree(process.pid)
6463

0 commit comments

Comments
 (0)