Skip to content

Commit afc58a9

Browse files
committed
feat: update vllm versions
1 parent 08d53e8 commit afc58a9

File tree

2 files changed

+9
-1
lines changed

2 files changed

+9
-1
lines changed

src/emd/models/engines.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -118,6 +118,13 @@ class KtransformersEngine(OpenAICompitableEngine):
118118
"default_cli_args": "--max_num_seq 256 --max_model_len 16000 --chat-template emd/models/chat_templates/deepseek_r1_distill.jinja"
119119
})
120120

121+
vllm_deepseek_r1_distill_qwen_engine085 = VllmEngine(**{
122+
**vllm_engine064.model_dump(),
123+
"engine_dockerfile_config": {"VERSION":"v0.8.5"},
124+
"default_cli_args": "--max_num_seq 256 --max_model_len 16000 --chat-template emd/models/chat_templates/deepseek_r1_distill.jinja"
125+
})
126+
127+
121128
vllm_deepseek_r1_distill_llama_engine071 = vllm_deepseek_r1_distill_qwen_engine071
122129

123130
vllm_deepseek_r1_engine084 = VllmEngine(**{

src/emd/models/llms/deepseek.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
from .. import Model
22
from ..engines import (
33
vllm_deepseek_r1_distill_qwen_engine071,
4+
vllm_deepseek_r1_distill_qwen_engine085,
45
vllm_deepseek_r1_distill_llama_engine071,
56
ollama_deepseek_r1_qwen2d5_1d5b_engine057,
67
llama_cpp_deepseek_r1_1d58_bit_engine_b9ab0a4,
@@ -307,7 +308,7 @@
307308
Model.register(
308309
dict(
309310
model_id = "DeepSeek-R1-0528-Qwen3-8B",
310-
supported_engines=[vllm_deepseek_r1_distill_llama_engine071],
311+
supported_engines=[vllm_deepseek_r1_distill_qwen_engine085],
311312
supported_instances=[
312313
g5dxlarge_instance,
313314
g5d2xlarge_instance,

0 commit comments

Comments
 (0)