File tree Expand file tree Collapse file tree 2 files changed +9
-1
lines changed Expand file tree Collapse file tree 2 files changed +9
-1
lines changed Original file line number Diff line number Diff line change @@ -118,6 +118,13 @@ class KtransformersEngine(OpenAICompitableEngine):
118
118
"default_cli_args" : "--max_num_seq 256 --max_model_len 16000 --chat-template emd/models/chat_templates/deepseek_r1_distill.jinja"
119
119
})
120
120
121
+ vllm_deepseek_r1_distill_qwen_engine085 = VllmEngine (** {
122
+ ** vllm_engine064 .model_dump (),
123
+ "engine_dockerfile_config" : {"VERSION" :"v0.8.5" },
124
+ "default_cli_args" : "--max_num_seq 256 --max_model_len 16000 --chat-template emd/models/chat_templates/deepseek_r1_distill.jinja"
125
+ })
126
+
127
+
121
128
vllm_deepseek_r1_distill_llama_engine071 = vllm_deepseek_r1_distill_qwen_engine071
122
129
123
130
vllm_deepseek_r1_engine084 = VllmEngine (** {
Original file line number Diff line number Diff line change 1
1
from .. import Model
2
2
from ..engines import (
3
3
vllm_deepseek_r1_distill_qwen_engine071 ,
4
+ vllm_deepseek_r1_distill_qwen_engine085 ,
4
5
vllm_deepseek_r1_distill_llama_engine071 ,
5
6
ollama_deepseek_r1_qwen2d5_1d5b_engine057 ,
6
7
llama_cpp_deepseek_r1_1d58_bit_engine_b9ab0a4 ,
307
308
Model .register (
308
309
dict (
309
310
model_id = "DeepSeek-R1-0528-Qwen3-8B" ,
310
- supported_engines = [vllm_deepseek_r1_distill_llama_engine071 ],
311
+ supported_engines = [vllm_deepseek_r1_distill_qwen_engine085 ],
311
312
supported_instances = [
312
313
g5dxlarge_instance ,
313
314
g5d2xlarge_instance ,
You can’t perform that action at this time.
0 commit comments