Skip to content

Commit d0e3041

Browse files
authored
Fix/fix qwen3 deploy (#157)
* merge * merge * add Mistral-Small-3.1-24B-Instruct-2503 * modify qwq-32b deploy * add txgemma model; * modify model list command * fix typo * add some ecs parameters * add glm4-z1 models * modify vllm backend * add qwen3 * fix cli bugs * fix * add deeseek r1/Qwen3-235B-A22B * fix local deploy account bug * add qwen 3 awq models * fix serialize_utils bugs * modify qwen3 deployment * modify docs * modify qwen3 engine;add strands client test * modify engine * merge
1 parent 58f3658 commit d0e3041

File tree

1 file changed

+11
-11
lines changed

1 file changed

+11
-11
lines changed

src/emd/models/llms/qwen.py

Lines changed: 11 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -539,7 +539,7 @@
539539
Model.register(
540540
dict(
541541
model_id = "Qwen3-0.6B",
542-
supported_engines=[vllm_qwen3_engin084],
542+
supported_engines=[vllm_qwen3_engin091],
543543
supported_instances=[
544544
g5d2xlarge_instance,
545545
g5d4xlarge_instance,
@@ -573,7 +573,7 @@
573573
Model.register(
574574
dict(
575575
model_id = "Qwen3-1.7B",
576-
supported_engines=[vllm_qwen3_engin084],
576+
supported_engines=[vllm_qwen3_engin091],
577577
supported_instances=[
578578
g5d2xlarge_instance,
579579
g5d4xlarge_instance,
@@ -608,7 +608,7 @@
608608
Model.register(
609609
dict(
610610
model_id = "Qwen3-4B",
611-
supported_engines=[vllm_qwen3_engin084],
611+
supported_engines=[vllm_qwen3_engin091],
612612
supported_instances=[
613613
g5d2xlarge_instance,
614614
g5d4xlarge_instance,
@@ -644,7 +644,7 @@
644644
Model.register(
645645
dict(
646646
model_id = "Qwen3-14B-AWQ",
647-
supported_engines=[vllm_qwen3_engin084],
647+
supported_engines=[vllm_qwen3_engin091],
648648
supported_instances=[
649649
g5d2xlarge_instance,
650650
g5d4xlarge_instance,
@@ -679,7 +679,7 @@
679679
Model.register(
680680
dict(
681681
model_id = "Qwen3-14B",
682-
supported_engines=[vllm_qwen3_engin084],
682+
supported_engines=[vllm_qwen3_engin091],
683683
supported_instances=[
684684
g5d12xlarge_instance,
685685
g5d24xlarge_instance,
@@ -714,7 +714,7 @@
714714
# Model.register(
715715
# dict(
716716
# model_id = "Qwen3-14B-FP8",
717-
# supported_engines=[vllm_qwen3_engin084],
717+
# supported_engines=[vllm_qwen3_engin091],
718718
# supported_instances=[
719719
# g5d2xlarge_instance,
720720
# g5d4xlarge_instance,
@@ -750,7 +750,7 @@
750750
Model.register(
751751
dict(
752752
model_id = "Qwen3-32B-AWQ",
753-
supported_engines=[vllm_qwen3_engin084],
753+
supported_engines=[vllm_qwen3_engin091],
754754
supported_instances=[
755755
g5d12xlarge_instance,
756756
g5d24xlarge_instance,
@@ -784,7 +784,7 @@
784784
Model.register(
785785
dict(
786786
model_id = "Qwen3-32B",
787-
supported_engines=[vllm_qwen3_engin084],
787+
supported_engines=[vllm_qwen3_engin091],
788788
supported_instances=[
789789
g5d12xlarge_instance,
790790
g5d24xlarge_instance,
@@ -817,7 +817,7 @@
817817
Model.register(
818818
dict(
819819
model_id = "Qwen3-30B-A3B",
820-
supported_engines=[vllm_qwen3_engin084],
820+
supported_engines=[vllm_qwen3_engin091],
821821
supported_instances=[
822822
g5d12xlarge_instance,
823823
g5d24xlarge_instance,
@@ -850,7 +850,7 @@
850850
Model.register(
851851
dict(
852852
model_id = "Qwen3-235B-A22B",
853-
supported_engines=[vllm_qwen3_engin084],
853+
supported_engines=[vllm_qwen3_engin091],
854854
supported_instances=[
855855
local_instance
856856
],
@@ -874,7 +874,7 @@
874874
Model.register(
875875
dict(
876876
model_id = "Qwen3-235B-A22B-FP8",
877-
supported_engines=[vllm_qwen3_engin084],
877+
supported_engines=[vllm_qwen3_engin091],
878878
supported_instances=[
879879
local_instance
880880
],

0 commit comments

Comments
 (0)