Skip to content

Commit 3aaf8a3

Browse files
committed
Merge remote-tracking branch 'origin/main'
2 parents 9b9944a + a8debfd commit 3aaf8a3

File tree

1 file changed

+60
-0
lines changed

1 file changed

+60
-0
lines changed

src/emd/models/llms/qwen.py

Lines changed: 60 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -846,6 +846,66 @@
846846
)
847847
)
848848

849+
Model.register(
850+
dict(
851+
model_id = "Qwen3-30B-A3B-Instruct-2507",
852+
supported_engines=[vllm_qwen3_engin091],
853+
supported_instances=[
854+
g5d12xlarge_instance,
855+
g5d24xlarge_instance,
856+
g5d48xlarge_instance,
857+
local_instance
858+
],
859+
supported_services=[
860+
sagemaker_service,
861+
sagemaker_async_service,
862+
ecs_service,
863+
local_service
864+
],
865+
supported_frameworks=[
866+
fastapi_framework
867+
],
868+
allow_china_region=True,
869+
huggingface_model_id="Qwen/Qwen3-30B-A3B-Instruct-2507",
870+
modelscope_model_id="Qwen/Qwen3-30B-A3B-Instruct-2507",
871+
require_huggingface_token=False,
872+
application_scenario="Agent, tool use, translation, summary, instruction following, reasoning",
873+
description="Qwen3-30B-A3B-Instruct-2507 is an updated instruction-tuned version featuring significant improvements in general capabilities, including instruction following, logical reasoning, text comprehension, mathematics, science, coding and tool usage, with enhanced 256K long-context understanding and better alignment with user preferences.",
874+
model_type=ModelType.LLM,
875+
model_series=QWEN3_SERIES
876+
)
877+
)
878+
879+
Model.register(
880+
dict(
881+
model_id = "Qwen3-30B-A3B-Thinking-2507",
882+
supported_engines=[vllm_qwen3_engin091],
883+
supported_instances=[
884+
g5d12xlarge_instance,
885+
g5d24xlarge_instance,
886+
g5d48xlarge_instance,
887+
local_instance
888+
],
889+
supported_services=[
890+
sagemaker_service,
891+
sagemaker_async_service,
892+
ecs_service,
893+
local_service
894+
],
895+
supported_frameworks=[
896+
fastapi_framework
897+
],
898+
allow_china_region=True,
899+
huggingface_model_id="Qwen/Qwen3-30B-A3B-Thinking-2507",
900+
modelscope_model_id="Qwen/Qwen3-30B-A3B-Thinking-2507",
901+
require_huggingface_token=False,
902+
application_scenario="Advanced reasoning, mathematics, science, coding, logical reasoning, complex problem solving",
903+
description="Qwen3-30B-A3B-Thinking-2507 is an enhanced thinking-enabled version featuring significantly improved performance on reasoning tasks, including logical reasoning, mathematics, science, coding, and academic benchmarks. This model supports only thinking mode with enhanced 256K long-context understanding and markedly better general capabilities for highly complex reasoning tasks.",
904+
model_type=ModelType.LLM,
905+
model_series=QWEN3_SERIES
906+
)
907+
)
908+
849909

850910
Model.register(
851911
dict(

0 commit comments

Comments
 (0)