|
846 | 846 | )
|
847 | 847 | )
|
848 | 848 |
|
| 849 | +Model.register( |
| 850 | + dict( |
| 851 | + model_id = "Qwen3-30B-A3B-Instruct-2507", |
| 852 | + supported_engines=[vllm_qwen3_engin091], |
| 853 | + supported_instances=[ |
| 854 | + g5d12xlarge_instance, |
| 855 | + g5d24xlarge_instance, |
| 856 | + g5d48xlarge_instance, |
| 857 | + local_instance |
| 858 | + ], |
| 859 | + supported_services=[ |
| 860 | + sagemaker_service, |
| 861 | + sagemaker_async_service, |
| 862 | + ecs_service, |
| 863 | + local_service |
| 864 | + ], |
| 865 | + supported_frameworks=[ |
| 866 | + fastapi_framework |
| 867 | + ], |
| 868 | + allow_china_region=True, |
| 869 | + huggingface_model_id="Qwen/Qwen3-30B-A3B-Instruct-2507", |
| 870 | + modelscope_model_id="Qwen/Qwen3-30B-A3B-Instruct-2507", |
| 871 | + require_huggingface_token=False, |
| 872 | + application_scenario="Agent, tool use, translation, summary, instruction following, reasoning", |
| 873 | + description="Qwen3-30B-A3B-Instruct-2507 is an updated instruction-tuned version featuring significant improvements in general capabilities, including instruction following, logical reasoning, text comprehension, mathematics, science, coding and tool usage, with enhanced 256K long-context understanding and better alignment with user preferences.", |
| 874 | + model_type=ModelType.LLM, |
| 875 | + model_series=QWEN3_SERIES |
| 876 | + ) |
| 877 | +) |
| 878 | + |
| 879 | +Model.register( |
| 880 | + dict( |
| 881 | + model_id = "Qwen3-30B-A3B-Thinking-2507", |
| 882 | + supported_engines=[vllm_qwen3_engin091], |
| 883 | + supported_instances=[ |
| 884 | + g5d12xlarge_instance, |
| 885 | + g5d24xlarge_instance, |
| 886 | + g5d48xlarge_instance, |
| 887 | + local_instance |
| 888 | + ], |
| 889 | + supported_services=[ |
| 890 | + sagemaker_service, |
| 891 | + sagemaker_async_service, |
| 892 | + ecs_service, |
| 893 | + local_service |
| 894 | + ], |
| 895 | + supported_frameworks=[ |
| 896 | + fastapi_framework |
| 897 | + ], |
| 898 | + allow_china_region=True, |
| 899 | + huggingface_model_id="Qwen/Qwen3-30B-A3B-Thinking-2507", |
| 900 | + modelscope_model_id="Qwen/Qwen3-30B-A3B-Thinking-2507", |
| 901 | + require_huggingface_token=False, |
| 902 | + application_scenario="Advanced reasoning, mathematics, science, coding, logical reasoning, complex problem solving", |
| 903 | + description="Qwen3-30B-A3B-Thinking-2507 is an enhanced thinking-enabled version featuring significantly improved performance on reasoning tasks, including logical reasoning, mathematics, science, coding, and academic benchmarks. This model supports only thinking mode with enhanced 256K long-context understanding and markedly better general capabilities for highly complex reasoning tasks.", |
| 904 | + model_type=ModelType.LLM, |
| 905 | + model_series=QWEN3_SERIES |
| 906 | + ) |
| 907 | +) |
| 908 | + |
849 | 909 |
|
850 | 910 | Model.register(
|
851 | 911 | dict(
|
|
0 commit comments