|
| 1 | +| ModeId | ModelSeries | ModelType | Supported Engines | Supported Instances | Supported Services | Support China Region | |
| 2 | +|:----------------------------------|:-------------------------|:------------|:--------------------|:---------------------------------------------------------------------------------------------------------------------|:------------------------------|:-----------------------| |
| 3 | +| glm-4-9b-chat | glm4 | llm | vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 4 | +| internlm2_5-20b-chat-4bit-awq | internlm2.5 | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.12xlarge,g5.16xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 5 | +| internlm2_5-20b-chat | internlm2.5 | llm | vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 6 | +| internlm2_5-7b-chat | internlm2.5 | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.12xlarge,g5.16xlarge,g5.24xlarge,g5.48xlarge,g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 7 | +| internlm2_5-7b-chat-4bit | internlm2.5 | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.12xlarge,g5.16xlarge,g5.24xlarge,g5.48xlarge,g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ❎ | |
| 8 | +| internlm2_5-1_8b-chat | internlm2.5 | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.12xlarge,g5.16xlarge,g5.24xlarge,g5.48xlarge,g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 9 | +| Qwen2.5-7B-Instruct | qwen2.5 | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.12xlarge,g5.16xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 10 | +| Qwen2.5-72B-Instruct-AWQ | qwen2.5 | llm | vllm,tgi | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 11 | +| Qwen2.5-72B-Instruct | qwen2.5 | llm | vllm | g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 12 | +| Qwen2.5-72B-Instruct-AWQ-128k | qwen2.5 | llm | vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 13 | +| Qwen2.5-32B-Instruct | qwen2.5 | llm | vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 14 | +| Qwen2.5-0.5B-Instruct | qwen2.5 | llm | vllm,tgi | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge,inf2.8xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 15 | +| Qwen2.5-1.5B-Instruct | qwen2.5 | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 16 | +| Qwen2.5-3B-Instruct | qwen2.5 | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 17 | +| Qwen2.5-14B-Instruct-AWQ | qwen2.5 | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 18 | +| Qwen2.5-14B-Instruct | qwen2.5 | llm | vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 19 | +| QwQ-32B-Preview | qwen reasoning model | llm | huggingface,vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 20 | +| llama-3.3-70b-instruct-awq | llama | llm | tgi | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ❎ | |
| 21 | +| DeepSeek-R1-Distill-Qwen-32B | deepseek reasoning model | llm | vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ❎ | |
| 22 | +| DeepSeek-R1-Distill-Qwen-14B | deepseek reasoning model | llm | vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ❎ | |
| 23 | +| DeepSeek-R1-Distill-Qwen-7B | deepseek reasoning model | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker,sagemaker_async,ecs | ❎ | |
| 24 | +| DeepSeek-R1-Distill-Qwen-1.5B | deepseek reasoning model | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker,sagemaker_async,ecs | ❎ | |
| 25 | +| DeepSeek-R1-Distill-Llama-8B | deepseek reasoning model | llm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker,sagemaker_async,ecs | ❎ | |
| 26 | +| deepseek-r1-distill-llama-70b-awq | deepseek reasoning model | llm | tgi,vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ✅ | |
| 27 | +| Baichuan-M1-14B-Instruct | baichuan | llm | huggingface | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async,ecs | ❎ | |
| 28 | +| Qwen2-VL-72B-Instruct-AWQ | qwen2vl | vlm | vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async | ✅ | |
| 29 | +| QVQ-72B-Preview-AWQ | qwen reasoning model | vlm | vllm | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async | ❎ | |
| 30 | +| Qwen2-VL-7B-Instruct | qwen2vl | vlm | vllm | g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.12xlarge,g5.16xlarge,g5.24xlarge,g5.48xlarge,g6e.2xlarge | sagemaker,sagemaker_async | ✅ | |
| 31 | +| InternVL2_5-78B-AWQ | internvl2.5 | vlm | lmdeploy | g5.12xlarge,g5.24xlarge,g5.48xlarge | sagemaker,sagemaker_async | ❎ | |
| 32 | +| txt2video-LTX | comfyui | video | comfyui | g5.4xlarge,g5.8xlarge,g6e.2xlarge | sagemaker_async | ❎ | |
| 33 | +| whisper | whisper | whisper | huggingface | g5.xlarge,g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker_async | ❎ | |
| 34 | +| bge-base-en-v1.5 | bge | embedding | vllm | g5.xlarge,g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker | ✅ | |
| 35 | +| bge-m3 | bge | embedding | vllm | g5.xlarge,g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker,ecs | ✅ | |
| 36 | +| bge-reranker-v2-m3 | bge | rerank | vllm | g5.xlarge,g5.2xlarge,g5.4xlarge,g5.8xlarge,g5.16xlarge | sagemaker | ✅ | |
0 commit comments