|
| 1 | +from ..engines import vllm_gptoss_engine |
| 2 | +from .. import Model |
| 3 | +from ..frameworks import fastapi_framework |
| 4 | +from ..services import ( |
| 5 | + sagemaker_service, |
| 6 | + sagemaker_async_service, |
| 7 | + ecs_service, |
| 8 | + local_service |
| 9 | +) |
| 10 | +from emd.models.utils.constants import ModelType |
| 11 | +from ..instances import ( |
| 12 | + g5d2xlarge_instance, |
| 13 | + g5d4xlarge_instance, |
| 14 | + g5d8xlarge_instance, |
| 15 | + g5d12xlarge_instance, |
| 16 | + g5d16xlarge_instance, |
| 17 | + g5d24xlarge_instance, |
| 18 | + g5d48xlarge_instance, |
| 19 | + g6e2xlarge_instance, |
| 20 | + local_instance |
| 21 | +) |
| 22 | +from ..utils.constants import ModelFilesDownloadSource |
| 23 | +from ..model_series import GPTOSS_SERIES |
| 24 | +Model.register( |
| 25 | + dict( |
| 26 | + model_id = "gpt-oss-20b", |
| 27 | + supported_engines=[vllm_gptoss_engine], |
| 28 | + supported_instances=[ |
| 29 | + g5d2xlarge_instance, |
| 30 | + g5d4xlarge_instance, |
| 31 | + g5d8xlarge_instance, |
| 32 | + g5d16xlarge_instance, |
| 33 | + # g5d24xlarge_instance, |
| 34 | + # g5d48xlarge_instance, |
| 35 | + local_instance |
| 36 | + ], |
| 37 | + supported_services=[ |
| 38 | + sagemaker_service, |
| 39 | + sagemaker_async_service, |
| 40 | + ecs_service, |
| 41 | + local_service |
| 42 | + ], |
| 43 | + supported_frameworks=[ |
| 44 | + fastapi_framework |
| 45 | + ], |
| 46 | + allow_china_region=True, |
| 47 | + huggingface_model_id="openai/gpt-oss-20b", |
| 48 | + modelscope_model_id="openai/gpt-oss-20b", |
| 49 | + require_huggingface_token=False, |
| 50 | + application_scenario="Agent, tool use, translation, summary", |
| 51 | + description="GPT-OSS (GPT Open Source Software) is OpenAI's initiative to provide open-source AI models, making advanced language models accessible to developers, researchers, and organizations. These models are designed for building, experimenting, and scaling generative AI applications while fostering innovation and collaboration in the open-source AI community.", |
| 52 | + model_type=ModelType.LLM, |
| 53 | + model_series=GPTOSS_SERIES |
| 54 | + ) |
| 55 | +) |
| 56 | + |
| 57 | + |
| 58 | +Model.register( |
| 59 | + dict( |
| 60 | + model_id = "gpt-oss-120b", |
| 61 | + supported_engines=[vllm_gptoss_engine], |
| 62 | + supported_instances=[ |
| 63 | + g5d12xlarge_instance, |
| 64 | + g5d24xlarge_instance, |
| 65 | + g5d48xlarge_instance, |
| 66 | + local_instance |
| 67 | + ], |
| 68 | + supported_services=[ |
| 69 | + sagemaker_service, |
| 70 | + sagemaker_async_service, |
| 71 | + ecs_service, |
| 72 | + local_service |
| 73 | + ], |
| 74 | + supported_frameworks=[ |
| 75 | + fastapi_framework |
| 76 | + ], |
| 77 | + allow_china_region=True, |
| 78 | + huggingface_model_id="openai/gpt-oss-120b", |
| 79 | + modelscope_model_id="openai/gpt-oss-120b", |
| 80 | + require_huggingface_token=False, |
| 81 | + application_scenario="Agent, tool use, translation, summary", |
| 82 | + description="GPT-OSS (GPT Open Source Software) is OpenAI's initiative to provide open-source AI models, making advanced language models accessible to developers, researchers, and organizations. These models are designed for building, experimenting, and scaling generative AI applications while fostering innovation and collaboration in the open-source AI community.", |
| 83 | + model_type=ModelType.LLM, |
| 84 | + model_series=GPTOSS_SERIES |
| 85 | + ) |
| 86 | +) |
0 commit comments