You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
{{ message }}
This repository was archived by the owner on Sep 20, 2025. It is now read-only.
Copy file name to clipboardExpand all lines: src/emd/models/model_series.py
+6Lines changed: 6 additions & 0 deletions
Original file line number
Diff line number
Diff line change
@@ -157,3 +157,9 @@
157
157
description="General Multimodal Embedding (GME) models based on Qwen2-VL architecture, designed for unified multimodal representation learning supporting text, image, and image-text pair inputs for retrieval and search applications.",
description="dots.ocr is a powerful, multilingual document parser that unifies layout detection and content recognition within a single vision-language model while maintaining good reading order. Despite its compact 1.7B-parameter LLM foundation, it achieves state-of-the-art(SOTA) performance on text, tables, and reading order tasks with multilingual support for over 100 languages.",
from ..enginesimportvllm_dots_ocr_engine091, huggingface_llm_engine_4d41d2
4
+
from ..instancesimport (
5
+
g5d2xlarge_instance,
6
+
g5d4xlarge_instance,
7
+
g5d8xlarge_instance,
8
+
g5d12xlarge_instance,
9
+
g5d16xlarge_instance,
10
+
g5d24xlarge_instance,
11
+
g5d48xlarge_instance,
12
+
local_instance
13
+
)
14
+
from ..servicesimport (
15
+
sagemaker_service,
16
+
sagemaker_async_service,
17
+
ecs_service,
18
+
local_service
19
+
)
20
+
from ..frameworksimportfastapi_framework
21
+
fromemd.models.utils.constantsimportModelType
22
+
23
+
Model.register(
24
+
dict(
25
+
model_id="rednote-hilab-dots-ocr",
26
+
model_type=ModelType.VLM,
27
+
description="dots.ocr is a powerful, multilingual document parser that unifies layout detection and content recognition within a single vision-language model. Built on a compact 1.7B-parameter LLM foundation, it achieves state-of-the-art performance on text, tables, and reading order tasks with support for over 100 languages including English, Chinese, and many others.",
28
+
application_scenario="multilingual document layout parsing, OCR, document understanding, table extraction, formula recognition, reading order detection",
0 commit comments