1 file changed
+1
-1
lines changed- doc/source/_static/xllamacpp_param.png
- doc/source/getting_started/installation.rst+3-15
- doc/source/getting_started/using_docker_image.rst+3-1
- doc/source/getting_started/using_xinference.rst+11
- doc/source/locale/zh_CN/LC_MESSAGES/getting_started/installation.po+17-25
- doc/source/locale/zh_CN/LC_MESSAGES/getting_started/using_docker_image.po+45-28
- doc/source/locale/zh_CN/LC_MESSAGES/getting_started/using_xinference.po+23-11
- doc/source/locale/zh_CN/LC_MESSAGES/user_guide/backends.po+118-133
- doc/source/models/builtin/image/index.rst+2
- doc/source/models/builtin/image/qwen-image.rst+20
- doc/source/models/builtin/llm/deepseek-r1-0528.rst+1-1
- doc/source/models/builtin/llm/gpt-oss.rst+47
- doc/source/models/builtin/llm/index.rst+3-3
- doc/source/models/builtin/llm/qwen3-coder.rst+1-1
- doc/source/models/builtin/llm/qwen3-instruct.rst+1-1
- doc/source/models/model_abilities/image.rst+9-2
- doc/source/models/model_abilities/tools.rst+3
- doc/source/user_guide/backends.rst+11
- setup.cfg+3
- xinference/api/restful_api.py+2-1
- xinference/core/model.py+5
- xinference/core/supervisor.py+2-3
- xinference/core/worker.py+3-4
- xinference/deploy/docker/Dockerfile+3-1
- xinference/deploy/docker/Dockerfile.cu128+4-4
- xinference/deploy/docker/requirements/requirements-models.txt+2-2
- xinference/deploy/docker/requirements_12.8/requirements-cu128-base.txt
- xinference/deploy/docker/requirements_12.8/requirements-cu128-ml.txt
- xinference/deploy/docker/requirements_12.8/requirements-cu128-models.txt+3-3
- xinference/deploy/local.py+5
- xinference/deploy/worker.py+6
- xinference/model/core.py+3
- xinference/model/embedding/sentence_transformers/core.py+3-4
- xinference/model/embedding/vllm/core.py+4-3
- xinference/model/image/model_spec.json+69
- xinference/model/image/stable_diffusion/core.py+22
- xinference/model/llm/cache_manager.py+17-3
- xinference/model/llm/harmony.py+245
- xinference/model/llm/llm_family.json+293-8
- xinference/model/llm/llm_family.py+1-1
- xinference/model/llm/sglang/core.py+108-5
- xinference/model/llm/tests/test_harmony.py+488
- xinference/model/llm/transformers/core.py+15-7
- xinference/model/llm/transformers/gemma3.py+1-1
- xinference/model/llm/transformers/gpt_oss.py+91
- xinference/model/llm/transformers/multimodal/core.py+1-1
- xinference/model/llm/transformers/multimodal/gemma3.py+1-1
- xinference/model/llm/transformers/multimodal/glm4_1v.py+2-2
- xinference/model/llm/transformers/multimodal/ovis2.py+1-1
- xinference/model/llm/transformers/multimodal/qwen-omni.py+7-8
- xinference/model/llm/transformers/multimodal/qwen2_vl.py+9-6
- xinference/model/llm/transformers/utils.py+1-33
- xinference/model/llm/utils.py+61-7
- xinference/model/llm/vllm/core.py+38-8
- xinference/model/rerank/__init__.py+66-23
- xinference/model/rerank/cache_manager.py+35
- xinference/model/rerank/core.py+84-339
- xinference/model/rerank/custom.py+33-8
- xinference/model/rerank/model_spec.json+251-212
- xinference/model/rerank/rerank_family.py+137
- xinference/model/rerank/sentence_transformers/__init__.py+13
- xinference/model/rerank/sentence_transformers/core.py+337
- xinference/model/rerank/sentence_transformers/tests/__init__.py
- xinference/model/rerank/sentence_transformers/tests/test_sentence_transformers.py+54
- xinference/model/rerank/tests/test_rerank.py+75-76
- xinference/model/rerank/vllm/__init__.py+13
- xinference/model/rerank/vllm/core.py+106
- xinference/model/rerank/vllm/tests/__init__.py
- xinference/model/rerank/vllm/tests/test_vllm.py+52
- xinference/model/utils.py+109
- xinference/types.py+2
- xinference/ui/web/ui/src/scenes/launch_model/data/data.js+3-2
- xinference/ui/web/ui/src/scenes/launch_model/modelCard.js+5-5
- xinference/ui/web/ui/src/scenes/register_model/components/addModelSpecs.js+15-2
- xinference/ui/web/ui/src/scenes/register_model/index.js+8-2
- xinference/ui/web/ui/src/scenes/register_model/registerModel.js+16-2
- xinference/ui/web/ui/src/scenes/running_models/index.js+5-1
0 commit comments