1 file changed
+1
-1
lines changed- .github/workflows/python.yaml+1
- README.md+4-3
- README_zh_CN.md+4-3
- doc/source/getting_started/installation.rst+2-1
- doc/source/locale/zh_CN/LC_MESSAGES/user_guide/vllm_enhancement.po+73
- doc/source/models/builtin/image/hunyuandit-v1.2-distilled.rst+20
- doc/source/models/builtin/image/hunyuandit-v1.2.rst+20
- doc/source/models/builtin/image/index.rst+4
- doc/source/models/builtin/llm/index.rst+7
- doc/source/models/builtin/llm/minicpm3-4b.rst+1-1
- doc/source/models/builtin/llm/qvq-72b-preview.rst+47
- doc/source/models/builtin/video/hunyuanvideo.rst+18
- doc/source/models/builtin/video/index.rst+2
- doc/source/user_guide/backends.rst+1
- doc/source/user_guide/index.rst+1
- doc/source/user_guide/vllm_enhancement.rst+23
- setup.cfg+4-2
- xinference/api/restful_api.py+49-65
- xinference/client/tests/test_client.py+26
- xinference/core/model.py+77-19
- xinference/core/supervisor.py+81-10
- xinference/core/tests/test_continuous_batching.py-5
- xinference/core/utils.py+2-2
- xinference/core/worker.py+32
- xinference/model/image/model_spec.json+18
- xinference/model/image/model_spec_modelscope.json+20
- xinference/model/llm/__init__.py+2
- xinference/model/llm/llm_family.json+96
- xinference/model/llm/llm_family_modelscope.json+99
- xinference/model/llm/mlx/core.py+23-73
- xinference/model/llm/transformers/cogagent.py+272
- xinference/model/llm/transformers/core.py+1
- xinference/model/llm/transformers/qwen2_vl.py+10-1
- xinference/model/llm/utils.py+27-3
- xinference/model/llm/vllm/core.py+37-7
- xinference/model/llm/vllm/xavier/__init__.py+13
- xinference/model/llm/vllm/xavier/allocator.py+74
- xinference/model/llm/vllm/xavier/block.py+112
- xinference/model/llm/vllm/xavier/block_manager.py+71
- xinference/model/llm/vllm/xavier/block_tracker.py+116
- xinference/model/llm/vllm/xavier/engine.py+247
- xinference/model/llm/vllm/xavier/executor.py+132
- xinference/model/llm/vllm/xavier/scheduler.py+422
- xinference/model/llm/vllm/xavier/test/__init__.py+13
- xinference/model/llm/vllm/xavier/test/test_xavier.py+122
- xinference/model/llm/vllm/xavier/transfer.py+298
- xinference/model/video/diffusers.py+14
- xinference/model/video/model_spec.json+15
- xinference/model/video/model_spec_modelscope.json+16
- xinference/types.py+13
- xinference/web/ui/package-lock.json+69-3
- xinference/web/ui/package.json+2
- xinference/web/ui/src/App.js+16-17
- xinference/web/ui/src/components/MenuSide.js+55-44
- xinference/web/ui/src/components/Title.js+1-6
- xinference/web/ui/src/components/hotkeyFocusTextField.js+3-2
- xinference/web/ui/src/components/themeButton.js+20
- xinference/web/ui/src/components/themeContext.js+36
- xinference/web/ui/src/components/translateButton.js+74
- xinference/web/ui/src/i18n.js+24
- xinference/web/ui/src/index.js+2
- xinference/web/ui/src/locales/en.json+186
- xinference/web/ui/src/locales/zh.json+186
- xinference/web/ui/src/scenes/cluster_info/index.js+9-4
- xinference/web/ui/src/scenes/cluster_info/nodeInfo.js+52-28
- xinference/web/ui/src/scenes/launch_model/LaunchModelComponent.js+8-5
- xinference/web/ui/src/scenes/launch_model/index.js+16-9
- xinference/web/ui/src/scenes/launch_model/launchCustom.js+23-8
- xinference/web/ui/src/scenes/launch_model/launchLLM.js+16-11
- xinference/web/ui/src/scenes/launch_model/modelCard.js+238-93
- xinference/web/ui/src/scenes/launch_model/styles/modelCardStyle.css+4
- xinference/web/ui/src/scenes/register_model/components/addControlnet.js+8-4
- xinference/web/ui/src/scenes/register_model/components/addModelSpecs.js+18-12
- xinference/web/ui/src/scenes/register_model/components/addStop.js+6-3
- xinference/web/ui/src/scenes/register_model/index.js+21-7
- xinference/web/ui/src/scenes/register_model/registerModel.js+57-50
- xinference/web/ui/src/scenes/register_model/styles/registerModelStyle.css+4-4
- xinference/web/ui/src/scenes/running_models/index.js+30-28
- xinference/web/ui/src/theme.js+6-3
0 commit comments