4 files changed
+11
-2
lines changed+2-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
145 | 145 |
| |
146 | 146 |
| |
147 | 147 |
| |
148 |
| - | |
| 148 | + | |
| 149 | + |
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
26 | 26 |
| |
27 | 27 |
| |
28 | 28 |
| |
| 29 | + | |
29 | 30 |
| |
30 | 31 |
| |
31 | 32 |
| |
|
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
117 | 117 |
| |
118 | 118 |
| |
119 | 119 |
| |
| 120 | + | |
| 121 | + | |
| 122 | + | |
| 123 | + | |
| 124 | + | |
| 125 | + | |
| 126 | + | |
120 | 127 |
| |
121 | 128 |
| |
122 | 129 |
| |
|
- .github/workflows/python.yaml+1
- README.md+1-1
- README_ja_JP.md+1-1
- README_zh_CN.md+1-1
- doc/source/examples/index.rst+3-3
- doc/source/getting_started/using_xinference.rst+1-1
- examples/gradio_chatinterface.py+1-1
- setup.cfg+4-1
- xinference/api/restful_api.py+76-141
- xinference/client/common.py+5-5
- xinference/client/oscar/actor_client.py+5
- xinference/client/restful/restful_client.py+5
- xinference/client/tests/test_client.py+12-1
- xinference/conftest.py+19-5
- xinference/core/chat_interface.py+4-1
- xinference/core/model.py+72-5
- xinference/core/supervisor.py+97-28
- xinference/core/tests/test_restful_api.py+149-7
- xinference/core/tests/test_types.py+80
- xinference/core/tests/test_worker.py+109-4
- xinference/core/worker.py+80-18
- xinference/deploy/__init__.py+7
- xinference/deploy/cmdline.py+71-16
- xinference/deploy/test/test_cmdline.py+1-3
- xinference/deploy/utils.py+22-5
- xinference/fields.py+133
- xinference/model/core.py+16-3
- xinference/model/embedding/__init__.py+1-1
- xinference/model/embedding/core.py+24-4
- xinference/model/embedding/tests/test_embedding_models.py+64-40
- xinference/model/image/__init__.py+1-1
- xinference/model/image/core.py+36-3
- xinference/model/image/tests/test_stable_diffusion.py+33-14
- xinference/model/llm/__init__.py+1
- xinference/model/llm/core.py+16-3
- xinference/model/llm/ggml/ctransformers.py+13-6
- xinference/model/llm/ggml/llamacpp.py+19-20
- xinference/model/llm/llm_family.json+9
- xinference/model/llm/llm_family.py+31-1
- xinference/model/llm/llm_family_modelscope.json+11
- xinference/model/llm/pytorch/core.py+54-24
- xinference/model/llm/pytorch/spec_decoding_utils.py+3-2
- xinference/model/llm/pytorch/spec_model.py+2
- xinference/model/llm/pytorch/tests/test_spec_decoding.py+1
- xinference/model/llm/pytorch/utils.py+9-6
- xinference/model/llm/tests/test_llm_family.py+72
- xinference/model/utils.py+1-1
- xinference/types.py+138-2
- xinference/web/ui/src/scenes/launch_model/embeddingCard.js+15-29
- xinference/web/ui/src/scenes/launch_model/index.js+6-10
- xinference/web/ui/src/scenes/launch_model/launchEmbedding.js+15-11
- xinference/web/ui/src/scenes/launch_model/launchLLM.js+21-33
- xinference/web/ui/src/scenes/launch_model/modelCard.js+88-27
- xinference/web/ui/src/scenes/running_models/index.js+243-11
0 commit comments