forked from xorbitsai/inference
-
Notifications
You must be signed in to change notification settings - Fork 0
/
setup.cfg
328 lines (317 loc) · 7.55 KB
/
setup.cfg
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
[metadata]
name = xinference
description = Model Serving Made Easy
author = Qin Xuye
author_email = [email protected]
maintainer = Qin Xuye
maintainer_email = [email protected]
license = Apache License 2.0
url = https://github.com/xorbitsai/inference
python_requires = >=3.9
classifier =
Operating System :: OS Independent
Programming Language :: Python
Programming Language :: Python :: 3
Programming Language :: Python :: 3.9
Programming Language :: Python :: 3.10
Programming Language :: Python :: 3.11
Programming Language :: Python :: 3.12
Programming Language :: Python :: Implementation :: CPython
Topic :: Software Development :: Libraries
[options]
zip_safe = False
include_package_data = True
packages = find:
install_requires =
xoscar>=0.3.0
torch
gradio
pillow
click
tqdm>=4.27
tabulate
requests
pydantic
fastapi>=0.110.3
uvicorn
huggingface-hub>=0.19.4
typing_extensions
modelscope>=1.10.0
sse_starlette>=1.6.5 # ensure_bytes API break change: https://github.com/sysid/sse-starlette/issues/65
openai>1 # For typing
python-jose[cryptography]
passlib[bcrypt]
aioprometheus[starlette]>=23.12.0
nvidia-ml-py
async-timeout
peft
timm
[options.packages.find]
exclude =
*.conftest*
*.tests.*
*.tests
[options.extras_require]
dev =
cython>=0.29
pytest>=3.5.0
pytest-cov>=2.5.0
pytest-timeout>=1.2.0
pytest-forked>=1.0
pytest-asyncio>=0.14.0
pytest-mock>=3.11.1
ipython>=6.5.0
sphinx>=3.0.0
pydata-sphinx-theme>=0.3.0
sphinx-intl>=0.9.9
jieba>=0.42.0
flake8>=3.8.0
black
openai>1
langchain
langchain-community
orjson
sphinx-tabs
sphinx-design
all =
llama-cpp-python>=0.2.25,!=0.2.58
transformers>=4.43.2
torch>=2.0.0 # >=2.0 For CosyVoice
accelerate>=0.28.0
sentencepiece
transformers_stream_generator
bitsandbytes
protobuf
einops
tiktoken>=0.6.0
sentence-transformers>=3.1.0
vllm>=0.2.6 ; sys_platform=='linux'
diffusers>=0.30.0
imageio-ffmpeg # For video
controlnet_aux
orjson
auto-gptq ; sys_platform!='darwin'
autoawq<0.2.6 ; sys_platform!='darwin' # autoawq 0.2.6 pinned torch to 2.3
optimum
outlines>=0.0.34
sglang>=0.2.7 ; sys_platform=='linux'
mlx-lm ; sys_platform=='darwin' and platform_machine=='arm64'
attrdict # For deepseek VL
timm>=0.9.16 # For deepseek VL
torchvision # For deepseek VL
FlagEmbedding # For rerank
funasr
omegaconf~=2.3.0 # For ChatTTS
nemo_text_processing<1.1.0 # 1.1.0 requires pynini==2.1.6.post1
WeTextProcessing<1.0.4 # 1.0.4 requires pynini==2.1.6
librosa # For ChatTTS
xxhash # For ChatTTS
torchaudio # For ChatTTS
ChatTTS>=0.2
lightning>=2.0.0 # For CosyVoice, matcha
hydra-core>=1.3.2 # For CosyVoice, matcha
inflect # For CosyVoice, matcha
conformer # For CosyVoice, matcha
diffusers>=0.30.0 # For CosyVoice, matcha
gdown # For CosyVoice, matcha
pyarrow # For CosyVoice, matcha
HyperPyYAML # For CosyVoice
onnxruntime==1.16.0 # For CosyVoice, use onnxruntime-gpu==1.16.0 if possible
boto3>=1.28.55,<1.28.65 # For tensorizer
tensorizer~=2.9.0
eva-decord # For video in VL
jj-pytorchvideo # For CogVLM2-video
loguru # For Fish Speech
natsort # For Fish Speech
loralib # For Fish Speech
ormsgpack # For Fish Speech
qwen-vl-utils # For qwen2-vl
datamodel_code_generator # for minicpm-4B
jsonschema # for minicpm-4B
verovio>=4.3.1 # For got_ocr2
accelerate>=0.28.0 # For got_ocr2
intel =
torch==2.1.0a0
intel_extension_for_pytorch==2.1.10+xpu
llama_cpp =
llama-cpp-python>=0.2.25,!=0.2.58
transformers =
transformers>=4.43.2
torch
accelerate>=0.28.0
sentencepiece
transformers_stream_generator
bitsandbytes
protobuf
einops
tiktoken
auto-gptq ; sys_platform!='darwin'
autoawq<0.2.6 ; sys_platform!='darwin' # autoawq 0.2.6 pinned torch to 2.3
optimum
attrdict # For deepseek VL
timm>=0.9.16 # For deepseek VL
torchvision # For deepseek VL
peft
eva-decord # For video in VL
jj-pytorchvideo # For CogVLM2-video
qwen-vl-utils # For qwen2-vl
datamodel_code_generator # for minicpm-4B
jsonschema # for minicpm-4B
vllm =
vllm>=0.2.6
sglang =
sglang>=0.2.7 ; sys_platform=='linux'
vllm>=0.5.2 ; sys_platform=='linux'
outlines>=0.0.34
mlx =
mlx-lm
embedding =
sentence-transformers>=3.1.0
rerank =
FlagEmbedding
image =
diffusers>=0.30.0 # fix conflict with matcha-tts
controlnet_aux
deepcache
verovio>=4.3.1 # For got_ocr2
transformers>=4.37.2 # For got_ocr2
tiktoken>=0.6.0 # For got_ocr2
accelerate>=0.28.0 # For got_ocr2
torch # For got_ocr2
torchvision # For got_ocr2
video =
diffusers>=0.30.0
imageio-ffmpeg
audio =
funasr
omegaconf~=2.3.0
nemo_text_processing<1.1.0 # 1.1.0 requires pynini==2.1.6.post1
WeTextProcessing<1.0.4 # 1.0.4 requires pynini==2.1.6
librosa
xxhash
torchaudio
ChatTTS>=0.2
tiktoken # For CosyVoice, openai-whisper
torch>=2.0.0 # For CosyVoice, matcha
lightning>=2.0.0 # For CosyVoice, matcha
hydra-core>=1.3.2 # For CosyVoice, matcha
inflect # For CosyVoice, matcha
conformer # For CosyVoice, matcha
diffusers>=0.30.0 # For CosyVoice, matcha
gdown # For CosyVoice, matcha
pyarrow # For CosyVoice, matcha
HyperPyYAML # For CosyVoice
onnxruntime==1.16.0 # For CosyVoice, use onnxruntime-gpu==1.16.0 if possible
loguru # For Fish Speech
natsort # For Fish Speech
loralib # For Fish Speech
ormsgpack # For Fish Speech
doc =
ipython>=6.5.0
sphinx>=3.0.0
pydata-sphinx-theme>=0.3.0
sphinx-intl>=0.9.9
sphinx-tabs
sphinx-design
prometheus_client
timm
benchmark =
psutil
[options.entry_points]
console_scripts =
xinference = xinference.deploy.cmdline:cli
xinference-local = xinference.deploy.cmdline:local
xinference-supervisor = xinference.deploy.cmdline:supervisor
xinference-worker = xinference.deploy.cmdline:worker
[coverage:run]
branch = True
relative_files = True
cover_pylib = False
plugins = Cython.Coverage
include =
xinference/*
omit =
xinference/_version.py
*.pxd
*/tests/*
[coverage:report]
exclude_lines =
pragma: no cover
def __repr__
raise AssertionError
raise NotImplementedError
return NotImplemented
[versioneer]
VCS = git
style = pep440
versionfile_source = xinference/_version.py
versionfile_build = xinference/_version.py
tag_prefix = v
parentdir_prefix = xinference-
[flake8]
max-line-length = 100
select =
E9,
E101,
E111,
E117,
E127,
E201,
E202,
E223,
E224,
E225,
E231,
E242,
E251,
E273,
E274,
E275,
E301,
E302,
E303,
E304,
E305,
E401,
E703,
E901,
E999,
F7,
F63,
F82,
F401,
F811,
F821,
F822,
F823,
F841,
W191,
W291,
W292,
W293,
W391,
W601,
W602,
W603,
W604,
W605
exclude =
__init__.py
__pycache__
.git/
.github/
build/
ci/
dist/
docs/
thirdparty
[codespell]
ignore-words-list = hist,rcall,fpr,ser,nd,inout,ot,Ba,ba,asend,hart,coo,splitted,datas,fro
skip = .idea,.git,./build,./docs/build,node_modules,static,generated,*.po,*.ts,*.json,*.c,*.cpp,*.cfg,thirdparty
[isort]
profile = black
skip = thirdparty
[mypy]
ignore_missing_imports=True
follow_imports=skip
exclude = thirdparty