Create requirements.txt
Browse files- requirements.txt +41 -0
requirements.txt
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
psutil
|
2 |
+
sentencepiece # Required for LLaMA tokenizer.
|
3 |
+
numpy < 2.0.0
|
4 |
+
requests >= 2.26.0
|
5 |
+
tqdm
|
6 |
+
blake3
|
7 |
+
py-cpuinfo
|
8 |
+
transformers >= 4.45.2 # Required for Llama 3.2 and Qwen2-VL.
|
9 |
+
tokenizers >= 0.19.1 # Required for Llama 3.
|
10 |
+
protobuf # Required by LlamaTokenizer.
|
11 |
+
fastapi >= 0.107.0, < 0.113.0; python_version < '3.9'
|
12 |
+
fastapi >= 0.107.0, != 0.113.*, != 0.114.0; python_version >= '3.9'
|
13 |
+
aiohttp
|
14 |
+
openai >= 1.52.0 # Ensure modern openai package (ensure types module present and max_completion_tokens field support)
|
15 |
+
uvicorn[standard]
|
16 |
+
pydantic >= 2.9 # Required for fastapi >= 0.113.0
|
17 |
+
prometheus_client >= 0.18.0
|
18 |
+
pillow # Required for image processing
|
19 |
+
prometheus-fastapi-instrumentator >= 7.0.0
|
20 |
+
tiktoken >= 0.6.0 # Required for DBRX tokenizer
|
21 |
+
lm-format-enforcer >= 0.10.9, < 0.11
|
22 |
+
outlines == 0.1.11
|
23 |
+
lark == 1.2.2
|
24 |
+
xgrammar >= 0.1.6; platform_machine == "x86_64"
|
25 |
+
typing_extensions >= 4.10
|
26 |
+
filelock >= 3.16.1 # need to contain https://github.com/tox-dev/filelock/pull/317
|
27 |
+
partial-json-parser # used for parsing partial JSON outputs
|
28 |
+
pyzmq
|
29 |
+
msgspec
|
30 |
+
gguf == 0.10.0
|
31 |
+
importlib_metadata
|
32 |
+
mistral_common[opencv] >= 1.5.0
|
33 |
+
pyyaml
|
34 |
+
six>=1.16.0; python_version > '3.11' # transitive dependency of pandas that needs to be the latest version for python 3.12
|
35 |
+
setuptools>=74.1.1; python_version > '3.11' # Setuptools is used by triton, we need to ensure a modern version is installed for 3.12+ so that it does not try to import distutils, which was removed in 3.12
|
36 |
+
einops # Required for Qwen2-VL.
|
37 |
+
compressed-tensors == 0.9.0 # required for compressed-tensors
|
38 |
+
depyf==0.18.0 # required for profiling and debugging with compilation config
|
39 |
+
cloudpickle # allows pickling lambda functions in model_executor/models/registry.py
|
40 |
+
ray[default] >= 2.9
|
41 |
+
nvidia-ml-py >= 12.560.30 # for pynvml package
|