21 lines
510 B
Plaintext
21 lines
510 B
Plaintext
cmake>=3.21
|
|
ninja # For faster builds.
|
|
psutil
|
|
ray >= 2.9
|
|
sentencepiece # Required for LLaMA tokenizer.
|
|
numpy
|
|
torch == 2.2.1
|
|
requests
|
|
py-cpuinfo
|
|
transformers >= 4.39.1 # Required for StarCoder2 & Llava.
|
|
xformers == 0.0.25 # Requires PyTorch 2.2.1.
|
|
fastapi
|
|
uvicorn[standard]
|
|
pydantic >= 2.0 # Required for OpenAI server.
|
|
prometheus_client >= 0.18.0
|
|
pynvml == 11.5.0
|
|
triton >= 2.1.0
|
|
outlines == 0.0.34
|
|
tiktoken == 0.6.0 # Required for DBRX tokenizer
|
|
vllm-nccl-cu12>=2.18,<2.19 # for downloading nccl library
|