forked from NVIDIA/TensorRT-LLM
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrequirements.txt
46 lines (46 loc) · 990 Bytes
/
requirements.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
accelerate>=0.25.0
build
colored
cuda-python # Do not override the custom version of cuda-python installed in the NGC PyTorch image.
diffusers>=0.27.0
lark
mpi4py
numpy<2
onnx>=1.12.0
onnx_graphsurgeon>=0.5.2
openai
polygraphy
psutil
pynvml>=11.5.0
pulp
pandas
h5py==3.12.1
StrEnum
sentencepiece>=0.1.99
tensorrt~=10.8.0
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-01.html#rel-25-01 uses 2.6.0a0.
torch>=2.5.1,<=2.6.0a0
torchvision
nvidia-modelopt[torch]~=0.23.0
nvidia-nccl-cu12
nvidia-cuda-nvrtc-cu12
# TODO: Remove the <4.48.0 constraint once https://github.com/huggingface/transformers/issues/35625 is resolved.
transformers>=4.47.0,<4.48.0
pydantic>=2.9.1
pillow==10.3.0
wheel
optimum
evaluate
mpmath>=1.3.0
click
click_option_group
aenum
pyzmq
fastapi==0.115.4
uvicorn
httpx
setuptools
ordered-set
peft
flashinfer @ git+https://github.com/flashinfer-ai/flashinfer.git@06309c4e
s2wrapper @ git+https://github.com/bfshi/scaling_on_scales.git@60da2afe