TensorRT-LLMs/requirements.txt

accelerate>=0.25.0
build
colored
cuda-python # Do not override the custom version of cuda-python installed in the NGC PyTorch image.
diffusers>=0.27.0
lark
mpi4py
numpy<2
onnx>=1.12.0
onnx_graphsurgeon>=0.5.2
openai==1.54.3
polygraphy
psutil
pynvml>=11.5.0
pulp
pandas
h5py==3.12.1
StrEnum
sentencepiece>=0.1.99
tensorrt~=10.7.0
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-24-11.html#rel-24-11 uses 2.6.0a0.
torch>=2.5.1,<=2.6.0a0
torchvision
nvidia-modelopt[torch]~=0.19.0
nvidia-nccl-cu12
transformers>=4.38.2,<=4.45.1
pydantic>=2.9.1
pillow==10.3.0
wheel
optimum
evaluate
mpmath>=1.3.0
click
click_option_group
aenum
pyzmq
fastapi==0.115.4
uvicorn
httpx
setuptools==70.3.0
ordered-set