mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
* Update TensorRT-LLM --------- Co-authored-by: Starrick Liu <73152103+StarrickLiu@users.noreply.github.com>
42 lines
720 B
Plaintext
42 lines
720 B
Plaintext
accelerate>=0.25.0
|
|
build
|
|
colored
|
|
cuda-python # Do not override the custom version of cuda-python installed in the NGC PyTorch image.
|
|
diffusers>=0.27.0
|
|
lark
|
|
mpi4py
|
|
numpy<2
|
|
onnx>=1.12.0
|
|
onnx_graphsurgeon>=0.5.2
|
|
openai==1.54.3
|
|
polygraphy
|
|
psutil
|
|
pynvml>=11.5.0
|
|
pulp
|
|
pandas
|
|
h5py==3.12.1
|
|
StrEnum
|
|
sentencepiece>=0.1.99
|
|
tensorrt~=10.7.0
|
|
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-24-11.html#rel-24-11 uses 2.6.0a0.
|
|
torch>=2.5.1,<=2.6.0a0
|
|
torchvision
|
|
nvidia-modelopt[torch]~=0.19.0
|
|
nvidia-nccl-cu12
|
|
transformers>=4.38.2,<=4.45.1
|
|
pydantic>=2.9.1
|
|
pillow==10.3.0
|
|
wheel
|
|
optimum
|
|
evaluate
|
|
mpmath>=1.3.0
|
|
click
|
|
click_option_group
|
|
aenum
|
|
pyzmq
|
|
fastapi==0.115.4
|
|
uvicorn
|
|
httpx
|
|
setuptools==70.3.0
|
|
ordered-set
|