mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
16 lines
212 B
Bash
16 lines
212 B
Bash
#!/bin/bash
|
|
set -ex
|
|
|
|
cd /code/
|
|
|
|
function serve {
|
|
export UCX_UD_TIMEOUT=120s
|
|
export PMIX_MCA_gds=hash # Required
|
|
|
|
/opt/tritonserver/bin/tritonserver --model-repo llmapi_repo
|
|
}
|
|
|
|
# task
|
|
nvidia-smi
|
|
serve
|