mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-13 22:18:36 +08:00
* Move TRT-LLM backend repo to TRT-LLM repo Signed-off-by: Iman Tabrizian <10105175+tabrizian@users.noreply.github.com> * Address review comments Signed-off-by: Iman Tabrizian <10105175+tabrizian@users.noreply.github.com> * debug ci Signed-off-by: Iman Tabrizian <10105175+tabrizian@users.noreply.github.com> * Update triton backend Signed-off-by: Iman Tabrizian <10105175+tabrizian@users.noreply.github.com> * Fixes after update Signed-off-by: Iman Tabrizian <10105175+tabrizian@users.noreply.github.com> --------- Signed-off-by: Iman Tabrizian <10105175+tabrizian@users.noreply.github.com>
36 lines
779 B
Bash
36 lines
779 B
Bash
#!/bin/bash
|
|
|
|
# Wait until server health endpoint shows ready. Sets WAIT_RET to 0 on
|
|
# success, 1 on failure
|
|
|
|
function wait_for_server_ready() {
|
|
|
|
local spid="$1";
|
|
local wait_time_secs="${2:-30}";
|
|
local triton_http_port="${3:-8000}"
|
|
WAIT_RET=0
|
|
|
|
local wait_secs=$wait_time_secs
|
|
until test $wait_secs -eq 0 ; do
|
|
if ! kill -0 $spid; then
|
|
echo "=== Server not running."
|
|
WAIT_RET=1
|
|
return
|
|
fi
|
|
|
|
sleep 1;
|
|
|
|
set +e
|
|
code=`curl -s -w %{http_code} localhost:${triton_http_port}/v2/health/ready`
|
|
set -e
|
|
if [ "$code" == "200" ]; then
|
|
return
|
|
fi
|
|
|
|
((wait_secs--));
|
|
done
|
|
|
|
echo "=== Timeout $wait_time_secs secs. Server not ready."
|
|
WAIT_RET=1
|
|
}
|