From 325a1ec4fbc007b7860238fff5fe4ba9e023b8cd Mon Sep 17 00:00:00 2001 From: yzong-rh Date: Thu, 28 May 2026 19:36:31 -0400 Subject: [PATCH] [CI] Enable prefix caching in BFCL benchmark (#43925) Signed-off-by: Yifan Zong --- .buildkite/scripts/tool_call/run-bfcl-eval.sh | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.buildkite/scripts/tool_call/run-bfcl-eval.sh b/.buildkite/scripts/tool_call/run-bfcl-eval.sh index 3748cab62c7..d50767ef0f2 100755 --- a/.buildkite/scripts/tool_call/run-bfcl-eval.sh +++ b/.buildkite/scripts/tool_call/run-bfcl-eval.sh @@ -70,7 +70,7 @@ echo "============================================" # ---- Install bfcl-eval if missing ---- if ! python3 -c "import bfcl_eval" 2>/dev/null; then echo "Installing bfcl-eval..." - pip install "bfcl-eval>=2025.10.20.1,<2026" + uv pip install "bfcl-eval>=2025.10.20.1,<2026" fi # ---- Cleanup handler ---- @@ -100,7 +100,7 @@ SERVE_ARGS=( --tensor-parallel-size "$TP_SIZE" --max-model-len "$MAX_MODEL_LEN" --enforce-eager - --no-enable-prefix-caching + --enable-prefix-caching ) # Append reasoning parser if specified