From 90ea6c1e093fc39dcba559d1086306187e160460 Mon Sep 17 00:00:00 2001 From: JunyiXu-nv <219237550+JunyiXu-nv@users.noreply.github.com> Date: Sat, 24 Jan 2026 16:04:02 +0800 Subject: [PATCH] =?UTF-8?q?[https://nvbugs/5804146][fix]=20Enable=20respon?= =?UTF-8?q?ses=20tests=20and=20remove=20ds=20to=E2=80=A6=20(#10925)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: Junyi Xu <219237550+JunyiXu-nv@users.noreply.github.com> Signed-off-by: Wangshanshan <30051912+dominicshanshan@users.noreply.github.com> --- tests/integration/test_lists/waives.txt | 1 - .../llmapi/apps/_test_openai_responses.py | 17 +++++------------ 2 files changed, 5 insertions(+), 13 deletions(-) diff --git a/tests/integration/test_lists/waives.txt b/tests/integration/test_lists/waives.txt index 702fc0d11d..4792036019 100644 --- a/tests/integration/test_lists/waives.txt +++ b/tests/integration/test_lists/waives.txt @@ -227,7 +227,6 @@ examples/test_ray.py::test_ray_disaggregated_serving[tp2] SKIP (https://nvbugs/5 unittest/executor/test_rpc_proxy.py SKIP (https://nvbugs/5605741) unittest/executor/test_rpc_worker.py SKIP (https://nvbugs/5605741) cpp/test_e2e.py::test_model[-redrafter-86] SKIP (https://nvbugs/5761642) -test_e2e.py::test_openai_responses SKIP (https://nvbugs/5804146) triton_server/test_triton.py::test_gpt_gather_logits[gpt-gather-logits] SKIP (https://nvbugs/5766960) full:sm89/accuracy/test_disaggregated_serving.py::TestLlama3_1_8BInstruct::test_ctx_pp_gen_tp_asymmetric[MMLU-gen_tp=1-ctx_pp=2] SKIP (https://nvbugs/5596337) test_e2e.py::test_eagle3_output_consistency_4gpus[Qwen3/saved_models_Qwen3-235B-A22B_fp8_hf-Qwen3/qwen3-235B-eagle3] SKIP (https://nvbugs/5685010) diff --git a/tests/unittest/llmapi/apps/_test_openai_responses.py b/tests/unittest/llmapi/apps/_test_openai_responses.py index 08b53490b1..67ae21cd91 100644 --- a/tests/unittest/llmapi/apps/_test_openai_responses.py +++ b/tests/unittest/llmapi/apps/_test_openai_responses.py @@ -13,10 +13,7 @@ pytestmark = pytest.mark.threadleak(enabled=False) @pytest.fixture(scope="module", - params=[ - "gpt_oss/gpt-oss-20b", "DeepSeek-R1-Distill-Qwen-1.5B", - "Qwen3/Qwen3-0.6B" - ]) + params=["gpt_oss/gpt-oss-20b", "Qwen3/Qwen3-0.6B"]) def model(request): return request.param @@ -35,10 +32,6 @@ def server(model: str, num_postprocess_workers: int): args = ["--num_postprocess_workers", f"{num_postprocess_workers}"] if model.startswith("Qwen3"): args.extend(["--reasoning_parser", "qwen3"]) - elif model.startswith("DeepSeek-R1"): - args.extend(["--reasoning_parser", "deepseek-r1"]) - - if not model.startswith("gpt_oss"): args.extend(["--tool_parser", "qwen3"]) with RemoteOpenAIServer(model_path, args) as remote_server: @@ -167,8 +160,8 @@ def get_current_weather(location: str, format: str = "celsius") -> dict: @pytest.mark.asyncio(loop_scope="module") async def test_tool_calls(client: openai.AsyncOpenAI, model: str): - if model.startswith("DeepSeek-R1"): - pytest.skip("DeepSeek-R1 does not support tool calls") + if model.startswith("Qwen3"): + pytest.skip("Qwen3 tool call is not stable") tool_get_current_weather = { "type": "function", @@ -241,8 +234,8 @@ async def test_streaming(client: openai.AsyncOpenAI, model: str): @pytest.mark.asyncio(loop_scope="module") async def test_streaming_tool_call(client: openai.AsyncOpenAI, model: str): - if model.startswith("DeepSeek-R1"): - pytest.skip("DeepSeek-R1 does not support tool calls") + if model.startswith("Qwen3"): + pytest.skip("Qwen3 tool call is not stable") tool_get_current_weather = { "type": "function",