mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-12 05:53:33 +08:00
Waive dynamic spec decode unit test
Signed-off-by: Zheyu Fu <zheyuf@NVIDIA.com>
This commit is contained in:
parent
7c638f155b
commit
ab45d6a7c7
@ -481,3 +481,4 @@ unittest/llmapi/apps/test_disagg_serving_perf_metrics.py SKIP (https://nvbugs/57
|
||||
unittest/_torch/attention/test_trtllm_flashinfer_symbol_collision.py::test_flashinfer_fused_moe_matches_torch_moe SKIP (https://nvbugs/5752521)
|
||||
unittest/llmapi/apps/_test_openai_responses.py::test_reasoning_effort[DeepSeek-R1-Distill-Qwen-1.5B] SKIP (https://nvbugs/5753250)
|
||||
unittest/llmapi/apps/_test_openai_responses.py::test_multi_turn_chat[Qwen3/Qwen3-0.6B] SKIP (https://nvbugs/5753250)
|
||||
unittest/_torch/speculative/test_dynamic_spec_decode.py::test_dynamic_spec_decode SKIP (https://nvbugs/5758449)
|
||||
|
||||
@ -21,6 +21,7 @@ def enforce_single_worker(monkeypatch):
|
||||
yield
|
||||
|
||||
|
||||
@pytest.mark.skip("https://nvbugs/5758449")
|
||||
@pytest.mark.parametrize("disable_overlap_scheduler", [True, False])
|
||||
@pytest.mark.high_cuda_memory
|
||||
def test_dynamic_spec_decode(enforce_single_worker,
|
||||
|
||||
Loading…
Reference in New Issue
Block a user