mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
test: waive flaky test_kv_cache_event_async_api (#3062)
Signed-off-by: Yuan Tong <13075180+tongyuantongyu@users.noreply.github.com>
This commit is contained in:
parent
d9acce72bb
commit
53adb3cb4e
@ -1,6 +1,7 @@
|
||||
import asyncio
|
||||
import time
|
||||
|
||||
import pytest
|
||||
from test_llm import get_model_path
|
||||
|
||||
import tensorrt_llm
|
||||
@ -119,6 +120,7 @@ def test_expected_kv_cache_events():
|
||||
assert event[0]["data"]["type"] == "stored"
|
||||
|
||||
|
||||
@pytest.mark.skip("https://nvbugs/5150466: flaky fail")
|
||||
def test_kv_cache_event_async_api():
|
||||
llm = create_llm()
|
||||
sampling_params = SamplingParams(max_tokens=6, temperature=0.01)
|
||||
|
||||
Loading…
Reference in New Issue
Block a user