mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
[None][infra] Skip test_eagle3 test with device memory check (#6617)
Signed-off-by: leslie-fang25 <leslief@nvidia.com>
This commit is contained in:
parent
7625845365
commit
164acfa31e
@ -1955,6 +1955,7 @@ class TestQwen3_8B(LlmapiAccuracyTestHarness):
|
||||
task = MMLU(self.MODEL_NAME)
|
||||
task.evaluate(llm)
|
||||
|
||||
@pytest.mark.skip_less_device_memory(140000) ## OOM on 80G H100
|
||||
@parametrize_with_ids("eagle3_one_model", [True, False])
|
||||
@parametrize_with_ids("enable_chunked_prefill", [False, True])
|
||||
def test_eagle3(self, enable_chunked_prefill, eagle3_one_model):
|
||||
|
||||
Loading…
Reference in New Issue
Block a user