mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-16 07:53:55 +08:00
[https://nvbugs/5839569][test] update test constraint (#11054)
Signed-off-by: Ivy Zhang <25222398+crazydemo@users.noreply.github.com> Signed-off-by: Wangshanshan <30051912+dominicshanshan@users.noreply.github.com>
This commit is contained in:
parent
03b635bb08
commit
9384cf8458
@ -3133,6 +3133,7 @@ class TestKimiK2(LlmapiAccuracyTestHarness):
|
||||
@pytest.mark.skip_less_mpi_world_size(8)
|
||||
@skip_post_blackwell
|
||||
@skip_pre_hopper
|
||||
@pytest.mark.skip_less_device_memory(180000)
|
||||
@pytest.mark.parametrize(
|
||||
"tp_size,pp_size,ep_size,fp8kv,attention_dp,cuda_graph,overlap_scheduler,max_batch_size",
|
||||
[(8, 1, 8, False, False, True, True, 16)],
|
||||
|
||||
Loading…
Reference in New Issue
Block a user