mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-13 22:18:36 +08:00
[None][test] update test case constraint (#10381)
Signed-off-by: Ivy Zhang <25222398+crazydemo@users.noreply.github.com>
This commit is contained in:
parent
1b1058279c
commit
22a1d31a27
@ -2269,6 +2269,7 @@ class TestDeepSeekR1(LlmapiAccuracyTestHarness):
|
||||
torch.cuda.empty_cache()
|
||||
|
||||
@skip_pre_blackwell
|
||||
@pytest.mark.skip_less_device_memory(95000)
|
||||
@pytest.mark.parametrize(
|
||||
"tp_size,pp_size,ep_size,mtp_nextn,fp8kv,attention_dp,cuda_graph,overlap_scheduler,max_batch_size,moe_backend",
|
||||
[
|
||||
|
||||
Loading…
Reference in New Issue
Block a user