mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-13 22:18:36 +08:00
test: add deepseek_v3_lite rcca cases (#5225)
Signed-off-by: ruodil <200874449+ruodil@users.noreply.github.com>
This commit is contained in:
parent
cbc6455266
commit
e05b3ff427
@ -78,7 +78,7 @@ def get_model_yaml_config(model_label: str) -> dict:
|
||||
[1, 2, 4, 8, 16, 32, 64, 128, 256, 384]
|
||||
},
|
||||
},
|
||||
'deepseek_r1_nvfp4-bench-pytorch-streaming-float4-maxbs:2048-maxnt:8192-input_output_len:256,256-num_reqs:200-gpus:1':
|
||||
'deepseek_v3_lite_nvfp4-bench-pytorch-streaming-float4-maxbs:2048-maxnt:8192-input_output_len:256,256-reqs:200':
|
||||
{
|
||||
'pytorch_backend_config': {
|
||||
'print_iter_log': True,
|
||||
|
||||
@ -11,7 +11,7 @@ trt_llm_release_perf_cluster_test:
|
||||
- perf/test_perf.py::test_perf[t5-bench-float16-input_output_len:128,20]
|
||||
- perf/test_perf.py::test_perf[mistral_7b_v0.1-bench-float16-input_output_len:1000,1000-quant:fp8]
|
||||
- perf/test_perf.py::test_perf[mistral_7b_v0.1-bench-float16-input_output_len:500,2000-quant:fp8]
|
||||
- perf/test_perf.py::test_perf[deepseek_r1_nvfp4-bench-pytorch-streaming-float4-maxbs:2048-maxnt:8192-input_output_len:256,256-num_reqs:200-gpus:1]
|
||||
- perf/test_perf.py::test_perf[deepseek_v3_lite_nvfp4-bench-pytorch-streaming-float4-maxbs:2048-maxnt:8192-input_output_len:256,256-reqs:200-gpus:1]
|
||||
- condition:
|
||||
ranges:
|
||||
system_gpu_count:
|
||||
|
||||
Loading…
Reference in New Issue
Block a user