mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
fix: wrong argument name enable_overlap_scheduler (#4433)
Fix wrong argument Signed-off-by: Kaiyu Xie <26294424+kaiyux@users.noreply.github.com>
This commit is contained in:
parent
cf6cd940e5
commit
a43914619f
@ -202,7 +202,6 @@ trtllm-bench --model $model_name throughput --dataset $dataset_file --backend py
|
||||
```yaml
|
||||
|
||||
pytorch_backend_config:
|
||||
enable_overlap_scheduler: true
|
||||
use_cuda_graph: true
|
||||
cuda_graph_padding_enabled: true
|
||||
cuda_graph_batch_sizes:
|
||||
|
||||
@ -1415,7 +1415,6 @@ def test_ptp_quickstart_advanced_deepseek_v3_2nodes_8gpus(
|
||||
"trtllm-llmapi-launch",
|
||||
"python3",
|
||||
str(example_root / "quickstart_advanced.py"),
|
||||
"--enable_overlap_scheduler",
|
||||
"--model_dir",
|
||||
f"{llm_models_root()}/{model_path}",
|
||||
"--moe_ep_size=8",
|
||||
|
||||
Loading…
Reference in New Issue
Block a user