mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-04 18:21:52 +08:00
[None][fix] AttributeError with return_perf_metrics on tensorrt backend (#10662)
Signed-off-by: Dmitry Barsukoff <riZZZhik@gmail.com> Co-authored-by: Kanghwan <861393+karljang@users.noreply.github.com>
This commit is contained in:
parent
1c8f8bed00
commit
ea49afdf0b
@ -2182,6 +2182,12 @@ class BaseLlmArgs(StrictBaseModel):
|
||||
description="Return perf metrics.",
|
||||
status="prototype")
|
||||
|
||||
perf_metrics_max_requests: int = Field(
|
||||
default=0,
|
||||
description=
|
||||
"The maximum number of requests for perf metrics. Must also set return_perf_metrics to true to get perf metrics.",
|
||||
status="prototype")
|
||||
|
||||
orchestrator_type: Optional[Literal["rpc", "ray"]] = Field(
|
||||
default=None,
|
||||
description=
|
||||
@ -2898,12 +2904,6 @@ class TorchLlmArgs(BaseLlmArgs):
|
||||
description="Print iteration logs.",
|
||||
status="beta")
|
||||
|
||||
perf_metrics_max_requests: int = Field(
|
||||
default=0,
|
||||
description=
|
||||
"The maximum number of requests for perf metrics. Must also set request_perf_metrics to true to get perf metrics.",
|
||||
status="prototype")
|
||||
|
||||
batch_wait_timeout_ms: float = Field(
|
||||
default=0,
|
||||
description=
|
||||
|
||||
Loading…
Reference in New Issue
Block a user