mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-05 02:31:33 +08:00
Signed-off-by: Stefan Niebler <82932102+stnie@users.noreply.github.com> Signed-off-by: Yuan Tong <13075180+tongyuantongyu@users.noreply.github.com> Signed-off-by: Erin Ho <14718778+hchings@users.noreply.github.com> Co-authored-by: Yuan Tong <13075180+tongyuantongyu@users.noreply.github.com> Co-authored-by: Erin Ho <14718778+hchings@users.noreply.github.com>
23 lines
561 B
YAML
23 lines
561 B
YAML
methods:
|
|
__init__:
|
|
parameters:
|
|
# Experimental features
|
|
additional_model_outputs:
|
|
annotation: Optional[List[str]]
|
|
default: null
|
|
status: prototype
|
|
return_perf_metrics:
|
|
annotation: bool
|
|
default: false
|
|
beam_width_array:
|
|
annotation: Optional[List[int]]
|
|
default: null
|
|
prompt_ignore_length:
|
|
annotation: Optional[int]
|
|
default: null
|
|
logprobs_mode:
|
|
annotation: LogprobMode
|
|
default: LogprobMode.RAW
|
|
return_annotation: None
|
|
properties: {}
|