mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-22 03:35:00 +08:00
* beam_width and max_new_token Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com> * remove beam_width Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com> * remove min_length Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com> * remove return_num_sequences Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com> Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com> Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com> Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com> Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com> Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com> --------- Signed-off-by: Superjomn <328693+Superjomn@users.noreply.github.com>
16 lines
412 B
YAML
16 lines
412 B
YAML
methods:
|
|
__init__:
|
|
parameters:
|
|
# Experimental features
|
|
additional_model_outputs:
|
|
annotation: Optional[List[tensorrt_llm.sampling_params.AdditionalModelOutput]]
|
|
default: null
|
|
return_perf_metrics:
|
|
annotation: bool
|
|
default: false
|
|
beam_width_array:
|
|
annotation: Optional[List[int]]
|
|
default: null
|
|
return_annotation: None
|
|
properties: {}
|